7da6eb2dd83b34a5400e24bcda9d1894f7874213
[nit.git] / lib / standard / collection / hash_collection.nit
1 # This file is part of NIT ( http://www.nitlanguage.org ).
2 #
3 # Copyright 2004-2009 Jean Privat <jean@pryen.org>
4 #
5 # This file is free software, which comes along with NIT. This software is
6 # distributed in the hope that it will be useful, but WITHOUT ANY WARRANTY;
7 # without even the implied warranty of MERCHANTABILITY or FITNESS FOR A
8 # PARTICULAR PURPOSE. You can modify it is you want, provided this header
9 # is kept unaltered, and a notification of the changes is added.
10 # You are allowed to redistribute it and sell it, alone or is a part of
11 # another product.
12
13 # Introduce Hashmap and Hashset.
14 module hash_collection
15
16 import array
17
18 # A HashCollection is an array of HashNode[K] indexed by the K hash value
19 private abstract class HashCollection[K: Object, N: HashNode[Object]]
20 super ArrayCapable[nullable N]
21
22 var _array: nullable NativeArray[nullable N] = null # Used to store items
23 var _capacity: Int = 0 # Size of _array
24 var _length: Int = 0 # Number of items in the map
25
26 readable var _first_item: nullable N = null # First added item (used to visit items in nice order)
27 var _last_item: nullable N = null # Last added item (same)
28
29 # The last key accessed (used for cache)
30 var _last_accessed_key: nullable K = null
31
32 # The last node accessed (used for cache)
33 var _last_accessed_node: nullable N = null
34
35 # Return the index of the key k
36 fun index_at(k: K): Int
37 do
38 var i = k.hash % _capacity
39 if i < 0 then i = - i
40 return i
41 end
42
43 # Return the node assosiated with the key
44 fun node_at(k: K): nullable N
45 do
46 # cache: `is` is used instead of `==` because it is a faster filter (even if not exact)
47 if k is _last_accessed_key then return _last_accessed_node
48
49 var res = node_at_idx(index_at(k), k)
50 _last_accessed_key = k
51 _last_accessed_node = res
52 return res
53 end
54
55 # Return the node assosiated with the key (but with the index already known)
56 fun node_at_idx(i: Int, k: K): nullable N
57 do
58 var c = _array[i]
59 while c != null do
60 var ck = c._key
61 if ck is k or ck == k then # prefilter with `is` because the compiler is not smart enought yet
62 break
63 end
64 c = c._next_in_bucklet
65 end
66 return c
67 end
68
69 # Add a new node at a given index
70 fun store(index: Int, node: N)
71 do
72 # Store the item in the list
73 if _first_item == null then
74 _first_item = node
75 else
76 _last_item._next_item = node
77 end
78 node._prev_item = _last_item
79 node._next_item = null
80 _last_item = node
81
82 # Then store it in the array
83 var next = _array[index]
84 _array[index] = node
85 node._next_in_bucklet = next
86 if next != null then next._prev_in_bucklet = node
87
88 _last_accessed_key = node._key
89 _last_accessed_node = node
90
91 # Enlarge if needed
92 var l = _length
93 _length = l + 1
94 l = (l + 5) * 3 / 2
95 if l >= _capacity then
96 enlarge(l * 2)
97 end
98 end
99
100 # Remove the node assosiated with the key
101 fun remove_node(k: K)
102 do
103 var i = index_at(k)
104 var node = node_at_idx(i, k)
105 if node == null then return
106
107 # Remove the item in the list
108 var prev = node._prev_item
109 var next = node._next_item
110 if prev != null then
111 prev._next_item = next
112 else
113 _first_item = next
114 end
115 if next != null then
116 next._prev_item = prev
117 else
118 _last_item = prev
119 end
120
121 # Remove the item in the array
122 _length -= 1
123 prev = node._prev_in_bucklet
124 next = node._next_in_bucklet
125 if prev != null then
126 prev._next_in_bucklet = next
127 else
128 _array[i] = next
129 end
130 if next != null then
131 next._prev_in_bucklet = prev
132 end
133
134 _last_accessed_key = null
135 end
136
137 # Clear the whole structure
138 fun raz
139 do
140 var i = _capacity - 1
141 while i >= 0 do
142 _array[i] = null
143 i -= 1
144 end
145 _length = 0
146 _first_item = null
147 _last_item = null
148 _last_accessed_key = null
149 end
150
151 # Force a capacity
152 fun enlarge(cap: Int)
153 do
154 var old_cap = _capacity
155 # get a new capacity
156 if cap < _length + 1 then cap = _length + 1
157 if cap <= _capacity then return
158 _capacity = cap
159 _last_accessed_key = null
160
161 # get a new array
162 var new_array = calloc_array(cap)
163 _array = new_array
164
165 # clean the new array
166 var i = cap - 1
167 while i >=0 do
168 new_array[i] = null
169 i -= 1
170 end
171
172 if _capacity <= old_cap then return
173
174 # Reput items in the array
175 var node = _first_item
176 while node != null do
177 var index = index_at(node._key)
178 # Then store it in the array
179 var next = new_array[index]
180 new_array[index] = node
181 node._next_in_bucklet = next
182 if next != null then next._prev_in_bucklet = node
183 node = node._next_item
184 end
185 end
186 end
187
188 private abstract class HashNode[K: Object]
189 var _key: K
190 type N: HashNode[K]
191 readable writable var _next_item: nullable N = null
192 readable writable var _prev_item: nullable N = null
193 var _prev_in_bucklet: nullable N = null
194 var _next_in_bucklet: nullable N = null
195 init(k: K)
196 do
197 _key = k
198 end
199 end
200
201 # A map implemented with a hash table.
202 # Keys of such a map cannot be null and require a working `hash` method
203 class HashMap[K: Object, V]
204 super Map[K, V]
205 super HashCollection[K, HashMapNode[K, V]]
206
207 redef fun [](key)
208 do
209 var c = node_at(key)
210 if c == null then
211 abort
212 else
213 return c._value
214 end
215 end
216
217 redef fun iterator: HashMapIterator[K, V] do return new HashMapIterator[K,V](self)
218
219 redef fun iterate
220 !each(k: K, v: V)
221 do
222 var c = _first_item
223 while c != null do
224 each(c._key, c._value)
225 c = c._next_item
226 end
227 end
228
229 redef fun length do return _length
230
231 redef fun is_empty do return _length == 0
232
233 redef fun []=(key, v)
234 do
235 var i = index_at(key)
236 var c = node_at_idx(i, key)
237 if c != null then
238 c._key = key
239 c._value = v
240 else
241 store(i, new HashMapNode[K, V](key, v))
242 end
243 end
244
245 redef fun clear do raz
246
247 init
248 do
249 _capacity = 0
250 _length = 0
251 enlarge(0)
252 end
253
254 redef var keys: HashMapKeys[K, V] = new HashMapKeys[K, V](self)
255 redef var values: HashMapValues[K, V] = new HashMapValues[K, V](self)
256 end
257
258 # View of the keys of a HashMap
259 class HashMapKeys[K: Object, V]
260 super RemovableCollection[K]
261 # The original map
262 var map: HashMap[K, V]
263
264 redef fun count(k) do if self.has(k) then return 1 else return 0
265 redef fun first do return self.map._first_item._key
266 redef fun has(k) do return self.map.node_at(k) != null
267 redef fun has_only(k) do return (self.has(k) and self.length == 1) or self.is_empty
268 redef fun is_empty do return self.map.is_empty
269 redef fun length do return self.map.length
270
271 redef fun iterator do return new MapKeysIterator[K, V](self.map.iterator)
272
273 redef fun clear do self.map.clear
274
275 redef fun remove(key) do self.map.remove_node(key)
276 redef fun remove_all(key) do self.map.remove_node(key)
277 end
278
279 # View of the values of a Map
280 class HashMapValues[K: Object, V]
281 super RemovableCollection[V]
282 # The original map
283 var map: HashMap[K, V]
284
285 redef fun count(item)
286 do
287 var nb = 0
288 var c = self.map._first_item
289 while c != null do
290 if c._value == item then nb += 1
291 c = c._next_item
292 end
293 return nb
294 end
295 redef fun first do return self.map._first_item._value
296
297 redef fun has(item)
298 do
299 var c = self.map._first_item
300 while c != null do
301 if c._value == item then return true
302 c = c._next_item
303 end
304 return false
305 end
306
307 redef fun has_only(item)
308 do
309 var c = self.map._first_item
310 while c != null do
311 if c._value != item then return false
312 c = c._next_item
313 end
314 return true
315 end
316
317 redef fun is_empty do return self.map.is_empty
318 redef fun length do return self.map.length
319
320 redef fun iterator do return new MapValuesIterator[K, V](self.map.iterator)
321
322 redef fun clear do self.map.clear
323
324 redef fun remove(item)
325 do
326 var map = self.map
327 var c = map._first_item
328 while c != null do
329 if c._value == item then
330 map.remove_node(c._key)
331 return
332 end
333 c = c._next_item
334 end
335 end
336
337 redef fun remove_all(item)
338 do
339 var map = self.map
340 var c = map._first_item
341 while c != null do
342 if c._value == item then
343 map.remove_node(c._key)
344 end
345 c = c._next_item
346 end
347 end
348 end
349
350 private class HashMapNode[K: Object, V]
351 super HashNode[K]
352 redef type N: HashMapNode[K, V]
353 var _value: V
354
355 init(k: K, v: V)
356 do
357 super(k)
358 _value = v
359 end
360 end
361
362 class HashMapIterator[K: Object, V]
363 super MapIterator[K, V]
364 redef fun is_ok do return _node != null
365
366 redef fun item
367 do
368 assert is_ok
369 return _node._value
370 end
371
372 #redef fun item=(value)
373 #do
374 # assert is_ok
375 # _node.second = value
376 #end
377
378 redef fun key
379 do
380 assert is_ok
381 return _node._key
382 end
383
384 redef fun next
385 do
386 assert is_ok
387 _node = _node._next_item
388 end
389
390 # The map to iterate on
391 var _map: HashMap[K, V]
392
393 # The current node
394 var _node: nullable HashMapNode[K, V]
395
396 init(map: HashMap[K, V])
397 do
398 _map = map
399 _node = map.first_item
400 end
401 end
402
403 # A `Set` implemented with a hash table.
404 # Keys of such a map cannot be null and require a working `hash` method
405 class HashSet[E: Object]
406 super Set[E]
407 super HashCollection[E, HashSetNode[E]]
408
409 redef fun length do return _length
410
411 redef fun is_empty do return _length == 0
412
413 redef fun first
414 do
415 assert _length > 0
416 return _first_item._key
417 end
418
419 redef fun has(item)
420 do
421 return node_at(item) != null
422 end
423
424 redef fun add(item)
425 do
426 var i = index_at(item)
427 var c = node_at_idx(i, item)
428 if c != null then
429 c._key = item
430 else
431 store(i,new HashSetNode[E](item))
432 end
433 end
434
435 redef fun remove(item) do remove_node(item)
436
437 redef fun clear do raz
438
439 redef fun iterator do return new HashSetIterator[E](self)
440
441 init
442 do
443 _capacity = 0
444 _length = 0
445 enlarge(0)
446 end
447
448 # Build a list filled with the items of `coll`.
449 init from(coll: Collection[E]) do
450 init
451 add_all(coll)
452 end
453 end
454
455 private class HashSetNode[E: Object]
456 super HashNode[E]
457 redef type N: HashSetNode[E]
458
459 init(e: E)
460 do
461 _key = e
462 end
463 end
464
465 class HashSetIterator[E: Object]
466 super Iterator[E]
467 redef fun is_ok do return _node != null
468
469 redef fun item
470 do
471 assert is_ok
472 return _node._key
473 end
474
475 redef fun next
476 do
477 assert is_ok
478 _node = _node._next_item
479 end
480
481 # The set to iterate on
482 var _set: HashSet[E]
483
484 # The position in the internal map storage
485 var _node: nullable HashSetNode[E]
486
487 init(set: HashSet[E])
488 do
489 _set = set
490 _node = set._first_item
491 end
492 end
493