Trie data structure for prefix searches

var trie = new Trie[Int]
trie["foo"] = 1
trie["fooo"] = 2
trie["bar"] = 3

# Search by key
assert trie.has_key("foo")
assert trie["foo"] == 1

# Search by prefix
assert trie.find_by_prefix("") == [1, 3, 2]
assert trie.find_by_prefix("foo") == [1, 2]
assert trie.find_by_prefix("baz").is_empty

Introduced properties

private var _cache: nullable TrieNode[E]

trees :: Trie :: _cache

Cache node used between has_key and []
private var _cache_key: nullable String

trees :: Trie :: _cache_key

Cache key used between has_key and []
private var _root: TrieNode[E]

trees :: Trie :: _root

Trie root
private fun cache: nullable TrieNode[E]

trees :: Trie :: cache

Cache node used between has_key and []
private fun cache=(cache: nullable TrieNode[E])

trees :: Trie :: cache=

Cache node used between has_key and []
private fun cache_key: nullable String

trees :: Trie :: cache_key

Cache key used between has_key and []
private fun cache_key=(cache_key: nullable String)

trees :: Trie :: cache_key=

Cache key used between has_key and []
fun find_by_prefix(prefix: String): Array[E]

trees :: Trie :: find_by_prefix

Find values stored under prefix
fun has_prefix(prefix: String): Bool

trees :: Trie :: has_prefix

Find values stored under prefix
private fun root: TrieNode[E]

trees :: Trie :: root

Trie root
private fun root=(root: TrieNode[E])

trees :: Trie :: root=

Trie root
private fun search_node(string: nullable Object): nullable TrieNode[E]

trees :: Trie :: search_node

Search a node by a key or prefix

Redefined properties

redef type SELF: Trie[E]

trees $ Trie :: SELF

Type of this instance, automatically specialized in every class
redef fun [](key: nullable Object): E

trees $ Trie :: []

Get the item at key
redef fun []=(key: String, value: E)

trees $ Trie :: []=

Set the value at key.
redef fun has_key(key: nullable Object): Bool

trees $ Trie :: has_key

Is there an item associated with key?

All properties

fun !=(other: nullable Object): Bool

core :: Object :: !=

Have self and other different values?
fun ==(other: nullable Object): Bool

core :: Object :: ==

Have self and other the same value?
type CLASS: Class[SELF]

core :: Object :: CLASS

The type of the class of self.
type SELF: Object

core :: Object :: SELF

Type of this instance, automatically specialized in every class
abstract fun [](key: nullable Object): V

core :: MapRead :: []

Get the item at key
abstract fun []=(key: K, value: V)

core :: Map :: []=

Set the value at key.
private var _cache: nullable TrieNode[E]

trees :: Trie :: _cache

Cache node used between has_key and []
private var _cache_key: nullable String

trees :: Trie :: _cache_key

Cache key used between has_key and []
private var _root: TrieNode[E]

trees :: Trie :: _root

Trie root
protected fun accept_json_serializer(v: JsonSerializer)

serialization :: Serializable :: accept_json_serializer

Refinable service to customize the serialization of this class to JSON
protected fun accept_msgpack_attribute_counter(v: AttributeCounter)

serialization :: Serializable :: accept_msgpack_attribute_counter

Hook to customize the behavior of the AttributeCounter
protected fun accept_msgpack_serializer(v: MsgPackSerializer)

serialization :: Serializable :: accept_msgpack_serializer

Hook to customize the serialization of this class to MessagePack
fun add_all(map: MapRead[K, V])

core :: Map :: add_all

Add each (key,value) of map into self.
protected fun add_to_bundle(bundle: NativeBundle, key: JavaString)

serialization :: Serializable :: add_to_bundle

Called by []= to dynamically choose the appropriate method according
private fun cache: nullable TrieNode[E]

trees :: Trie :: cache

Cache node used between has_key and []
private fun cache=(cache: nullable TrieNode[E])

trees :: Trie :: cache=

Cache node used between has_key and []
private fun cache_key: nullable String

trees :: Trie :: cache_key

Cache key used between has_key and []
private fun cache_key=(cache_key: nullable String)

trees :: Trie :: cache_key=

Cache key used between has_key and []
protected fun class_factory(name: String): CLASS

core :: Object :: class_factory

Implementation used by get_class to create the specific class.
fun class_name: String

core :: Object :: class_name

The class name of the object.
abstract fun clear

core :: Map :: clear

Remove all items
fun core_serialize_to(serializer: Serializer)

serialization :: Serializable :: core_serialize_to

Actual serialization of self to serializer
fun filter_keys(keys: Collection[nullable Object]): Array[K]

core :: MapRead :: filter_keys

Return all elements of keys that have a value.
fun find_by_prefix(prefix: String): Array[E]

trees :: Trie :: find_by_prefix

Find values stored under prefix
init from_deserializer(deserializer: Deserializer)

serialization :: Serializable :: from_deserializer

Create an instance of this class from the deserializer
fun get_class: CLASS

core :: Object :: get_class

The meta-object representing the dynamic type of self.
fun get_or_default(key: nullable Object, default: V): V

core :: MapRead :: get_or_default

Get the item at key or return default if not in map
fun get_or_null(key: nullable Object): nullable V

core :: MapRead :: get_or_null

Get the item at key or null if key is not in the map.
fun has_key(key: nullable Object): Bool

core :: MapRead :: has_key

Is there an item associated with key?
fun has_prefix(prefix: String): Bool

trees :: Trie :: has_prefix

Find values stored under prefix
fun hash: Int

core :: Object :: hash

The hash code of the object.
init init

core :: Object :: init

fun inspect: String

core :: Object :: inspect

Developer readable representation of self.
protected fun inspect_head: String

core :: Object :: inspect_head

Return "CLASSNAME:#OBJECTID".
abstract fun is_empty: Bool

core :: MapRead :: is_empty

Is there no item in the collection?
intern fun is_same_instance(other: nullable Object): Bool

core :: Object :: is_same_instance

Return true if self and other are the same instance (i.e. same identity).
fun is_same_serialized(other: nullable Object): Bool

core :: Object :: is_same_serialized

Is self the same as other in a serialization context?
intern fun is_same_type(other: Object): Bool

core :: Object :: is_same_type

Return true if self and other have the same dynamic type.
abstract fun iterator: MapIterator[K, V]

core :: MapRead :: iterator

Get a new iterator on the map.
abstract fun join(sep: String, couple_sep: String): String

core :: Map :: join

Concatenate couples of key value.
abstract fun keys: Collection[K]

core :: MapRead :: keys

Return the point of view of self on the keys only.
fun keys_sorted_by_values(comparator: Comparator): Array[K]

core :: MapRead :: keys_sorted_by_values

Return an array of all keys sorted with their values using comparator.
abstract fun length: Int

core :: MapRead :: length

Number of items in the collection.
fun lookup_all_values(pe: POSetElement[K]): Set[V]

core :: MapRead :: lookup_all_values

Search all the values in pe.greaters.
fun lookup_values(pe: POSetElement[K]): Set[V]

core :: MapRead :: lookup_values

Combine the values in pe.greaters from the most smaller elements that have a value.
protected fun msgpack_extra_array_items: Int

serialization :: Serializable :: msgpack_extra_array_items

Hook to request a larger than usual metadata array
private intern fun native_class_name: CString

core :: Object :: native_class_name

The class name of the object in CString format.
init new: Map[K, V]

core :: Map :: new

Get a HashMap[K, V] as default implementation
fun not_empty: Bool

core :: MapRead :: not_empty

Alias for not is_empty.
intern fun object_id: Int

core :: Object :: object_id

An internal hash code for the object based on its identity.
fun output

core :: Object :: output

Display self on stdout (debug only).
intern fun output_class_name

core :: Object :: output_class_name

Display class name on stdout (debug only).
protected fun provide_default_value(key: nullable Object): V

core :: MapRead :: provide_default_value

Called by the underling implementation of [] to provide a default value when a key has no value
fun recover_with(map: MapRead[K, V])

core :: Map :: recover_with

Alias for add_all
private fun root: TrieNode[E]

trees :: Trie :: root

Trie root
private fun root=(root: TrieNode[E])

trees :: Trie :: root=

Trie root
private fun search_node(string: nullable Object): nullable TrieNode[E]

trees :: Trie :: search_node

Search a node by a key or prefix
fun serialization_hash: Int

core :: Object :: serialization_hash

Hash value use for serialization
fun serialize_msgpack(plain: nullable Bool): Bytes

serialization :: Serializable :: serialize_msgpack

Serialize self to MessagePack bytes
fun serialize_to(serializer: Serializer)

serialization :: Serializable :: serialize_to

Serialize self to serializer
fun serialize_to_json(plain: nullable Bool, pretty: nullable Bool): String

serialization :: Serializable :: serialize_to_json

Serialize self to JSON
private fun serialize_to_or_delay(v: Serializer)

serialization :: Serializable :: serialize_to_or_delay

Accept references or force direct serialization (using serialize_to)
intern fun sys: Sys

core :: Object :: sys

Return the global sys object, the only instance of the Sys class.
fun to_json: String

serialization :: Serializable :: to_json

Serialize self to plain JSON
abstract fun to_jvalue(env: JniEnv): JValue

core :: Object :: to_jvalue

fun to_map_comparator(comparator: Comparator): MapComparator[K, V]

core :: MapRead :: to_map_comparator

A comparator that compares things with their values in self.
fun to_pretty_json: String

serialization :: Serializable :: to_pretty_json

Serialize self to plain pretty JSON
fun to_s: String

core :: Object :: to_s

User readable representation of self.
abstract fun values: Collection[V]

core :: MapRead :: values

Return the point of view of self on the values only.
fun values_sorted_by_key(comparator: Comparator): Array[V]

core :: MapRead :: values_sorted_by_key

Return an array of all values sorted with their keys using comparator.
package_diagram trees::Trie Trie core::Map Map trees::Trie->core::Map serialization::Serializable Serializable core::Map->serialization::Serializable core::MapRead MapRead core::Map->core::MapRead ...serialization::Serializable ... ...serialization::Serializable->serialization::Serializable ...core::MapRead ... ...core::MapRead->core::MapRead

Ancestors

interface MapRead[K: nullable Object, V: nullable Object]

core :: MapRead

MapRead are abstract associative collections: key -> item.
interface Object

core :: Object

The root of the class hierarchy.
interface Serializable

serialization :: Serializable

Instances of this class can be passed to Serializer::serialize

Parents

interface Map[K: nullable Object, V: nullable Object]

core :: Map

Maps are associative collections: key -> item.

Class definitions

trees $ Trie
# Trie data structure for prefix searches
#
# ~~~
# # Associate some integers to Map keys
# var trie = new Trie[Int]
# trie["foo"] = 1
# trie["fooo"] = 2
# trie["bar"] = 3
#
# # Search by key
# assert trie.has_key("foo")
# assert trie["foo"] == 1
#
# # Search by prefix
# assert trie.find_by_prefix("") == [1, 3, 2]
# assert trie.find_by_prefix("foo") == [1, 2]
# assert trie.find_by_prefix("baz").is_empty
# ~~~
class Trie[E]
	super Map[String, E]

	# Trie root
	#
	# Root children are used to store the first letters.
	private var root = new TrieNode[E]

	redef fun []=(key, value) do
		var children = root.children

		for i in [0..key.length[ do
			var c = key.chars[i]

			var node
			if children.has_key(c) then
				node = children[c]
			else
				node = new TrieNode[E](c)
				children[c] = node
			end
			children = node.children

			if i == key.length - 1 then
				node.is_leaf = true
				node.value = value
			end
		end
	end

	# Cache node used between `has_key` and `[]`
	private var cache: nullable TrieNode[E] = null

	# Cache key used between `has_key` and `[]`
	private var cache_key: nullable String = null

	redef fun [](key) do
		if cache_key == key then return cache.as(not null).value.as(not null)
		var node = search_node(key)
		assert node != null
		return node.value
	end

	redef fun has_key(key) do
		var node = search_node(key)
		if node == null then return false
		var res = node.is_leaf
		if res then
			cache = node
			cache_key = key.as(String)
		end
		return res
	end

	# Find values stored under `prefix`
	#
	# ~~~
	# # Associate some integers to Map keys
	# var trie = new Trie[Int]
	# trie["foo"] = 1
	# trie["fooo"] = 2
	# trie["foooo"] = 3
	# trie["bar"] = 4
	#
	# assert trie.find_by_prefix("") == [1, 4, 2, 3]
	# assert trie.find_by_prefix("foo") == [1, 2, 3]
	# assert trie.find_by_prefix("bar") == [4]
	# assert trie.find_by_prefix("baz").is_empty
	# ~~~
	fun find_by_prefix(prefix: String): Array[E] do
		var node
		if prefix == "" then
			node = root
		else
			node = search_node(prefix)
		end
		if node == null then return new Array[E]
		return node.collect_values
	end

	# Find values stored under `prefix`
	#
	# ~~~
	# # Associate some integers to Map keys
	# var trie = new Trie[Int]
	# trie["foo"] = 1
	# trie["bar"] = 4
	# trie["baz"] = 5
	#
	# assert trie.has_prefix("")
	# assert trie.has_prefix("f")
	# assert not trie.has_prefix("z")
	# ~~~
	fun has_prefix(prefix: String): Bool do
		if prefix == "" then return true
		return search_node(prefix) != null
	end

	# Search a node by a key or prefix
	#
	# Returns `null` if no node matches `string`.
	private fun search_node(string: nullable Object): nullable TrieNode[E] do
		if string == null then return null
		string = string.to_s
		var children = root.children
		var node = null
		for i in [0..string.length[ do
			var c = string.chars[i]
			if children.has_key(c) then
				node = children[c]
				children = node.children
			else
				node = null
				break
			end
		end
		return node
	end
end
lib/trees/trie.nit:45,1--181,3