nlp :: NLPFileIndex
nlp :: NLPFileIndex :: defaultinit
nlp $ NLPFileIndex :: SELF
Type of this instance, automatically specialized in every classvsm :: FileIndex :: accept_file
Ispath
accepted depending on whitelist_exts
and blacklist_exts
?
nlp :: NLPIndex :: accept_token
Istoken
accepted by this index?
vsm :: FileIndex :: blacklist_exts=
File extensions black listnlp :: NLPIndex :: blacklist_pos=
Part-Of-Speech blacklistcore :: Object :: class_factory
Implementation used byget_class
to create the specific class.
nlp :: NLPIndex :: defaultinit
vsm :: StringIndex :: defaultinit
nlp :: NLPFileIndex :: defaultinit
vsm :: FileIndex :: defaultinit
core :: Object :: defaultinit
vsm :: VSMIndex :: defaultinit
vsm :: VSMIndex :: index_document
Index a documentvsm :: FileIndex :: index_file
Index a file from itspath
.
vsm :: FileIndex :: index_files
Index multiple filesvsm :: StringIndex :: index_string
Index a new Document fromtitle
, uri
and string string
.
vsm :: VSMIndex :: inverse_doc_frequency
Inverse document frequencyvsm :: VSMIndex :: inverse_doc_frequency=
Inverse document frequencyvsm :: VSMIndex :: inversed_index
Inversed indexvsm :: VSMIndex :: inversed_index=
Inversed indexcore :: Object :: is_same_instance
Return true ifself
and other
are the same instance (i.e. same identity).
core :: Object :: is_same_serialized
Isself
the same as other
in a serialization context?
core :: Object :: is_same_type
Return true ifself
and other
have the same dynamic type.
vsm :: StringIndex :: match_string
Match thequery
string against all indexed documents
vsm :: VSMIndex :: match_vector
Matchquery
vector to all index document vectors
nlp :: NLPIndex :: nlp_processor
NLP Processor used to tokenize, lemmatize and POS tag documentsnlp :: NLPIndex :: nlp_processor=
NLP Processor used to tokenize, lemmatize and POS tag documentscore :: Object :: output_class_name
Display class name on stdout (debug only).vsm :: FileIndex :: parse_file
Parse thefile
content as a Vector
vsm :: StringIndex :: parse_string
Parse thestring
as a Vector
vsm :: VSMIndex :: terms_doc_count
Count for all terms in all indexed documentsvsm :: VSMIndex :: terms_doc_count=
Count for all terms in all indexed documentsvsm :: FileIndex :: whitelist_exts=
File extensions white listnlp :: NLPIndex :: whitelist_pos=
Part-Of-Speech whitelist
# A FileIndex based using a NLPProcessor
class NLPFileIndex
super NLPIndex
super FileIndex
end
lib/nlp/nlp.nit:73,1--77,3