Text Data
0.1.0
Max Lee Documentation Site
Installation
How
text_data
is organized
Getting Started
Corpus Structure
Exploring Text Data
text_data
Page
Index
A
|
C
|
D
|
E
|
F
|
G
|
H
|
I
|
L
|
M
|
N
|
O
|
P
|
Q
|
R
|
S
|
T
|
U
|
V
|
W
A
add_documents() (text_data.Corpus method)
(text_data.index.Corpus method)
(text_data.index.WordIndex method)
(text_data.WordIndex method)
add_ngram_index() (text_data.Corpus method)
(text_data.index.Corpus method)
C
chunks() (text_data.Corpus class method)
(text_data.index.Corpus class method)
concatenate() (in module text_data.multi_corpus)
(text_data.Corpus method)
(text_data.index.Corpus method)
(text_data.index.WordIndex method)
(text_data.WordIndex method)
copy() (text_data.Corpus method)
(text_data.index.Corpus method)
(text_data.index.WordIndex method)
(text_data.WordIndex method)
Corpus (class in text_data)
(class in text_data.index)
corpus_tokenizer() (in module text_data.tokenize)
count_matrix() (text_data.index.WordIndex method)
(text_data.WordIndex method)
D
default_tokenizer() (in module text_data.tokenize)
display_document() (text_data.Corpus method)
(text_data.index.Corpus method)
display_document_count() (text_data.Corpus method)
(text_data.index.Corpus method)
display_document_frequency() (text_data.Corpus method)
(text_data.index.Corpus method)
display_documents() (text_data.Corpus method)
(text_data.index.Corpus method)
display_occurrence_count() (text_data.Corpus method)
(text_data.index.Corpus method)
display_score_table() (in module text_data.display)
display_score_tables() (in module text_data.display)
display_search_results() (text_data.Corpus method)
(text_data.index.Corpus method)
doc_contains() (text_data.index.WordIndex method)
(text_data.WordIndex method)
doc_count_vector() (text_data.index.WordIndex method)
(text_data.WordIndex method)
doc_freq_vector() (text_data.index.WordIndex method)
(text_data.WordIndex method)
doc_id (text_data.index.PositionResult attribute)
doc_lengths() (text_data.index.WordIndex property)
(text_data.WordIndex property)
docs_with_word() (text_data.index.WordIndex method)
(text_data.WordIndex method)
document_count() (text_data.index.WordIndex method)
(text_data.WordIndex method)
document_frequency() (text_data.index.WordIndex method)
(text_data.WordIndex method)
documents (text_data.Corpus attribute)
(text_data.index.Corpus attribute)
E
exact (text_data.query.QueryItem attribute)
F
first_idx (text_data.index.PositionResult attribute)
flat_concat() (in module text_data.multi_corpus)
flatten() (text_data.Corpus method)
(text_data.index.Corpus method)
(text_data.index.WordIndex method)
(text_data.WordIndex method)
frequency_map() (in module text_data.display)
frequency_matrix() (text_data.index.WordIndex method)
(text_data.WordIndex method)
G
get_top_words() (text_data.index.WordIndex method)
(text_data.WordIndex method)
H
heatmap() (in module text_data.display)
histogram() (in module text_data.display)
I
idf() (text_data.index.WordIndex method)
(text_data.WordIndex method)
idf_vector() (text_data.index.WordIndex method)
(text_data.WordIndex method)
L
last_idx (text_data.index.PositionResult attribute)
M
max_word_count() (text_data.index.WordIndex method)
(text_data.WordIndex method)
modifier (text_data.query.QueryItem attribute)
module
text_data
text_data.core
text_data.display
text_data.index
text_data.multi_corpus
text_data.query
text_data.tokenize
most_common() (text_data.index.WordIndex method)
(text_data.WordIndex method)
N
ngram_indexes (text_data.Corpus attribute)
(text_data.index.Corpus attribute)
ngram_prefix (text_data.Corpus attribute)
(text_data.index.Corpus attribute)
ngram_sep (text_data.Corpus attribute)
(text_data.index.Corpus attribute)
ngram_suffix (text_data.Corpus attribute)
(text_data.index.Corpus attribute)
num_words() (text_data.index.WordIndex property)
(text_data.WordIndex property)
O
odds_document() (text_data.index.WordIndex method)
(text_data.WordIndex method)
odds_matrix() (text_data.index.WordIndex method)
(text_data.WordIndex method)
odds_vector() (text_data.index.WordIndex method)
(text_data.WordIndex method)
odds_word() (text_data.index.WordIndex method)
(text_data.WordIndex method)
one_hot_matrix() (text_data.index.WordIndex method)
(text_data.WordIndex method)
P
PositionResult (class in text_data.index)
postprocess_positions() (in module text_data.tokenize)
Q
Query (class in text_data.query)
QueryItem (class in text_data.query)
R
ranked_search() (text_data.Corpus method)
(text_data.index.Corpus method)
raw_end (text_data.index.PositionResult attribute)
raw_start (text_data.index.PositionResult attribute)
render_bar_chart() (in module text_data.display)
render_multi_bar_chart() (in module text_data.display)
requires_display_extra() (in module text_data.core)
reset_index() (text_data.index.WordIndex method)
(text_data.WordIndex method)
S
search_document_count() (text_data.Corpus method)
(text_data.index.Corpus method)
search_document_freq() (text_data.Corpus method)
(text_data.index.Corpus method)
search_documents() (text_data.Corpus method)
(text_data.index.Corpus method)
search_occurrence_count() (text_data.Corpus method)
(text_data.index.Corpus method)
search_occurrences() (text_data.Corpus method)
(text_data.index.Corpus method)
skip_words() (text_data.index.WordIndex method)
(text_data.WordIndex method)
slice() (text_data.Corpus method)
(text_data.index.Corpus method)
(text_data.index.WordIndex method)
(text_data.WordIndex method)
slice_many() (text_data.index.WordIndex method)
(text_data.WordIndex method)
split_off() (text_data.Corpus method)
(text_data.index.Corpus method)
(text_data.index.WordIndex method)
(text_data.WordIndex method)
T
term_count() (text_data.index.WordIndex method)
(text_data.WordIndex method)
term_frequency() (text_data.index.WordIndex method)
(text_data.WordIndex method)
text_data
module
text_data.core
module
text_data.display
module
text_data.index
module
text_data.multi_corpus
module
text_data.query
module
text_data.tokenize
module
tfidf_matrix() (text_data.index.WordIndex method)
(text_data.WordIndex method)
to_index() (text_data.Corpus method)
(text_data.index.Corpus method)
tokenize_regex_positions() (in module text_data.tokenize)
tokenized_documents (text_data.Corpus attribute)
(text_data.index.Corpus attribute)
tokenizer (text_data.Corpus attribute)
(text_data.index.Corpus attribute)
U
update() (text_data.Corpus method)
(text_data.index.Corpus method)
V
vocab() (text_data.index.WordIndex property)
(text_data.WordIndex property)
vocab_list() (text_data.index.WordIndex property)
(text_data.WordIndex property)
vocab_size() (text_data.index.WordIndex property)
(text_data.WordIndex property)
W
word_count() (text_data.index.WordIndex method)
(text_data.WordIndex method)
word_count_vector() (text_data.index.WordIndex method)
(text_data.WordIndex method)
word_counter() (text_data.index.WordIndex method)
(text_data.WordIndex method)
word_freq_vector() (text_data.index.WordIndex method)
(text_data.WordIndex method)
word_frequency() (text_data.index.WordIndex method)
(text_data.WordIndex method)
WordIndex (class in text_data)
(class in text_data.index)
words (text_data.query.QueryItem attribute)