Index
A
|
C
|
D
|
E
|
F
|
G
|
H
|
I
|
J
|
K
|
L
|
M
|
N
|
O
|
P
|
R
|
S
|
T
|
U
|
V
|
W
|
Y
A
acronyms_and_definitions() (in module textacy.extract)
add() (textacy.corpus.Corpus method)
add_doc() (textacy.corpus.Corpus method)
add_docs() (textacy.corpus.Corpus method)
add_record() (textacy.corpus.Corpus method)
add_records() (textacy.corpus.Corpus method)
add_text() (textacy.corpus.Corpus method)
add_texts() (textacy.corpus.Corpus method)
aggregate_term_variants() (in module textacy.ke.utils)
antonyms() (textacy.resources.concept_net.ConceptNet property)
apply_idf_weighting() (in module textacy.vsm.matrix_utils)
apply_transforms() (textacy.augmentation.augmenter.Augmenter method)
Augmenter (class in textacy.augmentation.augmenter)
AugTok (class in textacy.augmentation.utils)
authors (textacy.datasets.oxford_text_archive.OxfordTextArchive attribute)
automated_readability_index() (in module textacy.text_stats.readability)
(textacy.text_stats.api.TextStats property)
automatic_arabic_readability_index() (in module textacy.text_stats.readability)
(textacy.text_stats.api.TextStats property)
C
Candidate (class in textacy.ke.sgrank)
CapitolWords (class in textacy.datasets.capitol_words)
chambers (textacy.datasets.capitol_words.CapitolWords attribute)
character_ngrams() (in module textacy.similarity)
clean_terms() (in module textacy.text_utils)
clear() (in module textacy.cache)
coerce_content_type() (in module textacy.io.utils)
coleman_liau_index() (in module textacy.text_stats.readability)
(textacy.text_stats.api.TextStats property)
ConceptNet (class in textacy.resources.concept_net)
congresses (textacy.datasets.capitol_words.CapitolWords attribute)
Corpus (class in textacy.corpus)
count (textacy.ke.sgrank.Candidate attribute)
D
decision_directions (textacy.datasets.supreme_court.SupremeCourt attribute)
default() (textacy.io.json.ExtendedJSONEncoder method)
delete_chars() (in module textacy.augmentation.transforms)
delete_words() (in module textacy.augmentation.transforms)
DepecheMood (class in textacy.resources.depeche_mood)
deprecated() (in module textacy.utils)
direct_quotations() (in module textacy.extract)
docs (textacy.corpus.Corpus attribute)
download() (textacy.datasets.capitol_words.CapitolWords method)
(textacy.datasets.imdb.IMDB method)
(textacy.datasets.oxford_text_archive.OxfordTextArchive method)
(textacy.datasets.reddit_comments.RedditComments method)
(textacy.datasets.supreme_court.SupremeCourt method)
(textacy.datasets.udhr.UDHR method)
(textacy.datasets.wikimedia.Wikimedia method)
(textacy.lang_utils.LangIdentifier method)
(textacy.resources.concept_net.ConceptNet method)
(textacy.resources.depeche_mood.DepecheMood method)
download_file() (in module textacy.io.utils)
draw_semantic_network() (in module textacy.viz.network)
draw_termite_plot() (in module textacy.viz.termite)
E
entities() (in module textacy.extract)
entropy() (in module textacy.text_stats.basics)
(textacy.text_stats.api.TextStats property)
ExtendedJSONEncoder (class in textacy.io.json)
F
filepath() (textacy.datasets.capitol_words.CapitolWords property)
(textacy.datasets.supreme_court.SupremeCourt property)
(textacy.datasets.wikimedia.Wikimedia property)
(textacy.resources.concept_net.ConceptNet property)
(textacy.resources.depeche_mood.DepecheMood property)
filepaths() (textacy.datasets.reddit_comments.RedditComments property)
filter_terms_by_df() (in module textacy.vsm.matrix_utils)
filter_terms_by_ic() (in module textacy.vsm.matrix_utils)
fit() (textacy.vsm.vectorizers.GroupVectorizer method)
(textacy.vsm.vectorizers.Vectorizer method)
fit_transform() (textacy.vsm.vectorizers.GroupVectorizer method)
(textacy.vsm.vectorizers.Vectorizer method)
flesch_kincaid_grade_level() (in module textacy.text_stats.readability)
(textacy.text_stats.api.TextStats property)
flesch_reading_ease() (in module textacy.text_stats.readability)
(textacy.text_stats.api.TextStats property)
full_date_range (textacy.datasets.capitol_words.CapitolWords attribute)
(textacy.datasets.oxford_text_archive.OxfordTextArchive attribute)
(textacy.datasets.reddit_comments.RedditComments attribute)
(textacy.datasets.supreme_court.SupremeCourt attribute)
full_rating_range (textacy.datasets.imdb.IMDB attribute)
G
get() (textacy.corpus.Corpus method)
get_antonyms() (textacy.resources.concept_net.ConceptNet method)
get_char_weights() (in module textacy.augmentation.utils)
get_config() (in module textacy.utils)
get_doc_extensions() (in module textacy.spacier.doc_extensions)
get_doc_freqs() (in module textacy.vsm.matrix_utils)
get_doc_lengths() (in module textacy.vsm.matrix_utils)
get_doc_topic_matrix() (textacy.tm.topic_model.TopicModel method)
get_emotional_valence() (textacy.resources.depeche_mood.DepecheMood method)
get_filename_from_url() (in module textacy.io.utils)
get_filepaths() (in module textacy.io.utils)
get_filtered_topn_terms() (in module textacy.ke.utils)
get_hyponyms() (textacy.resources.concept_net.ConceptNet method)
get_information_content() (in module textacy.vsm.matrix_utils)
get_inverse_doc_freqs() (in module textacy.vsm.matrix_utils)
get_kwargs_for_func() (in module textacy.utils)
get_lang() (in module textacy.spacier.doc_extensions)
get_longest_subsequence_candidates() (in module textacy.ke.utils)
get_main_verbs_of_sent() (in module textacy.spacier.utils)
get_meronyms() (textacy.resources.concept_net.ConceptNet method)
get_meta() (in module textacy.spacier.doc_extensions)
get_n_sents() (in module textacy.spacier.doc_extensions)
get_n_tokens() (in module textacy.spacier.doc_extensions)
get_ngram_candidates() (in module textacy.ke.utils)
get_normalized_text() (in module textacy.spacier.utils)
get_objects_of_verb() (in module textacy.spacier.utils)
get_pattern_matching_candidates() (in module textacy.ke.utils)
get_preview() (in module textacy.spacier.doc_extensions)
get_span_for_compound_noun() (in module textacy.spacier.utils)
get_span_for_verb_auxiliaries() (in module textacy.spacier.utils)
get_subjects_of_verb() (in module textacy.spacier.utils)
get_synonyms() (textacy.resources.concept_net.ConceptNet method)
get_term_freqs() (in module textacy.vsm.matrix_utils)
get_tokens() (in module textacy.spacier.doc_extensions)
GroupVectorizer (class in textacy.vsm.vectorizers)
grps_list() (textacy.vsm.vectorizers.GroupVectorizer property)
gulpease_index() (in module textacy.text_stats.readability)
(textacy.text_stats.api.TextStats property)
gunning_fog_index() (in module textacy.text_stats.readability)
(textacy.text_stats.api.TextStats property)
H
hyponyms() (textacy.resources.concept_net.ConceptNet property)
I
id_to_grp() (textacy.vsm.vectorizers.GroupVectorizer property)
id_to_term (textacy.vsm.vectorizers.GroupVectorizer attribute)
id_to_term() (textacy.vsm.vectorizers.Vectorizer property)
identify_lang() (in module textacy.lang_utils)
(textacy.lang_utils.LangIdentifier method)
identify_topn_langs() (textacy.lang_utils.LangIdentifier method)
idx (textacy.ke.sgrank.Candidate attribute)
IMDB (class in textacy.datasets.imdb)
init_pipeline() (textacy.lang_utils.LangIdentifier method)
insert_chars() (in module textacy.augmentation.transforms)
insert_word_synonyms() (in module textacy.augmentation.transforms)
is_acronym() (in module textacy.text_utils)
is_record() (in module textacy.utils)
is_word (textacy.augmentation.utils.AugTok attribute)
issue_area_codes (textacy.datasets.supreme_court.SupremeCourt attribute)
issue_codes (textacy.datasets.supreme_court.SupremeCourt attribute)
J
jaccard() (in module textacy.similarity)
K
keyword_in_context() (in module textacy.text_utils)
KWIC() (in module textacy.text_utils)
L
lang (textacy.corpus.Corpus attribute)
LangIdentifier (class in textacy.lang_utils)
langs (textacy.datasets.udhr.UDHR attribute)
length (textacy.ke.sgrank.Candidate attribute)
levenshtein() (in module textacy.similarity)
lix() (in module textacy.text_stats.readability)
(textacy.text_stats.api.TextStats property)
load() (textacy.corpus.Corpus class method)
load_hyphenator() (in module textacy.text_stats.api)
load_spacy_lang() (in module textacy.spacier.core)
LRU_CACHE (in module textacy.cache)
M
make_doc_from_text_chunks() (in module textacy.spacier.utils)
make_spacy_doc() (in module textacy.spacier.core)
matches() (in module textacy.extract)
merge_spans() (in module textacy.spacier.utils)
meronyms() (textacy.resources.concept_net.ConceptNet property)
metadata() (textacy.datasets.oxford_text_archive.OxfordTextArchive property)
module
textacy.augmentation.augmenter
textacy.augmentation.transforms
textacy.augmentation.utils
textacy.cache
textacy.corpus
textacy.datasets.capitol_words
textacy.datasets.imdb
textacy.datasets.oxford_text_archive
textacy.datasets.reddit_comments
textacy.datasets.supreme_court
textacy.datasets.udhr
textacy.datasets.wikimedia
textacy.extract
textacy.io.csv
textacy.io.http
textacy.io.json
textacy.io.matrix
textacy.io.spacy
textacy.io.text
textacy.io.utils
textacy.ke.scake
textacy.ke.sgrank
textacy.ke.textrank
textacy.ke.utils
textacy.ke.yake
textacy.lang_utils
textacy.network
textacy.preprocessing.normalize
textacy.preprocessing.remove
textacy.preprocessing.replace
textacy.resources.concept_net
textacy.resources.depeche_mood
textacy.similarity
textacy.spacier.components
textacy.spacier.core
textacy.spacier.doc_extensions
textacy.spacier.utils
textacy.text_stats.api
textacy.text_stats.basics
textacy.text_stats.readability
textacy.text_utils
textacy.tm.topic_model
textacy.utils
textacy.viz.network
textacy.viz.termite
textacy.vsm.matrix_utils
textacy.vsm.vectorizers
most_discriminating_terms() (in module textacy.ke.utils)
mu_legibility_index() (in module textacy.text_stats.readability)
(textacy.text_stats.api.TextStats property)
N
n_chars() (in module textacy.text_stats.basics)
(textacy.text_stats.api.TextStats property)
n_chars_per_word() (in module textacy.text_stats.basics)
(textacy.text_stats.api.TextStats property)
n_docs (textacy.corpus.Corpus attribute)
n_long_words() (in module textacy.text_stats.basics)
(textacy.text_stats.api.TextStats property)
n_monosyllable_words() (in module textacy.text_stats.basics)
(textacy.text_stats.api.TextStats property)
n_polysyllable_words() (in module textacy.text_stats.basics)
(textacy.text_stats.api.TextStats property)
n_sents (textacy.corpus.Corpus attribute)
n_sents() (in module textacy.text_stats.basics)
(textacy.text_stats.api.TextStats property)
n_syllables() (in module textacy.text_stats.basics)
(textacy.text_stats.api.TextStats property)
n_syllables_per_word() (in module textacy.text_stats.basics)
(textacy.text_stats.api.TextStats property)
n_tokens (textacy.corpus.Corpus attribute)
n_unique_words() (in module textacy.text_stats.basics)
(textacy.text_stats.api.TextStats property)
n_words() (in module textacy.text_stats.basics)
(textacy.text_stats.api.TextStats property)
name (textacy.spacier.components.TextStatsComponent attribute)
ngrams() (in module textacy.extract)
normalize_hyphenated_words() (in module textacy.preprocessing.normalize)
normalize_quotation_marks() (in module textacy.preprocessing.normalize)
normalize_repeating_chars() (in module textacy.preprocessing.normalize)
normalize_terms() (in module textacy.ke.utils)
normalize_unicode() (in module textacy.preprocessing.normalize)
normalize_whitespace() (in module textacy.preprocessing.normalize)
noun_chunks() (in module textacy.extract)
O
open_sesame() (in module textacy.io.utils)
opinion_author_codes (textacy.datasets.supreme_court.SupremeCourt attribute)
OxfordTextArchive (class in textacy.datasets.oxford_text_archive)
P
perspicuity_index() (in module textacy.text_stats.readability)
(textacy.text_stats.api.TextStats property)
pipeline (textacy.lang_utils.LangIdentifier attribute)
pos (textacy.augmentation.utils.AugTok attribute)
pos_regex_matches() (in module textacy.extract)
preserve_case() (in module textacy.spacier.utils)
print_markdown() (in module textacy.utils)
R
read_csv() (in module textacy.io.csv)
read_http_stream() (in module textacy.io.http)
read_json() (in module textacy.io.json)
read_json_mash() (in module textacy.io.json)
read_spacy_docs() (in module textacy.io.spacy)
read_sparse_matrix() (in module textacy.io.matrix)
read_text() (in module textacy.io.text)
records() (textacy.datasets.capitol_words.CapitolWords method)
(textacy.datasets.imdb.IMDB method)
(textacy.datasets.oxford_text_archive.OxfordTextArchive method)
(textacy.datasets.reddit_comments.RedditComments method)
(textacy.datasets.supreme_court.SupremeCourt method)
(textacy.datasets.udhr.UDHR method)
(textacy.datasets.wikimedia.Wikimedia method)
RedditComments (class in textacy.datasets.reddit_comments)
remove() (textacy.corpus.Corpus method)
remove_accents() (in module textacy.preprocessing.remove)
remove_doc_extensions() (in module textacy.spacier.doc_extensions)
remove_punctuation() (in module textacy.preprocessing.remove)
replace_currency_symbols() (in module textacy.preprocessing.replace)
replace_emails() (in module textacy.preprocessing.replace)
replace_emojis() (in module textacy.preprocessing.replace)
replace_hashtags() (in module textacy.preprocessing.replace)
replace_numbers() (in module textacy.preprocessing.replace)
replace_phone_numbers() (in module textacy.preprocessing.replace)
replace_urls() (in module textacy.preprocessing.replace)
replace_user_handles() (in module textacy.preprocessing.replace)
S
save() (textacy.corpus.Corpus method)
scake() (in module textacy.ke.scake)
semistructured_statements() (in module textacy.extract)
sents_to_semantic_network() (in module textacy.network)
set_doc_extensions() (in module textacy.spacier.doc_extensions)
set_meta() (in module textacy.spacier.doc_extensions)
sgrank() (in module textacy.ke.sgrank)
smog_index() (in module textacy.text_stats.readability)
(textacy.text_stats.api.TextStats property)
spacy_lang (textacy.corpus.Corpus attribute)
speaker_names (textacy.datasets.capitol_words.CapitolWords attribute)
speaker_parties (textacy.datasets.capitol_words.CapitolWords attribute)
split_records() (in module textacy.io.utils)
subject_verb_object_triples() (in module textacy.extract)
substitute_chars() (in module textacy.augmentation.transforms)
substitute_word_synonyms() (in module textacy.augmentation.transforms)
SupremeCourt (class in textacy.datasets.supreme_court)
swap_chars() (in module textacy.augmentation.transforms)
swap_words() (in module textacy.augmentation.transforms)
synonyms() (textacy.resources.concept_net.ConceptNet property)
syns (textacy.augmentation.utils.AugTok attribute)
T
termite_df_plot() (in module textacy.viz.termite)
termite_plot() (textacy.tm.topic_model.TopicModel method)
terms_list (textacy.vsm.vectorizers.GroupVectorizer attribute)
terms_list() (textacy.vsm.vectorizers.Vectorizer property)
terms_to_semantic_network() (in module textacy.network)
text (textacy.augmentation.utils.AugTok attribute)
(textacy.ke.sgrank.Candidate attribute)
textacy.augmentation.augmenter
module
textacy.augmentation.transforms
module
textacy.augmentation.utils
module
textacy.cache
module
textacy.corpus
module
textacy.datasets.capitol_words
module
textacy.datasets.imdb
module
textacy.datasets.oxford_text_archive
module
textacy.datasets.reddit_comments
module
textacy.datasets.supreme_court
module
textacy.datasets.udhr
module
textacy.datasets.wikimedia
module
textacy.extract
module
textacy.io.csv
module
textacy.io.http
module
textacy.io.json
module
textacy.io.matrix
module
textacy.io.spacy
module
textacy.io.text
module
textacy.io.utils
module
textacy.ke.scake
module
textacy.ke.sgrank
module
textacy.ke.textrank
module
textacy.ke.utils
module
textacy.ke.yake
module
textacy.lang_utils
module
textacy.network
module
textacy.preprocessing.normalize
module
textacy.preprocessing.remove
module
textacy.preprocessing.replace
module
textacy.resources.concept_net
module
textacy.resources.depeche_mood
module
textacy.similarity
module
textacy.spacier.components
module
textacy.spacier.core
module
textacy.spacier.doc_extensions
module
textacy.spacier.utils
module
textacy.text_stats.api
module
textacy.text_stats.basics
module
textacy.text_stats.readability
module
textacy.text_utils
module
textacy.tm.topic_model
module
textacy.utils
module
textacy.viz.network
module
textacy.viz.termite
module
textacy.vsm.matrix_utils
module
textacy.vsm.vectorizers
module
textrank() (in module textacy.ke.textrank)
texts() (textacy.datasets.capitol_words.CapitolWords method)
(textacy.datasets.imdb.IMDB method)
(textacy.datasets.oxford_text_archive.OxfordTextArchive method)
(textacy.datasets.reddit_comments.RedditComments method)
(textacy.datasets.supreme_court.SupremeCourt method)
(textacy.datasets.udhr.UDHR method)
(textacy.datasets.wikimedia.Wikimedia method)
TextStats (class in textacy.text_stats.api)
TextStatsComponent (class in textacy.spacier.components)
to_aug_toks() (in module textacy.augmentation.utils)
to_bag_of_terms() (in module textacy.spacier.doc_extensions)
to_bag_of_words() (in module textacy.spacier.doc_extensions)
to_bytes() (in module textacy.utils)
to_collection() (in module textacy.utils)
to_path() (in module textacy.utils)
to_semantic_network() (in module textacy.spacier.doc_extensions)
to_tagged_text() (in module textacy.spacier.doc_extensions)
to_terms_list() (in module textacy.spacier.doc_extensions)
to_tokenized_text() (in module textacy.spacier.doc_extensions)
to_unicode() (in module textacy.utils)
token_sort_ratio() (in module textacy.similarity)
top_doc_topics() (textacy.tm.topic_model.TopicModel method)
top_topic_docs() (textacy.tm.topic_model.TopicModel method)
top_topic_terms() (textacy.tm.topic_model.TopicModel method)
topic_weights() (textacy.tm.topic_model.TopicModel method)
TopicModel (class in textacy.tm.topic_model)
transform() (textacy.vsm.vectorizers.GroupVectorizer method)
(textacy.vsm.vectorizers.Vectorizer method)
U
UDHR (class in textacy.datasets.udhr)
unpack_archive() (in module textacy.io.utils)
unzip() (in module textacy.io.utils)
V
validate_and_clip_range() (in module textacy.utils)
validate_set_members() (in module textacy.utils)
vector_norms() (textacy.corpus.Corpus property)
Vectorizer (class in textacy.vsm.vectorizers)
vectors() (textacy.corpus.Corpus property)
vocabulary_grps (textacy.vsm.vectorizers.GroupVectorizer attribute)
vocabulary_terms (textacy.vsm.vectorizers.GroupVectorizer attribute)
(textacy.vsm.vectorizers.Vectorizer attribute)
W
weighting() (textacy.vsm.vectorizers.Vectorizer property)
weights() (textacy.resources.depeche_mood.DepecheMood property)
wiener_sachtextformel() (in module textacy.text_stats.readability)
(textacy.text_stats.api.TextStats property)
Wikimedia (class in textacy.datasets.wikimedia)
Wikinews (class in textacy.datasets.wikimedia)
Wikipedia (class in textacy.datasets.wikimedia)
word2vec() (in module textacy.similarity)
word_counts() (textacy.corpus.Corpus method)
word_doc_counts() (textacy.corpus.Corpus method)
word_movers() (in module textacy.similarity)
words() (in module textacy.extract)
write_csv() (in module textacy.io.csv)
write_http_stream() (in module textacy.io.http)
write_json() (in module textacy.io.json)
write_spacy_docs() (in module textacy.io.spacy)
write_sparse_matrix() (in module textacy.io.matrix)
write_text() (in module textacy.io.text)
ws (textacy.augmentation.utils.AugTok attribute)
Y
yake() (in module textacy.ke.yake)
Navigation
Installation
Quickstart
API Reference
Changes
Related Topics
Documentation overview
Quick search