Table of Contents
Autogenerated API
simserver
simserver.NullHandler
simserver.SessionServer
simserver.SimServer
word2vec
word2vec.doc2vec()
word2vec.load()
word2vec.load_clusters()
word2vec.run_cmd()
word2vec.unitvec()
word2vec.word2clusters()
word2vec.word2phrase()
word2vec.word2vec()
word2vec.WordClusters
word2vec.WordVectors
stop_words
stop_words.add_filter()
stop_words.apply_filters()
stop_words.get_stop_words()
stop_words.get_version()
stop_words.remove_filter()
stop_words.safe_get_stop_words()
nltk
nltk.accuracy()
nltk.add_logs()
nltk.alignment_error_rate()
nltk.apply_features()
nltk.approxrand()
nltk.arity()
nltk.bigrams()
nltk.binary_distance()
nltk.binary_search_file()
nltk.binding_ops()
nltk.bleu()
nltk.boolean_ops()
nltk.bracket_parse()
nltk.breadth_first()
nltk.build_opener()
nltk.call_megam()
nltk.casual_tokenize()
nltk.choose()
nltk.clause()
nltk.clean_html()
nltk.clean_url()
nltk.config_java()
nltk.config_megam()
nltk.config_weka()
nltk.conflicts()
nltk.conllstr2tree()
nltk.conlltags2tree()
nltk.custom_distance()
nltk.decorator()
nltk.demo()
nltk.download_gui()
nltk.download_shell()
nltk.edit_distance()
nltk.elementtree_indent()
nltk.entropy()
nltk.equality_preds()
nltk.evaluate_sents()
nltk.everygrams()
nltk.extract_rels()
nltk.extract_test_sentences()
nltk.f_measure()
nltk.filestring()
nltk.flatten()
nltk.fractional_presence()
nltk.getproxies()
nltk.ghd()
nltk.guess_encoding()
nltk.ieerstr2tree()
nltk.in_idle()
nltk.induce_pcfg()
nltk.install_opener()
nltk.interpret_sents()
nltk.interval_distance()
nltk.invert_dict()
nltk.invert_graph()
nltk.is_rel()
nltk.jaccard_distance()
nltk.line_tokenize()
nltk.load()
nltk.load_parser()
nltk.log_likelihood()
nltk.map_tag()
nltk.masi_distance()
nltk.memoize()
nltk.ne_chunk()
nltk.ne_chunk_sents()
nltk.ngrams()
nltk.nonterminals()
nltk.pad_sequence()
nltk.parse_sents()
nltk.pk()
nltk.pos_tag()
nltk.pos_tag_sents()
nltk.pprint()
nltk.pr()
nltk.precision()
nltk.presence()
nltk.print_string()
nltk.py25()
nltk.py26()
nltk.py27()
nltk.python_2_unicode_compatible()
nltk.raise_unorderable_types()
nltk.ranks_from_scores()
nltk.ranks_from_sequence()
nltk.re_show()
nltk.read_grammar()
nltk.read_logic()
nltk.read_valuation()
nltk.recall()
nltk.regexp_span_tokenize()
nltk.regexp_tokenize()
nltk.register_tag()
nltk.ribes()
nltk.root_semrep()
nltk.rte_classifier()
nltk.rte_features()
nltk.rtuple()
nltk.sent_tokenize()
nltk.set2rel()
nltk.set_proxy()
nltk.sinica_parse()
nltk.skipgrams()
nltk.skolemize()
nltk.slice_bounds()
nltk.spearman_correlation()
nltk.str2tuple()
nltk.string_span_tokenize()
nltk.subsumes()
nltk.sum_logs()
nltk.tagset_mapping()
nltk.tagstr2tree()
nltk.tokenwrap()
nltk.total_ordering()
nltk.transitive_closure()
nltk.tree2conllstr()
nltk.tree2conlltags()
nltk.trigrams()
nltk.tuple2str()
nltk.unify()
nltk.unique_list()
nltk.untag()
nltk.usage()
nltk.windowdiff()
nltk.word_tokenize()
nltk.AbstractLazySequence
nltk.AffixTagger
nltk.AlignedSent
nltk.Alignment
nltk.AnnotationTask
nltk.ApplicationExpression
nltk.Assignment
nltk.BigramAssocMeasures
nltk.BigramCollocationFinder
nltk.BigramTagger
nltk.BinaryMaxentFeatureEncoding
nltk.BlanklineTokenizer
nltk.BllipParser
nltk.BottomUpChartParser
nltk.BottomUpLeftCornerChartParser
nltk.BottomUpProbabilisticChartParser
nltk.Boxer
nltk.BrillTagger
nltk.BrillTaggerTrainer
nltk.CFG
nltk.CRFTagger
nltk.CfgReadingCommand
nltk.ChartParser
nltk.ChunkParserI
nltk.ChunkScore
nltk.ClassifierBasedPOSTagger
nltk.ClassifierBasedTagger
nltk.ClassifierI
nltk.ConcordanceIndex
nltk.ConditionalExponentialClassifier
nltk.ConditionalFreqDist
nltk.ConditionalProbDist
nltk.ConditionalProbDistI
nltk.ConfusionMatrix
nltk.ContextIndex
nltk.ContextTagger
nltk.ContingencyMeasures
nltk.CrossValidationProbDist
nltk.DRS
nltk.DecisionTreeClassifier
nltk.DefaultTagger
nltk.DependencyEvaluator
nltk.DependencyGrammar
nltk.DependencyGraph
nltk.DependencyProduction
nltk.DictionaryConditionalProbDist
nltk.DictionaryProbDist
nltk.DiscourseTester
nltk.DrtExpression
nltk.DrtGlueReadingCommand
nltk.ELEProbDist
nltk.EarleyChartParser
nltk.Expression
nltk.FStructure
nltk.FeatDict
nltk.FeatList
nltk.FeatStruct
nltk.FeatStructReader
nltk.Feature
nltk.FeatureBottomUpChartParser
nltk.FeatureBottomUpLeftCornerChartParser
nltk.FeatureChartParser
nltk.FeatureEarleyChartParser
nltk.FeatureIncrementalBottomUpChartParser
nltk.FeatureIncrementalBottomUpLeftCornerChartParser
nltk.FeatureIncrementalChartParser
nltk.FeatureIncrementalTopDownChartParser
nltk.FeatureTopDownChartParser
nltk.FreqDist
nltk.HTTPPasswordMgrWithDefaultRealm
nltk.HeldoutProbDist
nltk.HiddenMarkovModelTagger
nltk.HiddenMarkovModelTrainer
nltk.HunposTagger
nltk.IBMModel
nltk.IBMModel1
nltk.IBMModel2
nltk.IBMModel3
nltk.IBMModel4
nltk.IBMModel5
nltk.ISRIStemmer
nltk.ImmutableMultiParentedTree
nltk.ImmutableParentedTree
nltk.ImmutableProbabilisticMixIn
nltk.ImmutableProbabilisticTree
nltk.ImmutableTree
nltk.IncrementalBottomUpChartParser
nltk.IncrementalBottomUpLeftCornerChartParser
nltk.IncrementalChartParser
nltk.IncrementalLeftCornerChartParser
nltk.IncrementalTopDownChartParser
nltk.Index
nltk.InsideChartParser
nltk.JSONTaggedDecoder
nltk.JSONTaggedEncoder
nltk.KneserNeyProbDist
nltk.LancasterStemmer
nltk.LaplaceProbDist
nltk.LazyConcatenation
nltk.LazyEnumerate
nltk.LazyMap
nltk.LazySubsequence
nltk.LazyZip
nltk.LeftCornerChartParser
nltk.LidstoneProbDist
nltk.LineTokenizer
nltk.LongestChartParser
nltk.MLEProbDist
nltk.MWETokenizer
nltk.Mace
nltk.MaceCommand
nltk.MaltParser
nltk.MaxentClassifier
nltk.Model
nltk.MultiClassifierI
nltk.MultiParentedTree
nltk.MutableProbDist
nltk.NaiveBayesClassifier
nltk.NaiveBayesDependencyScorer
nltk.NgramAssocMeasures
nltk.NgramTagger
nltk.NonprojectiveDependencyParser
nltk.Nonterminal
nltk.OrderedDict
nltk.PCFG
nltk.Paice
nltk.ParallelProverBuilder
nltk.ParallelProverBuilderCommand
nltk.ParentedTree
nltk.ParserI
nltk.PerceptronTagger
nltk.PhraseTable
nltk.PorterStemmer
nltk.PositiveNaiveBayesClassifier
nltk.ProbDistI
nltk.ProbabilisticDependencyGrammar
nltk.ProbabilisticMixIn
nltk.ProbabilisticNonprojectiveParser
nltk.ProbabilisticProduction
nltk.ProbabilisticProjectiveDependencyParser
nltk.ProbabilisticTree
nltk.Production
nltk.ProjectiveDependencyParser
nltk.Prover9
nltk.Prover9Command
nltk.ProxyBasicAuthHandler
nltk.ProxyDigestAuthHandler
nltk.ProxyHandler
nltk.PunktSentenceTokenizer
nltk.QuadgramCollocationFinder
nltk.RSLPStemmer
nltk.RTEFeatureExtractor
nltk.RandomChartParser
nltk.RangeFeature
nltk.ReadingCommand
nltk.RecursiveDescentParser
nltk.RegexpChunkParser
nltk.RegexpParser
nltk.RegexpStemmer
nltk.RegexpTagger
nltk.RegexpTokenizer
nltk.ResolutionProver
nltk.ResolutionProverCommand
nltk.SExprTokenizer
nltk.Senna
nltk.SennaChunkTagger
nltk.SennaNERTagger
nltk.SennaTagger
nltk.SequentialBackoffTagger
nltk.ShiftReduceParser
nltk.SimpleGoodTuringProbDist
nltk.SklearnClassifier
nltk.SlashFeature
nltk.SnowballStemmer
nltk.SpaceTokenizer
nltk.StackDecoder
nltk.StanfordNERTagger
nltk.StanfordPOSTagger
nltk.StanfordTagger
nltk.StanfordTokenizer
nltk.StemmerI
nltk.SteppingChartParser
nltk.SteppingRecursiveDescentParser
nltk.SteppingShiftReduceParser
nltk.TabTokenizer
nltk.TableauProver
nltk.TableauProverCommand
nltk.TaggerI
nltk.TestGrammar
nltk.Text
nltk.TextCat
nltk.TextCollection
nltk.TextTilingTokenizer
nltk.TnT
nltk.TokenSearcher
nltk.TopDownChartParser
nltk.TransitionParser
nltk.Tree
nltk.TreebankWordTokenizer
nltk.Trie
nltk.TrigramAssocMeasures
nltk.TrigramCollocationFinder
nltk.TrigramTagger
nltk.TweetTokenizer
nltk.TypedMaxentFeatureEncoding
nltk.UniformProbDist
nltk.UnigramTagger
nltk.UnsortedChartParser
nltk.Valuation
nltk.Variable
nltk.ViterbiParser
nltk.WekaClassifier
nltk.WhitespaceTokenizer
nltk.WittenBellProbDist
nltk.WordNetLemmatizer
nltk.WordPunctTokenizer
nltk.chain
nltk.combinations
nltk.defaultdict
nltk.deque
nltk.islice
nltk.text_type
nltk.classify
nltk.classify.accuracy()
nltk.classify.apply_features()
nltk.classify.call_megam()
nltk.classify.config_megam()
nltk.classify.config_weka()
nltk.classify.log_likelihood()
nltk.classify.rte_classifier()
nltk.classify.rte_features()
nltk.classify.BinaryMaxentFeatureEncoding
nltk.classify.ClassifierI
nltk.classify.ConditionalExponentialClassifier
nltk.classify.DecisionTreeClassifier
nltk.classify.MaxentClassifier
nltk.classify.MultiClassifierI
nltk.classify.NaiveBayesClassifier
nltk.classify.PositiveNaiveBayesClassifier
nltk.classify.RTEFeatureExtractor
nltk.classify.Senna
nltk.classify.SklearnClassifier
nltk.classify.TextCat
nltk.classify.TypedMaxentFeatureEncoding
nltk.classify.WekaClassifier
nltk.cluster
nltk.cluster.cosine_distance()
nltk.cluster.euclidean_distance()
nltk.cluster.Dendrogram
nltk.cluster.EMClusterer
nltk.cluster.GAAClusterer
nltk.cluster.KMeansClusterer
nltk.cluster.VectorSpaceClusterer
nltk.chunk
nltk.chunk.accuracy()
nltk.chunk.conllstr2tree()
nltk.chunk.conlltags2tree()
nltk.chunk.ieerstr2tree()
nltk.chunk.load()
nltk.chunk.ne_chunk()
nltk.chunk.ne_chunk_sents()
nltk.chunk.tagstr2tree()
nltk.chunk.tree2conllstr()
nltk.chunk.tree2conlltags()
nltk.chunk.ChunkParserI
nltk.chunk.ChunkScore
nltk.chunk.RegexpChunkParser
nltk.chunk.RegexpParser
nltk.corpus
nltk.parse
nltk.parse.extract_test_sentences()
nltk.parse.load_parser()
nltk.parse.BllipParser
nltk.parse.BottomUpChartParser
nltk.parse.BottomUpLeftCornerChartParser
nltk.parse.BottomUpProbabilisticChartParser
nltk.parse.ChartParser
nltk.parse.DependencyEvaluator
nltk.parse.DependencyGraph
nltk.parse.EarleyChartParser
nltk.parse.FeatureBottomUpChartParser
nltk.parse.FeatureBottomUpLeftCornerChartParser
nltk.parse.FeatureChartParser
nltk.parse.FeatureEarleyChartParser
nltk.parse.FeatureIncrementalBottomUpChartParser
nltk.parse.FeatureIncrementalBottomUpLeftCornerChartParser
nltk.parse.FeatureIncrementalChartParser
nltk.parse.FeatureIncrementalTopDownChartParser
nltk.parse.FeatureTopDownChartParser
nltk.parse.IncrementalBottomUpChartParser
nltk.parse.IncrementalBottomUpLeftCornerChartParser
nltk.parse.IncrementalChartParser
nltk.parse.IncrementalLeftCornerChartParser
nltk.parse.IncrementalTopDownChartParser
nltk.parse.InsideChartParser
nltk.parse.LeftCornerChartParser
nltk.parse.LongestChartParser
nltk.parse.MaltParser
nltk.parse.NaiveBayesDependencyScorer
nltk.parse.NonprojectiveDependencyParser
nltk.parse.ParserI
nltk.parse.ProbabilisticNonprojectiveParser
nltk.parse.ProbabilisticProjectiveDependencyParser
nltk.parse.ProjectiveDependencyParser
nltk.parse.RandomChartParser
nltk.parse.RecursiveDescentParser
nltk.parse.ShiftReduceParser
nltk.parse.SteppingChartParser
nltk.parse.SteppingRecursiveDescentParser
nltk.parse.SteppingShiftReduceParser
nltk.parse.TestGrammar
nltk.parse.TopDownChartParser
nltk.parse.TransitionParser
nltk.parse.UnsortedChartParser
nltk.parse.ViterbiParser
nltk.sem
nltk.sem.arity()
nltk.sem.binding_ops()
nltk.sem.boolean_ops()
nltk.sem.clause()
nltk.sem.equality_preds()
nltk.sem.evaluate_sents()
nltk.sem.extract_rels()
nltk.sem.interpret_sents()
nltk.sem.is_rel()
nltk.sem.parse_sents()
nltk.sem.read_logic()
nltk.sem.read_valuation()
nltk.sem.root_semrep()
nltk.sem.rtuple()
nltk.sem.set2rel()
nltk.sem.skolemize()
nltk.sem.ApplicationExpression
nltk.sem.Assignment
nltk.sem.Boxer
nltk.sem.DRS
nltk.sem.DrtExpression
nltk.sem.Expression
nltk.sem.FStructure
nltk.sem.Model
nltk.sem.Valuation
nltk.sem.Variable
nltk.stem
nltk.stem.ISRIStemmer
nltk.stem.LancasterStemmer
nltk.stem.PorterStemmer
nltk.stem.RSLPStemmer
nltk.stem.RegexpStemmer
nltk.stem.SnowballStemmer
nltk.stem.StemmerI
nltk.stem.WordNetLemmatizer
nltk.tag
nltk.tag.load()
nltk.tag.map_tag()
nltk.tag.pos_tag()
nltk.tag.pos_tag_sents()
nltk.tag.str2tuple()
nltk.tag.tagset_mapping()
nltk.tag.tuple2str()
nltk.tag.untag()
nltk.tag.AffixTagger
nltk.tag.BigramTagger
nltk.tag.BrillTagger
nltk.tag.BrillTaggerTrainer
nltk.tag.CRFTagger
nltk.tag.ClassifierBasedPOSTagger
nltk.tag.ClassifierBasedTagger
nltk.tag.ContextTagger
nltk.tag.DefaultTagger
nltk.tag.HiddenMarkovModelTagger
nltk.tag.HiddenMarkovModelTrainer
nltk.tag.HunposTagger
nltk.tag.NgramTagger
nltk.tag.PerceptronTagger
nltk.tag.RegexpTagger
nltk.tag.SennaChunkTagger
nltk.tag.SennaNERTagger
nltk.tag.SennaTagger
nltk.tag.SequentialBackoffTagger
nltk.tag.StanfordNERTagger
nltk.tag.StanfordPOSTagger
nltk.tag.StanfordTagger
nltk.tag.TaggerI
nltk.tag.TnT
nltk.tag.TrigramTagger
nltk.tag.UnigramTagger
nltk.tokenize
nltk.tokenize.casual_tokenize()
nltk.tokenize.line_tokenize()
nltk.tokenize.load()
nltk.tokenize.regexp_span_tokenize()
nltk.tokenize.regexp_tokenize()
nltk.tokenize.sent_tokenize()
nltk.tokenize.string_span_tokenize()
nltk.tokenize.word_tokenize()
nltk.tokenize.BlanklineTokenizer
nltk.tokenize.LineTokenizer
nltk.tokenize.MWETokenizer
nltk.tokenize.PunktSentenceTokenizer
nltk.tokenize.RegexpTokenizer
nltk.tokenize.SExprTokenizer
nltk.tokenize.SpaceTokenizer
nltk.tokenize.StanfordTokenizer
nltk.tokenize.TabTokenizer
nltk.tokenize.TextTilingTokenizer
nltk.tokenize.TreebankWordTokenizer
nltk.tokenize.TweetTokenizer
nltk.tokenize.WhitespaceTokenizer
nltk.tokenize.WordPunctTokenizer
nltk.twitter
nltk.twitter.json2csv()
gensim
gensim.NullHandler
gensim.interfaces
gensim.interfaces.CorpusABC
gensim.interfaces.SimilarityABC
gensim.interfaces.TransformationABC
gensim.interfaces.TransformedCorpus
gensim.interfaces.xrange
gensim.matutils
gensim.matutils.any2sparse()
gensim.matutils.argsort()
gensim.matutils.blas()
gensim.matutils.corpus2csc()
gensim.matutils.corpus2dense()
gensim.matutils.cossim()
gensim.matutils.dense2vec()
gensim.matutils.entropy()
gensim.matutils.full2sparse()
gensim.matutils.full2sparse_clipped()
gensim.matutils.get_lapack_funcs()
gensim.matutils.hellinger()
gensim.matutils.isbow()
gensim.matutils.ismatrix()
gensim.matutils.iteritems()
gensim.matutils.itervalues()
gensim.matutils.jaccard()
gensim.matutils.kullback_leibler()
gensim.matutils.pad()
gensim.matutils.qr_destroy()
gensim.matutils.ret_normalized_vec()
gensim.matutils.scipy2sparse()
gensim.matutils.sparse2full()
gensim.matutils.triu()
gensim.matutils.triu_indices()
gensim.matutils.unitvec()
gensim.matutils.veclen()
gensim.matutils.zeros_aligned()
gensim.matutils.Dense2Corpus
gensim.matutils.MmReader
gensim.matutils.MmWriter
gensim.matutils.Scipy2Corpus
gensim.matutils.Sparse2Corpus
gensim.matutils.izip
gensim.matutils.xrange
gensim.utils
gensim.utils.any2unicode()
gensim.utils.any2utf8()
gensim.utils.check_output()
gensim.utils.chunkize()
gensim.utils.chunkize_serial()
gensim.utils.contextmanager()
gensim.utils.copytree_hardlink()
gensim.utils.deaccent()
gensim.utils.decode_htmlentities()
gensim.utils.dict_from_corpus()
gensim.utils.file_or_filename()
gensim.utils.getNS()
gensim.utils.get_max_id()
gensim.utils.get_my_ip()
gensim.utils.grouper()
gensim.utils.has_pattern()
gensim.utils.identity()
gensim.utils.is_corpus()
gensim.utils.iteritems()
gensim.utils.keep_vocab_item()
gensim.utils.lemmatize()
gensim.utils.mock_data()
gensim.utils.mock_data_row()
gensim.utils.pickle()
gensim.utils.prune_vocab()
gensim.utils.pyro_daemon()
gensim.utils.qsize()
gensim.utils.randfname()
gensim.utils.revdict()
gensim.utils.safe_unichr()
gensim.utils.simple_preprocess()
gensim.utils.smart_extension()
gensim.utils.smart_open()
gensim.utils.synchronous()
gensim.utils.to_unicode()
gensim.utils.to_utf8()
gensim.utils.tokenize()
gensim.utils.toptexts()
gensim.utils.u()
gensim.utils.unichr()
gensim.utils.unpickle()
gensim.utils.upload_chunked()
gensim.utils.wraps()
gensim.utils.ClippedCorpus
gensim.utils.FakeDict
gensim.utils.InputQueue
gensim.utils.NoCM
gensim.utils.RepeatCorpus
gensim.utils.RepeatCorpusNTimes
gensim.utils.SaveLoad
gensim.utils.SlicedCorpus
gensim.utils.xrange
gensim.corpora
gensim.corpora.BleiCorpus
gensim.corpora.Dictionary
gensim.corpora.HashDictionary
gensim.corpora.IndexedCorpus
gensim.corpora.LowCorpus
gensim.corpora.MalletCorpus
gensim.corpora.MmCorpus
gensim.corpora.ShardedCorpus
gensim.corpora.SvmLightCorpus
gensim.corpora.TextCorpus
gensim.corpora.UciCorpus
gensim.corpora.WikiCorpus
gensim.models
gensim.models.CoherenceModel
gensim.models.Doc2Vec
gensim.models.HdpModel
gensim.models.LdaModel
gensim.models.LdaMulticore
gensim.models.LogEntropyModel
gensim.models.LsiModel
gensim.models.NormModel
gensim.models.Phrases
gensim.models.RpModel
gensim.models.TfidfModel
gensim.models.VocabTransform
gensim.models.Word2Vec
gensim.parsing
gensim.parsing.preprocess_documents()
gensim.parsing.preprocess_string()
gensim.parsing.read_file()
gensim.parsing.read_files()
gensim.parsing.remove_stopwords()
gensim.parsing.split_alphanum()
gensim.parsing.stem()
gensim.parsing.stem_text()
gensim.parsing.strip_multiple_whitespaces()
gensim.parsing.strip_non_alphanum()
gensim.parsing.strip_numeric()
gensim.parsing.strip_punctuation()
gensim.parsing.strip_punctuation2()
gensim.parsing.strip_short()
gensim.parsing.strip_tags()
gensim.parsing.PorterStemmer
gensim.scripts
gensim.similarities
gensim.similarities.MatrixSimilarity
gensim.similarities.Similarity
gensim.similarities.SparseMatrixSimilarity
gensim.similarities.WmdSimilarity
gensim.summarization
gensim.summarization.keywords()
gensim.summarization.summarize()
gensim.summarization.summarize_corpus()
gensim.topic_coherence
from __future__ import division, print_function, unicode_literals from numpy import linalg as LA [docs]def unitvec(vec): return (1.0 / LA.norm(vec, ord=2)) * vec