diff --git a/CHANGELOG.md b/CHANGELOG.md index 04c81ddcd6..f0d8fca90f 100644 --- a/CHANGELOG.md +++ b/CHANGELOG.md @@ -1,5 +1,66 @@ Changes =========== + +## Unreleased + +### :red_circle: Bug fixes + +* Fix unicode error when loading FastText vocabulary (__[@mpenkov](https://github.com/mpenkov)__, [#2390](https://github.com/RaRe-Technologies/gensim/pull/2390)) + +### :books: Tutorial and doc improvements + +* Add link to bindr (__[rogueleaderr](https://github.com/rogueleaderr)__, [#2387](https://github.com/RaRe-Technologies/gensim/pull/2387)) + +## 3.7.1, 2019-01-31 + +### :+1: Improvements + +* NMF optimization & documentation (__[@anotherbugmaster](https://github.com/anotherbugmaster)__, [#2361](https://github.com/RaRe-Technologies/gensim/pull/2361)) +* Optimize `FastText.load_fasttext_model` (__[@mpenkov](https://github.com/mpenkov)__, [#2340](https://github.com/RaRe-Technologies/gensim/pull/2340)) +* Add warning when string is used as argument to `Doc2Vec.infer_vector` (__[@tobycheese](https://github.com/tobycheese)__, [#2347](https://github.com/RaRe-Technologies/gensim/pull/2347)) +* Fix light linting issues in `LdaSeqModel` (__[@horpto](https://github.com/horpto)__, [#2360](https://github.com/RaRe-Technologies/gensim/pull/2360)) +* Move out `process_result_queue` from cycle in `LdaMulticore` (__[@horpto](https://github.com/horpto)__, [#2358](https://github.com/RaRe-Technologies/gensim/pull/2358)) + + +### :red_circle: Bug fixes + +* Fix infinite diff in `LdaModel.do_mstep` (__[@horpto](https://github.com/horpto)__, [#2344](https://github.com/RaRe-Technologies/gensim/pull/2344)) +* Fix backward compatibility issue: loading `FastTextKeyedVectors` using `KeyedVectors` (missing attribute `compatible_hash`) (__[@menshikh-iv](https://github.com/menshikh-iv)__, [#2349](https://github.com/RaRe-Technologies/gensim/pull/2349)) +* Fix logging issue (conda-forge related) (__[@menshikh-iv](https://github.com/menshikh-iv)__, [#2339](https://github.com/RaRe-Technologies/gensim/pull/2339)) +* Fix `WordEmbeddingsKeyedVectors.most_similar` (__[@Witiko](https://github.com/Witiko)__, [#2356](https://github.com/RaRe-Technologies/gensim/pull/2356)) +* Fix issues of `flake8==3.7.1` (__[@horpto](https://github.com/horpto)__, [#2365](https://github.com/RaRe-Technologies/gensim/pull/2365)) + + +### :books: Tutorial and doc improvements + +* Improve `FastText` documentation (__[@mpenkov](https://github.com/mpenkov)__, [#2353](https://github.com/RaRe-Technologies/gensim/pull/2353)) +* Minor corrections and improvements in `Any*Vec` docstrings (__[@tobycheese](https://github.com/tobycheese)__, [#2345](https://github.com/RaRe-Technologies/gensim/pull/2345)) +* Fix the example code for SparseTermSimilarityMatrix (__[@Witiko](https://github.com/Witiko)__, [#2359](https://github.com/RaRe-Technologies/gensim/pull/2359)) +* Update `poincare` documentation to indicate the relation format (__[@AMR-KELEG](https://github.com/AMR-KELEG)__, [#2357](https://github.com/RaRe-Technologies/gensim/pull/2357)) + + +### :warning: Deprecations (will be removed in the next major release) + +* Remove + - `gensim.models.wrappers.fasttext` (obsoleted by the new native `gensim.models.fasttext` implementation) + - `gensim.examples` + - `gensim.nosy` + - `gensim.scripts.word2vec_standalone` + - `gensim.scripts.make_wiki_lemma` + - `gensim.scripts.make_wiki_online` + - `gensim.scripts.make_wiki_online_lemma` + - `gensim.scripts.make_wiki_online_nodebug` + - `gensim.scripts.make_wiki` (all of these obsoleted by the new native `gensim.scripts.segment_wiki` implementation) + - "deprecated" functions and attributes + +* Move + - `gensim.scripts.make_wikicorpus` ➡ `gensim.scripts.make_wiki.py` + - `gensim.summarization` ➡ `gensim.models.summarization` + - `gensim.topic_coherence` ➡ `gensim.models._coherence` + - `gensim.utils` ➡ `gensim.utils.utils` (old imports will continue to work) + - `gensim.parsing.*` ➡ `gensim.utils.text_utils` + + ## 3.7.0, 2019-01-18 ### :star2: New features diff --git a/ISSUE_TEMPLATE.md b/ISSUE_TEMPLATE.md index 44eaefb24f..8fa0214517 100644 --- a/ISSUE_TEMPLATE.md +++ b/ISSUE_TEMPLATE.md @@ -1,48 +1,29 @@ - - +**IMPORTANT**: -#### Description -TODO: change commented example - - -#### Steps/Code/Corpus to Reproduce - -#### Expected Results - +#### Problem description -#### Actual Results - +#### Steps/code/corpus to reproduce + +Include full tracebacks, logs and datasets if necessary. Please keep the examples minimal ("minimal reproducible example"). #### Versions - - - - - +``` diff --git a/MANIFEST.in b/MANIFEST.in index fe5947fbe2..2ad20ee9f8 100644 --- a/MANIFEST.in +++ b/MANIFEST.in @@ -6,6 +6,7 @@ include COPYING.LESSER include ez_setup.py include gensim/models/voidptr.h +include gensim/models/stdint_wrapper.h include gensim/models/fast_line_sentence.h include gensim/models/word2vec_inner.c diff --git a/docs/fasttext-notes.md b/docs/fasttext-notes.md deleted file mode 100644 index 5b11b7de6a..0000000000 --- a/docs/fasttext-notes.md +++ /dev/null @@ -1,152 +0,0 @@ -FastText Notes -============== - -The implementation is split across several submodules: - -- models.fasttext -- models.keyedvectors (includes FastText-specific code, not good) -- models.word2vec (superclasses) -- models.base_any2vec (superclasses) - -The implementation consists of several key classes: - -1. models.fasttext.FastTextVocab: the vocabulary -2. models.keyedvectors.FastTextKeyedVectors: the vectors -3. models.fasttext.FastTextTrainables: the underlying neural network -4. models.fasttext.FastText: ties everything together - -FastTextVocab -------------- - -Seems to be an entirely redundant class. -Inherits from models.word2vec.Word2VecVocab, adding no new functionality. - -FastTextKeyedVectors --------------------- - -Inheritance hierarchy: - -1. FastTextKeyedVectors -2. WordEmbeddingsKeyedVectors. Implements word similarity e.g. cosine similarity, WMD, etc. -3. BaseKeyedVectors (abstract base class) -4. utils.SaveLoad - -There are many attributes. - -Inherited from BaseKeyedVectors: - -- vectors: a 2D numpy array. Flexible number of rows (0 by default). Number of columns equals vector dimensionality. -- vocab: a dictionary. Keys are words. Items are Vocab instances: these are essentially namedtuples that contain an index and a count. The former is the index of a term in the entire vocab. The latter is the number of times the term occurs. -- vector_size (dimensionality) -- index2entity - -Inherited from WordEmbeddingsKeyedVectors: - -- vectors_norm -- index2word - -Added by FastTextKeyedVectors: - -- vectors_vocab: 2D array. Rows are vectors. Columns correspond to vector dimensions. Initialized in FastTextTrainables.init_ngrams_weights. Reset in reset_ngrams_weights. Referred to as syn0_vocab in fasttext_inner.pyx. These are vectors for every word in the vocabulary. -- vectors_vocab_norm: looks unused, see _clear_post_train method. -- vectors_ngrams: 2D array. Each row is a bucket. Columns correspond to vector dimensions. Initialized in init_ngrams_weights function. Initialized in _load_vectors method when reading from native FB binary. Modified in reset_ngrams_weights method. This is the first matrix loaded from the native binary files. -- vectors_ngrams_norm: looks unused, see _clear_post_train method. -- buckets_word: A hashmap. Keyed by the index of a term in the vocab. Each value is an array, where each element is an integer that corresponds to a bucket. Initialized in init_ngrams_weights function -- hash2index: A hashmap. Keys are hashes of ngrams. Values are the number of ngrams (?). Initialized in init_ngrams_weights function. -- min_n: minimum ngram length -- max_n: maximum ngram length -- num_ngram_vectors: initialized in the init_ngrams_weights function - -The init_ngrams_method looks like an internal method of FastTextTrainables. -It gets called as part of the prepare_weights method, which is effectively part of the FastModel constructor. - -The above attributes are initialized to None in the FastTextKeyedVectors class constructor. -Unfortunately, their real initialization happens in an entirely different module, models.fasttext - another indication of poor separation of concerns. - -Some questions: - -- What is the x_lockf stuff? Why is it used only by the fast C implementation? -- How are vectors_vocab and vectors_ngrams different? - -vectors_vocab contains vectors for entire vocabulary. -vectors_ngrams contains vectors for each _bucket_. - - -FastTextTrainables ------------------- - -[Link](https://radimrehurek.com/gensim/models/fasttext.html#gensim.models.fasttext.FastTextTrainables) - -This is a neural network that learns the vectors for the FastText embedding. -Mostly inherits from its [Word2Vec parent](https://radimrehurek.com/gensim/models/word2vec.html#gensim.models.word2vec.Word2VecTrainables). -Adds logic for calculating and maintaining ngram weights. - -Key attributes: - -- hashfxn: function for randomly initializing weights. Defaults to the built-in hash() -- layer1_size: The size of the inner layer of the NN. Equal to the vector dimensionality. Set in the Word2VecTrainables constructor. -- seed: The random generator seed used in reset_weights and update_weights -- syn1: The inner layer of the NN. Each row corresponds to a term in the vocabulary. Columns correspond to weights of the inner layer. There are layer1_size such weights. Set in the reset_weights and update_weights methods, only if hierarchical sampling is used. -- syn1neg: Similar to syn1, but only set if negative sampling is used. -- vectors_lockf: A one-dimensional array with one element for each term in the vocab. Set in reset_weights to an array of ones. -- vectors_vocab_lockf: Similar to vectors_vocab_lockf, ones(len(model.trainables.vectors), dtype=REAL) -- vectors_ngrams_lockf = ones((self.bucket, wv.vector_size), dtype=REAL) - -The lockf stuff looks like it gets used by the fast C implementation. - -The inheritance hierarchy here is: - -1. FastTextTrainables -2. Word2VecTrainables -3. utils.SaveLoad - -FastText --------- - -Inheritance hierarchy: - -1. FastText -2. BaseWordEmbeddingsModel: vocabulary management plus a ton of deprecated attrs -3. BaseAny2VecModel: logging and training functionality -4. utils.SaveLoad: for loading and saving - -Lots of attributes (many inherited from superclasses). - -From BaseAny2VecModel: - -- workers -- vector_size -- epochs -- callbacks -- batch_words -- kv -- vocabulary -- trainables - -From BaseWordEmbeddingModel: - -- alpha -- min_alpha -- min_alpha_yet_reached -- window -- random -- hs -- negative -- ns_exponent -- cbow_mean -- compute_loss -- running_training_loss -- corpus_count -- corpus_total_words -- neg_labels - -FastText attributes: - -- wv: FastTextWordVectors. Used instead of .kv - -Logging -------- - -The logging seems to be inheritance-based. -It may be better to refactor this using aggregation istead of inheritance in the future. -The benefits would be leaner classes with less responsibilities and better separation of concerns. diff --git a/docs/notebooks/FastText_Tutorial.ipynb b/docs/notebooks/FastText_Tutorial.ipynb index bc964b2829..ed2d4d522f 100644 --- a/docs/notebooks/FastText_Tutorial.ipynb +++ b/docs/notebooks/FastText_Tutorial.ipynb @@ -54,39 +54,31 @@ "execution_count": 1, "metadata": {}, "outputs": [ - { - "name": "stderr", - "output_type": "stream", - "text": [ - "Using TensorFlow backend.\n" - ] - }, { "name": "stdout", "output_type": "stream", "text": [ - "FastText(vocab=1763, size=100, alpha=0.025)\n" + "FastText(vocab=1762, size=100, alpha=0.025)\n" ] } ], "source": [ - "import gensim\n", - "import os\n", - "from gensim.models.word2vec import LineSentence\n", "from gensim.models.fasttext import FastText as FT_gensim\n", + "from gensim.test.utils import datapath\n", "\n", "# Set file names for train and test data\n", - "data_dir = '{}'.format(os.sep).join([gensim.__path__[0], 'test', 'test_data']) + os.sep\n", - "lee_train_file = data_dir + 'lee_background.cor'\n", - "lee_data = LineSentence(lee_train_file)\n", + "corpus_file = datapath('lee_background.cor')\n", "\n", "model_gensim = FT_gensim(size=100)\n", "\n", "# build the vocabulary\n", - "model_gensim.build_vocab(lee_data)\n", + "model_gensim.build_vocab(corpus_file=corpus_file)\n", "\n", "# train the model\n", - "model_gensim.train(lee_data, total_examples=model_gensim.corpus_count, epochs=model_gensim.iter)\n", + "model_gensim.train(\n", + " corpus_file=corpus_file, epochs=model_gensim.epochs,\n", + " total_examples=model_gensim.corpus_count, total_words=model_gensim.corpus_total_words\n", + ")\n", "\n", "print(model_gensim)" ] @@ -115,10 +107,10 @@ "from gensim.models.wrappers.fasttext import FastText as FT_wrapper\n", "\n", "# Set FastText home to the path to the FastText executable\n", - "ft_home = '/home/chinmaya/GSOC/Gensim/fastText/fasttext'\n", + "ft_home = '/home/misha/src/fastText-0.1.0/fasttext'\n", "\n", "# train the model\n", - "model_wrapper = FT_wrapper.train(ft_home, lee_train_file)\n", + "model_wrapper = FT_wrapper.train(ft_home, corpus_file)\n", "\n", "print(model_wrapper)" ] @@ -160,7 +152,7 @@ "cell_type": "markdown", "metadata": {}, "source": [ - "**Note:** As in the case of Word2Vec, you can continue to train your model while using Gensim's native implementation of fastText. However, continuation of training with fastText models while using the wrapper is not supported." + "**Note:** As in the case of Word2Vec, you can continue to train your model while using Gensim's native implementation of fastText." ] }, { @@ -186,7 +178,7 @@ "name": "stdout", "output_type": "stream", "text": [ - "FastText(vocab=1763, size=100, alpha=0.025)\n", + "FastText(vocab=1762, size=100, alpha=0.025)\n", "FastText(vocab=1763, size=100, alpha=0.025)\n" ] } @@ -231,40 +223,40 @@ "text": [ "True\n", "False\n", - "[ 0.60971916 0.66131264 0.09225323 0.28898761 0.34161603 0.06163925\n", - " -0.10147806 -0.18834428 -0.26355353 0.46417126 0.20428349 0.08414238\n", - " -0.61960417 -0.2977576 -0.22102182 0.14144184 0.13698931 -0.24608244\n", - " -0.58096874 0.3039414 0.18766184 0.38110724 0.11518024 -0.75747257\n", - " -0.275776 -0.42740449 -0.00725944 -0.24556711 0.41061676 0.05050014\n", - " -0.71367824 0.05223881 -0.07810796 0.22933683 0.43850809 0.06360656\n", - " 0.43815458 0.11096461 0.29619065 0.38061273 0.26262566 -0.07368335\n", - " 0.33198604 -0.1431711 -0.04876067 -0.35243919 0.18561274 -0.70321769\n", - " -0.16492438 -0.28362423 0.08294757 0.49758917 -0.17844993 -0.02241638\n", - " 0.18489315 0.01197879 -0.22931916 0.45774016 -0.40240806 -0.16401663\n", - " -0.07500558 0.06775728 0.14273891 0.39902335 0.1906638 0.14533612\n", - " -0.70275193 -0.64343351 -0.18003808 0.45082757 -0.42847934 0.23554228\n", - " 0.03722449 -0.0726353 -0.20106563 -0.85182953 0.16529776 0.2167791\n", - " 0.01655668 -0.45087481 0.44368106 0.94318634 0.3191022 -0.78148538\n", - " 0.06931634 -0.02454508 -0.07709292 0.00889531 0.41768485 -0.4333123\n", - " 0.57354093 0.40387386 0.50435936 0.15307237 0.41140166 0.09306428\n", - " -0.6406759 -0.00130932 0.01818158 0.05408832]\n", - "[ 0.57120456 0.61710706 0.08425266 0.28013577 0.30789921 0.08454974\n", - " -0.05984595 -0.14644302 -0.23369177 0.42689164 0.18699257 0.09090185\n", - " -0.57885733 -0.28756606 -0.20198511 0.12675938 0.14102744 -0.22880791\n", - " -0.52516965 0.27686313 0.19865591 0.33872125 0.11230565 -0.74198454\n", - " -0.28486362 -0.40490177 -0.00606945 -0.18761727 0.40040097 0.06941447\n", - " -0.70890718 0.03646363 -0.0598574 0.19175974 0.4242314 0.05878129\n", - " 0.41432344 0.10394377 0.2668701 0.38148809 0.2761937 -0.06951485\n", - " 0.34113405 -0.12189032 -0.05861677 -0.33032765 0.16585448 -0.65862278\n", - " -0.18381383 -0.28438907 0.08867586 0.46635329 -0.18801565 -0.01610042\n", - " 0.1940661 0.03761584 -0.21442287 0.41826423 -0.38097134 -0.15111094\n", - " -0.08636253 0.07374192 0.12731727 0.40068088 0.18576843 0.13244282\n", - " -0.64814759 -0.62510144 -0.17045424 0.44949777 -0.39068545 0.19102012\n", - " 0.03177847 -0.06673145 -0.17997442 -0.81052922 0.15459165 0.21476634\n", - " -0.01961387 -0.43806009 0.40781115 0.88663652 0.29360816 -0.74157697\n", - " 0.04686275 -0.0396045 -0.06810026 0.00260469 0.40505417 -0.39977569\n", - " 0.5443192 0.38472273 0.48665705 0.12033045 0.40395209 0.10123577\n", - " -0.6243847 -0.02460667 0.00828873 0.04089492]\n" + "[ 0.8314139 0.61584824 -0.22241311 0.07523467 0.5152522 0.07724247\n", + " -0.13744526 0.05606242 -0.09502476 0.45655364 0.51096547 -0.13521144\n", + " -0.7620124 -0.4685431 -0.15228595 -0.03442579 0.20600994 -0.5080321\n", + " -0.6443741 0.605772 -0.30647403 0.41962707 0.06037483 -0.40195057\n", + " -0.11246474 -0.59829116 -0.32052496 -0.48515126 0.2997839 -0.20067295\n", + " -0.20996568 0.12522118 -0.0364657 0.62870216 0.5781912 -0.00992062\n", + " 0.51955134 -0.10997857 0.16197589 0.27111182 -0.06318171 -0.24831475\n", + " 0.09808698 -0.37751442 -0.13298641 -0.15047912 -0.01828656 -0.6400881\n", + " 0.28488973 -0.14948265 0.18325825 0.6458386 -0.00953633 0.13587084\n", + " -0.1961209 -0.42555386 -0.19528134 0.52414805 -0.30868796 -0.5202228\n", + " -0.10896837 0.06696089 0.44607309 0.37719652 0.08233636 0.24584875\n", + " -0.80979943 -0.30543917 -0.15849951 0.16166946 -0.36826986 -0.00906481\n", + " -0.14814071 -0.25263855 -0.41303173 -0.48292273 -0.05554645 -0.00310395\n", + " 0.21415223 -0.27768075 0.7148276 1.3367277 0.33960983 -0.47452113\n", + " 0.27783358 0.09962273 0.04856196 -0.23065457 0.19847827 -0.7086235\n", + " 0.2897328 0.08882508 0.47819164 -0.10128012 0.17164136 -0.08161731\n", + " -0.64568347 -0.04466937 0.04507336 0.4807562 ]\n", + "[ 0.7486652 0.5551642 -0.20113334 0.0694495 0.46116358 0.06881845\n", + " -0.12488337 0.05208117 -0.08345503 0.41118833 0.4612766 -0.12186286\n", + " -0.68638855 -0.4214572 -0.13843313 -0.03139759 0.18622552 -0.45825756\n", + " -0.57948387 0.54435897 -0.27771378 0.3789184 0.05383135 -0.36025965\n", + " -0.10304614 -0.53994924 -0.28970715 -0.43614468 0.26968622 -0.18174443\n", + " -0.19075763 0.11169459 -0.03211116 0.5669812 0.5213458 -0.01047292\n", + " 0.4683945 -0.09853561 0.14416309 0.2458799 -0.05680516 -0.22388494\n", + " 0.08682863 -0.34187067 -0.11945734 -0.1357073 -0.0152749 -0.5779147\n", + " 0.25770664 -0.13402262 0.16518788 0.5821273 -0.00866939 0.12256315\n", + " -0.17704405 -0.38423932 -0.1755833 0.47041836 -0.27653104 -0.46991062\n", + " -0.09599836 0.05943088 0.4017819 0.33958077 0.07508487 0.22090466\n", + " -0.72955 -0.2727049 -0.14109111 0.14624386 -0.33014265 -0.00984893\n", + " -0.13071296 -0.22914156 -0.37331858 -0.43644536 -0.05077597 -0.00315402\n", + " 0.19187897 -0.2513682 0.6448789 1.2039913 0.30247915 -0.4269294\n", + " 0.25062108 0.08874664 0.04146989 -0.20783317 0.17835104 -0.6382346\n", + " 0.26064712 0.08040012 0.43090543 -0.09168535 0.15238702 -0.07426675\n", + " -0.5815522 -0.03998712 0.04137334 0.4317176 ]\n" ] } ], @@ -286,25 +278,19 @@ "cell_type": "code", "execution_count": 5, "metadata": {}, - "outputs": [ - { - "ename": "KeyError", - "evalue": "'all ngrams for word axe absent from model'", - "output_type": "error", - "traceback": [ - "\u001b[0;31m---------------------------------------------------------------------------\u001b[0m", - "\u001b[0;31mKeyError\u001b[0m Traceback (most recent call last)", - "\u001b[0;32m\u001b[0m in \u001b[0;36m\u001b[0;34m()\u001b[0m\n\u001b[1;32m 1\u001b[0m \u001b[0;31m# Raises a KeyError since none of the character ngrams of the word `axe` are present in the training data\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0;32m----> 2\u001b[0;31m \u001b[0mmodel_wrapper\u001b[0m\u001b[0;34m[\u001b[0m\u001b[0;34m'axe'\u001b[0m\u001b[0;34m]\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0m", - "\u001b[0;32m/home/chinmaya/GSOC/Gensim/gensim/gensim/models/word2vec.pyc\u001b[0m in \u001b[0;36m__getitem__\u001b[0;34m(self, words)\u001b[0m\n\u001b[1;32m 1280\u001b[0m \u001b[0mRefer\u001b[0m \u001b[0mto\u001b[0m \u001b[0mthe\u001b[0m \u001b[0mdocumentation\u001b[0m \u001b[0;32mfor\u001b[0m \u001b[0;34m`\u001b[0m\u001b[0mgensim\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mmodels\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mKeyedVectors\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0m__getitem__\u001b[0m\u001b[0;34m`\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 1281\u001b[0m \"\"\"\n\u001b[0;32m-> 1282\u001b[0;31m \u001b[0;32mreturn\u001b[0m \u001b[0mself\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mwv\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0m__getitem__\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mwords\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0m\u001b[1;32m 1283\u001b[0m \u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 1284\u001b[0m \u001b[0;32mdef\u001b[0m \u001b[0m__contains__\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mself\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mword\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n", - "\u001b[0;32m/home/chinmaya/GSOC/Gensim/gensim/gensim/models/keyedvectors.pyc\u001b[0m in \u001b[0;36m__getitem__\u001b[0;34m(self, words)\u001b[0m\n\u001b[1;32m 587\u001b[0m \u001b[0;32mif\u001b[0m \u001b[0misinstance\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mwords\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mstring_types\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 588\u001b[0m \u001b[0;31m# allow calls like trained_model['office'], as a shorthand for trained_model[['office']]\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0;32m--> 589\u001b[0;31m \u001b[0;32mreturn\u001b[0m \u001b[0mself\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mword_vec\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mwords\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0m\u001b[1;32m 590\u001b[0m \u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 591\u001b[0m \u001b[0;32mreturn\u001b[0m \u001b[0mvstack\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0;34m[\u001b[0m\u001b[0mself\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mword_vec\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mword\u001b[0m\u001b[0;34m)\u001b[0m \u001b[0;32mfor\u001b[0m \u001b[0mword\u001b[0m \u001b[0;32min\u001b[0m \u001b[0mwords\u001b[0m\u001b[0;34m]\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n", - "\u001b[0;32m/home/chinmaya/GSOC/Gensim/gensim/gensim/models/wrappers/fasttext.pyc\u001b[0m in \u001b[0;36mword_vec\u001b[0;34m(self, word, use_norm)\u001b[0m\n\u001b[1;32m 92\u001b[0m \u001b[0;32mreturn\u001b[0m \u001b[0mword_vec\u001b[0m \u001b[0;34m/\u001b[0m \u001b[0mlen\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mngrams\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 93\u001b[0m \u001b[0;32melse\u001b[0m\u001b[0;34m:\u001b[0m \u001b[0;31m# No ngrams of the word are present in self.ngrams\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0;32m---> 94\u001b[0;31m \u001b[0;32mraise\u001b[0m \u001b[0mKeyError\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0;34m'all ngrams for word %s absent from model'\u001b[0m \u001b[0;34m%\u001b[0m \u001b[0mword\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0m\u001b[1;32m 95\u001b[0m \u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 96\u001b[0m \u001b[0;32mdef\u001b[0m \u001b[0minit_sims\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mself\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mreplace\u001b[0m\u001b[0;34m=\u001b[0m\u001b[0mFalse\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n", - "\u001b[0;31mKeyError\u001b[0m: 'all ngrams for word axe absent from model'" - ] - } - ], + "outputs": [], "source": [ "# Raises a KeyError since none of the character ngrams of the word `axe` are present in the training data\n", - "model_wrapper['axe']" + "try:\n", + " model_wrapper['axe']\n", + "except KeyError:\n", + " #\n", + " # trap the error here so it does not interfere\n", + " # with the execution of the cells below\n", + " #\n", + " pass\n", + "else:\n", + " assert False, 'the above code should have raised a KeyError'" ] }, { @@ -365,7 +351,7 @@ { "data": { "text/plain": [ - "0.9988949391617723" + "0.99999416" ] }, "execution_count": 7, @@ -401,16 +387,16 @@ { "data": { "text/plain": [ - "[(u'bowler', 0.9999216198921204),\n", - " (u'flights', 0.999881386756897),\n", - " (u'dozens', 0.9998700618743896),\n", - " (u'each', 0.9998670220375061),\n", - " (u'weather', 0.9998487234115601),\n", - " (u'technology', 0.999805748462677),\n", - " (u'acting', 0.9998006820678711),\n", - " (u'dollars', 0.999785840511322),\n", - " (u'place,', 0.9997731447219849),\n", - " (u'custody', 0.9997485280036926)]" + "[('night', 0.9999646544456482),\n", + " ('flights', 0.9999643564224243),\n", + " ('rights', 0.999963641166687),\n", + " ('night.', 0.9999594688415527),\n", + " ('quarter', 0.9999569654464722),\n", + " ('night,', 0.9999566078186035),\n", + " ('hearing', 0.9999553561210632),\n", + " ('better', 0.9999548196792603),\n", + " ('eight', 0.9999544620513916),\n", + " ('during', 0.999954342842102)]" ] }, "execution_count": 8, @@ -431,7 +417,7 @@ { "data": { "text/plain": [ - "0.99936318443348537" + "0.9999701" ] }, "execution_count": 9, @@ -451,7 +437,7 @@ { "data": { "text/plain": [ - "'dinner'" + "'cereal'" ] }, "execution_count": 10, @@ -471,16 +457,16 @@ { "data": { "text/plain": [ - "[(u'September', 0.9997114539146423),\n", - " (u'Rafter', 0.9996863007545471),\n", - " (u'New', 0.999636709690094),\n", - " (u'after', 0.9996317625045776),\n", - " (u'day', 0.9996190071105957),\n", - " (u'After', 0.9996107816696167),\n", - " (u'against', 0.9996088743209839),\n", - " (u'Robert', 0.9996023178100586),\n", - " (u'attacks', 0.9995726346969604),\n", - " (u'States', 0.9995641112327576)]" + "[('suicide', 0.9997773170471191),\n", + " ('decide', 0.9997694492340088),\n", + " ('side', 0.9997690916061401),\n", + " ('Minister', 0.9997668266296387),\n", + " ('inside', 0.9997666478157043),\n", + " ('Minister,', 0.99976646900177),\n", + " ('ministers', 0.9997649192810059),\n", + " ('Alliance', 0.9997645616531372),\n", + " ('best', 0.9997645020484924),\n", + " ('bombers', 0.9997643232345581)]" ] }, "execution_count": 11, @@ -497,242 +483,220 @@ "execution_count": 12, "metadata": {}, "outputs": [ - { - "name": "stdout", - "output_type": "stream", - "text": [ - "family: 0.0% (0/2)\n", - "gram3-comparative: 0.0% (0/12)\n", - "gram4-superlative: 0.0% (0/12)\n", - "gram5-present-participle: 0.0% (0/20)\n", - "gram6-nationality-adjective: 0.0% (0/20)\n", - "gram7-past-tense: 0.0% (0/20)\n", - "gram8-plural: 0.0% (0/12)\n", - "total: 0.0% (0/98)\n" - ] - }, { "data": { "text/plain": [ - "[{'correct': [], 'incorrect': [], 'section': u'capital-common-countries'},\n", - " {'correct': [], 'incorrect': [], 'section': u'capital-world'},\n", - " {'correct': [], 'incorrect': [], 'section': u'currency'},\n", - " {'correct': [], 'incorrect': [], 'section': u'city-in-state'},\n", - " {'correct': [],\n", - " 'incorrect': [(u'HE', u'SHE', u'HIS', u'HER'),\n", - " (u'HIS', u'HER', u'HE', u'SHE')],\n", - " 'section': u'family'},\n", - " {'correct': [], 'incorrect': [], 'section': u'gram1-adjective-to-adverb'},\n", - " {'correct': [], 'incorrect': [], 'section': u'gram2-opposite'},\n", - " {'correct': [],\n", - " 'incorrect': [(u'GOOD', u'BETTER', u'GREAT', u'GREATER'),\n", - " (u'GOOD', u'BETTER', u'LONG', u'LONGER'),\n", - " (u'GOOD', u'BETTER', u'LOW', u'LOWER'),\n", - " (u'GREAT', u'GREATER', u'LONG', u'LONGER'),\n", - " (u'GREAT', u'GREATER', u'LOW', u'LOWER'),\n", - " (u'GREAT', u'GREATER', u'GOOD', u'BETTER'),\n", - " (u'LONG', u'LONGER', u'LOW', u'LOWER'),\n", - " (u'LONG', u'LONGER', u'GOOD', u'BETTER'),\n", - " (u'LONG', u'LONGER', u'GREAT', u'GREATER'),\n", - " (u'LOW', u'LOWER', u'GOOD', u'BETTER'),\n", - " (u'LOW', u'LOWER', u'GREAT', u'GREATER'),\n", - " (u'LOW', u'LOWER', u'LONG', u'LONGER')],\n", - " 'section': u'gram3-comparative'},\n", - " {'correct': [],\n", - " 'incorrect': [(u'BIG', u'BIGGEST', u'GOOD', u'BEST'),\n", - " (u'BIG', u'BIGGEST', u'GREAT', u'GREATEST'),\n", - " (u'BIG', u'BIGGEST', u'LARGE', u'LARGEST'),\n", - " (u'GOOD', u'BEST', u'GREAT', u'GREATEST'),\n", - " (u'GOOD', u'BEST', u'LARGE', u'LARGEST'),\n", - " (u'GOOD', u'BEST', u'BIG', u'BIGGEST'),\n", - " (u'GREAT', u'GREATEST', u'LARGE', u'LARGEST'),\n", - " (u'GREAT', u'GREATEST', u'BIG', u'BIGGEST'),\n", - " (u'GREAT', u'GREATEST', u'GOOD', u'BEST'),\n", - " (u'LARGE', u'LARGEST', u'BIG', u'BIGGEST'),\n", - " (u'LARGE', u'LARGEST', u'GOOD', u'BEST'),\n", - " (u'LARGE', u'LARGEST', u'GREAT', u'GREATEST')],\n", - " 'section': u'gram4-superlative'},\n", - " {'correct': [],\n", - " 'incorrect': [(u'GO', u'GOING', u'LOOK', u'LOOKING'),\n", - " (u'GO', u'GOING', u'PLAY', u'PLAYING'),\n", - " (u'GO', u'GOING', u'RUN', u'RUNNING'),\n", - " (u'GO', u'GOING', u'SAY', u'SAYING'),\n", - " (u'LOOK', u'LOOKING', u'PLAY', u'PLAYING'),\n", - " (u'LOOK', u'LOOKING', u'RUN', u'RUNNING'),\n", - " (u'LOOK', u'LOOKING', u'SAY', u'SAYING'),\n", - " (u'LOOK', u'LOOKING', u'GO', u'GOING'),\n", - " (u'PLAY', u'PLAYING', u'RUN', u'RUNNING'),\n", - " (u'PLAY', u'PLAYING', u'SAY', u'SAYING'),\n", - " (u'PLAY', u'PLAYING', u'GO', u'GOING'),\n", - " (u'PLAY', u'PLAYING', u'LOOK', u'LOOKING'),\n", - " (u'RUN', u'RUNNING', u'SAY', u'SAYING'),\n", - " (u'RUN', u'RUNNING', u'GO', u'GOING'),\n", - " (u'RUN', u'RUNNING', u'LOOK', u'LOOKING'),\n", - " (u'RUN', u'RUNNING', u'PLAY', u'PLAYING'),\n", - " (u'SAY', u'SAYING', u'GO', u'GOING'),\n", - " (u'SAY', u'SAYING', u'LOOK', u'LOOKING'),\n", - " (u'SAY', u'SAYING', u'PLAY', u'PLAYING'),\n", - " (u'SAY', u'SAYING', u'RUN', u'RUNNING')],\n", - " 'section': u'gram5-present-participle'},\n", - " {'correct': [],\n", - " 'incorrect': [(u'AUSTRALIA', u'AUSTRALIAN', u'FRANCE', u'FRENCH'),\n", - " (u'AUSTRALIA', u'AUSTRALIAN', u'INDIA', u'INDIAN'),\n", - " (u'AUSTRALIA', u'AUSTRALIAN', u'ISRAEL', u'ISRAELI'),\n", - " (u'AUSTRALIA', u'AUSTRALIAN', u'SWITZERLAND', u'SWISS'),\n", - " (u'FRANCE', u'FRENCH', u'INDIA', u'INDIAN'),\n", - " (u'FRANCE', u'FRENCH', u'ISRAEL', u'ISRAELI'),\n", - " (u'FRANCE', u'FRENCH', u'SWITZERLAND', u'SWISS'),\n", - " (u'FRANCE', u'FRENCH', u'AUSTRALIA', u'AUSTRALIAN'),\n", - " (u'INDIA', u'INDIAN', u'ISRAEL', u'ISRAELI'),\n", - " (u'INDIA', u'INDIAN', u'SWITZERLAND', u'SWISS'),\n", - " (u'INDIA', u'INDIAN', u'AUSTRALIA', u'AUSTRALIAN'),\n", - " (u'INDIA', u'INDIAN', u'FRANCE', u'FRENCH'),\n", - " (u'ISRAEL', u'ISRAELI', u'SWITZERLAND', u'SWISS'),\n", - " (u'ISRAEL', u'ISRAELI', u'AUSTRALIA', u'AUSTRALIAN'),\n", - " (u'ISRAEL', u'ISRAELI', u'FRANCE', u'FRENCH'),\n", - " (u'ISRAEL', u'ISRAELI', u'INDIA', u'INDIAN'),\n", - " (u'SWITZERLAND', u'SWISS', u'AUSTRALIA', u'AUSTRALIAN'),\n", - " (u'SWITZERLAND', u'SWISS', u'FRANCE', u'FRENCH'),\n", - " (u'SWITZERLAND', u'SWISS', u'INDIA', u'INDIAN'),\n", - " (u'SWITZERLAND', u'SWISS', u'ISRAEL', u'ISRAELI')],\n", - " 'section': u'gram6-nationality-adjective'},\n", - " {'correct': [],\n", - " 'incorrect': [(u'GOING', u'WENT', u'PAYING', u'PAID'),\n", - " (u'GOING', u'WENT', u'PLAYING', u'PLAYED'),\n", - " (u'GOING', u'WENT', u'SAYING', u'SAID'),\n", - " (u'GOING', u'WENT', u'TAKING', u'TOOK'),\n", - " (u'PAYING', u'PAID', u'PLAYING', u'PLAYED'),\n", - " (u'PAYING', u'PAID', u'SAYING', u'SAID'),\n", - " (u'PAYING', u'PAID', u'TAKING', u'TOOK'),\n", - " (u'PAYING', u'PAID', u'GOING', u'WENT'),\n", - " (u'PLAYING', u'PLAYED', u'SAYING', u'SAID'),\n", - " (u'PLAYING', u'PLAYED', u'TAKING', u'TOOK'),\n", - " (u'PLAYING', u'PLAYED', u'GOING', u'WENT'),\n", - " (u'PLAYING', u'PLAYED', u'PAYING', u'PAID'),\n", - " (u'SAYING', u'SAID', u'TAKING', u'TOOK'),\n", - " (u'SAYING', u'SAID', u'GOING', u'WENT'),\n", - " (u'SAYING', u'SAID', u'PAYING', u'PAID'),\n", - " (u'SAYING', u'SAID', u'PLAYING', u'PLAYED'),\n", - " (u'TAKING', u'TOOK', u'GOING', u'WENT'),\n", - " (u'TAKING', u'TOOK', u'PAYING', u'PAID'),\n", - " (u'TAKING', u'TOOK', u'PLAYING', u'PLAYED'),\n", - " (u'TAKING', u'TOOK', u'SAYING', u'SAID')],\n", - " 'section': u'gram7-past-tense'},\n", - " {'correct': [],\n", - " 'incorrect': [(u'BUILDING', u'BUILDINGS', u'CAR', u'CARS'),\n", - " (u'BUILDING', u'BUILDINGS', u'CHILD', u'CHILDREN'),\n", - " (u'BUILDING', u'BUILDINGS', u'MAN', u'MEN'),\n", - " (u'CAR', u'CARS', u'CHILD', u'CHILDREN'),\n", - " (u'CAR', u'CARS', u'MAN', u'MEN'),\n", - " (u'CAR', u'CARS', u'BUILDING', u'BUILDINGS'),\n", - " (u'CHILD', u'CHILDREN', u'MAN', u'MEN'),\n", - " (u'CHILD', u'CHILDREN', u'BUILDING', u'BUILDINGS'),\n", - " (u'CHILD', u'CHILDREN', u'CAR', u'CARS'),\n", - " (u'MAN', u'MEN', u'BUILDING', u'BUILDINGS'),\n", - " (u'MAN', u'MEN', u'CAR', u'CARS'),\n", - " (u'MAN', u'MEN', u'CHILD', u'CHILDREN')],\n", - " 'section': u'gram8-plural'},\n", - " {'correct': [], 'incorrect': [], 'section': u'gram9-plural-verbs'},\n", - " {'correct': [],\n", - " 'incorrect': [(u'HE', u'SHE', u'HIS', u'HER'),\n", - " (u'HIS', u'HER', u'HE', u'SHE'),\n", - " (u'GOOD', u'BETTER', u'GREAT', u'GREATER'),\n", - " (u'GOOD', u'BETTER', u'LONG', u'LONGER'),\n", - " (u'GOOD', u'BETTER', u'LOW', u'LOWER'),\n", - " (u'GREAT', u'GREATER', u'LONG', u'LONGER'),\n", - " (u'GREAT', u'GREATER', u'LOW', u'LOWER'),\n", - " (u'GREAT', u'GREATER', u'GOOD', u'BETTER'),\n", - " (u'LONG', u'LONGER', u'LOW', u'LOWER'),\n", - " (u'LONG', u'LONGER', u'GOOD', u'BETTER'),\n", - " (u'LONG', u'LONGER', u'GREAT', u'GREATER'),\n", - " (u'LOW', u'LOWER', u'GOOD', u'BETTER'),\n", - " (u'LOW', u'LOWER', u'GREAT', u'GREATER'),\n", - " (u'LOW', u'LOWER', u'LONG', u'LONGER'),\n", - " (u'BIG', u'BIGGEST', u'GOOD', u'BEST'),\n", - " (u'BIG', u'BIGGEST', u'GREAT', u'GREATEST'),\n", - " (u'BIG', u'BIGGEST', u'LARGE', u'LARGEST'),\n", - " (u'GOOD', u'BEST', u'GREAT', u'GREATEST'),\n", - " (u'GOOD', u'BEST', u'LARGE', u'LARGEST'),\n", - " (u'GOOD', u'BEST', u'BIG', u'BIGGEST'),\n", - " (u'GREAT', u'GREATEST', u'LARGE', u'LARGEST'),\n", - " (u'GREAT', u'GREATEST', u'BIG', u'BIGGEST'),\n", - " (u'GREAT', u'GREATEST', u'GOOD', u'BEST'),\n", - " (u'LARGE', u'LARGEST', u'BIG', u'BIGGEST'),\n", - " (u'LARGE', u'LARGEST', u'GOOD', u'BEST'),\n", - " (u'LARGE', u'LARGEST', u'GREAT', u'GREATEST'),\n", - " (u'GO', u'GOING', u'LOOK', u'LOOKING'),\n", - " (u'GO', u'GOING', u'PLAY', u'PLAYING'),\n", - " (u'GO', u'GOING', u'RUN', u'RUNNING'),\n", - " (u'GO', u'GOING', u'SAY', u'SAYING'),\n", - " (u'LOOK', u'LOOKING', u'PLAY', u'PLAYING'),\n", - " (u'LOOK', u'LOOKING', u'RUN', u'RUNNING'),\n", - " (u'LOOK', u'LOOKING', u'SAY', u'SAYING'),\n", - " (u'LOOK', u'LOOKING', u'GO', u'GOING'),\n", - " (u'PLAY', u'PLAYING', u'RUN', u'RUNNING'),\n", - " (u'PLAY', u'PLAYING', u'SAY', u'SAYING'),\n", - " (u'PLAY', u'PLAYING', u'GO', u'GOING'),\n", - " (u'PLAY', u'PLAYING', u'LOOK', u'LOOKING'),\n", - " (u'RUN', u'RUNNING', u'SAY', u'SAYING'),\n", - " (u'RUN', u'RUNNING', u'GO', u'GOING'),\n", - " (u'RUN', u'RUNNING', u'LOOK', u'LOOKING'),\n", - " (u'RUN', u'RUNNING', u'PLAY', u'PLAYING'),\n", - " (u'SAY', u'SAYING', u'GO', u'GOING'),\n", - " (u'SAY', u'SAYING', u'LOOK', u'LOOKING'),\n", - " (u'SAY', u'SAYING', u'PLAY', u'PLAYING'),\n", - " (u'SAY', u'SAYING', u'RUN', u'RUNNING'),\n", - " (u'AUSTRALIA', u'AUSTRALIAN', u'FRANCE', u'FRENCH'),\n", - " (u'AUSTRALIA', u'AUSTRALIAN', u'INDIA', u'INDIAN'),\n", - " (u'AUSTRALIA', u'AUSTRALIAN', u'ISRAEL', u'ISRAELI'),\n", - " (u'AUSTRALIA', u'AUSTRALIAN', u'SWITZERLAND', u'SWISS'),\n", - " (u'FRANCE', u'FRENCH', u'INDIA', u'INDIAN'),\n", - " (u'FRANCE', u'FRENCH', u'ISRAEL', u'ISRAELI'),\n", - " (u'FRANCE', u'FRENCH', u'SWITZERLAND', u'SWISS'),\n", - " (u'FRANCE', u'FRENCH', u'AUSTRALIA', u'AUSTRALIAN'),\n", - " (u'INDIA', u'INDIAN', u'ISRAEL', u'ISRAELI'),\n", - " (u'INDIA', u'INDIAN', u'SWITZERLAND', u'SWISS'),\n", - " (u'INDIA', u'INDIAN', u'AUSTRALIA', u'AUSTRALIAN'),\n", - " (u'INDIA', u'INDIAN', u'FRANCE', u'FRENCH'),\n", - " (u'ISRAEL', u'ISRAELI', u'SWITZERLAND', u'SWISS'),\n", - " (u'ISRAEL', u'ISRAELI', u'AUSTRALIA', u'AUSTRALIAN'),\n", - " (u'ISRAEL', u'ISRAELI', u'FRANCE', u'FRENCH'),\n", - " (u'ISRAEL', u'ISRAELI', u'INDIA', u'INDIAN'),\n", - " (u'SWITZERLAND', u'SWISS', u'AUSTRALIA', u'AUSTRALIAN'),\n", - " (u'SWITZERLAND', u'SWISS', u'FRANCE', u'FRENCH'),\n", - " (u'SWITZERLAND', u'SWISS', u'INDIA', u'INDIAN'),\n", - " (u'SWITZERLAND', u'SWISS', u'ISRAEL', u'ISRAELI'),\n", - " (u'GOING', u'WENT', u'PAYING', u'PAID'),\n", - " (u'GOING', u'WENT', u'PLAYING', u'PLAYED'),\n", - " (u'GOING', u'WENT', u'SAYING', u'SAID'),\n", - " (u'GOING', u'WENT', u'TAKING', u'TOOK'),\n", - " (u'PAYING', u'PAID', u'PLAYING', u'PLAYED'),\n", - " (u'PAYING', u'PAID', u'SAYING', u'SAID'),\n", - " (u'PAYING', u'PAID', u'TAKING', u'TOOK'),\n", - " (u'PAYING', u'PAID', u'GOING', u'WENT'),\n", - " (u'PLAYING', u'PLAYED', u'SAYING', u'SAID'),\n", - " (u'PLAYING', u'PLAYED', u'TAKING', u'TOOK'),\n", - " (u'PLAYING', u'PLAYED', u'GOING', u'WENT'),\n", - " (u'PLAYING', u'PLAYED', u'PAYING', u'PAID'),\n", - " (u'SAYING', u'SAID', u'TAKING', u'TOOK'),\n", - " (u'SAYING', u'SAID', u'GOING', u'WENT'),\n", - " (u'SAYING', u'SAID', u'PAYING', u'PAID'),\n", - " (u'SAYING', u'SAID', u'PLAYING', u'PLAYED'),\n", - " (u'TAKING', u'TOOK', u'GOING', u'WENT'),\n", - " (u'TAKING', u'TOOK', u'PAYING', u'PAID'),\n", - " (u'TAKING', u'TOOK', u'PLAYING', u'PLAYED'),\n", - " (u'TAKING', u'TOOK', u'SAYING', u'SAID'),\n", - " (u'BUILDING', u'BUILDINGS', u'CAR', u'CARS'),\n", - " (u'BUILDING', u'BUILDINGS', u'CHILD', u'CHILDREN'),\n", - " (u'BUILDING', u'BUILDINGS', u'MAN', u'MEN'),\n", - " (u'CAR', u'CARS', u'CHILD', u'CHILDREN'),\n", - " (u'CAR', u'CARS', u'MAN', u'MEN'),\n", - " (u'CAR', u'CARS', u'BUILDING', u'BUILDINGS'),\n", - " (u'CHILD', u'CHILDREN', u'MAN', u'MEN'),\n", - " (u'CHILD', u'CHILDREN', u'BUILDING', u'BUILDINGS'),\n", - " (u'CHILD', u'CHILDREN', u'CAR', u'CARS'),\n", - " (u'MAN', u'MEN', u'BUILDING', u'BUILDINGS'),\n", - " (u'MAN', u'MEN', u'CAR', u'CARS'),\n", - " (u'MAN', u'MEN', u'CHILD', u'CHILDREN')],\n", - " 'section': 'total'}]" + "[{'section': 'capital-common-countries', 'correct': [], 'incorrect': []},\n", + " {'section': 'capital-world', 'correct': [], 'incorrect': []},\n", + " {'section': 'currency', 'correct': [], 'incorrect': []},\n", + " {'section': 'city-in-state', 'correct': [], 'incorrect': []},\n", + " {'section': 'family',\n", + " 'correct': [],\n", + " 'incorrect': [('HE', 'SHE', 'HIS', 'HER'), ('HIS', 'HER', 'HE', 'SHE')]},\n", + " {'section': 'gram1-adjective-to-adverb', 'correct': [], 'incorrect': []},\n", + " {'section': 'gram2-opposite', 'correct': [], 'incorrect': []},\n", + " {'section': 'gram3-comparative',\n", + " 'correct': [('GREAT', 'GREATER', 'LOW', 'LOWER'),\n", + " ('LONG', 'LONGER', 'LOW', 'LOWER'),\n", + " ('LOW', 'LOWER', 'GREAT', 'GREATER')],\n", + " 'incorrect': [('GOOD', 'BETTER', 'GREAT', 'GREATER'),\n", + " ('GOOD', 'BETTER', 'LONG', 'LONGER'),\n", + " ('GOOD', 'BETTER', 'LOW', 'LOWER'),\n", + " ('GREAT', 'GREATER', 'LONG', 'LONGER'),\n", + " ('GREAT', 'GREATER', 'GOOD', 'BETTER'),\n", + " ('LONG', 'LONGER', 'GOOD', 'BETTER'),\n", + " ('LONG', 'LONGER', 'GREAT', 'GREATER'),\n", + " ('LOW', 'LOWER', 'GOOD', 'BETTER'),\n", + " ('LOW', 'LOWER', 'LONG', 'LONGER')]},\n", + " {'section': 'gram4-superlative',\n", + " 'correct': [('GOOD', 'BEST', 'GREAT', 'GREATEST'),\n", + " ('GOOD', 'BEST', 'LARGE', 'LARGEST'),\n", + " ('GOOD', 'BEST', 'BIG', 'BIGGEST'),\n", + " ('GREAT', 'GREATEST', 'BIG', 'BIGGEST'),\n", + " ('LARGE', 'LARGEST', 'BIG', 'BIGGEST'),\n", + " ('LARGE', 'LARGEST', 'GREAT', 'GREATEST')],\n", + " 'incorrect': [('BIG', 'BIGGEST', 'GOOD', 'BEST'),\n", + " ('BIG', 'BIGGEST', 'GREAT', 'GREATEST'),\n", + " ('BIG', 'BIGGEST', 'LARGE', 'LARGEST'),\n", + " ('GREAT', 'GREATEST', 'LARGE', 'LARGEST'),\n", + " ('GREAT', 'GREATEST', 'GOOD', 'BEST'),\n", + " ('LARGE', 'LARGEST', 'GOOD', 'BEST')]},\n", + " {'section': 'gram5-present-participle',\n", + " 'correct': [('GO', 'GOING', 'LOOK', 'LOOKING'),\n", + " ('PLAY', 'PLAYING', 'SAY', 'SAYING'),\n", + " ('PLAY', 'PLAYING', 'LOOK', 'LOOKING'),\n", + " ('SAY', 'SAYING', 'LOOK', 'LOOKING'),\n", + " ('SAY', 'SAYING', 'PLAY', 'PLAYING')],\n", + " 'incorrect': [('GO', 'GOING', 'PLAY', 'PLAYING'),\n", + " ('GO', 'GOING', 'RUN', 'RUNNING'),\n", + " ('GO', 'GOING', 'SAY', 'SAYING'),\n", + " ('LOOK', 'LOOKING', 'PLAY', 'PLAYING'),\n", + " ('LOOK', 'LOOKING', 'RUN', 'RUNNING'),\n", + " ('LOOK', 'LOOKING', 'SAY', 'SAYING'),\n", + " ('LOOK', 'LOOKING', 'GO', 'GOING'),\n", + " ('PLAY', 'PLAYING', 'RUN', 'RUNNING'),\n", + " ('PLAY', 'PLAYING', 'GO', 'GOING'),\n", + " ('RUN', 'RUNNING', 'SAY', 'SAYING'),\n", + " ('RUN', 'RUNNING', 'GO', 'GOING'),\n", + " ('RUN', 'RUNNING', 'LOOK', 'LOOKING'),\n", + " ('RUN', 'RUNNING', 'PLAY', 'PLAYING'),\n", + " ('SAY', 'SAYING', 'GO', 'GOING'),\n", + " ('SAY', 'SAYING', 'RUN', 'RUNNING')]},\n", + " {'section': 'gram6-nationality-adjective',\n", + " 'correct': [('AUSTRALIA', 'AUSTRALIAN', 'INDIA', 'INDIAN'),\n", + " ('AUSTRALIA', 'AUSTRALIAN', 'ISRAEL', 'ISRAELI'),\n", + " ('INDIA', 'INDIAN', 'AUSTRALIA', 'AUSTRALIAN'),\n", + " ('ISRAEL', 'ISRAELI', 'INDIA', 'INDIAN'),\n", + " ('SWITZERLAND', 'SWISS', 'INDIA', 'INDIAN')],\n", + " 'incorrect': [('AUSTRALIA', 'AUSTRALIAN', 'FRANCE', 'FRENCH'),\n", + " ('AUSTRALIA', 'AUSTRALIAN', 'SWITZERLAND', 'SWISS'),\n", + " ('FRANCE', 'FRENCH', 'INDIA', 'INDIAN'),\n", + " ('FRANCE', 'FRENCH', 'ISRAEL', 'ISRAELI'),\n", + " ('FRANCE', 'FRENCH', 'SWITZERLAND', 'SWISS'),\n", + " ('FRANCE', 'FRENCH', 'AUSTRALIA', 'AUSTRALIAN'),\n", + " ('INDIA', 'INDIAN', 'ISRAEL', 'ISRAELI'),\n", + " ('INDIA', 'INDIAN', 'SWITZERLAND', 'SWISS'),\n", + " ('INDIA', 'INDIAN', 'FRANCE', 'FRENCH'),\n", + " ('ISRAEL', 'ISRAELI', 'SWITZERLAND', 'SWISS'),\n", + " ('ISRAEL', 'ISRAELI', 'AUSTRALIA', 'AUSTRALIAN'),\n", + " ('ISRAEL', 'ISRAELI', 'FRANCE', 'FRENCH'),\n", + " ('SWITZERLAND', 'SWISS', 'AUSTRALIA', 'AUSTRALIAN'),\n", + " ('SWITZERLAND', 'SWISS', 'FRANCE', 'FRENCH'),\n", + " ('SWITZERLAND', 'SWISS', 'ISRAEL', 'ISRAELI')]},\n", + " {'section': 'gram7-past-tense',\n", + " 'correct': [('PAYING', 'PAID', 'SAYING', 'SAID')],\n", + " 'incorrect': [('GOING', 'WENT', 'PAYING', 'PAID'),\n", + " ('GOING', 'WENT', 'PLAYING', 'PLAYED'),\n", + " ('GOING', 'WENT', 'SAYING', 'SAID'),\n", + " ('GOING', 'WENT', 'TAKING', 'TOOK'),\n", + " ('PAYING', 'PAID', 'PLAYING', 'PLAYED'),\n", + " ('PAYING', 'PAID', 'TAKING', 'TOOK'),\n", + " ('PAYING', 'PAID', 'GOING', 'WENT'),\n", + " ('PLAYING', 'PLAYED', 'SAYING', 'SAID'),\n", + " ('PLAYING', 'PLAYED', 'TAKING', 'TOOK'),\n", + " ('PLAYING', 'PLAYED', 'GOING', 'WENT'),\n", + " ('PLAYING', 'PLAYED', 'PAYING', 'PAID'),\n", + " ('SAYING', 'SAID', 'TAKING', 'TOOK'),\n", + " ('SAYING', 'SAID', 'GOING', 'WENT'),\n", + " ('SAYING', 'SAID', 'PAYING', 'PAID'),\n", + " ('SAYING', 'SAID', 'PLAYING', 'PLAYED'),\n", + " ('TAKING', 'TOOK', 'GOING', 'WENT'),\n", + " ('TAKING', 'TOOK', 'PAYING', 'PAID'),\n", + " ('TAKING', 'TOOK', 'PLAYING', 'PLAYED'),\n", + " ('TAKING', 'TOOK', 'SAYING', 'SAID')]},\n", + " {'section': 'gram8-plural',\n", + " 'correct': [('BUILDING', 'BUILDINGS', 'CHILD', 'CHILDREN'),\n", + " ('CHILD', 'CHILDREN', 'CAR', 'CARS'),\n", + " ('MAN', 'MEN', 'CAR', 'CARS')],\n", + " 'incorrect': [('BUILDING', 'BUILDINGS', 'CAR', 'CARS'),\n", + " ('BUILDING', 'BUILDINGS', 'MAN', 'MEN'),\n", + " ('CAR', 'CARS', 'CHILD', 'CHILDREN'),\n", + " ('CAR', 'CARS', 'MAN', 'MEN'),\n", + " ('CAR', 'CARS', 'BUILDING', 'BUILDINGS'),\n", + " ('CHILD', 'CHILDREN', 'MAN', 'MEN'),\n", + " ('CHILD', 'CHILDREN', 'BUILDING', 'BUILDINGS'),\n", + " ('MAN', 'MEN', 'BUILDING', 'BUILDINGS'),\n", + " ('MAN', 'MEN', 'CHILD', 'CHILDREN')]},\n", + " {'section': 'gram9-plural-verbs', 'correct': [], 'incorrect': []},\n", + " {'section': 'total',\n", + " 'correct': [('GREAT', 'GREATER', 'LOW', 'LOWER'),\n", + " ('LONG', 'LONGER', 'LOW', 'LOWER'),\n", + " ('LOW', 'LOWER', 'GREAT', 'GREATER'),\n", + " ('GOOD', 'BEST', 'GREAT', 'GREATEST'),\n", + " ('GOOD', 'BEST', 'LARGE', 'LARGEST'),\n", + " ('GOOD', 'BEST', 'BIG', 'BIGGEST'),\n", + " ('GREAT', 'GREATEST', 'BIG', 'BIGGEST'),\n", + " ('LARGE', 'LARGEST', 'BIG', 'BIGGEST'),\n", + " ('LARGE', 'LARGEST', 'GREAT', 'GREATEST'),\n", + " ('GO', 'GOING', 'LOOK', 'LOOKING'),\n", + " ('PLAY', 'PLAYING', 'SAY', 'SAYING'),\n", + " ('PLAY', 'PLAYING', 'LOOK', 'LOOKING'),\n", + " ('SAY', 'SAYING', 'LOOK', 'LOOKING'),\n", + " ('SAY', 'SAYING', 'PLAY', 'PLAYING'),\n", + " ('AUSTRALIA', 'AUSTRALIAN', 'INDIA', 'INDIAN'),\n", + " ('AUSTRALIA', 'AUSTRALIAN', 'ISRAEL', 'ISRAELI'),\n", + " ('INDIA', 'INDIAN', 'AUSTRALIA', 'AUSTRALIAN'),\n", + " ('ISRAEL', 'ISRAELI', 'INDIA', 'INDIAN'),\n", + " ('SWITZERLAND', 'SWISS', 'INDIA', 'INDIAN'),\n", + " ('PAYING', 'PAID', 'SAYING', 'SAID'),\n", + " ('BUILDING', 'BUILDINGS', 'CHILD', 'CHILDREN'),\n", + " ('CHILD', 'CHILDREN', 'CAR', 'CARS'),\n", + " ('MAN', 'MEN', 'CAR', 'CARS')],\n", + " 'incorrect': [('HE', 'SHE', 'HIS', 'HER'),\n", + " ('HIS', 'HER', 'HE', 'SHE'),\n", + " ('GOOD', 'BETTER', 'GREAT', 'GREATER'),\n", + " ('GOOD', 'BETTER', 'LONG', 'LONGER'),\n", + " ('GOOD', 'BETTER', 'LOW', 'LOWER'),\n", + " ('GREAT', 'GREATER', 'LONG', 'LONGER'),\n", + " ('GREAT', 'GREATER', 'GOOD', 'BETTER'),\n", + " ('LONG', 'LONGER', 'GOOD', 'BETTER'),\n", + " ('LONG', 'LONGER', 'GREAT', 'GREATER'),\n", + " ('LOW', 'LOWER', 'GOOD', 'BETTER'),\n", + " ('LOW', 'LOWER', 'LONG', 'LONGER'),\n", + " ('BIG', 'BIGGEST', 'GOOD', 'BEST'),\n", + " ('BIG', 'BIGGEST', 'GREAT', 'GREATEST'),\n", + " ('BIG', 'BIGGEST', 'LARGE', 'LARGEST'),\n", + " ('GREAT', 'GREATEST', 'LARGE', 'LARGEST'),\n", + " ('GREAT', 'GREATEST', 'GOOD', 'BEST'),\n", + " ('LARGE', 'LARGEST', 'GOOD', 'BEST'),\n", + " ('GO', 'GOING', 'PLAY', 'PLAYING'),\n", + " ('GO', 'GOING', 'RUN', 'RUNNING'),\n", + " ('GO', 'GOING', 'SAY', 'SAYING'),\n", + " ('LOOK', 'LOOKING', 'PLAY', 'PLAYING'),\n", + " ('LOOK', 'LOOKING', 'RUN', 'RUNNING'),\n", + " ('LOOK', 'LOOKING', 'SAY', 'SAYING'),\n", + " ('LOOK', 'LOOKING', 'GO', 'GOING'),\n", + " ('PLAY', 'PLAYING', 'RUN', 'RUNNING'),\n", + " ('PLAY', 'PLAYING', 'GO', 'GOING'),\n", + " ('RUN', 'RUNNING', 'SAY', 'SAYING'),\n", + " ('RUN', 'RUNNING', 'GO', 'GOING'),\n", + " ('RUN', 'RUNNING', 'LOOK', 'LOOKING'),\n", + " ('RUN', 'RUNNING', 'PLAY', 'PLAYING'),\n", + " ('SAY', 'SAYING', 'GO', 'GOING'),\n", + " ('SAY', 'SAYING', 'RUN', 'RUNNING'),\n", + " ('AUSTRALIA', 'AUSTRALIAN', 'FRANCE', 'FRENCH'),\n", + " ('AUSTRALIA', 'AUSTRALIAN', 'SWITZERLAND', 'SWISS'),\n", + " ('FRANCE', 'FRENCH', 'INDIA', 'INDIAN'),\n", + " ('FRANCE', 'FRENCH', 'ISRAEL', 'ISRAELI'),\n", + " ('FRANCE', 'FRENCH', 'SWITZERLAND', 'SWISS'),\n", + " ('FRANCE', 'FRENCH', 'AUSTRALIA', 'AUSTRALIAN'),\n", + " ('INDIA', 'INDIAN', 'ISRAEL', 'ISRAELI'),\n", + " ('INDIA', 'INDIAN', 'SWITZERLAND', 'SWISS'),\n", + " ('INDIA', 'INDIAN', 'FRANCE', 'FRENCH'),\n", + " ('ISRAEL', 'ISRAELI', 'SWITZERLAND', 'SWISS'),\n", + " ('ISRAEL', 'ISRAELI', 'AUSTRALIA', 'AUSTRALIAN'),\n", + " ('ISRAEL', 'ISRAELI', 'FRANCE', 'FRENCH'),\n", + " ('SWITZERLAND', 'SWISS', 'AUSTRALIA', 'AUSTRALIAN'),\n", + " ('SWITZERLAND', 'SWISS', 'FRANCE', 'FRENCH'),\n", + " ('SWITZERLAND', 'SWISS', 'ISRAEL', 'ISRAELI'),\n", + " ('GOING', 'WENT', 'PAYING', 'PAID'),\n", + " ('GOING', 'WENT', 'PLAYING', 'PLAYED'),\n", + " ('GOING', 'WENT', 'SAYING', 'SAID'),\n", + " ('GOING', 'WENT', 'TAKING', 'TOOK'),\n", + " ('PAYING', 'PAID', 'PLAYING', 'PLAYED'),\n", + " ('PAYING', 'PAID', 'TAKING', 'TOOK'),\n", + " ('PAYING', 'PAID', 'GOING', 'WENT'),\n", + " ('PLAYING', 'PLAYED', 'SAYING', 'SAID'),\n", + " ('PLAYING', 'PLAYED', 'TAKING', 'TOOK'),\n", + " ('PLAYING', 'PLAYED', 'GOING', 'WENT'),\n", + " ('PLAYING', 'PLAYED', 'PAYING', 'PAID'),\n", + " ('SAYING', 'SAID', 'TAKING', 'TOOK'),\n", + " ('SAYING', 'SAID', 'GOING', 'WENT'),\n", + " ('SAYING', 'SAID', 'PAYING', 'PAID'),\n", + " ('SAYING', 'SAID', 'PLAYING', 'PLAYED'),\n", + " ('TAKING', 'TOOK', 'GOING', 'WENT'),\n", + " ('TAKING', 'TOOK', 'PAYING', 'PAID'),\n", + " ('TAKING', 'TOOK', 'PLAYING', 'PLAYED'),\n", + " ('TAKING', 'TOOK', 'SAYING', 'SAID'),\n", + " ('BUILDING', 'BUILDINGS', 'CAR', 'CARS'),\n", + " ('BUILDING', 'BUILDINGS', 'MAN', 'MEN'),\n", + " ('CAR', 'CARS', 'CHILD', 'CHILDREN'),\n", + " ('CAR', 'CARS', 'MAN', 'MEN'),\n", + " ('CAR', 'CARS', 'BUILDING', 'BUILDINGS'),\n", + " ('CHILD', 'CHILDREN', 'MAN', 'MEN'),\n", + " ('CHILD', 'CHILDREN', 'BUILDING', 'BUILDINGS'),\n", + " ('MAN', 'MEN', 'BUILDING', 'BUILDINGS'),\n", + " ('MAN', 'MEN', 'CHILD', 'CHILDREN')]}]" ] }, "execution_count": 12, @@ -741,9 +705,7 @@ } ], "source": [ - "question_file_path = data_dir + 'questions-words.txt'\n", - "\n", - "model_wrapper.accuracy(questions=question_file_path)" + "model_wrapper.accuracy(questions=datapath('questions-words.txt'))" ] }, { @@ -754,7 +716,7 @@ { "data": { "text/plain": [ - "1.1102867164706653" + "1.1245153746934533" ] }, "execution_count": 13, @@ -781,9 +743,7 @@ { "cell_type": "code", "execution_count": null, - "metadata": { - "collapsed": true - }, + "metadata": {}, "outputs": [], "source": [] } @@ -791,21 +751,21 @@ "metadata": { "anaconda-cloud": {}, "kernelspec": { - "display_name": "Python 2", + "display_name": "Python 3", "language": "python", - "name": "python2" + "name": "python3" }, "language_info": { "codemirror_mode": { "name": "ipython", - "version": 2 + "version": 3 }, "file_extension": ".py", "mimetype": "text/x-python", "name": "python", "nbconvert_exporter": "python", - "pygments_lexer": "ipython2", - "version": "2.7.13" + "pygments_lexer": "ipython3", + "version": "3.7.1" } }, "nbformat": 4, diff --git a/docs/notebooks/nmf_tutorial.ipynb b/docs/notebooks/nmf_tutorial.ipynb index 49e5f02bc3..fc9e31f111 100644 --- a/docs/notebooks/nmf_tutorial.ipynb +++ b/docs/notebooks/nmf_tutorial.ipynb @@ -26,7 +26,47 @@ "\n", "Why **Online**? Because corpora are large and RAM is limited. Online NMF can learn topics iteratively.\n", "\n", - "This particular implementation is based on [this paper](arxiv.org/abs/1604.02634)." + "This particular implementation is based on [this paper](https://arxiv.org/abs/1604.02634).\n", + "\n", + "The main attributes are following:\n", + "\n", + "- W is a word-topic matrix\n", + "- h is a topic-document matrix\n", + "- v is an input word-document matrix\n", + "- A, B - matrices that accumulate information from every consecutive chunk. A = h.dot(ht), B = v.dot(ht).\n", + "\n", + "The idea of the algorithm is as follows:\n", + "\n", + "```\n", + " Initialize W, A and B matrices\n", + "\n", + " Input corpus\n", + " Split corpus to batches\n", + "\n", + " for v in batches:\n", + " infer h:\n", + " do coordinate gradient descent step to find h that minimizes (v - Wh) l2 norm\n", + "\n", + " bound h so that it is non-negative\n", + "\n", + " update A and B:\n", + " A = h.dot(ht)\n", + " B = v.dot(ht)\n", + "\n", + " update W:\n", + " do gradient descent step to find W that minimizes 0.5*trace(WtWA) - trace(WtB) l2 norm\n", + "```" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "## What's in this tutorial?\n", + "\n", + "- Basic training example\n", + "- Comparison with alternative models (LDA and Sklearn NMF)\n", + "- Non-standart application (image decomposition)" ] }, { @@ -40,8 +80,22 @@ "cell_type": "code", "execution_count": 1, "metadata": {}, - "outputs": [], + "outputs": [ + { + "name": "stderr", + "output_type": "stream", + "text": [ + "/home/anotherbugmaster/.virtualenvs/gensim/lib/python3.6/importlib/_bootstrap.py:219: RuntimeWarning: numpy.dtype size changed, may indicate binary incompatibility. Expected 96, got 88\n", + " return f(*args, **kwds)\n" + ] + } + ], "source": [ + "%load_ext autoreload\n", + "%load_ext line_profiler\n", + "\n", + "%autoreload 2\n", + "\n", "import logging\n", "import matplotlib.pyplot as plt\n", "import numpy as np\n", @@ -155,11 +209,11 @@ "name": "stderr", "output_type": "stream", "text": [ - "2019-01-17 14:47:54,339 : INFO : adding document #0 to Dictionary(0 unique tokens: [])\n", - "2019-01-17 14:47:54,673 : INFO : built Dictionary(25279 unique tokens: ['actual', 'assum', 'babbl', 'batka', 'batkaj']...) from 2819 documents (total 435328 corpus positions)\n", - "2019-01-17 14:47:54,701 : INFO : discarding 18198 tokens: [('batka', 1), ('batkaj', 1), ('beatl', 1), ('ccmail', 3), ('dayton', 4), ('edu', 1785), ('inhibit', 1), ('jbatka', 1), ('line', 2748), ('organ', 2602)]...\n", - "2019-01-17 14:47:54,702 : INFO : keeping 7081 tokens which were in no less than 5 and no more than 1409 (=50.0%) documents\n", - "2019-01-17 14:47:54,712 : INFO : resulting dictionary: Dictionary(7081 unique tokens: ['actual', 'assum', 'babbl', 'burster', 'caus']...)\n" + "2019-01-31 03:18:20,423 : INFO : adding document #0 to Dictionary(0 unique tokens: [])\n", + "2019-01-31 03:18:21,151 : INFO : built Dictionary(25279 unique tokens: ['actual', 'assum', 'babbl', 'batka', 'batkaj']...) from 2819 documents (total 435328 corpus positions)\n", + "2019-01-31 03:18:21,253 : INFO : discarding 18198 tokens: [('batka', 1), ('batkaj', 1), ('beatl', 1), ('ccmail', 3), ('dayton', 4), ('edu', 1785), ('inhibit', 1), ('jbatka', 1), ('line', 2748), ('organ', 2602)]...\n", + "2019-01-31 03:18:21,255 : INFO : keeping 7081 tokens which were in no less than 5 and no more than 1409 (=50.0%) documents\n", + "2019-01-31 03:18:21,300 : INFO : resulting dictionary: Dictionary(7081 unique tokens: ['actual', 'assum', 'babbl', 'burster', 'caus']...)\n" ] } ], @@ -202,12 +256,33 @@ "\n", "The API works in the way similar to [Gensim.models.LdaModel](https://radimrehurek.com/gensim/models/ldamodel.html).\n", "\n", - "Specific parameters:\n", + "Special parameters:\n", + "\n", + "- `kappa` float, optional\n", + "\n", + " Gradient descent step size.\n", + " \n", + " Larger value makes the model train faster, but could lead to non-convergence if set too large.\n", + " \n", + " \n", + "- `w_max_iter` int, optional\n", + "\n", + " Maximum number of iterations to train W per each batch.\n", + " \n", + " \n", + "- `w_stop_condition` float, optional\n", "\n", - "- `use_r` - whether to use residuals. Effectively adds regularization to the model\n", - "- `kappa` - optimizer step size coefficient.\n", - "- `lambda_` - residuals coefficient. The larger it is, the less more regularized result gets.\n", - "- `sparse_coef` - internal matrices sparse coefficient. The more it is, the faster and less accurate training is." + " If error difference gets less than that, training of ``W`` stops for the current batch.\n", + " \n", + " \n", + "- `h_r_max_iter` int, optional\n", + "\n", + " Maximum number of iterations to train h per each batch.\n", + " \n", + " \n", + "- `h_r_stop_condition` float\n", + "\n", + " If error difference gets less than that, training of ``h`` stops for the current batch." ] }, { @@ -219,16 +294,16 @@ "name": "stderr", "output_type": "stream", "text": [ - "2019-01-17 14:47:56,086 : INFO : Loss (no outliers): 547.4249457586467\tLoss (with outliers): 547.4249457586467\n", - "2019-01-17 14:47:56,387 : INFO : Loss (no outliers): 638.2126742605573\tLoss (with outliers): 638.2126742605573\n" + "2019-01-31 03:18:22,816 : INFO : Loss: 1.0280021673693736\n", + "2019-01-31 03:18:23,067 : INFO : Loss: 0.9805869534381415\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "CPU times: user 1.23 s, sys: 30.1 ms, total: 1.26 s\n", - "Wall time: 1.27 s\n" + "CPU times: user 795 ms, sys: 20.2 ms, total: 815 ms\n", + "Wall time: 814 ms\n" ] } ], @@ -237,15 +312,13 @@ "\n", "nmf = GensimNmf(\n", " corpus=train_corpus,\n", - " chunksize=1000,\n", " num_topics=5,\n", " id2word=dictionary,\n", + " chunksize=1000,\n", " passes=5,\n", " eval_every=10,\n", " minimum_probability=0,\n", " random_state=42,\n", - " use_r=False,\n", - " lambda_=1000,\n", " kappa=1,\n", ")" ] @@ -266,15 +339,15 @@ "data": { "text/plain": [ "[(0,\n", - " '0.021*\"armenian\" + 0.020*\"peopl\" + 0.019*\"said\" + 0.017*\"know\" + 0.010*\"went\" + 0.010*\"sai\" + 0.010*\"like\" + 0.010*\"apart\" + 0.009*\"come\" + 0.009*\"azerbaijani\"'),\n", + " '0.017*\"armenian\" + 0.015*\"peopl\" + 0.014*\"said\" + 0.013*\"know\" + 0.008*\"went\" + 0.008*\"sai\" + 0.007*\"like\" + 0.007*\"apart\" + 0.007*\"come\" + 0.007*\"azerbaijani\"'),\n", " (1,\n", - " '0.094*\"jpeg\" + 0.040*\"file\" + 0.039*\"gif\" + 0.033*\"imag\" + 0.030*\"color\" + 0.021*\"format\" + 0.018*\"qualiti\" + 0.016*\"convert\" + 0.016*\"compress\" + 0.016*\"version\"'),\n", + " '0.074*\"jpeg\" + 0.032*\"file\" + 0.031*\"gif\" + 0.028*\"imag\" + 0.024*\"color\" + 0.017*\"format\" + 0.014*\"qualiti\" + 0.013*\"convert\" + 0.013*\"compress\" + 0.013*\"version\"'),\n", " (2,\n", - " '0.046*\"imag\" + 0.021*\"graphic\" + 0.018*\"data\" + 0.016*\"file\" + 0.016*\"ftp\" + 0.016*\"pub\" + 0.015*\"avail\" + 0.013*\"format\" + 0.012*\"program\" + 0.012*\"packag\"'),\n", + " '0.030*\"imag\" + 0.014*\"graphic\" + 0.012*\"data\" + 0.010*\"file\" + 0.010*\"pub\" + 0.010*\"ftp\" + 0.010*\"avail\" + 0.008*\"format\" + 0.008*\"program\" + 0.008*\"packag\"'),\n", " (3,\n", - " '0.035*\"god\" + 0.029*\"atheist\" + 0.021*\"believ\" + 0.021*\"exist\" + 0.018*\"atheism\" + 0.016*\"religion\" + 0.015*\"peopl\" + 0.014*\"christian\" + 0.013*\"religi\" + 0.012*\"israel\"'),\n", + " '0.015*\"god\" + 0.012*\"atheist\" + 0.009*\"believ\" + 0.009*\"exist\" + 0.008*\"atheism\" + 0.007*\"peopl\" + 0.007*\"religion\" + 0.006*\"christian\" + 0.006*\"israel\" + 0.006*\"religi\"'),\n", " (4,\n", - " '0.044*\"space\" + 0.029*\"launch\" + 0.020*\"satellit\" + 0.013*\"orbit\" + 0.013*\"nasa\" + 0.011*\"year\" + 0.010*\"mission\" + 0.009*\"new\" + 0.009*\"commerci\" + 0.009*\"market\"')]" + " '0.028*\"space\" + 0.019*\"launch\" + 0.013*\"satellit\" + 0.009*\"orbit\" + 0.008*\"nasa\" + 0.007*\"year\" + 0.007*\"mission\" + 0.006*\"new\" + 0.006*\"commerci\" + 0.005*\"market\"')]" ] }, "execution_count": 8, @@ -290,7 +363,9 @@ "cell_type": "markdown", "metadata": {}, "source": [ - "### Coherence" + "### Coherence\n", + "\n", + "Here's a [description of what coherence is](http://qpleple.com/topic-coherence-to-evaluate-topic-models/). Basically it measures how often do most frequent tokens from each topic co-occur in one document." ] }, { @@ -302,13 +377,13 @@ "name": "stderr", "output_type": "stream", "text": [ - "2019-01-17 14:47:56,425 : INFO : CorpusAccumulator accumulated stats from 1000 documents\n" + "2019-01-31 03:18:23,179 : INFO : CorpusAccumulator accumulated stats from 1000 documents\n" ] }, { "data": { "text/plain": [ - "-1.7121027413685233" + "-1.7053902612634844" ] }, "execution_count": 9, @@ -328,7 +403,9 @@ "cell_type": "markdown", "metadata": {}, "source": [ - "### Perplexity" + "### Perplexity\n", + "\n", + "[Perplexity](http://qpleple.com/perplexity-to-evaluate-topic-models/) is basically a degree of uncertainty of the model, i.e. how probable it is to observe a particular set of documents." ] }, { @@ -339,7 +416,7 @@ { "data": { "text/plain": [ - "55.22863930899718" + "2501.280703411481" ] }, "execution_count": 10, @@ -357,7 +434,9 @@ "lines_to_next_cell": 2 }, "source": [ - "### Document topics inference" + "### Document topics inference\n", + "\n", + "Let's get some news and infer a topic vector." ] }, { @@ -395,12 +474,14 @@ "\"Until I meet you, then, in Upper Hell\n", "Convulsed, foaming immortal blood: farewell\" - J. Berryman, \"A Professor's Song\"\n", "\n", - "Topics: [(0, 0.29204189080735804), (1, 0.026352973191825578), (2, 0.36870720087404435), (3, 0.28605983002406815), (4, 0.02683810510270401)]\n" + "====================================================================================================\n", + "Topics: [(0, 0.29903293372372697), (1, 0.007751538808305081), (2, 0.41698421255575224), (3, 0.27623131491221575)]\n" ] } ], "source": [ "print(testset[0]['data'])\n", + "print('=' * 100)\n", "print(\"Topics: {}\".format(nmf[test_corpus[0]]))" ] }, @@ -408,7 +489,9 @@ "cell_type": "markdown", "metadata": {}, "source": [ - "### Word topic inference" + "### Word topic inference\n", + "\n", + "Here's an example of topic distribution inference for a token." ] }, { @@ -423,7 +506,7 @@ "output_type": "stream", "text": [ "Word: actual\n", - "Topics: [(1, 0.20201598559144582), (3, 0.7979840144085542)]\n" + "Topics: [(0, 0.04910674896578284), (1, 0.1277766177062051), (2, 0.07803764680331245), (3, 0.6584104509982174), (4, 0.08666853552648228)]\n" ] } ], @@ -440,6 +523,13 @@ "### Internal state" ] }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "Density is a fraction of non-zero elements in a matrix." + ] + }, { "cell_type": "code", "execution_count": 13, @@ -448,8 +538,8 @@ }, "outputs": [], "source": [ - "def density(sparse_matrix):\n", - " return sparse_matrix.nnz / np.multiply(*sparse_matrix.shape)" + "def density(matrix):\n", + " return (matrix > 0).mean()" ] }, { @@ -463,33 +553,12 @@ "cell_type": "code", "execution_count": 14, "metadata": {}, - "outputs": [ - { - "data": { - "text/plain": [ - "<7081x5 sparse matrix of type ''\n", - "\twith 1735 stored elements in Compressed Sparse Column format>" - ] - }, - "execution_count": 14, - "metadata": {}, - "output_type": "execute_result" - } - ], - "source": [ - "nmf._W" - ] - }, - { - "cell_type": "code", - "execution_count": 15, - "metadata": {}, "outputs": [ { "name": "stdout", "output_type": "stream", "text": [ - "Density: 0.04900437791272419\n" + "Density: 0.6427905663041943\n" ] } ], @@ -506,35 +575,14 @@ }, { "cell_type": "code", - "execution_count": 16, - "metadata": {}, - "outputs": [ - { - "data": { - "text/plain": [ - "<5x819 sparse matrix of type ''\n", - "\twith 3593 stored elements in Compressed Sparse Row format>" - ] - }, - "execution_count": 16, - "metadata": {}, - "output_type": "execute_result" - } - ], - "source": [ - "nmf._h" - ] - }, - { - "cell_type": "code", - "execution_count": 17, + "execution_count": 15, "metadata": {}, "outputs": [ { "name": "stdout", "output_type": "stream", "text": [ - "Density: 0.8774114774114774\n" + "Density: 0.8424908424908425\n" ] } ], @@ -549,44 +597,6 @@ "Residuals matrix of the last batch of shape `(words, batch)`" ] }, - { - "cell_type": "code", - "execution_count": 18, - "metadata": {}, - "outputs": [ - { - "data": { - "text/plain": [ - "<7081x819 sparse matrix of type ''\n", - "\twith 0 stored elements in Compressed Sparse Row format>" - ] - }, - "execution_count": 18, - "metadata": {}, - "output_type": "execute_result" - } - ], - "source": [ - "nmf._r" - ] - }, - { - "cell_type": "code", - "execution_count": 19, - "metadata": {}, - "outputs": [ - { - "name": "stdout", - "output_type": "stream", - "text": [ - "Density: 0.0\n" - ] - } - ], - "source": [ - "print(\"Density: {}\".format(density(nmf._r)))" - ] - }, { "cell_type": "markdown", "metadata": {}, @@ -598,23 +608,27 @@ "cell_type": "markdown", "metadata": {}, "source": [ - "## Gensim NMF vs Sklearn NMF vs Gensim LDA" + "## Gensim NMF vs Sklearn NMF vs Gensim LDA\n", + "\n", + "We'll run all the models on the [20newsgroups](https://scikit-learn.org/0.19/datasets/twenty_newsgroups.html) dataset, which has texts and labels for them.\n", + "\n", + "### Metrics\n", + "\n", + "- train time: time to train a model in seconds\n", + "- coherence: coherence score (not defined for sklearn NMF). Classic metric for topic models.\n", + "- perplexity: perplexity score. Another usual TM metric\n", + "- f1: f1 on the task of news topic classification\n", + "- l2_norm: l2 matrix norm" ] }, { "cell_type": "code", - "execution_count": 20, + "execution_count": 16, "metadata": { "lines_to_next_cell": 2 }, "outputs": [], "source": [ - "variable_params_grid = list(ParameterGrid(dict(\n", - " use_r=[False, True],\n", - " sparse_coef=[0, 3],\n", - " lambda_=[1, 10, 100]\n", - ")))\n", - "\n", "fixed_params = dict(\n", " corpus=train_corpus,\n", " chunksize=1000,\n", @@ -629,7 +643,7 @@ }, { "cell_type": "code", - "execution_count": 21, + "execution_count": 17, "metadata": { "lines_to_next_cell": 2 }, @@ -637,7 +651,6 @@ "source": [ "def get_execution_time(func):\n", " start = time.time()\n", - "\n", " result = func()\n", "\n", " return (time.time() - start), result\n", @@ -692,14 +705,11 @@ " coherence='u_mass'\n", " ).get_coherence()\n", "\n", - " topics = model.show_topics()\n", - "\n", " model.normalize = False\n", "\n", " return dict(\n", " perplexity=perplexity,\n", " coherence=coherence,\n", - " topics=topics,\n", " l2_norm=l2_norm,\n", " f1=f1,\n", " )\n", @@ -735,9 +745,16 @@ " )" ] }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "### Run the models" + ] + }, { "cell_type": "code", - "execution_count": 22, + "execution_count": 18, "metadata": { "scrolled": true }, @@ -746,184 +763,151 @@ "name": "stderr", "output_type": "stream", "text": [ - "2019-01-17 14:48:02,685 : INFO : using symmetric alpha at 0.2\n", - "2019-01-17 14:48:02,685 : INFO : using symmetric eta at 0.2\n", - "2019-01-17 14:48:02,687 : INFO : using serial LDA version on this node\n", - "2019-01-17 14:48:02,693 : INFO : running online (multi-pass) LDA training, 5 topics, 5 passes over the supplied corpus of 2819 documents, updating model once every 1000 documents, evaluating perplexity every 2819 documents, iterating 50x with a convergence threshold of 0.001000\n", - "2019-01-17 14:48:02,694 : INFO : PROGRESS: pass 0, at document #1000/2819\n", - "2019-01-17 14:48:03,679 : INFO : merging changes from 1000 documents into a model of 2819 documents\n", - "2019-01-17 14:48:03,684 : INFO : topic #0 (0.200): 0.006*\"com\" + 0.005*\"new\" + 0.005*\"peopl\" + 0.004*\"space\" + 0.004*\"like\" + 0.004*\"univers\" + 0.004*\"time\" + 0.004*\"nntp\" + 0.004*\"armenian\" + 0.004*\"host\"\n", - "2019-01-17 14:48:03,684 : INFO : topic #1 (0.200): 0.007*\"com\" + 0.005*\"like\" + 0.005*\"peopl\" + 0.005*\"know\" + 0.004*\"think\" + 0.004*\"time\" + 0.004*\"god\" + 0.004*\"univers\" + 0.004*\"said\" + 0.004*\"host\"\n", - "2019-01-17 14:48:03,685 : INFO : topic #2 (0.200): 0.005*\"time\" + 0.005*\"like\" + 0.005*\"com\" + 0.005*\"israel\" + 0.005*\"space\" + 0.005*\"univers\" + 0.004*\"peopl\" + 0.004*\"islam\" + 0.004*\"host\" + 0.004*\"isra\"\n", - "2019-01-17 14:48:03,686 : INFO : topic #3 (0.200): 0.008*\"com\" + 0.006*\"jpeg\" + 0.006*\"imag\" + 0.005*\"nntp\" + 0.005*\"think\" + 0.005*\"file\" + 0.005*\"host\" + 0.004*\"like\" + 0.004*\"univers\" + 0.004*\"graphic\"\n", - "2019-01-17 14:48:03,687 : INFO : topic #4 (0.200): 0.007*\"peopl\" + 0.006*\"space\" + 0.006*\"com\" + 0.005*\"armenian\" + 0.004*\"know\" + 0.004*\"nasa\" + 0.003*\"right\" + 0.003*\"like\" + 0.003*\"point\" + 0.003*\"time\"\n", - "2019-01-17 14:48:03,687 : INFO : topic diff=1.649469, rho=1.000000\n", - "2019-01-17 14:48:03,688 : INFO : PROGRESS: pass 0, at document #2000/2819\n", - "2019-01-17 14:48:04,584 : INFO : merging changes from 1000 documents into a model of 2819 documents\n", - "2019-01-17 14:48:04,589 : INFO : topic #0 (0.200): 0.006*\"com\" + 0.006*\"space\" + 0.005*\"new\" + 0.005*\"armenian\" + 0.005*\"univers\" + 0.004*\"like\" + 0.004*\"peopl\" + 0.004*\"time\" + 0.004*\"nntp\" + 0.004*\"turkish\"\n", - "2019-01-17 14:48:04,590 : INFO : topic #1 (0.200): 0.007*\"peopl\" + 0.007*\"com\" + 0.006*\"know\" + 0.006*\"like\" + 0.006*\"think\" + 0.005*\"god\" + 0.005*\"said\" + 0.004*\"time\" + 0.004*\"thing\" + 0.004*\"univers\"\n", - "2019-01-17 14:48:04,590 : INFO : topic #2 (0.200): 0.007*\"israel\" + 0.005*\"isra\" + 0.005*\"peopl\" + 0.005*\"islam\" + 0.005*\"like\" + 0.005*\"time\" + 0.005*\"univers\" + 0.005*\"state\" + 0.004*\"god\" + 0.004*\"know\"\n", - "2019-01-17 14:48:04,591 : INFO : topic #3 (0.200): 0.011*\"imag\" + 0.009*\"com\" + 0.007*\"file\" + 0.006*\"graphic\" + 0.005*\"program\" + 0.005*\"like\" + 0.005*\"host\" + 0.004*\"nntp\" + 0.004*\"univers\" + 0.004*\"us\"\n", - "2019-01-17 14:48:04,592 : INFO : topic #4 (0.200): 0.011*\"armenian\" + 0.009*\"peopl\" + 0.009*\"space\" + 0.005*\"know\" + 0.005*\"nasa\" + 0.004*\"com\" + 0.004*\"right\" + 0.004*\"like\" + 0.003*\"said\" + 0.003*\"armenia\"\n", - "2019-01-17 14:48:04,592 : INFO : topic diff=0.848670, rho=0.707107\n", - "2019-01-17 14:48:05,706 : INFO : -8.075 per-word bound, 269.6 perplexity estimate based on a held-out corpus of 819 documents with 113268 words\n", - "2019-01-17 14:48:05,707 : INFO : PROGRESS: pass 0, at document #2819/2819\n", - "2019-01-17 14:48:06,380 : INFO : merging changes from 819 documents into a model of 2819 documents\n", - "2019-01-17 14:48:06,384 : INFO : topic #0 (0.200): 0.006*\"com\" + 0.006*\"space\" + 0.005*\"new\" + 0.005*\"turkish\" + 0.005*\"bike\" + 0.005*\"univers\" + 0.004*\"year\" + 0.004*\"like\" + 0.004*\"armenian\" + 0.004*\"time\"\n", - "2019-01-17 14:48:06,386 : INFO : topic #1 (0.200): 0.009*\"com\" + 0.007*\"peopl\" + 0.007*\"like\" + 0.006*\"think\" + 0.006*\"god\" + 0.006*\"know\" + 0.005*\"thing\" + 0.005*\"said\" + 0.004*\"moral\" + 0.004*\"time\"\n", - "2019-01-17 14:48:06,386 : INFO : topic #2 (0.200): 0.010*\"israel\" + 0.007*\"isra\" + 0.006*\"jew\" + 0.006*\"peopl\" + 0.005*\"state\" + 0.005*\"univers\" + 0.005*\"islam\" + 0.005*\"think\" + 0.005*\"time\" + 0.004*\"arab\"\n", - "2019-01-17 14:48:06,387 : INFO : topic #3 (0.200): 0.011*\"com\" + 0.009*\"graphic\" + 0.009*\"imag\" + 0.007*\"file\" + 0.006*\"program\" + 0.005*\"host\" + 0.005*\"nntp\" + 0.005*\"softwar\" + 0.005*\"us\" + 0.005*\"like\"\n", - "2019-01-17 14:48:06,388 : INFO : topic #4 (0.200): 0.014*\"armenian\" + 0.010*\"space\" + 0.008*\"peopl\" + 0.006*\"turkish\" + 0.005*\"launch\" + 0.004*\"nasa\" + 0.004*\"year\" + 0.004*\"turkei\" + 0.004*\"armenia\" + 0.004*\"know\"\n", - "2019-01-17 14:48:06,389 : INFO : topic diff=0.663292, rho=0.577350\n", - "2019-01-17 14:48:06,390 : INFO : PROGRESS: pass 1, at document #1000/2819\n", - "2019-01-17 14:48:07,142 : INFO : merging changes from 1000 documents into a model of 2819 documents\n", - "2019-01-17 14:48:07,147 : INFO : topic #0 (0.200): 0.007*\"com\" + 0.007*\"space\" + 0.005*\"new\" + 0.005*\"bike\" + 0.005*\"univers\" + 0.004*\"like\" + 0.004*\"turkish\" + 0.004*\"time\" + 0.004*\"year\" + 0.004*\"nntp\"\n", - "2019-01-17 14:48:07,148 : INFO : topic #1 (0.200): 0.009*\"com\" + 0.007*\"peopl\" + 0.007*\"like\" + 0.007*\"god\" + 0.006*\"think\" + 0.006*\"know\" + 0.005*\"thing\" + 0.005*\"moral\" + 0.005*\"time\" + 0.004*\"said\"\n", - "2019-01-17 14:48:07,148 : INFO : topic #2 (0.200): 0.011*\"israel\" + 0.009*\"isra\" + 0.006*\"peopl\" + 0.006*\"jew\" + 0.005*\"arab\" + 0.005*\"islam\" + 0.005*\"think\" + 0.005*\"right\" + 0.005*\"state\" + 0.004*\"univers\"\n", - "2019-01-17 14:48:07,149 : INFO : topic #3 (0.200): 0.012*\"imag\" + 0.010*\"com\" + 0.009*\"file\" + 0.009*\"graphic\" + 0.006*\"program\" + 0.005*\"host\" + 0.005*\"us\" + 0.005*\"jpeg\" + 0.005*\"nntp\" + 0.005*\"univers\"\n", - "2019-01-17 14:48:07,150 : INFO : topic #4 (0.200): 0.014*\"armenian\" + 0.011*\"space\" + 0.008*\"peopl\" + 0.006*\"nasa\" + 0.006*\"turkish\" + 0.005*\"launch\" + 0.004*\"year\" + 0.004*\"armenia\" + 0.004*\"said\" + 0.004*\"orbit\"\n", - "2019-01-17 14:48:07,150 : INFO : topic diff=0.431707, rho=0.455535\n", - "2019-01-17 14:48:07,151 : INFO : PROGRESS: pass 1, at document #2000/2819\n", - "2019-01-17 14:48:07,831 : INFO : merging changes from 1000 documents into a model of 2819 documents\n", - "2019-01-17 14:48:07,836 : INFO : topic #0 (0.200): 0.008*\"space\" + 0.007*\"com\" + 0.006*\"new\" + 0.005*\"bike\" + 0.005*\"univers\" + 0.004*\"like\" + 0.004*\"year\" + 0.004*\"nntp\" + 0.004*\"host\" + 0.004*\"time\"\n", - "2019-01-17 14:48:07,837 : INFO : topic #1 (0.200): 0.009*\"com\" + 0.008*\"god\" + 0.007*\"peopl\" + 0.007*\"like\" + 0.007*\"think\" + 0.006*\"know\" + 0.005*\"thing\" + 0.005*\"moral\" + 0.005*\"time\" + 0.004*\"said\"\n", - "2019-01-17 14:48:07,838 : INFO : topic #2 (0.200): 0.011*\"israel\" + 0.009*\"isra\" + 0.007*\"jew\" + 0.006*\"peopl\" + 0.006*\"arab\" + 0.006*\"islam\" + 0.005*\"state\" + 0.005*\"right\" + 0.005*\"think\" + 0.004*\"univers\"\n", - "2019-01-17 14:48:07,838 : INFO : topic #3 (0.200): 0.013*\"imag\" + 0.010*\"com\" + 0.008*\"file\" + 0.008*\"graphic\" + 0.007*\"program\" + 0.005*\"us\" + 0.005*\"host\" + 0.005*\"univers\" + 0.005*\"softwar\" + 0.005*\"nntp\"\n", - "2019-01-17 14:48:07,839 : INFO : topic #4 (0.200): 0.016*\"armenian\" + 0.010*\"space\" + 0.009*\"peopl\" + 0.005*\"turkish\" + 0.005*\"said\" + 0.005*\"nasa\" + 0.005*\"know\" + 0.004*\"armenia\" + 0.004*\"year\" + 0.004*\"like\"\n", - "2019-01-17 14:48:07,840 : INFO : topic diff=0.436104, rho=0.455535\n", - "2019-01-17 14:48:08,814 : INFO : -7.846 per-word bound, 230.1 perplexity estimate based on a held-out corpus of 819 documents with 113268 words\n", - "2019-01-17 14:48:08,815 : INFO : PROGRESS: pass 1, at document #2819/2819\n", - "2019-01-17 14:48:09,364 : INFO : merging changes from 819 documents into a model of 2819 documents\n", - "2019-01-17 14:48:09,368 : INFO : topic #0 (0.200): 0.008*\"space\" + 0.007*\"com\" + 0.006*\"bike\" + 0.006*\"new\" + 0.005*\"univers\" + 0.005*\"year\" + 0.004*\"like\" + 0.004*\"orbit\" + 0.004*\"dod\" + 0.004*\"host\"\n", - "2019-01-17 14:48:09,370 : INFO : topic #1 (0.200): 0.010*\"com\" + 0.008*\"god\" + 0.007*\"peopl\" + 0.007*\"like\" + 0.007*\"think\" + 0.006*\"know\" + 0.005*\"thing\" + 0.005*\"moral\" + 0.005*\"time\" + 0.004*\"said\"\n", - "2019-01-17 14:48:09,371 : INFO : topic #2 (0.200): 0.012*\"israel\" + 0.009*\"isra\" + 0.008*\"jew\" + 0.007*\"peopl\" + 0.006*\"arab\" + 0.005*\"state\" + 0.005*\"islam\" + 0.005*\"right\" + 0.005*\"think\" + 0.004*\"univers\"\n", - "2019-01-17 14:48:09,374 : INFO : topic #3 (0.200): 0.011*\"imag\" + 0.010*\"com\" + 0.010*\"graphic\" + 0.008*\"file\" + 0.007*\"program\" + 0.006*\"softwar\" + 0.005*\"host\" + 0.005*\"us\" + 0.005*\"nntp\" + 0.005*\"univers\"\n", - "2019-01-17 14:48:09,374 : INFO : topic #4 (0.200): 0.017*\"armenian\" + 0.009*\"turkish\" + 0.009*\"space\" + 0.008*\"peopl\" + 0.005*\"said\" + 0.005*\"launch\" + 0.005*\"armenia\" + 0.005*\"year\" + 0.005*\"nasa\" + 0.004*\"turkei\"\n" + "2019-01-31 03:18:27,010 : INFO : using symmetric alpha at 0.2\n", + "2019-01-31 03:18:27,012 : INFO : using symmetric eta at 0.2\n", + "2019-01-31 03:18:27,018 : INFO : using serial LDA version on this node\n", + "2019-01-31 03:18:27,026 : INFO : running online (multi-pass) LDA training, 5 topics, 5 passes over the supplied corpus of 2819 documents, updating model once every 1000 documents, evaluating perplexity every 2819 documents, iterating 50x with a convergence threshold of 0.001000\n", + "2019-01-31 03:18:27,027 : INFO : PROGRESS: pass 0, at document #1000/2819\n", + "2019-01-31 03:18:28,047 : INFO : merging changes from 1000 documents into a model of 2819 documents\n", + "2019-01-31 03:18:28,052 : INFO : topic #0 (0.200): 0.006*\"com\" + 0.005*\"new\" + 0.005*\"peopl\" + 0.004*\"space\" + 0.004*\"like\" + 0.004*\"univers\" + 0.004*\"time\" + 0.004*\"nntp\" + 0.004*\"armenian\" + 0.004*\"host\"\n", + "2019-01-31 03:18:28,053 : INFO : topic #1 (0.200): 0.007*\"com\" + 0.005*\"like\" + 0.005*\"peopl\" + 0.005*\"know\" + 0.004*\"think\" + 0.004*\"time\" + 0.004*\"god\" + 0.004*\"univers\" + 0.004*\"said\" + 0.004*\"host\"\n", + "2019-01-31 03:18:28,054 : INFO : topic #2 (0.200): 0.005*\"time\" + 0.005*\"like\" + 0.005*\"com\" + 0.005*\"israel\" + 0.005*\"space\" + 0.005*\"univers\" + 0.004*\"peopl\" + 0.004*\"islam\" + 0.004*\"host\" + 0.004*\"isra\"\n", + "2019-01-31 03:18:28,057 : INFO : topic #3 (0.200): 0.008*\"com\" + 0.006*\"jpeg\" + 0.006*\"imag\" + 0.005*\"nntp\" + 0.005*\"think\" + 0.005*\"file\" + 0.005*\"host\" + 0.004*\"like\" + 0.004*\"univers\" + 0.004*\"graphic\"\n", + "2019-01-31 03:18:28,059 : INFO : topic #4 (0.200): 0.007*\"peopl\" + 0.006*\"space\" + 0.006*\"com\" + 0.005*\"armenian\" + 0.004*\"know\" + 0.004*\"nasa\" + 0.003*\"right\" + 0.003*\"like\" + 0.003*\"point\" + 0.003*\"time\"\n", + "2019-01-31 03:18:28,060 : INFO : topic diff=1.686979, rho=1.000000\n", + "2019-01-31 03:18:28,062 : INFO : PROGRESS: pass 0, at document #2000/2819\n", + "2019-01-31 03:18:29,018 : INFO : merging changes from 1000 documents into a model of 2819 documents\n", + "2019-01-31 03:18:29,025 : INFO : topic #0 (0.200): 0.006*\"com\" + 0.006*\"space\" + 0.005*\"new\" + 0.005*\"armenian\" + 0.005*\"univers\" + 0.004*\"like\" + 0.004*\"peopl\" + 0.004*\"time\" + 0.004*\"nntp\" + 0.004*\"turkish\"\n", + "2019-01-31 03:18:29,027 : INFO : topic #1 (0.200): 0.007*\"peopl\" + 0.007*\"com\" + 0.006*\"know\" + 0.006*\"like\" + 0.006*\"think\" + 0.005*\"god\" + 0.005*\"said\" + 0.004*\"time\" + 0.004*\"thing\" + 0.004*\"univers\"\n", + "2019-01-31 03:18:29,028 : INFO : topic #2 (0.200): 0.007*\"israel\" + 0.005*\"isra\" + 0.005*\"peopl\" + 0.005*\"islam\" + 0.005*\"like\" + 0.005*\"time\" + 0.005*\"univers\" + 0.005*\"state\" + 0.004*\"god\" + 0.004*\"know\"\n", + "2019-01-31 03:18:29,031 : INFO : topic #3 (0.200): 0.011*\"imag\" + 0.009*\"com\" + 0.007*\"file\" + 0.006*\"graphic\" + 0.005*\"program\" + 0.005*\"like\" + 0.005*\"host\" + 0.004*\"nntp\" + 0.004*\"univers\" + 0.004*\"us\"\n", + "2019-01-31 03:18:29,034 : INFO : topic #4 (0.200): 0.011*\"armenian\" + 0.009*\"peopl\" + 0.009*\"space\" + 0.005*\"know\" + 0.005*\"nasa\" + 0.004*\"com\" + 0.004*\"right\" + 0.004*\"like\" + 0.003*\"said\" + 0.003*\"armenia\"\n", + "2019-01-31 03:18:29,035 : INFO : topic diff=0.848667, rho=0.707107\n", + "2019-01-31 03:18:30,239 : INFO : -8.075 per-word bound, 269.6 perplexity estimate based on a held-out corpus of 819 documents with 113268 words\n", + "2019-01-31 03:18:30,240 : INFO : PROGRESS: pass 0, at document #2819/2819\n", + "2019-01-31 03:18:30,922 : INFO : merging changes from 819 documents into a model of 2819 documents\n", + "2019-01-31 03:18:30,927 : INFO : topic #0 (0.200): 0.006*\"com\" + 0.006*\"space\" + 0.005*\"new\" + 0.005*\"turkish\" + 0.005*\"bike\" + 0.005*\"univers\" + 0.004*\"year\" + 0.004*\"like\" + 0.004*\"armenian\" + 0.004*\"time\"\n", + "2019-01-31 03:18:30,929 : INFO : topic #1 (0.200): 0.009*\"com\" + 0.007*\"peopl\" + 0.007*\"like\" + 0.006*\"think\" + 0.006*\"god\" + 0.006*\"know\" + 0.005*\"thing\" + 0.005*\"said\" + 0.004*\"moral\" + 0.004*\"time\"\n", + "2019-01-31 03:18:30,930 : INFO : topic #2 (0.200): 0.010*\"israel\" + 0.007*\"isra\" + 0.006*\"jew\" + 0.006*\"peopl\" + 0.005*\"state\" + 0.005*\"univers\" + 0.005*\"islam\" + 0.005*\"think\" + 0.005*\"time\" + 0.004*\"arab\"\n", + "2019-01-31 03:18:30,932 : INFO : topic #3 (0.200): 0.011*\"com\" + 0.009*\"graphic\" + 0.009*\"imag\" + 0.007*\"file\" + 0.006*\"program\" + 0.005*\"host\" + 0.005*\"nntp\" + 0.005*\"softwar\" + 0.005*\"us\" + 0.005*\"like\"\n", + "2019-01-31 03:18:30,934 : INFO : topic #4 (0.200): 0.014*\"armenian\" + 0.010*\"space\" + 0.008*\"peopl\" + 0.006*\"turkish\" + 0.005*\"launch\" + 0.004*\"nasa\" + 0.004*\"year\" + 0.004*\"turkei\" + 0.004*\"armenia\" + 0.004*\"know\"\n", + "2019-01-31 03:18:30,935 : INFO : topic diff=0.663294, rho=0.577350\n", + "2019-01-31 03:18:30,939 : INFO : PROGRESS: pass 1, at document #1000/2819\n", + "2019-01-31 03:18:31,707 : INFO : merging changes from 1000 documents into a model of 2819 documents\n", + "2019-01-31 03:18:31,711 : INFO : topic #0 (0.200): 0.007*\"com\" + 0.007*\"space\" + 0.005*\"new\" + 0.005*\"bike\" + 0.005*\"univers\" + 0.004*\"like\" + 0.004*\"turkish\" + 0.004*\"time\" + 0.004*\"year\" + 0.004*\"nntp\"\n", + "2019-01-31 03:18:31,714 : INFO : topic #1 (0.200): 0.009*\"com\" + 0.007*\"peopl\" + 0.007*\"like\" + 0.007*\"god\" + 0.006*\"think\" + 0.006*\"know\" + 0.005*\"thing\" + 0.005*\"moral\" + 0.005*\"time\" + 0.004*\"said\"\n", + "2019-01-31 03:18:31,716 : INFO : topic #2 (0.200): 0.011*\"israel\" + 0.009*\"isra\" + 0.006*\"peopl\" + 0.006*\"jew\" + 0.005*\"arab\" + 0.005*\"islam\" + 0.005*\"think\" + 0.005*\"right\" + 0.005*\"state\" + 0.004*\"univers\"\n", + "2019-01-31 03:18:31,717 : INFO : topic #3 (0.200): 0.012*\"imag\" + 0.010*\"com\" + 0.009*\"file\" + 0.009*\"graphic\" + 0.006*\"program\" + 0.005*\"host\" + 0.005*\"us\" + 0.005*\"jpeg\" + 0.005*\"nntp\" + 0.005*\"univers\"\n", + "2019-01-31 03:18:31,718 : INFO : topic #4 (0.200): 0.014*\"armenian\" + 0.011*\"space\" + 0.008*\"peopl\" + 0.006*\"nasa\" + 0.006*\"turkish\" + 0.005*\"launch\" + 0.004*\"year\" + 0.004*\"armenia\" + 0.004*\"said\" + 0.004*\"orbit\"\n", + "2019-01-31 03:18:31,719 : INFO : topic diff=0.431708, rho=0.455535\n", + "2019-01-31 03:18:31,720 : INFO : PROGRESS: pass 1, at document #2000/2819\n", + "2019-01-31 03:18:32,621 : INFO : merging changes from 1000 documents into a model of 2819 documents\n", + "2019-01-31 03:18:32,625 : INFO : topic #0 (0.200): 0.008*\"space\" + 0.007*\"com\" + 0.006*\"new\" + 0.005*\"bike\" + 0.005*\"univers\" + 0.004*\"like\" + 0.004*\"year\" + 0.004*\"nntp\" + 0.004*\"host\" + 0.004*\"time\"\n", + "2019-01-31 03:18:32,626 : INFO : topic #1 (0.200): 0.009*\"com\" + 0.008*\"god\" + 0.007*\"peopl\" + 0.007*\"like\" + 0.007*\"think\" + 0.006*\"know\" + 0.005*\"thing\" + 0.005*\"moral\" + 0.005*\"time\" + 0.004*\"said\"\n", + "2019-01-31 03:18:32,628 : INFO : topic #2 (0.200): 0.011*\"israel\" + 0.009*\"isra\" + 0.007*\"jew\" + 0.006*\"peopl\" + 0.006*\"arab\" + 0.006*\"islam\" + 0.005*\"state\" + 0.005*\"right\" + 0.005*\"think\" + 0.004*\"univers\"\n", + "2019-01-31 03:18:32,630 : INFO : topic #3 (0.200): 0.013*\"imag\" + 0.010*\"com\" + 0.008*\"file\" + 0.008*\"graphic\" + 0.007*\"program\" + 0.005*\"us\" + 0.005*\"host\" + 0.005*\"univers\" + 0.005*\"softwar\" + 0.005*\"nntp\"\n", + "2019-01-31 03:18:32,631 : INFO : topic #4 (0.200): 0.016*\"armenian\" + 0.010*\"space\" + 0.009*\"peopl\" + 0.005*\"turkish\" + 0.005*\"said\" + 0.005*\"nasa\" + 0.005*\"know\" + 0.004*\"armenia\" + 0.004*\"year\" + 0.004*\"like\"\n", + "2019-01-31 03:18:32,632 : INFO : topic diff=0.436104, rho=0.455535\n", + "2019-01-31 03:18:33,790 : INFO : -7.846 per-word bound, 230.1 perplexity estimate based on a held-out corpus of 819 documents with 113268 words\n", + "2019-01-31 03:18:33,791 : INFO : PROGRESS: pass 1, at document #2819/2819\n", + "2019-01-31 03:18:34,344 : INFO : merging changes from 819 documents into a model of 2819 documents\n", + "2019-01-31 03:18:34,348 : INFO : topic #0 (0.200): 0.008*\"space\" + 0.007*\"com\" + 0.006*\"bike\" + 0.006*\"new\" + 0.005*\"univers\" + 0.005*\"year\" + 0.004*\"like\" + 0.004*\"orbit\" + 0.004*\"dod\" + 0.004*\"host\"\n", + "2019-01-31 03:18:34,349 : INFO : topic #1 (0.200): 0.010*\"com\" + 0.008*\"god\" + 0.007*\"peopl\" + 0.007*\"like\" + 0.007*\"think\" + 0.006*\"know\" + 0.005*\"thing\" + 0.005*\"moral\" + 0.005*\"time\" + 0.004*\"said\"\n", + "2019-01-31 03:18:34,351 : INFO : topic #2 (0.200): 0.012*\"israel\" + 0.009*\"isra\" + 0.008*\"jew\" + 0.007*\"peopl\" + 0.006*\"arab\" + 0.005*\"state\" + 0.005*\"islam\" + 0.005*\"right\" + 0.005*\"think\" + 0.004*\"univers\"\n", + "2019-01-31 03:18:34,353 : INFO : topic #3 (0.200): 0.011*\"imag\" + 0.010*\"com\" + 0.010*\"graphic\" + 0.008*\"file\" + 0.007*\"program\" + 0.006*\"softwar\" + 0.005*\"host\" + 0.005*\"us\" + 0.005*\"nntp\" + 0.005*\"univers\"\n", + "2019-01-31 03:18:34,355 : INFO : topic #4 (0.200): 0.017*\"armenian\" + 0.009*\"turkish\" + 0.009*\"space\" + 0.008*\"peopl\" + 0.005*\"said\" + 0.005*\"launch\" + 0.005*\"armenia\" + 0.005*\"year\" + 0.005*\"nasa\" + 0.004*\"turkei\"\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ - "2019-01-17 14:48:09,377 : INFO : topic diff=0.423402, rho=0.455535\n", - "2019-01-17 14:48:09,378 : INFO : PROGRESS: pass 2, at document #1000/2819\n", - "2019-01-17 14:48:09,997 : INFO : merging changes from 1000 documents into a model of 2819 documents\n", - "2019-01-17 14:48:10,002 : INFO : topic #0 (0.200): 0.009*\"space\" + 0.007*\"com\" + 0.006*\"bike\" + 0.006*\"new\" + 0.005*\"univers\" + 0.005*\"orbit\" + 0.004*\"nasa\" + 0.004*\"year\" + 0.004*\"like\" + 0.004*\"time\"\n", - "2019-01-17 14:48:10,003 : INFO : topic #1 (0.200): 0.010*\"com\" + 0.009*\"god\" + 0.007*\"peopl\" + 0.007*\"like\" + 0.007*\"think\" + 0.006*\"know\" + 0.006*\"thing\" + 0.006*\"moral\" + 0.005*\"time\" + 0.005*\"atheist\"\n", - "2019-01-17 14:48:10,006 : INFO : topic #2 (0.200): 0.012*\"israel\" + 0.010*\"isra\" + 0.007*\"jew\" + 0.007*\"peopl\" + 0.006*\"arab\" + 0.006*\"islam\" + 0.005*\"right\" + 0.005*\"think\" + 0.005*\"state\" + 0.004*\"univers\"\n", - "2019-01-17 14:48:10,007 : INFO : topic #3 (0.200): 0.013*\"imag\" + 0.009*\"file\" + 0.009*\"graphic\" + 0.009*\"com\" + 0.007*\"program\" + 0.006*\"us\" + 0.006*\"host\" + 0.005*\"univers\" + 0.005*\"jpeg\" + 0.005*\"nntp\"\n", - "2019-01-17 14:48:10,008 : INFO : topic #4 (0.200): 0.017*\"armenian\" + 0.009*\"turkish\" + 0.008*\"peopl\" + 0.008*\"space\" + 0.005*\"said\" + 0.005*\"nasa\" + 0.005*\"armenia\" + 0.005*\"year\" + 0.004*\"launch\" + 0.004*\"turkei\"\n", - "2019-01-17 14:48:10,008 : INFO : topic diff=0.333963, rho=0.414549\n", - "2019-01-17 14:48:10,010 : INFO : PROGRESS: pass 2, at document #2000/2819\n", - "2019-01-17 14:48:10,635 : INFO : merging changes from 1000 documents into a model of 2819 documents\n", - "2019-01-17 14:48:10,640 : INFO : topic #0 (0.200): 0.011*\"space\" + 0.008*\"com\" + 0.006*\"bike\" + 0.006*\"new\" + 0.005*\"nasa\" + 0.005*\"univers\" + 0.005*\"orbit\" + 0.004*\"year\" + 0.004*\"like\" + 0.004*\"host\"\n", - "2019-01-17 14:48:10,640 : INFO : topic #1 (0.200): 0.010*\"com\" + 0.010*\"god\" + 0.007*\"peopl\" + 0.007*\"like\" + 0.007*\"think\" + 0.006*\"know\" + 0.006*\"thing\" + 0.005*\"moral\" + 0.005*\"time\" + 0.004*\"atheist\"\n", - "2019-01-17 14:48:10,643 : INFO : topic #2 (0.200): 0.012*\"israel\" + 0.010*\"isra\" + 0.008*\"jew\" + 0.007*\"arab\" + 0.007*\"peopl\" + 0.006*\"islam\" + 0.006*\"state\" + 0.005*\"right\" + 0.005*\"think\" + 0.004*\"univers\"\n", - "2019-01-17 14:48:10,646 : INFO : topic #3 (0.200): 0.014*\"imag\" + 0.009*\"file\" + 0.009*\"graphic\" + 0.009*\"com\" + 0.007*\"program\" + 0.006*\"us\" + 0.006*\"univers\" + 0.005*\"softwar\" + 0.005*\"host\" + 0.005*\"nntp\"\n", - "2019-01-17 14:48:10,647 : INFO : topic #4 (0.200): 0.018*\"armenian\" + 0.010*\"peopl\" + 0.008*\"turkish\" + 0.007*\"space\" + 0.006*\"said\" + 0.005*\"know\" + 0.005*\"armenia\" + 0.004*\"like\" + 0.004*\"year\" + 0.004*\"nasa\"\n", - "2019-01-17 14:48:10,647 : INFO : topic diff=0.334135, rho=0.414549\n", - "2019-01-17 14:48:11,575 : INFO : -7.786 per-word bound, 220.6 perplexity estimate based on a held-out corpus of 819 documents with 113268 words\n", - "2019-01-17 14:48:11,576 : INFO : PROGRESS: pass 2, at document #2819/2819\n", - "2019-01-17 14:48:12,086 : INFO : merging changes from 819 documents into a model of 2819 documents\n", - "2019-01-17 14:48:12,092 : INFO : topic #0 (0.200): 0.011*\"space\" + 0.008*\"com\" + 0.007*\"bike\" + 0.006*\"new\" + 0.005*\"univers\" + 0.005*\"orbit\" + 0.005*\"nasa\" + 0.005*\"year\" + 0.004*\"like\" + 0.004*\"satellit\"\n", - "2019-01-17 14:48:12,093 : INFO : topic #1 (0.200): 0.011*\"com\" + 0.010*\"god\" + 0.008*\"peopl\" + 0.007*\"think\" + 0.007*\"like\" + 0.006*\"thing\" + 0.006*\"know\" + 0.005*\"moral\" + 0.005*\"time\" + 0.004*\"believ\"\n", - "2019-01-17 14:48:12,094 : INFO : topic #2 (0.200): 0.012*\"israel\" + 0.010*\"isra\" + 0.009*\"jew\" + 0.007*\"peopl\" + 0.007*\"arab\" + 0.006*\"state\" + 0.005*\"islam\" + 0.005*\"right\" + 0.005*\"think\" + 0.004*\"univers\"\n", - "2019-01-17 14:48:12,095 : INFO : topic #3 (0.200): 0.012*\"imag\" + 0.010*\"graphic\" + 0.009*\"com\" + 0.009*\"file\" + 0.007*\"program\" + 0.006*\"softwar\" + 0.006*\"us\" + 0.005*\"univers\" + 0.005*\"host\" + 0.005*\"mail\"\n", - "2019-01-17 14:48:12,096 : INFO : topic #4 (0.200): 0.018*\"armenian\" + 0.011*\"turkish\" + 0.009*\"peopl\" + 0.006*\"said\" + 0.006*\"space\" + 0.005*\"turkei\" + 0.005*\"armenia\" + 0.005*\"turk\" + 0.005*\"year\" + 0.005*\"know\"\n", - "2019-01-17 14:48:12,099 : INFO : topic diff=0.321527, rho=0.414549\n", - "2019-01-17 14:48:12,100 : INFO : PROGRESS: pass 3, at document #1000/2819\n", - "2019-01-17 14:48:12,722 : INFO : merging changes from 1000 documents into a model of 2819 documents\n", - "2019-01-17 14:48:12,727 : INFO : topic #0 (0.200): 0.012*\"space\" + 0.008*\"com\" + 0.007*\"bike\" + 0.006*\"orbit\" + 0.006*\"nasa\" + 0.006*\"new\" + 0.005*\"univers\" + 0.005*\"year\" + 0.004*\"like\" + 0.004*\"host\"\n", - "2019-01-17 14:48:12,728 : INFO : topic #1 (0.200): 0.011*\"com\" + 0.010*\"god\" + 0.008*\"peopl\" + 0.007*\"like\" + 0.007*\"think\" + 0.006*\"thing\" + 0.006*\"know\" + 0.006*\"moral\" + 0.005*\"time\" + 0.005*\"atheist\"\n", - "2019-01-17 14:48:12,729 : INFO : topic #2 (0.200): 0.012*\"israel\" + 0.011*\"isra\" + 0.008*\"jew\" + 0.007*\"arab\" + 0.007*\"peopl\" + 0.006*\"islam\" + 0.006*\"right\" + 0.005*\"state\" + 0.005*\"think\" + 0.004*\"univers\"\n", - "2019-01-17 14:48:12,730 : INFO : topic #3 (0.200): 0.013*\"imag\" + 0.010*\"file\" + 0.009*\"graphic\" + 0.008*\"com\" + 0.007*\"program\" + 0.006*\"us\" + 0.006*\"univers\" + 0.005*\"host\" + 0.005*\"jpeg\" + 0.005*\"softwar\"\n", - "2019-01-17 14:48:12,731 : INFO : topic #4 (0.200): 0.018*\"armenian\" + 0.010*\"turkish\" + 0.009*\"peopl\" + 0.006*\"said\" + 0.005*\"armenia\" + 0.005*\"space\" + 0.005*\"turk\" + 0.005*\"turkei\" + 0.004*\"year\" + 0.004*\"know\"\n", - "2019-01-17 14:48:12,731 : INFO : topic diff=0.255652, rho=0.382948\n", - "2019-01-17 14:48:12,732 : INFO : PROGRESS: pass 3, at document #2000/2819\n", - "2019-01-17 14:48:13,320 : INFO : merging changes from 1000 documents into a model of 2819 documents\n", - "2019-01-17 14:48:13,325 : INFO : topic #0 (0.200): 0.013*\"space\" + 0.008*\"com\" + 0.007*\"nasa\" + 0.006*\"bike\" + 0.006*\"new\" + 0.006*\"orbit\" + 0.005*\"univers\" + 0.004*\"year\" + 0.004*\"host\" + 0.004*\"nntp\"\n", - "2019-01-17 14:48:13,326 : INFO : topic #1 (0.200): 0.011*\"god\" + 0.010*\"com\" + 0.008*\"peopl\" + 0.007*\"think\" + 0.007*\"like\" + 0.006*\"know\" + 0.006*\"thing\" + 0.005*\"moral\" + 0.005*\"time\" + 0.005*\"believ\"\n", - "2019-01-17 14:48:13,326 : INFO : topic #2 (0.200): 0.012*\"israel\" + 0.011*\"isra\" + 0.008*\"jew\" + 0.007*\"arab\" + 0.007*\"peopl\" + 0.006*\"islam\" + 0.006*\"state\" + 0.006*\"right\" + 0.005*\"think\" + 0.004*\"jewish\"\n", - "2019-01-17 14:48:13,327 : INFO : topic #3 (0.200): 0.014*\"imag\" + 0.009*\"file\" + 0.009*\"graphic\" + 0.008*\"com\" + 0.007*\"program\" + 0.006*\"us\" + 0.006*\"univers\" + 0.006*\"softwar\" + 0.005*\"host\" + 0.005*\"nntp\"\n", - "2019-01-17 14:48:13,328 : INFO : topic #4 (0.200): 0.019*\"armenian\" + 0.011*\"peopl\" + 0.009*\"turkish\" + 0.007*\"said\" + 0.006*\"know\" + 0.005*\"armenia\" + 0.005*\"turk\" + 0.005*\"like\" + 0.004*\"year\" + 0.004*\"turkei\"\n", - "2019-01-17 14:48:13,328 : INFO : topic diff=0.256253, rho=0.382948\n", - "2019-01-17 14:48:14,249 : INFO : -7.754 per-word bound, 215.8 perplexity estimate based on a held-out corpus of 819 documents with 113268 words\n", - "2019-01-17 14:48:14,250 : INFO : PROGRESS: pass 3, at document #2819/2819\n", - "2019-01-17 14:48:14,719 : INFO : merging changes from 819 documents into a model of 2819 documents\n", - "2019-01-17 14:48:14,724 : INFO : topic #0 (0.200): 0.013*\"space\" + 0.008*\"com\" + 0.007*\"bike\" + 0.006*\"nasa\" + 0.006*\"new\" + 0.005*\"orbit\" + 0.005*\"year\" + 0.005*\"univers\" + 0.005*\"launch\" + 0.004*\"like\"\n", - "2019-01-17 14:48:14,724 : INFO : topic #1 (0.200): 0.011*\"com\" + 0.010*\"god\" + 0.008*\"peopl\" + 0.007*\"think\" + 0.007*\"like\" + 0.006*\"thing\" + 0.006*\"know\" + 0.005*\"moral\" + 0.005*\"believ\" + 0.005*\"time\"\n", - "2019-01-17 14:48:14,725 : INFO : topic #2 (0.200): 0.013*\"israel\" + 0.010*\"isra\" + 0.009*\"jew\" + 0.007*\"arab\" + 0.007*\"peopl\" + 0.006*\"state\" + 0.006*\"islam\" + 0.006*\"right\" + 0.005*\"think\" + 0.004*\"war\"\n", - "2019-01-17 14:48:14,726 : INFO : topic #3 (0.200): 0.012*\"imag\" + 0.010*\"graphic\" + 0.009*\"file\" + 0.008*\"com\" + 0.008*\"program\" + 0.006*\"softwar\" + 0.006*\"us\" + 0.006*\"univers\" + 0.005*\"host\" + 0.005*\"mail\"\n", - "2019-01-17 14:48:14,727 : INFO : topic #4 (0.200): 0.019*\"armenian\" + 0.012*\"turkish\" + 0.010*\"peopl\" + 0.007*\"said\" + 0.006*\"turkei\" + 0.005*\"armenia\" + 0.005*\"turk\" + 0.005*\"know\" + 0.004*\"year\" + 0.004*\"like\"\n", - "2019-01-17 14:48:14,727 : INFO : topic diff=0.249831, rho=0.382948\n", - "2019-01-17 14:48:14,728 : INFO : PROGRESS: pass 4, at document #1000/2819\n", - "2019-01-17 14:48:15,289 : INFO : merging changes from 1000 documents into a model of 2819 documents\n", - "2019-01-17 14:48:15,294 : INFO : topic #0 (0.200): 0.013*\"space\" + 0.008*\"com\" + 0.007*\"bike\" + 0.007*\"nasa\" + 0.006*\"orbit\" + 0.005*\"new\" + 0.005*\"year\" + 0.005*\"univers\" + 0.005*\"launch\" + 0.004*\"host\"\n" + "2019-01-31 03:18:34,356 : INFO : topic diff=0.423402, rho=0.455535\n", + "2019-01-31 03:18:34,357 : INFO : PROGRESS: pass 2, at document #1000/2819\n", + "2019-01-31 03:18:35,071 : INFO : merging changes from 1000 documents into a model of 2819 documents\n", + "2019-01-31 03:18:35,075 : INFO : topic #0 (0.200): 0.009*\"space\" + 0.007*\"com\" + 0.006*\"bike\" + 0.006*\"new\" + 0.005*\"univers\" + 0.005*\"orbit\" + 0.004*\"nasa\" + 0.004*\"year\" + 0.004*\"like\" + 0.004*\"time\"\n", + "2019-01-31 03:18:35,076 : INFO : topic #1 (0.200): 0.010*\"com\" + 0.009*\"god\" + 0.007*\"peopl\" + 0.007*\"like\" + 0.007*\"think\" + 0.006*\"know\" + 0.006*\"thing\" + 0.006*\"moral\" + 0.005*\"time\" + 0.005*\"atheist\"\n", + "2019-01-31 03:18:35,079 : INFO : topic #2 (0.200): 0.012*\"israel\" + 0.010*\"isra\" + 0.007*\"jew\" + 0.007*\"peopl\" + 0.006*\"arab\" + 0.006*\"islam\" + 0.005*\"right\" + 0.005*\"think\" + 0.005*\"state\" + 0.004*\"univers\"\n", + "2019-01-31 03:18:35,080 : INFO : topic #3 (0.200): 0.013*\"imag\" + 0.009*\"file\" + 0.009*\"graphic\" + 0.009*\"com\" + 0.007*\"program\" + 0.006*\"us\" + 0.006*\"host\" + 0.005*\"univers\" + 0.005*\"jpeg\" + 0.005*\"nntp\"\n", + "2019-01-31 03:18:35,081 : INFO : topic #4 (0.200): 0.017*\"armenian\" + 0.009*\"turkish\" + 0.008*\"peopl\" + 0.008*\"space\" + 0.005*\"said\" + 0.005*\"nasa\" + 0.005*\"armenia\" + 0.005*\"year\" + 0.004*\"launch\" + 0.004*\"turkei\"\n", + "2019-01-31 03:18:35,082 : INFO : topic diff=0.333964, rho=0.414549\n", + "2019-01-31 03:18:35,083 : INFO : PROGRESS: pass 2, at document #2000/2819\n", + "2019-01-31 03:18:35,848 : INFO : merging changes from 1000 documents into a model of 2819 documents\n", + "2019-01-31 03:18:35,852 : INFO : topic #0 (0.200): 0.011*\"space\" + 0.008*\"com\" + 0.006*\"bike\" + 0.006*\"new\" + 0.005*\"nasa\" + 0.005*\"univers\" + 0.005*\"orbit\" + 0.004*\"year\" + 0.004*\"like\" + 0.004*\"host\"\n", + "2019-01-31 03:18:35,854 : INFO : topic #1 (0.200): 0.010*\"com\" + 0.010*\"god\" + 0.007*\"peopl\" + 0.007*\"like\" + 0.007*\"think\" + 0.006*\"know\" + 0.006*\"thing\" + 0.005*\"moral\" + 0.005*\"time\" + 0.004*\"atheist\"\n", + "2019-01-31 03:18:35,855 : INFO : topic #2 (0.200): 0.012*\"israel\" + 0.010*\"isra\" + 0.008*\"jew\" + 0.007*\"arab\" + 0.007*\"peopl\" + 0.006*\"islam\" + 0.006*\"state\" + 0.005*\"right\" + 0.005*\"think\" + 0.004*\"univers\"\n", + "2019-01-31 03:18:35,858 : INFO : topic #3 (0.200): 0.014*\"imag\" + 0.009*\"file\" + 0.009*\"graphic\" + 0.009*\"com\" + 0.007*\"program\" + 0.006*\"us\" + 0.006*\"univers\" + 0.005*\"softwar\" + 0.005*\"host\" + 0.005*\"nntp\"\n", + "2019-01-31 03:18:35,859 : INFO : topic #4 (0.200): 0.018*\"armenian\" + 0.010*\"peopl\" + 0.008*\"turkish\" + 0.007*\"space\" + 0.006*\"said\" + 0.005*\"know\" + 0.005*\"armenia\" + 0.004*\"like\" + 0.004*\"year\" + 0.004*\"nasa\"\n", + "2019-01-31 03:18:35,861 : INFO : topic diff=0.334136, rho=0.414549\n", + "2019-01-31 03:18:36,922 : INFO : -7.786 per-word bound, 220.6 perplexity estimate based on a held-out corpus of 819 documents with 113268 words\n", + "2019-01-31 03:18:36,923 : INFO : PROGRESS: pass 2, at document #2819/2819\n", + "2019-01-31 03:18:37,532 : INFO : merging changes from 819 documents into a model of 2819 documents\n", + "2019-01-31 03:18:37,536 : INFO : topic #0 (0.200): 0.011*\"space\" + 0.008*\"com\" + 0.007*\"bike\" + 0.006*\"new\" + 0.005*\"univers\" + 0.005*\"orbit\" + 0.005*\"nasa\" + 0.005*\"year\" + 0.004*\"like\" + 0.004*\"satellit\"\n", + "2019-01-31 03:18:37,537 : INFO : topic #1 (0.200): 0.011*\"com\" + 0.010*\"god\" + 0.008*\"peopl\" + 0.007*\"think\" + 0.007*\"like\" + 0.006*\"thing\" + 0.006*\"know\" + 0.005*\"moral\" + 0.005*\"time\" + 0.004*\"believ\"\n", + "2019-01-31 03:18:37,539 : INFO : topic #2 (0.200): 0.012*\"israel\" + 0.010*\"isra\" + 0.009*\"jew\" + 0.007*\"peopl\" + 0.007*\"arab\" + 0.006*\"state\" + 0.005*\"islam\" + 0.005*\"right\" + 0.005*\"think\" + 0.004*\"univers\"\n", + "2019-01-31 03:18:37,542 : INFO : topic #3 (0.200): 0.012*\"imag\" + 0.010*\"graphic\" + 0.009*\"com\" + 0.009*\"file\" + 0.007*\"program\" + 0.006*\"softwar\" + 0.006*\"us\" + 0.005*\"univers\" + 0.005*\"host\" + 0.005*\"mail\"\n", + "2019-01-31 03:18:37,544 : INFO : topic #4 (0.200): 0.018*\"armenian\" + 0.011*\"turkish\" + 0.009*\"peopl\" + 0.006*\"said\" + 0.006*\"space\" + 0.005*\"turkei\" + 0.005*\"armenia\" + 0.005*\"turk\" + 0.005*\"year\" + 0.005*\"know\"\n", + "2019-01-31 03:18:37,544 : INFO : topic diff=0.321527, rho=0.414549\n", + "2019-01-31 03:18:37,546 : INFO : PROGRESS: pass 3, at document #1000/2819\n", + "2019-01-31 03:18:38,269 : INFO : merging changes from 1000 documents into a model of 2819 documents\n", + "2019-01-31 03:18:38,274 : INFO : topic #0 (0.200): 0.012*\"space\" + 0.008*\"com\" + 0.007*\"bike\" + 0.006*\"orbit\" + 0.006*\"nasa\" + 0.006*\"new\" + 0.005*\"univers\" + 0.005*\"year\" + 0.004*\"like\" + 0.004*\"host\"\n", + "2019-01-31 03:18:38,276 : INFO : topic #1 (0.200): 0.011*\"com\" + 0.010*\"god\" + 0.008*\"peopl\" + 0.007*\"like\" + 0.007*\"think\" + 0.006*\"thing\" + 0.006*\"know\" + 0.006*\"moral\" + 0.005*\"time\" + 0.005*\"atheist\"\n", + "2019-01-31 03:18:38,277 : INFO : topic #2 (0.200): 0.012*\"israel\" + 0.011*\"isra\" + 0.008*\"jew\" + 0.007*\"arab\" + 0.007*\"peopl\" + 0.006*\"islam\" + 0.006*\"right\" + 0.005*\"state\" + 0.005*\"think\" + 0.004*\"univers\"\n", + "2019-01-31 03:18:38,279 : INFO : topic #3 (0.200): 0.013*\"imag\" + 0.010*\"file\" + 0.009*\"graphic\" + 0.008*\"com\" + 0.007*\"program\" + 0.006*\"us\" + 0.006*\"univers\" + 0.005*\"host\" + 0.005*\"jpeg\" + 0.005*\"softwar\"\n", + "2019-01-31 03:18:38,281 : INFO : topic #4 (0.200): 0.018*\"armenian\" + 0.010*\"turkish\" + 0.009*\"peopl\" + 0.006*\"said\" + 0.005*\"armenia\" + 0.005*\"space\" + 0.005*\"turk\" + 0.005*\"turkei\" + 0.004*\"year\" + 0.004*\"know\"\n", + "2019-01-31 03:18:38,289 : INFO : topic diff=0.255652, rho=0.382948\n", + "2019-01-31 03:18:38,291 : INFO : PROGRESS: pass 3, at document #2000/2819\n", + "2019-01-31 03:18:39,204 : INFO : merging changes from 1000 documents into a model of 2819 documents\n", + "2019-01-31 03:18:39,209 : INFO : topic #0 (0.200): 0.013*\"space\" + 0.008*\"com\" + 0.007*\"nasa\" + 0.006*\"bike\" + 0.006*\"new\" + 0.006*\"orbit\" + 0.005*\"univers\" + 0.004*\"year\" + 0.004*\"host\" + 0.004*\"nntp\"\n", + "2019-01-31 03:18:39,211 : INFO : topic #1 (0.200): 0.011*\"god\" + 0.010*\"com\" + 0.008*\"peopl\" + 0.007*\"think\" + 0.007*\"like\" + 0.006*\"know\" + 0.006*\"thing\" + 0.005*\"moral\" + 0.005*\"time\" + 0.005*\"believ\"\n", + "2019-01-31 03:18:39,213 : INFO : topic #2 (0.200): 0.012*\"israel\" + 0.011*\"isra\" + 0.008*\"jew\" + 0.007*\"arab\" + 0.007*\"peopl\" + 0.006*\"islam\" + 0.006*\"state\" + 0.006*\"right\" + 0.005*\"think\" + 0.004*\"jewish\"\n", + "2019-01-31 03:18:39,219 : INFO : topic #3 (0.200): 0.014*\"imag\" + 0.009*\"file\" + 0.009*\"graphic\" + 0.008*\"com\" + 0.007*\"program\" + 0.006*\"us\" + 0.006*\"univers\" + 0.006*\"softwar\" + 0.005*\"host\" + 0.005*\"nntp\"\n", + "2019-01-31 03:18:39,220 : INFO : topic #4 (0.200): 0.019*\"armenian\" + 0.011*\"peopl\" + 0.009*\"turkish\" + 0.007*\"said\" + 0.006*\"know\" + 0.005*\"armenia\" + 0.005*\"turk\" + 0.005*\"like\" + 0.004*\"year\" + 0.004*\"turkei\"\n", + "2019-01-31 03:18:39,222 : INFO : topic diff=0.256253, rho=0.382948\n", + "2019-01-31 03:18:40,239 : INFO : -7.754 per-word bound, 215.8 perplexity estimate based on a held-out corpus of 819 documents with 113268 words\n", + "2019-01-31 03:18:40,240 : INFO : PROGRESS: pass 3, at document #2819/2819\n", + "2019-01-31 03:18:40,808 : INFO : merging changes from 819 documents into a model of 2819 documents\n", + "2019-01-31 03:18:40,815 : INFO : topic #0 (0.200): 0.013*\"space\" + 0.008*\"com\" + 0.007*\"bike\" + 0.006*\"nasa\" + 0.006*\"new\" + 0.005*\"orbit\" + 0.005*\"year\" + 0.005*\"univers\" + 0.005*\"launch\" + 0.004*\"like\"\n", + "2019-01-31 03:18:40,822 : INFO : topic #1 (0.200): 0.011*\"com\" + 0.010*\"god\" + 0.008*\"peopl\" + 0.007*\"think\" + 0.007*\"like\" + 0.006*\"thing\" + 0.006*\"know\" + 0.005*\"moral\" + 0.005*\"believ\" + 0.005*\"time\"\n", + "2019-01-31 03:18:40,831 : INFO : topic #2 (0.200): 0.013*\"israel\" + 0.010*\"isra\" + 0.009*\"jew\" + 0.007*\"arab\" + 0.007*\"peopl\" + 0.006*\"state\" + 0.006*\"islam\" + 0.006*\"right\" + 0.005*\"think\" + 0.004*\"war\"\n", + "2019-01-31 03:18:40,835 : INFO : topic #3 (0.200): 0.012*\"imag\" + 0.010*\"graphic\" + 0.009*\"file\" + 0.008*\"com\" + 0.008*\"program\" + 0.006*\"softwar\" + 0.006*\"us\" + 0.006*\"univers\" + 0.005*\"host\" + 0.005*\"mail\"\n", + "2019-01-31 03:18:40,839 : INFO : topic #4 (0.200): 0.019*\"armenian\" + 0.012*\"turkish\" + 0.010*\"peopl\" + 0.007*\"said\" + 0.006*\"turkei\" + 0.005*\"armenia\" + 0.005*\"turk\" + 0.005*\"know\" + 0.004*\"year\" + 0.004*\"like\"\n", + "2019-01-31 03:18:40,841 : INFO : topic diff=0.249832, rho=0.382948\n", + "2019-01-31 03:18:40,846 : INFO : PROGRESS: pass 4, at document #1000/2819\n", + "2019-01-31 03:18:41,534 : INFO : merging changes from 1000 documents into a model of 2819 documents\n", + "2019-01-31 03:18:41,539 : INFO : topic #0 (0.200): 0.013*\"space\" + 0.008*\"com\" + 0.007*\"bike\" + 0.007*\"nasa\" + 0.006*\"orbit\" + 0.005*\"new\" + 0.005*\"year\" + 0.005*\"univers\" + 0.005*\"launch\" + 0.004*\"host\"\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ - "2019-01-17 14:48:15,295 : INFO : topic #1 (0.200): 0.011*\"com\" + 0.011*\"god\" + 0.008*\"peopl\" + 0.007*\"think\" + 0.007*\"like\" + 0.006*\"thing\" + 0.006*\"know\" + 0.006*\"moral\" + 0.005*\"atheist\" + 0.005*\"time\"\n", - "2019-01-17 14:48:15,296 : INFO : topic #2 (0.200): 0.013*\"israel\" + 0.011*\"isra\" + 0.009*\"jew\" + 0.007*\"arab\" + 0.007*\"peopl\" + 0.006*\"islam\" + 0.006*\"right\" + 0.005*\"state\" + 0.005*\"think\" + 0.004*\"peac\"\n", - "2019-01-17 14:48:15,296 : INFO : topic #3 (0.200): 0.014*\"imag\" + 0.010*\"file\" + 0.010*\"graphic\" + 0.008*\"com\" + 0.008*\"program\" + 0.006*\"us\" + 0.006*\"univers\" + 0.005*\"softwar\" + 0.005*\"host\" + 0.005*\"jpeg\"\n", - "2019-01-17 14:48:15,297 : INFO : topic #4 (0.200): 0.019*\"armenian\" + 0.011*\"turkish\" + 0.010*\"peopl\" + 0.006*\"said\" + 0.006*\"armenia\" + 0.006*\"turk\" + 0.005*\"turkei\" + 0.005*\"know\" + 0.004*\"greek\" + 0.004*\"year\"\n", - "2019-01-17 14:48:15,297 : INFO : topic diff=0.204473, rho=0.357622\n", - "2019-01-17 14:48:15,298 : INFO : PROGRESS: pass 4, at document #2000/2819\n", - "2019-01-17 14:48:15,860 : INFO : merging changes from 1000 documents into a model of 2819 documents\n", - "2019-01-17 14:48:15,865 : INFO : topic #0 (0.200): 0.014*\"space\" + 0.008*\"com\" + 0.008*\"nasa\" + 0.007*\"bike\" + 0.006*\"orbit\" + 0.006*\"new\" + 0.005*\"univers\" + 0.005*\"year\" + 0.004*\"host\" + 0.004*\"nntp\"\n", - "2019-01-17 14:48:15,865 : INFO : topic #1 (0.200): 0.011*\"god\" + 0.010*\"com\" + 0.008*\"peopl\" + 0.007*\"think\" + 0.007*\"like\" + 0.006*\"thing\" + 0.006*\"know\" + 0.005*\"moral\" + 0.005*\"believ\" + 0.005*\"atheist\"\n", - "2019-01-17 14:48:15,868 : INFO : topic #2 (0.200): 0.012*\"israel\" + 0.011*\"isra\" + 0.009*\"jew\" + 0.008*\"arab\" + 0.007*\"peopl\" + 0.006*\"islam\" + 0.006*\"right\" + 0.006*\"state\" + 0.005*\"think\" + 0.004*\"jewish\"\n", - "2019-01-17 14:48:15,869 : INFO : topic #3 (0.200): 0.014*\"imag\" + 0.010*\"file\" + 0.009*\"graphic\" + 0.008*\"program\" + 0.007*\"com\" + 0.006*\"univers\" + 0.006*\"us\" + 0.006*\"softwar\" + 0.005*\"host\" + 0.005*\"need\"\n", - "2019-01-17 14:48:15,870 : INFO : topic #4 (0.200): 0.019*\"armenian\" + 0.011*\"peopl\" + 0.010*\"turkish\" + 0.007*\"said\" + 0.006*\"know\" + 0.006*\"armenia\" + 0.005*\"turk\" + 0.005*\"like\" + 0.005*\"turkei\" + 0.004*\"time\"\n", - "2019-01-17 14:48:15,870 : INFO : topic diff=0.206188, rho=0.357622\n", - "2019-01-17 14:48:16,764 : INFO : -7.735 per-word bound, 213.0 perplexity estimate based on a held-out corpus of 819 documents with 113268 words\n", - "2019-01-17 14:48:16,765 : INFO : PROGRESS: pass 4, at document #2819/2819\n", - "2019-01-17 14:48:17,216 : INFO : merging changes from 819 documents into a model of 2819 documents\n", - "2019-01-17 14:48:17,221 : INFO : topic #0 (0.200): 0.014*\"space\" + 0.008*\"com\" + 0.007*\"bike\" + 0.007*\"nasa\" + 0.005*\"new\" + 0.005*\"orbit\" + 0.005*\"launch\" + 0.005*\"year\" + 0.005*\"univers\" + 0.004*\"like\"\n", - "2019-01-17 14:48:17,222 : INFO : topic #1 (0.200): 0.011*\"god\" + 0.011*\"com\" + 0.008*\"peopl\" + 0.008*\"think\" + 0.007*\"like\" + 0.006*\"thing\" + 0.006*\"know\" + 0.005*\"moral\" + 0.005*\"believ\" + 0.005*\"time\"\n", - "2019-01-17 14:48:17,223 : INFO : topic #2 (0.200): 0.013*\"israel\" + 0.011*\"isra\" + 0.010*\"jew\" + 0.007*\"arab\" + 0.007*\"peopl\" + 0.006*\"state\" + 0.006*\"islam\" + 0.006*\"right\" + 0.005*\"think\" + 0.004*\"jewish\"\n", - "2019-01-17 14:48:17,224 : INFO : topic #3 (0.200): 0.012*\"imag\" + 0.010*\"graphic\" + 0.010*\"file\" + 0.008*\"com\" + 0.008*\"program\" + 0.006*\"softwar\" + 0.006*\"univers\" + 0.006*\"us\" + 0.005*\"mail\" + 0.005*\"host\"\n", - "2019-01-17 14:48:17,224 : INFO : topic #4 (0.200): 0.020*\"armenian\" + 0.012*\"turkish\" + 0.010*\"peopl\" + 0.007*\"said\" + 0.006*\"turkei\" + 0.006*\"armenia\" + 0.006*\"turk\" + 0.005*\"know\" + 0.004*\"greek\" + 0.004*\"year\"\n", - "2019-01-17 14:48:17,225 : INFO : topic diff=0.203500, rho=0.357622\n", - "2019-01-17 14:48:21,544 : INFO : CorpusAccumulator accumulated stats from 1000 documents\n", - "2019-01-17 14:48:31,057 : INFO : Loss (no outliers): 543.9085511209285\tLoss (with outliers): 543.9085511209285\n", - "2019-01-17 14:48:31,780 : INFO : Loss (no outliers): 629.7446210861123\tLoss (with outliers): 629.7446210861123\n", - "2019-01-17 14:48:50,245 : INFO : CorpusAccumulator accumulated stats from 1000 documents\n", - "2019-01-17 14:49:03,569 : INFO : Loss (no outliers): 677.513414250545\tLoss (with outliers): 279.46611421992964\n", - "2019-01-17 14:49:10,097 : INFO : Loss (no outliers): 669.590857352226\tLoss (with outliers): 259.2467646189499\n", - "2019-01-17 14:49:39,601 : INFO : CorpusAccumulator accumulated stats from 1000 documents\n", - "2019-01-17 14:49:40,561 : INFO : Loss (no outliers): 547.4249457586467\tLoss (with outliers): 547.4249457586467\n", - "2019-01-17 14:49:40,838 : INFO : Loss (no outliers): 638.2126742605573\tLoss (with outliers): 638.2126742605573\n", - "2019-01-17 14:49:54,607 : INFO : CorpusAccumulator accumulated stats from 1000 documents\n", - "2019-01-17 14:49:57,634 : INFO : Loss (no outliers): 692.6547711302494\tLoss (with outliers): 287.76899186681857\n", - "2019-01-17 14:49:58,233 : INFO : Loss (no outliers): 695.4958681211045\tLoss (with outliers): 268.2945499450434\n", - "2019-01-17 14:50:21,411 : INFO : CorpusAccumulator accumulated stats from 1000 documents\n", - "2019-01-17 14:50:22,980 : INFO : Loss (no outliers): 543.9085511209285\tLoss (with outliers): 543.9085511209285\n", - "2019-01-17 14:50:23,716 : INFO : Loss (no outliers): 629.7446210861123\tLoss (with outliers): 629.7446210861123\n", - "2019-01-17 14:50:42,308 : INFO : CorpusAccumulator accumulated stats from 1000 documents\n", - "2019-01-17 14:50:56,452 : INFO : Loss (no outliers): 639.6176167237056\tLoss (with outliers): 511.0048240200623\n", - "2019-01-17 14:51:03,333 : INFO : Loss (no outliers): 637.4050783690045\tLoss (with outliers): 498.7006582634081\n", - "2019-01-17 14:51:33,575 : INFO : CorpusAccumulator accumulated stats from 1000 documents\n", - "2019-01-17 14:51:34,425 : INFO : Loss (no outliers): 547.4249457586467\tLoss (with outliers): 547.4249457586467\n", - "2019-01-17 14:51:34,696 : INFO : Loss (no outliers): 638.2126742605573\tLoss (with outliers): 638.2126742605573\n", - "2019-01-17 14:51:48,503 : INFO : CorpusAccumulator accumulated stats from 1000 documents\n", - "2019-01-17 14:51:51,998 : INFO : Loss (no outliers): 651.3812921172465\tLoss (with outliers): 518.2309924866902\n", - "2019-01-17 14:51:53,008 : INFO : Loss (no outliers): 647.9339449245117\tLoss (with outliers): 509.82049860049364\n", - "2019-01-17 14:52:14,849 : INFO : CorpusAccumulator accumulated stats from 1000 documents\n", - "2019-01-17 14:52:16,415 : INFO : Loss (no outliers): 543.9085511209285\tLoss (with outliers): 543.9085511209285\n", - "2019-01-17 14:52:17,127 : INFO : Loss (no outliers): 629.7446210861123\tLoss (with outliers): 629.7446210861123\n", - "2019-01-17 14:52:35,545 : INFO : CorpusAccumulator accumulated stats from 1000 documents\n", - "2019-01-17 14:52:54,059 : INFO : Loss (no outliers): 542.2256187627806\tLoss (with outliers): 542.2256187627806\n", - "2019-01-17 14:53:03,433 : INFO : Loss (no outliers): 624.7035238321835\tLoss (with outliers): 624.6056240734391\n", - "2019-01-17 14:53:30,678 : INFO : CorpusAccumulator accumulated stats from 1000 documents\n", - "2019-01-17 14:53:31,653 : INFO : Loss (no outliers): 547.4249457586467\tLoss (with outliers): 547.4249457586467\n", - "2019-01-17 14:53:31,927 : INFO : Loss (no outliers): 638.2126742605573\tLoss (with outliers): 638.2126742605573\n", - "2019-01-17 14:53:45,702 : INFO : CorpusAccumulator accumulated stats from 1000 documents\n", - "2019-01-17 14:53:50,458 : INFO : Loss (no outliers): 547.1203901181682\tLoss (with outliers): 547.1203901181682\n", - "2019-01-17 14:53:51,589 : INFO : Loss (no outliers): 633.6243596382214\tLoss (with outliers): 633.3634284766107\n", - "2019-01-17 14:54:12,967 : INFO : CorpusAccumulator accumulated stats from 1000 documents\n" + "2019-01-31 03:18:41,542 : INFO : topic #1 (0.200): 0.011*\"com\" + 0.011*\"god\" + 0.008*\"peopl\" + 0.007*\"think\" + 0.007*\"like\" + 0.006*\"thing\" + 0.006*\"know\" + 0.006*\"moral\" + 0.005*\"atheist\" + 0.005*\"time\"\n", + "2019-01-31 03:18:41,543 : INFO : topic #2 (0.200): 0.013*\"israel\" + 0.011*\"isra\" + 0.009*\"jew\" + 0.007*\"arab\" + 0.007*\"peopl\" + 0.006*\"islam\" + 0.006*\"right\" + 0.005*\"state\" + 0.005*\"think\" + 0.004*\"peac\"\n", + "2019-01-31 03:18:41,546 : INFO : topic #3 (0.200): 0.014*\"imag\" + 0.010*\"file\" + 0.010*\"graphic\" + 0.008*\"com\" + 0.008*\"program\" + 0.006*\"us\" + 0.006*\"univers\" + 0.005*\"softwar\" + 0.005*\"host\" + 0.005*\"jpeg\"\n", + "2019-01-31 03:18:41,548 : INFO : topic #4 (0.200): 0.019*\"armenian\" + 0.011*\"turkish\" + 0.010*\"peopl\" + 0.006*\"said\" + 0.006*\"armenia\" + 0.006*\"turk\" + 0.005*\"turkei\" + 0.005*\"know\" + 0.004*\"greek\" + 0.004*\"year\"\n", + "2019-01-31 03:18:41,549 : INFO : topic diff=0.204471, rho=0.357622\n", + "2019-01-31 03:18:41,551 : INFO : PROGRESS: pass 4, at document #2000/2819\n", + "2019-01-31 03:18:42,187 : INFO : merging changes from 1000 documents into a model of 2819 documents\n", + "2019-01-31 03:18:42,191 : INFO : topic #0 (0.200): 0.014*\"space\" + 0.008*\"com\" + 0.008*\"nasa\" + 0.007*\"bike\" + 0.006*\"orbit\" + 0.006*\"new\" + 0.005*\"univers\" + 0.005*\"year\" + 0.004*\"host\" + 0.004*\"nntp\"\n", + "2019-01-31 03:18:42,195 : INFO : topic #1 (0.200): 0.011*\"god\" + 0.010*\"com\" + 0.008*\"peopl\" + 0.007*\"think\" + 0.007*\"like\" + 0.006*\"thing\" + 0.006*\"know\" + 0.005*\"moral\" + 0.005*\"believ\" + 0.005*\"atheist\"\n", + "2019-01-31 03:18:42,197 : INFO : topic #2 (0.200): 0.012*\"israel\" + 0.011*\"isra\" + 0.009*\"jew\" + 0.008*\"arab\" + 0.007*\"peopl\" + 0.006*\"islam\" + 0.006*\"right\" + 0.006*\"state\" + 0.005*\"think\" + 0.004*\"jewish\"\n", + "2019-01-31 03:18:42,199 : INFO : topic #3 (0.200): 0.014*\"imag\" + 0.010*\"file\" + 0.009*\"graphic\" + 0.008*\"program\" + 0.007*\"com\" + 0.006*\"univers\" + 0.006*\"us\" + 0.006*\"softwar\" + 0.005*\"host\" + 0.005*\"need\"\n", + "2019-01-31 03:18:42,201 : INFO : topic #4 (0.200): 0.019*\"armenian\" + 0.011*\"peopl\" + 0.010*\"turkish\" + 0.007*\"said\" + 0.006*\"know\" + 0.006*\"armenia\" + 0.005*\"turk\" + 0.005*\"like\" + 0.005*\"turkei\" + 0.004*\"time\"\n", + "2019-01-31 03:18:42,203 : INFO : topic diff=0.206189, rho=0.357622\n", + "2019-01-31 03:18:43,176 : INFO : -7.735 per-word bound, 213.0 perplexity estimate based on a held-out corpus of 819 documents with 113268 words\n", + "2019-01-31 03:18:43,177 : INFO : PROGRESS: pass 4, at document #2819/2819\n", + "2019-01-31 03:18:43,789 : INFO : merging changes from 819 documents into a model of 2819 documents\n", + "2019-01-31 03:18:43,794 : INFO : topic #0 (0.200): 0.014*\"space\" + 0.008*\"com\" + 0.007*\"bike\" + 0.007*\"nasa\" + 0.005*\"new\" + 0.005*\"orbit\" + 0.005*\"launch\" + 0.005*\"year\" + 0.005*\"univers\" + 0.004*\"like\"\n", + "2019-01-31 03:18:43,795 : INFO : topic #1 (0.200): 0.011*\"god\" + 0.011*\"com\" + 0.008*\"peopl\" + 0.008*\"think\" + 0.007*\"like\" + 0.006*\"thing\" + 0.006*\"know\" + 0.005*\"moral\" + 0.005*\"believ\" + 0.005*\"time\"\n", + "2019-01-31 03:18:43,796 : INFO : topic #2 (0.200): 0.013*\"israel\" + 0.011*\"isra\" + 0.010*\"jew\" + 0.007*\"arab\" + 0.007*\"peopl\" + 0.006*\"state\" + 0.006*\"islam\" + 0.006*\"right\" + 0.005*\"think\" + 0.004*\"jewish\"\n", + "2019-01-31 03:18:43,798 : INFO : topic #3 (0.200): 0.012*\"imag\" + 0.010*\"graphic\" + 0.010*\"file\" + 0.008*\"com\" + 0.008*\"program\" + 0.006*\"softwar\" + 0.006*\"univers\" + 0.006*\"us\" + 0.005*\"mail\" + 0.005*\"host\"\n", + "2019-01-31 03:18:43,799 : INFO : topic #4 (0.200): 0.020*\"armenian\" + 0.012*\"turkish\" + 0.010*\"peopl\" + 0.007*\"said\" + 0.006*\"turkei\" + 0.006*\"armenia\" + 0.006*\"turk\" + 0.005*\"know\" + 0.004*\"greek\" + 0.004*\"year\"\n", + "2019-01-31 03:18:43,801 : INFO : topic diff=0.203499, rho=0.357622\n", + "2019-01-31 03:18:49,095 : INFO : CorpusAccumulator accumulated stats from 1000 documents\n", + "2019-01-31 03:19:05,551 : INFO : Loss: 1.0280021673693736\n", + "2019-01-31 03:19:05,749 : INFO : Loss: 0.9805869534381415\n", + "2019-01-31 03:19:11,783 : INFO : CorpusAccumulator accumulated stats from 1000 documents\n" ] } ], @@ -959,21 +943,19 @@ "))\n", "tm_metrics = tm_metrics.append(pd.Series(row), ignore_index=True)\n", "\n", - "for variable_params in variable_params_grid:\n", - " row = dict()\n", - " row['model'] = 'gensim_nmf'\n", - " row.update(variable_params)\n", - " row['train_time'], model = get_execution_time(\n", - " lambda: GensimNmf(\n", - " normalize=False,\n", - " **fixed_params,\n", - " **variable_params,\n", - " )\n", + "row = dict()\n", + "row['model'] = 'gensim_nmf'\n", + "row['train_time'], model = get_execution_time(\n", + " lambda: GensimNmf(\n", + " normalize=False,\n", + " **fixed_params\n", " )\n", - " row.update(get_tm_metrics(\n", - " model, train_corpus, test_corpus, test_dense_corpus, trainset_target, testset_target,\n", - " ))\n", - " tm_metrics = tm_metrics.append(pd.Series(row), ignore_index=True)" + ")\n", + "row.update(get_tm_metrics(\n", + " model, train_corpus, test_corpus, test_dense_corpus, trainset_target, testset_target,\n", + "))\n", + "tm_metrics = tm_metrics.append(pd.Series(row), ignore_index=True)\n", + "tm_metrics.replace(np.nan, '-', inplace=True)" ] }, { @@ -985,7 +967,7 @@ }, { "cell_type": "code", - "execution_count": 23, + "execution_count": 19, "metadata": {}, "outputs": [ { @@ -1014,251 +996,49 @@ " l2_norm\n", " model\n", " perplexity\n", - " topics\n", " train_time\n", - " lambda_\n", - " sparse_coef\n", - " use_r\n", " \n", " \n", " \n", " \n", - " 5\n", - " -1.675162\n", - " 0.527719\n", - " 7.167809\n", - " gensim_nmf\n", - " 24.738142\n", - " [(0, 0.035*\"com\" + 0.030*\"world\" + 0.030*\"like...\n", - " 3.597497\n", - " 1.0\n", - " 3.0\n", - " 1.0\n", - " \n", - " \n", - " 3\n", - " -1.693074\n", - " 0.625267\n", - " 7.035608\n", - " gensim_nmf\n", - " 2479.600679\n", - " [(0, 0.012*\"com\" + 0.012*\"armenian\" + 0.011*\"w...\n", - " 19.820650\n", - " 1.0\n", - " 0.0\n", - " 1.0\n", - " \n", - " \n", - " 13\n", - " -1.695379\n", - " 0.675373\n", - " 7.183766\n", - " gensim_nmf\n", - " 48.768942\n", - " [(0, 0.025*\"armenian\" + 0.023*\"peopl\" + 0.021*...\n", - " 5.856175\n", - " 100.0\n", - " 3.0\n", - " 1.0\n", - " \n", - " \n", - " 9\n", - " -1.670903\n", - " 0.694030\n", - " 7.131330\n", - " gensim_nmf\n", - " 46.644018\n", - " [(0, 0.031*\"armenian\" + 0.021*\"peopl\" + 0.020*...\n", - " 4.476314\n", - " 10.0\n", - " 3.0\n", - " 1.0\n", - " \n", - " \n", " 1\n", - " NaN\n", - " 0.698827\n", + " -\n", + " 0.696695\n", " 6.929583\n", " sklearn_nmf\n", " 2404.189918\n", - " NaN\n", - " 5.676373\n", - " NaN\n", - " NaN\n", - " NaN\n", - " \n", - " \n", - " 11\n", - " -1.711411\n", - " 0.698827\n", - " 7.059604\n", - " gensim_nmf\n", - " 2460.213716\n", - " [(0, 0.017*\"armenian\" + 0.016*\"peopl\" + 0.015*...\n", - " 27.860318\n", - " 100.0\n", - " 0.0\n", - " 1.0\n", - " \n", - " \n", - " 4\n", - " -1.712103\n", - " 0.700959\n", - " 7.174119\n", - " gensim_nmf\n", - " 55.361718\n", - " [(0, 0.021*\"armenian\" + 0.020*\"peopl\" + 0.019*...\n", - " 1.205277\n", - " 1.0\n", - " 3.0\n", - " 0.0\n", - " \n", - " \n", - " 8\n", - " -1.712103\n", - " 0.700959\n", - " 7.174119\n", - " gensim_nmf\n", - " 55.361718\n", - " [(0, 0.021*\"armenian\" + 0.020*\"peopl\" + 0.019*...\n", - " 1.091239\n", - " 10.0\n", - " 3.0\n", - " 0.0\n", - " \n", - " \n", - " 12\n", - " -1.712103\n", - " 0.700959\n", - " 7.174119\n", - " gensim_nmf\n", - " 55.361718\n", - " [(0, 0.021*\"armenian\" + 0.020*\"peopl\" + 0.019*...\n", - " 1.219200\n", - " 100.0\n", - " 3.0\n", - " 0.0\n", + " 12.541235\n", " \n", " \n", " 2\n", - " -1.702542\n", - " 0.711087\n", - " 7.060992\n", - " gensim_nmf\n", - " 2473.714343\n", - " [(0, 0.017*\"armenian\" + 0.015*\"peopl\" + 0.014*...\n", - " 2.253492\n", - " 1.0\n", - " 0.0\n", - " 0.0\n", - " \n", - " \n", - " 6\n", - " -1.702542\n", - " 0.711087\n", - " 7.060992\n", - " gensim_nmf\n", - " 2473.714343\n", - " [(0, 0.017*\"armenian\" + 0.015*\"peopl\" + 0.014*...\n", - " 2.271240\n", - " 10.0\n", - " 0.0\n", - " 0.0\n", - " \n", - " \n", - " 10\n", - " -1.702542\n", - " 0.711087\n", - " 7.060992\n", + " -1.70539\n", + " 0.715352\n", + " 7.061342\n", " gensim_nmf\n", - " 2473.714343\n", - " [(0, 0.017*\"armenian\" + 0.015*\"peopl\" + 0.014*...\n", - " 2.247909\n", - " 100.0\n", - " 0.0\n", - " 0.0\n", - " \n", - " \n", - " 7\n", - " -1.663787\n", - " 0.750000\n", - " 7.040535\n", - " gensim_nmf\n", - " 2287.018000\n", - " [(0, 0.022*\"armenian\" + 0.015*\"peopl\" + 0.014*...\n", - " 20.997104\n", - " 10.0\n", - " 0.0\n", - " 1.0\n", + " 2475.979773\n", + " 0.656207\n", " \n", " \n", " 0\n", - " -1.755650\n", + " -1.75565\n", " 0.765458\n", " 7.002725\n", " lda\n", - " 1939.575701\n", - " [(0, 0.014*\"space\" + 0.008*\"com\" + 0.007*\"bike...\n", - " 14.540969\n", - " NaN\n", - " NaN\n", - " NaN\n", + " 1939.575705\n", + " 16.793869\n", " \n", " \n", "\n", "" ], "text/plain": [ - " coherence f1 l2_norm model perplexity \\\n", - "5 -1.675162 0.527719 7.167809 gensim_nmf 24.738142 \n", - "3 -1.693074 0.625267 7.035608 gensim_nmf 2479.600679 \n", - "13 -1.695379 0.675373 7.183766 gensim_nmf 48.768942 \n", - "9 -1.670903 0.694030 7.131330 gensim_nmf 46.644018 \n", - "1 NaN 0.698827 6.929583 sklearn_nmf 2404.189918 \n", - "11 -1.711411 0.698827 7.059604 gensim_nmf 2460.213716 \n", - "4 -1.712103 0.700959 7.174119 gensim_nmf 55.361718 \n", - "8 -1.712103 0.700959 7.174119 gensim_nmf 55.361718 \n", - "12 -1.712103 0.700959 7.174119 gensim_nmf 55.361718 \n", - "2 -1.702542 0.711087 7.060992 gensim_nmf 2473.714343 \n", - "6 -1.702542 0.711087 7.060992 gensim_nmf 2473.714343 \n", - "10 -1.702542 0.711087 7.060992 gensim_nmf 2473.714343 \n", - "7 -1.663787 0.750000 7.040535 gensim_nmf 2287.018000 \n", - "0 -1.755650 0.765458 7.002725 lda 1939.575701 \n", - "\n", - " topics train_time lambda_ \\\n", - "5 [(0, 0.035*\"com\" + 0.030*\"world\" + 0.030*\"like... 3.597497 1.0 \n", - "3 [(0, 0.012*\"com\" + 0.012*\"armenian\" + 0.011*\"w... 19.820650 1.0 \n", - "13 [(0, 0.025*\"armenian\" + 0.023*\"peopl\" + 0.021*... 5.856175 100.0 \n", - "9 [(0, 0.031*\"armenian\" + 0.021*\"peopl\" + 0.020*... 4.476314 10.0 \n", - "1 NaN 5.676373 NaN \n", - "11 [(0, 0.017*\"armenian\" + 0.016*\"peopl\" + 0.015*... 27.860318 100.0 \n", - "4 [(0, 0.021*\"armenian\" + 0.020*\"peopl\" + 0.019*... 1.205277 1.0 \n", - "8 [(0, 0.021*\"armenian\" + 0.020*\"peopl\" + 0.019*... 1.091239 10.0 \n", - "12 [(0, 0.021*\"armenian\" + 0.020*\"peopl\" + 0.019*... 1.219200 100.0 \n", - "2 [(0, 0.017*\"armenian\" + 0.015*\"peopl\" + 0.014*... 2.253492 1.0 \n", - "6 [(0, 0.017*\"armenian\" + 0.015*\"peopl\" + 0.014*... 2.271240 10.0 \n", - "10 [(0, 0.017*\"armenian\" + 0.015*\"peopl\" + 0.014*... 2.247909 100.0 \n", - "7 [(0, 0.022*\"armenian\" + 0.015*\"peopl\" + 0.014*... 20.997104 10.0 \n", - "0 [(0, 0.014*\"space\" + 0.008*\"com\" + 0.007*\"bike... 14.540969 NaN \n", - "\n", - " sparse_coef use_r \n", - "5 3.0 1.0 \n", - "3 0.0 1.0 \n", - "13 3.0 1.0 \n", - "9 3.0 1.0 \n", - "1 NaN NaN \n", - "11 0.0 1.0 \n", - "4 3.0 0.0 \n", - "8 3.0 0.0 \n", - "12 3.0 0.0 \n", - "2 0.0 0.0 \n", - "6 0.0 0.0 \n", - "10 0.0 0.0 \n", - "7 0.0 1.0 \n", - "0 NaN NaN " + " coherence f1 l2_norm model perplexity train_time\n", + "1 - 0.696695 6.929583 sklearn_nmf 2404.189918 12.541235\n", + "2 -1.70539 0.715352 7.061342 gensim_nmf 2475.979773 0.656207\n", + "0 -1.75565 0.765458 7.002725 lda 1939.575705 16.793869" ] }, - "execution_count": 23, + "execution_count": 19, "metadata": {}, "output_type": "execute_result" } @@ -1267,96 +1047,28 @@ "tm_metrics.sort_values('f1')" ] }, - { - "cell_type": "code", - "execution_count": 24, - "metadata": {}, - "outputs": [ - { - "name": "stdout", - "output_type": "stream", - "text": [ - "Best NMF's topics\n" - ] - }, - { - "data": { - "text/plain": [ - "[(0,\n", - " '0.017*\"armenian\" + 0.015*\"peopl\" + 0.014*\"said\" + 0.013*\"know\" + 0.008*\"went\" + 0.008*\"sai\" + 0.007*\"like\" + 0.007*\"apart\" + 0.007*\"come\" + 0.007*\"azerbaijani\"'),\n", - " (1,\n", - " '0.074*\"jpeg\" + 0.032*\"file\" + 0.031*\"gif\" + 0.028*\"imag\" + 0.024*\"color\" + 0.017*\"format\" + 0.014*\"qualiti\" + 0.013*\"convert\" + 0.013*\"compress\" + 0.013*\"version\"'),\n", - " (2,\n", - " '0.030*\"imag\" + 0.014*\"graphic\" + 0.012*\"data\" + 0.010*\"file\" + 0.010*\"pub\" + 0.010*\"ftp\" + 0.010*\"avail\" + 0.008*\"format\" + 0.008*\"program\" + 0.008*\"packag\"'),\n", - " (3,\n", - " '0.015*\"god\" + 0.012*\"atheist\" + 0.009*\"believ\" + 0.009*\"exist\" + 0.008*\"atheism\" + 0.007*\"peopl\" + 0.007*\"religion\" + 0.006*\"christian\" + 0.006*\"israel\" + 0.006*\"religi\"'),\n", - " (4,\n", - " '0.028*\"space\" + 0.019*\"launch\" + 0.013*\"satellit\" + 0.009*\"orbit\" + 0.008*\"nasa\" + 0.007*\"year\" + 0.006*\"mission\" + 0.006*\"new\" + 0.006*\"commerci\" + 0.005*\"market\"')]" - ] - }, - "execution_count": 24, - "metadata": {}, - "output_type": "execute_result" - } - ], - "source": [ - "print(\"Best NMF's topics\")\n", - "tm_metrics.iloc[2].topics" - ] - }, - { - "cell_type": "code", - "execution_count": 25, - "metadata": {}, - "outputs": [ - { - "name": "stdout", - "output_type": "stream", - "text": [ - "LDA topics\n" - ] - }, - { - "data": { - "text/plain": [ - "[(0,\n", - " '0.014*\"space\" + 0.008*\"com\" + 0.007*\"bike\" + 0.007*\"nasa\" + 0.005*\"new\" + 0.005*\"orbit\" + 0.005*\"launch\" + 0.005*\"year\" + 0.005*\"univers\" + 0.004*\"like\"'),\n", - " (1,\n", - " '0.011*\"god\" + 0.011*\"com\" + 0.008*\"peopl\" + 0.008*\"think\" + 0.007*\"like\" + 0.006*\"thing\" + 0.006*\"know\" + 0.005*\"moral\" + 0.005*\"believ\" + 0.005*\"time\"'),\n", - " (2,\n", - " '0.013*\"israel\" + 0.011*\"isra\" + 0.010*\"jew\" + 0.007*\"arab\" + 0.007*\"peopl\" + 0.006*\"state\" + 0.006*\"islam\" + 0.006*\"right\" + 0.005*\"think\" + 0.004*\"jewish\"'),\n", - " (3,\n", - " '0.012*\"imag\" + 0.010*\"graphic\" + 0.010*\"file\" + 0.008*\"com\" + 0.008*\"program\" + 0.006*\"softwar\" + 0.006*\"univers\" + 0.006*\"us\" + 0.005*\"mail\" + 0.005*\"host\"'),\n", - " (4,\n", - " '0.020*\"armenian\" + 0.012*\"turkish\" + 0.010*\"peopl\" + 0.007*\"said\" + 0.006*\"turkei\" + 0.006*\"armenia\" + 0.006*\"turk\" + 0.005*\"know\" + 0.004*\"greek\" + 0.004*\"year\"')]" - ] - }, - "execution_count": 25, - "metadata": {}, - "output_type": "execute_result" - } - ], - "source": [ - "print('LDA topics')\n", - "tm_metrics.iloc[0].topics" - ] - }, { "cell_type": "markdown", "metadata": {}, "source": [ - "- Gensim NMF clearly beats sklearn implementation both in terms of speed and quality\n", - "- LDA is still significantly better in terms of quality, though interpretabiliy of topics and speed are clearly worse then NMF's" + "### Main insights\n", + "\n", + "- Gensim NMF is **ridiculously** fast and leaves LDA and Sklearn far behind in terms of training time\n", + "- Gensim NMF beats sklearn NMF implementation on f1 metric, though not on the l2 norm and perplexity\n", + "- Gensim NMF beats LDA on coherence, but LDA is still better on perplexity and l2 norm" ] }, { "cell_type": "markdown", "metadata": {}, "source": [ - "## Olivietti faces + Gensim NMF\n", + "## Faces Dataset Decomposition + Gensim NMF\n", + "\n", "NMF algorithm works not only with texts, but with all kinds of stuff!\n", "\n", - "Let's run our model with other factorization algorithms and check out the results" + "Let's compare our model with the other factorization algorithms and check out the results!\n", + "\n", + "To do that we'll patch sklearn's [Faces Dataset Decomposition](https://scikit-learn.org/stable/auto_examples/decomposition/plot_faces_decomposition.html)." ] }, { @@ -1364,59 +1076,47 @@ "metadata": {}, "source": [ "### Sklearn wrapper\n", - "We need that wrapper to compare Gensim NMF with other factorizations on images" + "Let's create a wrapper to compare Gensim NMF with the other factorizations on images" ] }, { "cell_type": "code", - "execution_count": 26, + "execution_count": 20, "metadata": { "lines_to_next_cell": 2 }, "outputs": [], "source": [ "from sklearn.base import BaseEstimator, TransformerMixin\n", + "import scipy.sparse as sparse\n", "\n", "\n", "class NmfWrapper(BaseEstimator, TransformerMixin):\n", - " def __init__(self, **kwargs):\n", + " def __init__(self, bow_matrix, **kwargs):\n", + " self.corpus = sparse.csc.csc_matrix(bow_matrix)\n", " self.nmf = GensimNmf(**kwargs)\n", - " self.corpus = None\n", - "\n", - " def fit_transform(self, X):\n", - " self.fit(X)\n", - " return self.transform(X)\n", "\n", " def fit(self, X):\n", - " self.corpus = [\n", - " [\n", - " (feature_idx, value)\n", - " for feature_idx, value\n", - " in enumerate(sample)\n", - " ]\n", - " for sample\n", - " in X\n", - " ]\n", - "\n", " self.nmf.update(self.corpus)\n", "\n", - " def transform(self, X):\n", - " H = np.zeros((len(self.corpus), self.nmf.num_topics))\n", - " for bow_id, bow in enumerate(self.corpus):\n", - " for topic_id, proba in self.nmf[bow]:\n", - " H[bow_id, topic_id] = proba\n", - "\n", - " return H\n", - "\n", " @property\n", " def components_(self):\n", " return self.nmf.get_topics()" ] }, { - "cell_type": "code", - "execution_count": 27, + "cell_type": "markdown", "metadata": {}, + "source": [ + "### Modified FDD notebook" + ] + }, + { + "cell_type": "code", + "execution_count": 21, + "metadata": { + "scrolled": false + }, "outputs": [ { "name": "stdout", @@ -1435,9 +1135,9 @@ "\n", "Dataset consists of 400 faces\n", "Extracting the top 6 Eigenfaces - PCA using randomized SVD...\n", - "done in 0.195s\n", + "done in 0.172s\n", "Extracting the top 6 Non-negative components - NMF (Sklearn)...\n", - "done in 1.069s\n", + "done in 0.905s\n", "Extracting the top 6 Non-negative components - NMF (Gensim)...\n" ] }, @@ -1445,35 +1145,40 @@ "name": "stderr", "output_type": "stream", "text": [ - "2019-01-17 14:54:20,785 : INFO : Loss (no outliers): 5.486415140971889\tLoss (with outliers): 5.486415140971889\n", - "2019-01-17 14:54:20,788 : INFO : Loss (no outliers): 5.486415140971889\tLoss (with outliers): 5.486415140971889\n" + "2019-01-31 03:19:14,462 : INFO : Loss: 1.0006496938661258\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "done in 6.041s\n", + "done in 0.818s\n", "Extracting the top 6 Independent components - FastICA...\n", - "done in 0.197s\n", + "done in 0.448s\n", "Extracting the top 6 Sparse comp. - MiniBatchSparsePCA...\n", - "done in 0.862s\n", + "done in 1.343s\n", "Extracting the top 6 MiniBatchDictionaryLearning...\n", - "done in 0.660s\n", + "done in 2.885s\n", "Extracting the top 6 Cluster centers - MiniBatchKMeans...\n", - "done in 0.064s\n", - "Extracting the top 6 Factor Analysis components - FA...\n", - "done in 0.113s\n" + "done in 0.133s\n", + "Extracting the top 6 Factor Analysis components - FA...\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ - "/home/anotherbugmaster/.virtualenvs/gensim/lib/python3.7/site-packages/sklearn/decomposition/factor_analysis.py:228: ConvergenceWarning: FactorAnalysis did not converge. You might want to increase the number of iterations.\n", + "/home/anotherbugmaster/.virtualenvs/gensim/lib/python3.6/site-packages/sklearn/decomposition/factor_analysis.py:228: ConvergenceWarning: FactorAnalysis did not converge. You might want to increase the number of iterations.\n", " ConvergenceWarning)\n" ] }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "done in 0.304s\n" + ] + }, { "data": { "image/png": "\n", @@ -1486,7 +1191,7 @@ }, { "data": { - "image/png": "\n", + "image/png": "\n", "text/plain": [ "
" ] @@ -1496,7 +1201,7 @@ }, { "data": { - "image/png": "\n", + "image/png": "\n", "text/plain": [ "
" ] @@ -1506,7 +1211,7 @@ }, { "data": { - "image/png": "\n", + "image/png": "\n", "text/plain": [ "
" ] @@ -1516,7 +1221,7 @@ }, { "data": { - "image/png": "\n", + "image/png": "\n", "text/plain": [ "
" ] @@ -1526,7 +1231,7 @@ }, { "data": { - "image/png": "\n", + "image/png": "\n", "text/plain": [ "
" ] @@ -1536,7 +1241,7 @@ }, { "data": { - "image/png": "\n", + "image/png": "\n", "text/plain": [ "
" ] @@ -1566,7 +1271,7 @@ }, { "data": { - "image/png": "\n", + "image/png": "\n", "text/plain": [ "
" ] @@ -1642,13 +1347,14 @@ "\n", " ('Non-negative components - NMF (Gensim)',\n", " NmfWrapper(\n", - " chunksize=1,\n", + " bow_matrix=faces.T,\n", + " chunksize=2,\n", " eval_every=400,\n", " passes=1,\n", - " sparse_coef=0,\n", " id2word={idx: idx for idx in range(faces.shape[1])},\n", " num_topics=n_components,\n", - " minimum_probability=0\n", + " minimum_probability=0,\n", + " random_state=42,\n", " ),\n", " False),\n", "\n", @@ -1715,6 +1421,22 @@ "\n", "plt.show()" ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "As you can see, Gensim NMF implementation works as fast as Sklearn NMF and achieves comparable quality, even though it's not optimised for dense matrices." + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "## Conclusion\n", + "\n", + "Gensim NMF is an extremely fast and memory-optimized model, and should be used whenever your system resources are too scarse for the task or when you want to try something different from LDA." + ] } ], "metadata": { @@ -1722,8 +1444,8 @@ "text_representation": { "extension": ".py", "format_name": "percent", - "format_version": "1.2", - "jupytext_version": "0.8.6" + "format_version": "1.1", + "jupytext_version": "0.8.3" } }, "kernelspec": { @@ -1741,7 +1463,7 @@ "name": "python", "nbconvert_exporter": "python", "pygments_lexer": "ipython3", - "version": "3.7.2" + "version": "3.6.8" } }, "nbformat": 4, diff --git a/docs/notebooks/nmf_wikipedia.ipynb b/docs/notebooks/nmf_wikipedia.ipynb index eaa3c656c7..49dbd318b6 100644 --- a/docs/notebooks/nmf_wikipedia.ipynb +++ b/docs/notebooks/nmf_wikipedia.ipynb @@ -29,13 +29,19 @@ "import scipy.sparse\n", "import smart_open\n", "import time\n", + "import os\n", + "import psutil\n", + "from contextlib import contextmanager\n", + "from multiprocessing import Process\n", "from tqdm import tqdm, tqdm_notebook\n", + "import joblib\n", "\n", "import gensim.downloader as api\n", "from gensim import matutils\n", "from gensim.corpora import MmCorpus, Dictionary\n", "from gensim.models import LdaModel, CoherenceModel\n", - "from gensim.models.nmf import Nmf\n", + "from gensim.models.nmf import Nmf as GensimNmf\n", + "from sklearn.decomposition.nmf import NMF as SklearnNmf\n", "from gensim.parsing.preprocessing import preprocess_string\n", "\n", "tqdm.pandas()\n", @@ -244,11 +250,11 @@ "name": "stderr", "output_type": "stream", "text": [ - "2019-01-15 19:31:03,151 : INFO : loading Dictionary object from wiki.dict\n", - "2019-01-15 19:31:04,024 : INFO : loaded wiki.dict\n", - "2019-01-15 19:31:06,292 : INFO : discarding 1910258 tokens: [('abdelrahim', 49), ('abstention', 120), ('anarcha', 101), ('anarchica', 40), ('anarchosyndicalist', 20), ('antimilitar', 68), ('arbet', 194), ('archo', 100), ('arkhē', 5), ('autonomedia', 118)]...\n", - "2019-01-15 19:31:06,293 : INFO : keeping 100000 tokens which were in no less than 5 and no more than 2462447 (=50.0%) documents\n", - "2019-01-15 19:31:06,645 : INFO : resulting dictionary: Dictionary(100000 unique tokens: ['abandon', 'abil', 'abl', 'abolit', 'abstent']...)\n" + "2019-01-30 23:49:27,738 : INFO : loading Dictionary object from wiki.dict\n", + "2019-01-30 23:49:28,637 : INFO : loaded wiki.dict\n", + "2019-01-30 23:49:33,783 : INFO : discarding 1910146 tokens: [('abdelrahim', 49), ('abstention', 120), ('anarcha', 101), ('anarchica', 40), ('anarchosyndicalist', 20), ('antimilitar', 68), ('arbet', 194), ('archo', 100), ('arkhē', 5), ('autonomedia', 118)]...\n", + "2019-01-30 23:49:33,784 : INFO : keeping 100000 tokens which were in no less than 5 and no more than 2462447 (=50.0%) documents\n", + "2019-01-30 23:49:34,701 : INFO : resulting dictionary: Dictionary(100000 unique tokens: ['omana', 'thoroughfar', 'janssen', 'boletacea', 'itzik']...)\n" ] } ], @@ -283,18 +289,22 @@ " super().__init__(*args, **kwargs)\n", "\n", " random_state = np.random.RandomState(random_seed)\n", + " \n", " self.indices = random_state.permutation(range(self.num_docs))\n", + " test_nnz = sum(len(self[doc_idx]) for doc_idx in self.indices[:testsize])\n", + " \n", " if testset:\n", " self.indices = self.indices[:testsize]\n", + " self.num_docs = testsize\n", + " self.num_nnz = test_nnz\n", " else:\n", " self.indices = self.indices[testsize:]\n", + " self.num_docs -= testsize\n", + " self.num_nnz -= test_nnz\n", "\n", " def __iter__(self):\n", " for doc_id in self.indices:\n", - " yield self[doc_id]\n", - " \n", - " def __len__(self):\n", - " return len(self.indices)" + " yield self[doc_id]" ] }, { @@ -343,12 +353,12 @@ "name": "stderr", "output_type": "stream", "text": [ - "2019-01-15 19:31:07,323 : INFO : loaded corpus index from wiki.mm.index\n", - "2019-01-15 19:31:07,324 : INFO : initializing cython corpus reader from wiki.mm\n", - "2019-01-15 19:31:07,325 : INFO : accepted corpus with 4924894 documents, 100000 features, 683375728 non-zero entries\n", - "2019-01-15 19:31:08,544 : INFO : loaded corpus index from wiki.mm.index\n", - "2019-01-15 19:31:08,544 : INFO : initializing cython corpus reader from wiki.mm\n", - "2019-01-15 19:31:08,545 : INFO : accepted corpus with 4924894 documents, 100000 features, 683375728 non-zero entries\n" + "2019-01-30 23:49:35,606 : INFO : loaded corpus index from wiki.mm.index\n", + "2019-01-30 23:49:35,607 : INFO : initializing cython corpus reader from wiki.mm\n", + "2019-01-30 23:49:35,607 : INFO : accepted corpus with 4924894 documents, 100000 features, 683326444 non-zero entries\n", + "2019-01-30 23:49:37,629 : INFO : loaded corpus index from wiki.mm.index\n", + "2019-01-30 23:49:37,630 : INFO : initializing cython corpus reader from wiki.mm\n", + "2019-01-30 23:49:37,630 : INFO : accepted corpus with 4924894 documents, 100000 features, 683326444 non-zero entries\n" ] } ], @@ -365,7 +375,7 @@ "cell_type": "markdown", "metadata": {}, "source": [ - "## Metrics" + "### Convert corpora to csc and save" ] }, { @@ -374,12 +384,82 @@ "metadata": {}, "outputs": [], "source": [ - "def get_execution_time(func):\n", + "SAVE_CSC = False\n", + "\n", + "if SAVE_CSC:\n", + " train_csc = matutils.corpus2csc(train_corpus, len(dictionary))\n", + " scipy.sparse.save_npz('train_csc.npz', train_csc)\n", + " \n", + " test_csc = matutils.corpus2csc(test_corpus, len(dictionary))\n", + " scipy.sparse.save_npz('test_csc.npz', test_csc)" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "### Load csc" + ] + }, + { + "cell_type": "code", + "execution_count": 11, + "metadata": {}, + "outputs": [], + "source": [ + "train_csc = scipy.sparse.load_npz('train_csc.npz')\n", + "test_csc = scipy.sparse.load_npz('test_csc.npz')" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "## Metrics" + ] + }, + { + "cell_type": "code", + "execution_count": 12, + "metadata": {}, + "outputs": [], + "source": [ + "@contextmanager\n", + "def measure_ram(output, tick=2):\n", + " def _measure_ram(pid, output, tick=5):\n", + " py = psutil.Process(pid)\n", + " with open(output, 'w') as outfile:\n", + " while True:\n", + " memory = py.memory_info().rss\n", + " outfile.write(\"{}\\n\".format(memory))\n", + " outfile.flush()\n", + " time.sleep(tick)\n", + "\n", + " pid = os.getpid()\n", + " p = Process(target=_measure_ram, args=(pid, output, tick))\n", + " p.start()\n", + " yield\n", + " p.terminate()\n", + "\n", + "def get_train_time_and_ram(func, name):\n", + " memprof_filename = \"{}.memprof\".format(name)\n", + " \n", " start = time.time()\n", "\n", - " result = func()\n", + " with measure_ram(memprof_filename, 5):\n", + " result = func() \n", + " \n", + " elapsed_time = pd.to_timedelta(time.time() - start, unit='s').round('s')\n", + " \n", + " memprof_df = pd.read_csv(memprof_filename, squeeze=True)\n", + " \n", + " mean_ram = \"{} MB\".format(\n", + " memprof_df.mean() // 2**20,\n", + " )\n", + " \n", + " max_ram = \"{} MB\".format(memprof_df.max() // 2**20)\n", "\n", - " return (time.time() - start), result\n", + " return elapsed_time, mean_ram, max_ram, result\n", "\n", "\n", "def get_tm_metrics(model, test_corpus):\n", @@ -406,15 +486,12 @@ " coherence='u_mass'\n", " ).get_coherence()\n", "\n", - " topics = model.show_topics()\n", - "\n", " model.normalize = False\n", "\n", " return dict(\n", - " perplexity=perplexity,\n", - " coherence=coherence,\n", - " topics=topics,\n", - " l2_norm=l2_norm,\n", + " perplexity=round(perplexity, 4),\n", + " coherence=round(coherence, 4),\n", + " l2_norm=round(l2_norm, 4),\n", " )\n", "\n", "\n", @@ -423,7 +500,26 @@ "\n", "\n", "def get_tm_l2_norm(pred_factors, dense_corpus):\n", - " return np.linalg.norm(dense_corpus / dense_corpus.sum(axis=0) - pred_factors)" + " return np.linalg.norm(dense_corpus / dense_corpus.sum(axis=0) - pred_factors)\n", + "\n", + "\n", + "def get_sklearn_metrics(model, test_corpus):\n", + " W = model.components_.T\n", + " H = model.transform((test_corpus / test_corpus.sum(axis=0)).T).T\n", + " pred_factors = W.dot(H)\n", + " pred_factors /= pred_factors.sum(axis=0)\n", + "\n", + " perplexity = np.exp(\n", + " -(np.log(pred_factors, where=pred_factors > 0) * test_corpus).sum()\n", + " / test_corpus.sum()\n", + " )\n", + "\n", + " l2_norm = np.linalg.norm(test_corpus / test_corpus.sum(axis=0) - pred_factors)\n", + "\n", + " return dict(\n", + " perplexity=perplexity,\n", + " l2_norm=l2_norm,\n", + " )" ] }, { @@ -435,7 +531,7 @@ }, { "cell_type": "code", - "execution_count": 11, + "execution_count": 13, "metadata": {}, "outputs": [], "source": [ @@ -446,12 +542,12 @@ "cell_type": "markdown", "metadata": {}, "source": [ - "### Define common params for models" + "### Define common params for the models" ] }, { "cell_type": "code", - "execution_count": 12, + "execution_count": 14, "metadata": {}, "outputs": [], "source": [ @@ -478,230 +574,296 @@ "cell_type": "markdown", "metadata": {}, "source": [ - "### Train NMF and save it\n", + "### Train Gensim NMF and save it\n", "Normalization is turned off to compute metrics correctly" ] }, { "cell_type": "code", - "execution_count": 13, - "metadata": {}, - "outputs": [ - { - "name": "stderr", - "output_type": "stream", - "text": [ - "2019-01-15 19:33:21,875 : INFO : Loss (no outliers): 2186.768444126956\tLoss (with outliers): 2186.768444126956\n", - "2019-01-15 19:34:49,514 : INFO : Loss (no outliers): 2298.434152045061\tLoss (with outliers): 2298.434152045061\n", - "==Truncated==\n", - "2019-01-15 20:44:23,913 : INFO : Loss (no outliers): 1322.9664709183141\tLoss (with outliers): 1322.9664709183141\n", - "2019-01-15 20:44:23,928 : INFO : saving Nmf object under nmf.model, separately None\n", - "2019-01-15 20:44:24,625 : INFO : saved nmf.model\n" - ] - } - ], - "source": [ - "row = dict()\n", - "row['model'] = 'nmf'\n", - "row['train_time'], nmf = get_execution_time(\n", - " lambda: Nmf(\n", - " use_r=False,\n", - " normalize=False,\n", - " **params\n", - " )\n", - ")\n", - "nmf.save('nmf.model')" - ] - }, - { - "cell_type": "markdown", - "metadata": {}, - "source": [ - "### Load NMF and store metrics" - ] - }, - { - "cell_type": "code", - "execution_count": 14, + "execution_count": 15, "metadata": {}, "outputs": [ { "name": "stderr", "output_type": "stream", "text": [ - "2019-01-15 20:44:24,872 : INFO : loading Nmf object from nmf.model\n", - "2019-01-15 20:44:25,150 : INFO : loading id2word recursively from nmf.model.id2word.* with mmap=None\n", - "2019-01-15 20:44:25,151 : INFO : loaded nmf.model\n", - "2019-01-15 20:44:54,148 : INFO : CorpusAccumulator accumulated stats from 1000 documents\n", - "2019-01-15 20:44:54,336 : INFO : CorpusAccumulator accumulated stats from 2000 documents\n" + "2019-01-30 23:50:41,538 : INFO : Loss: 0.9592283350028137\n", + "2019-01-30 23:51:07,841 : INFO : Loss: 0.9654052723463945\n", + "2019-01-30 23:51:19,986 : INFO : Loss: 0.983610134773025\n", + "2019-01-30 23:51:31,494 : INFO : Loss: 0.9856176961379628\n", + "2019-01-30 23:51:47,703 : INFO : Loss: 1.0388382070148916\n", + "2019-01-30 23:52:00,235 : INFO : Loss: 0.9885831160386329\n", + "2019-01-30 23:52:10,915 : INFO : Loss: 0.9940857027761342\n", + "2019-01-30 23:52:19,815 : INFO : Loss: 0.9946127359838275\n", + "2019-01-30 23:52:28,330 : INFO : Loss: 0.9949275215480511\n", + "2019-01-30 23:52:36,515 : INFO : Loss: 0.9957360140573942\n", + "2019-01-30 23:52:45,287 : INFO : Loss: 0.995799267839182\n", + "2019-01-30 23:52:53,664 : INFO : Loss: 0.9950670862672046\n", + "2019-01-30 23:53:00,937 : INFO : Loss: 0.9959924745279174\n", + "2019-01-30 23:53:09,471 : INFO : Loss: 0.9959557971255888\n", + "2019-01-30 23:53:17,299 : INFO : Loss: 0.9992069754012614\n", + "2019-01-30 23:53:24,887 : INFO : Loss: 0.9970817907880735\n", + "2019-01-30 23:53:31,921 : INFO : Loss: 0.9968030668126687\n", + "2019-01-30 23:53:40,154 : INFO : Loss: 1.000805162837266\n", + "2019-01-30 23:53:47,588 : INFO : Loss: 1.0036445937560066\n", + "2019-01-30 23:53:56,589 : INFO : Loss: 0.9978459394716457\n", + "2019-01-30 23:54:03,979 : INFO : Loss: 0.9989593665461145\n", + "2019-01-30 23:54:10,702 : INFO : Loss: 0.9980982301738708\n", + "2019-01-30 23:54:17,266 : INFO : Loss: 0.998238226164612\n", + "2019-01-30 23:54:23,887 : INFO : Loss: 0.9985550255498024\n", + "2019-01-30 23:54:30,537 : INFO : Loss: 0.9996225023252939\n", + "2019-01-30 23:54:37,091 : INFO : Loss: 0.9987754828651019\n", + "2019-01-30 23:54:43,688 : INFO : Loss: 0.9990247943574684\n", + "2019-01-30 23:54:50,660 : INFO : Loss: 1.029933776961323\n", + "2019-01-30 23:54:57,057 : INFO : Loss: 0.9984374937212643\n", + "2019-01-30 23:55:03,790 : INFO : Loss: 0.9986012940684562\n", + "2019-01-30 23:55:10,033 : INFO : Loss: 0.9984611293557583\n", + "2019-01-30 23:55:16,684 : INFO : Loss: 1.003185791874025\n", + "2019-01-30 23:55:22,973 : INFO : Loss: 1.0001865879991019\n", + "2019-01-30 23:55:29,217 : INFO : Loss: 0.9994679229677745\n", + "2019-01-30 23:55:35,906 : INFO : Loss: 0.9985081154694843\n", + "2019-01-30 23:55:42,292 : INFO : Loss: 0.9990448183844505\n", + "2019-01-30 23:55:49,929 : INFO : Loss: 1.000794691283293\n", + "2019-01-30 23:55:56,328 : INFO : Loss: 1.0002123974155162\n", + "2019-01-30 23:56:02,429 : INFO : Loss: 0.9989732756831223\n", + "2019-01-30 23:56:08,386 : INFO : Loss: 0.9995798986671256\n", + "2019-01-30 23:56:14,287 : INFO : Loss: 0.9988648461033055\n", + "2019-01-30 23:56:20,215 : INFO : Loss: 0.9994823271485055\n", + "2019-01-30 23:56:27,174 : INFO : Loss: 0.9992080164439477\n", + "2019-01-30 23:56:33,158 : INFO : Loss: 0.9988811343061132\n", + "2019-01-30 23:56:39,103 : INFO : Loss: 1.0013969957742161\n", + "2019-01-30 23:56:44,826 : INFO : Loss: 0.9994270907250508\n", + "2019-01-30 23:56:50,690 : INFO : Loss: 1.0034991318444846\n", + "2019-01-30 23:56:56,529 : INFO : Loss: 0.9991126657253063\n", + "2019-01-30 23:57:02,515 : INFO : Loss: 0.9997881610469845\n", + "2019-01-30 23:57:08,185 : INFO : Loss: 1.0\n", + "2019-01-30 23:57:13,680 : INFO : Loss: 1.0\n", + "2019-01-30 23:57:19,254 : INFO : Loss: 1.0007322403108705\n", + "2019-01-30 23:57:24,728 : INFO : Loss: 0.9998991583235138\n", + "2019-01-30 23:57:30,255 : INFO : Loss: 1.0\n", + "2019-01-30 23:57:35,879 : INFO : Loss: 1.000862549425418\n", + "2019-01-30 23:57:41,421 : INFO : Loss: 0.9993713664199815\n", + "2019-01-30 23:57:47,091 : INFO : Loss: 1.0\n", + "2019-01-30 23:57:52,975 : INFO : Loss: 1.0012177641426152\n", + "2019-01-30 23:57:58,429 : INFO : Loss: 0.9994286988767374\n", + "2019-01-30 23:58:03,930 : INFO : Loss: 0.9994671593690372\n", + "2019-01-30 23:58:09,306 : INFO : Loss: 1.001183875880235\n", + "2019-01-30 23:58:15,514 : INFO : Loss: 0.9994795707619146\n", + "2019-01-30 23:58:21,136 : INFO : Loss: 0.9992854839602129\n", + "2019-01-30 23:58:26,589 : INFO : Loss: 0.9994518698021087\n", + "2019-01-30 23:58:32,003 : INFO : Loss: 0.9990751419440501\n", + "2019-01-30 23:58:37,371 : INFO : Loss: 0.9994931463773729\n", + "2019-01-30 23:58:42,638 : INFO : Loss: 0.9994701481009289\n", + "2019-01-30 23:58:48,291 : INFO : Loss: 0.9994988926020567\n", + "2019-01-30 23:58:54,907 : INFO : Loss: 0.9992860285805035\n", + "2019-01-30 23:59:00,262 : INFO : Loss: 0.9998802191658904\n", + "2019-01-30 23:59:06,694 : INFO : Loss: 1.0003219826923089\n", + "2019-01-30 23:59:12,160 : INFO : Loss: 1.0020653252480436\n", + "2019-01-30 23:59:17,886 : INFO : Loss: 1.0\n", + "2019-01-30 23:59:22,959 : INFO : Loss: 0.99960539436228\n", + "2019-01-30 23:59:28,326 : INFO : Loss: 0.9997496698976536\n", + "2019-01-30 23:59:33,570 : INFO : Loss: 1.0\n", + "2019-01-30 23:59:38,901 : INFO : Loss: 0.9992640842941912\n", + "2019-01-30 23:59:44,234 : INFO : Loss: 0.9996701790008146\n", + "2019-01-30 23:59:49,554 : INFO : Loss: 0.9995232569631003\n", + "2019-01-30 23:59:54,880 : INFO : Loss: 0.9994679955178987\n", + "2019-01-31 00:00:00,090 : INFO : Loss: 1.0\n", + "2019-01-31 00:00:05,340 : INFO : Loss: 1.0001264964909649\n", + "2019-01-31 00:00:10,660 : INFO : Loss: 1.0003099669567983\n", + "2019-01-31 00:00:15,846 : INFO : Loss: 0.999510447047944\n", + "2019-01-31 00:00:21,189 : INFO : Loss: 0.9998373104438704\n", + "2019-01-31 00:00:26,610 : INFO : Loss: 0.9995054808665768\n", + "2019-01-31 00:00:31,824 : INFO : Loss: 1.0008622014983644\n", + "2019-01-31 00:00:37,155 : INFO : Loss: 0.9997513667540812\n", + "2019-01-31 00:00:42,391 : INFO : Loss: 1.000112602276772\n", + "2019-01-31 00:00:47,562 : INFO : Loss: 0.999614659204462\n", + "2019-01-31 00:00:52,875 : INFO : Loss: 0.9996428659515518\n", + "2019-01-31 00:00:58,145 : INFO : Loss: 0.9996863887344251\n", + "2019-01-31 00:01:03,445 : INFO : Loss: 0.9995239914092358\n", + "2019-01-31 00:01:08,885 : INFO : Loss: 0.9995073748133226\n", + "2019-01-31 00:01:14,242 : INFO : Loss: 1.0003544989505417\n", + "2019-01-31 00:01:19,604 : INFO : Loss: 1.0012755530698754\n", + "2019-01-31 00:01:24,644 : INFO : Loss: 1.0\n", + "2019-01-31 00:01:29,877 : INFO : Loss: 0.99966203211569\n", + "2019-01-31 00:01:35,039 : INFO : Loss: 0.9998002679855106\n", + "2019-01-31 00:01:40,211 : INFO : Loss: 0.9995272854993261\n", + "2019-01-31 00:01:45,627 : INFO : Loss: 0.9997888099016539\n", + "2019-01-31 00:01:50,963 : INFO : Loss: 0.9998562780997933\n", + "2019-01-31 00:01:56,264 : INFO : Loss: 0.9997473628030654\n", + "2019-01-31 00:02:01,555 : INFO : Loss: 1.0003431605249815\n", + "2019-01-31 00:02:06,729 : INFO : Loss: 1.0007903437271084\n", + "2019-01-31 00:02:11,928 : INFO : Loss: 0.9996308245384098\n", + "2019-01-31 00:02:17,125 : INFO : Loss: 0.999614879237478\n", + "2019-01-31 00:02:22,374 : INFO : Loss: 1.0005106541696671\n", + "2019-01-31 00:02:28,302 : INFO : Loss: 0.9997306365770836\n", + "2019-01-31 00:02:33,649 : INFO : Loss: 0.9998478611893203\n", + "2019-01-31 00:02:38,974 : INFO : Loss: 0.9994914532031707\n", + "2019-01-31 00:02:44,203 : INFO : Loss: 1.0\n", + "2019-01-31 00:02:49,225 : INFO : Loss: 1.0\n", + "2019-01-31 00:02:54,595 : INFO : Loss: 0.9998652359311595\n", + "2019-01-31 00:02:59,729 : INFO : Loss: 0.9996833407421091\n", + "2019-01-31 00:03:05,085 : INFO : Loss: 0.9996180471892749\n", + "2019-01-31 00:03:10,404 : INFO : Loss: 0.9996931412100092\n", + "2019-01-31 00:03:15,525 : INFO : Loss: 1.0008416184086477\n", + "2019-01-31 00:03:20,604 : INFO : Loss: 1.0\n", + "2019-01-31 00:03:26,557 : INFO : Loss: 0.9998130261219252\n", + "2019-01-31 00:03:31,849 : INFO : Loss: 0.9997170788505965\n", + "2019-01-31 00:03:37,042 : INFO : Loss: 0.9998773189717101\n", + "2019-01-31 00:03:42,323 : INFO : Loss: 0.999892658139298\n", + "2019-01-31 00:03:47,376 : INFO : Loss: 0.9997717371453464\n", + "2019-01-31 00:03:52,678 : INFO : Loss: 0.9998946683607691\n", + "2019-01-31 00:03:57,864 : INFO : Loss: 1.0002281674740388\n", + "2019-01-31 00:04:03,286 : INFO : Loss: 0.999715879131544\n", + "2019-01-31 00:04:08,944 : INFO : Loss: 1.0003323213881778\n", + "2019-01-31 00:04:14,185 : INFO : Loss: 0.999676269832639\n", + "2019-01-31 00:04:19,367 : INFO : Loss: 1.0\n", + "2019-01-31 00:04:24,588 : INFO : Loss: 0.9995829561522159\n", + "2019-01-31 00:04:29,857 : INFO : Loss: 0.9998033643456774\n", + "2019-01-31 00:04:35,007 : INFO : Loss: 0.9998542048725552\n", + "2019-01-31 00:04:40,302 : INFO : Loss: 1.0001348536908885\n", + "2019-01-31 00:04:45,362 : INFO : Loss: 0.9997062111511045\n", + "2019-01-31 00:04:50,531 : INFO : Loss: 0.9997433373378711\n", + "2019-01-31 00:04:55,782 : INFO : Loss: 0.9996415014654532\n", + "2019-01-31 00:05:00,922 : INFO : Loss: 0.9997769304322037\n", + "2019-01-31 00:05:05,857 : INFO : Loss: 0.9997176984039825\n", + "2019-01-31 00:05:11,163 : INFO : Loss: 0.9997360219022641\n", + "2019-01-31 00:05:16,195 : INFO : Loss: 0.9997746634954645\n", + "2019-01-31 00:05:21,071 : INFO : Loss: 1.0\n", + "2019-01-31 00:05:26,238 : INFO : Loss: 1.0\n", + "2019-01-31 00:05:31,524 : INFO : Loss: 0.9997525633663635\n", + "2019-01-31 00:05:36,869 : INFO : Loss: 1.0005806645002224\n", + "2019-01-31 00:05:42,163 : INFO : Loss: 1.0001624907418802\n" ] }, - { - "data": { - "text/plain": [ - "[(0,\n", - " '0.075*\"parti\" + 0.071*\"elect\" + 0.042*\"democrat\" + 0.029*\"republican\" + 0.022*\"vote\" + 0.018*\"conserv\" + 0.017*\"liber\" + 0.014*\"candid\" + 0.013*\"seat\" + 0.013*\"labour\"'),\n", - " (1,\n", - " '0.039*\"book\" + 0.038*\"centuri\" + 0.032*\"histori\" + 0.032*\"languag\" + 0.032*\"publish\" + 0.024*\"english\" + 0.023*\"world\" + 0.022*\"law\" + 0.022*\"govern\" + 0.021*\"nation\"'),\n", - " (2,\n", - " '0.050*\"war\" + 0.036*\"forc\" + 0.026*\"armi\" + 0.023*\"battl\" + 0.021*\"attack\" + 0.019*\"militari\" + 0.018*\"german\" + 0.016*\"british\" + 0.015*\"command\" + 0.014*\"kill\"'),\n", - " (3,\n", - " '0.119*\"race\" + 0.106*\"car\" + 0.073*\"engin\" + 0.035*\"model\" + 0.030*\"driver\" + 0.029*\"vehicl\" + 0.029*\"ford\" + 0.028*\"lap\" + 0.023*\"electr\" + 0.020*\"power\"'),\n", - " (4,\n", - " '0.102*\"leagu\" + 0.092*\"club\" + 0.049*\"footbal\" + 0.047*\"cup\" + 0.029*\"plai\" + 0.028*\"season\" + 0.028*\"divis\" + 0.028*\"goal\" + 0.022*\"team\" + 0.021*\"unit\"'),\n", - " (5,\n", - " '0.055*\"award\" + 0.041*\"best\" + 0.008*\"nomin\" + 0.008*\"year\" + 0.006*\"actress\" + 0.006*\"actor\" + 0.005*\"perform\" + 0.005*\"artist\" + 0.005*\"won\" + 0.005*\"outstand\"'),\n", - " (6,\n", - " '0.115*\"citi\" + 0.014*\"airport\" + 0.013*\"area\" + 0.011*\"popul\" + 0.010*\"san\" + 0.009*\"region\" + 0.008*\"center\" + 0.007*\"municip\" + 0.007*\"intern\" + 0.007*\"ukrainian\"'),\n", - " (7,\n", - " '0.316*\"act\" + 0.046*\"amend\" + 0.020*\"order\" + 0.018*\"ireland\" + 0.016*\"law\" + 0.015*\"regul\" + 0.013*\"court\" + 0.011*\"scotland\" + 0.011*\"road\" + 0.009*\"public\"'),\n", - " (8,\n", - " '0.102*\"align\" + 0.084*\"left\" + 0.022*\"right\" + 0.012*\"text\" + 0.011*\"style\" + 0.007*\"center\" + 0.004*\"bar\" + 0.003*\"till\" + 0.003*\"bgcolor\" + 0.003*\"color\"'),\n", - " (9,\n", - " '0.092*\"team\" + 0.027*\"race\" + 0.025*\"ret\" + 0.014*\"championship\" + 0.007*\"nation\" + 0.006*\"time\" + 0.006*\"sport\" + 0.005*\"stage\" + 0.005*\"coach\" + 0.005*\"finish\"'),\n", - " (10,\n", - " '0.135*\"compani\" + 0.089*\"ship\" + 0.035*\"product\" + 0.028*\"oper\" + 0.024*\"navi\" + 0.022*\"corpor\" + 0.021*\"oil\" + 0.021*\"launch\" + 0.021*\"bank\" + 0.021*\"built\"'),\n", - " (11,\n", - " '0.053*\"new\" + 0.019*\"york\" + 0.004*\"zealand\" + 0.003*\"jersei\" + 0.003*\"american\" + 0.002*\"time\" + 0.002*\"australia\" + 0.002*\"radio\" + 0.002*\"press\" + 0.002*\"washington\"'),\n", - " (12,\n", - " '0.036*\"world\" + 0.034*\"championship\" + 0.032*\"final\" + 0.029*\"match\" + 0.026*\"win\" + 0.026*\"round\" + 0.019*\"open\" + 0.018*\"won\" + 0.015*\"defeat\" + 0.015*\"cup\"'),\n", - " (13,\n", - " '0.019*\"album\" + 0.017*\"record\" + 0.014*\"band\" + 0.008*\"releas\" + 0.005*\"tour\" + 0.005*\"guitar\" + 0.005*\"vocal\" + 0.004*\"rock\" + 0.004*\"track\" + 0.004*\"music\"'),\n", - " (14,\n", - " '0.100*\"church\" + 0.017*\"cathol\" + 0.014*\"christian\" + 0.012*\"centuri\" + 0.012*\"saint\" + 0.011*\"bishop\" + 0.011*\"built\" + 0.009*\"list\" + 0.009*\"build\" + 0.008*\"roman\"'),\n", - " (15,\n", - " '0.088*\"presid\" + 0.072*\"minist\" + 0.046*\"prime\" + 0.015*\"govern\" + 0.014*\"gener\" + 0.011*\"met\" + 0.011*\"governor\" + 0.010*\"foreign\" + 0.010*\"visit\" + 0.009*\"council\"'),\n", - " (16,\n", - " '0.182*\"speci\" + 0.112*\"famili\" + 0.101*\"nov\" + 0.092*\"valid\" + 0.066*\"genu\" + 0.045*\"format\" + 0.040*\"member\" + 0.037*\"gen\" + 0.036*\"bird\" + 0.034*\"type\"'),\n", - " (17,\n", - " '0.029*\"season\" + 0.013*\"yard\" + 0.013*\"game\" + 0.011*\"plai\" + 0.008*\"team\" + 0.007*\"score\" + 0.007*\"win\" + 0.007*\"record\" + 0.006*\"run\" + 0.006*\"coach\"'),\n", - " (18,\n", - " '0.214*\"counti\" + 0.064*\"township\" + 0.017*\"area\" + 0.016*\"statist\" + 0.007*\"ohio\" + 0.006*\"metropolitan\" + 0.006*\"combin\" + 0.005*\"pennsylvania\" + 0.005*\"texa\" + 0.005*\"washington\"'),\n", - " (19,\n", - " '0.017*\"area\" + 0.016*\"river\" + 0.015*\"water\" + 0.006*\"larg\" + 0.006*\"region\" + 0.006*\"lake\" + 0.006*\"power\" + 0.006*\"high\" + 0.005*\"bar\" + 0.005*\"form\"'),\n", - " (20,\n", - " '0.031*\"us\" + 0.025*\"gener\" + 0.024*\"model\" + 0.022*\"data\" + 0.021*\"design\" + 0.020*\"time\" + 0.019*\"function\" + 0.019*\"number\" + 0.018*\"process\" + 0.017*\"exampl\"'),\n", - " (21,\n", - " '0.202*\"order\" + 0.098*\"group\" + 0.098*\"regul\" + 0.076*\"amend\" + 0.041*\"road\" + 0.034*\"traffic\" + 0.033*\"temporari\" + 0.032*\"prohibit\" + 0.027*\"trunk\" + 0.021*\"junction\"'),\n", - " (22,\n", - " '0.096*\"film\" + 0.010*\"product\" + 0.010*\"director\" + 0.010*\"festiv\" + 0.009*\"star\" + 0.009*\"produc\" + 0.009*\"movi\" + 0.008*\"direct\" + 0.007*\"releas\" + 0.007*\"actor\"'),\n", - " (23,\n", - " '0.163*\"music\" + 0.046*\"viola\" + 0.045*\"radio\" + 0.042*\"piano\" + 0.029*\"perform\" + 0.028*\"station\" + 0.027*\"orchestra\" + 0.026*\"compos\" + 0.025*\"song\" + 0.015*\"rock\"'),\n", - " (24,\n", - " '0.052*\"mount\" + 0.051*\"lemmon\" + 0.051*\"peak\" + 0.051*\"kitt\" + 0.051*\"spacewatch\" + 0.026*\"survei\" + 0.015*\"octob\" + 0.012*\"septemb\" + 0.009*\"css\" + 0.009*\"catalina\"'),\n", - " (25,\n", - " '0.075*\"air\" + 0.035*\"forc\" + 0.030*\"squadron\" + 0.029*\"aircraft\" + 0.028*\"oper\" + 0.023*\"unit\" + 0.018*\"flight\" + 0.017*\"airport\" + 0.017*\"wing\" + 0.017*\"base\"'),\n", - " (26,\n", - " '0.105*\"hous\" + 0.038*\"term\" + 0.020*\"march\" + 0.019*\"build\" + 0.019*\"member\" + 0.017*\"serv\" + 0.014*\"congress\" + 0.014*\"hall\" + 0.012*\"januari\" + 0.010*\"window\"'),\n", - " (27,\n", - " '0.129*\"district\" + 0.019*\"pennsylvania\" + 0.016*\"grade\" + 0.012*\"fund\" + 0.012*\"educ\" + 0.012*\"basic\" + 0.011*\"level\" + 0.010*\"oblast\" + 0.010*\"rural\" + 0.009*\"tax\"'),\n", - " (28,\n", - " '0.042*\"year\" + 0.012*\"dai\" + 0.007*\"time\" + 0.005*\"ag\" + 0.004*\"month\" + 0.003*\"includ\" + 0.003*\"follow\" + 0.003*\"later\" + 0.003*\"old\" + 0.003*\"student\"'),\n", - " (29,\n", - " '0.113*\"station\" + 0.109*\"line\" + 0.076*\"road\" + 0.072*\"railwai\" + 0.048*\"rout\" + 0.035*\"oper\" + 0.034*\"train\" + 0.023*\"street\" + 0.020*\"cross\" + 0.020*\"railroad\"'),\n", - " (30,\n", - " '0.036*\"park\" + 0.029*\"town\" + 0.025*\"north\" + 0.020*\"south\" + 0.018*\"west\" + 0.017*\"east\" + 0.017*\"street\" + 0.015*\"nation\" + 0.014*\"build\" + 0.013*\"river\"'),\n", - " (31,\n", - " '0.066*\"women\" + 0.044*\"men\" + 0.030*\"nation\" + 0.024*\"right\" + 0.014*\"athlet\" + 0.013*\"intern\" + 0.013*\"rank\" + 0.013*\"countri\" + 0.012*\"advanc\" + 0.011*\"event\"'),\n", - " (32,\n", - " '0.127*\"linear\" + 0.126*\"socorro\" + 0.029*\"septemb\" + 0.026*\"neat\" + 0.023*\"palomar\" + 0.021*\"octob\" + 0.016*\"kitt\" + 0.016*\"peak\" + 0.015*\"spacewatch\" + 0.015*\"anderson\"'),\n", - " (33,\n", - " '0.152*\"univers\" + 0.055*\"colleg\" + 0.019*\"institut\" + 0.018*\"student\" + 0.018*\"scienc\" + 0.015*\"professor\" + 0.012*\"research\" + 0.011*\"campu\" + 0.011*\"educ\" + 0.011*\"technolog\"'),\n", - " (34,\n", - " '0.072*\"state\" + 0.032*\"unit\" + 0.005*\"court\" + 0.005*\"law\" + 0.004*\"feder\" + 0.004*\"american\" + 0.003*\"nation\" + 0.003*\"govern\" + 0.003*\"kingdom\" + 0.003*\"senat\"'),\n", - " (35,\n", - " '0.074*\"game\" + 0.017*\"player\" + 0.007*\"plai\" + 0.006*\"releas\" + 0.005*\"develop\" + 0.005*\"video\" + 0.005*\"charact\" + 0.004*\"playstat\" + 0.004*\"version\" + 0.004*\"world\"'),\n", - " (36,\n", - " '0.141*\"south\" + 0.098*\"american\" + 0.081*\"india\" + 0.059*\"commun\" + 0.053*\"west\" + 0.053*\"director\" + 0.053*\"africa\" + 0.049*\"usa\" + 0.049*\"indian\" + 0.041*\"servic\"'),\n", - " (37,\n", - " '0.111*\"servic\" + 0.025*\"commun\" + 0.021*\"offic\" + 0.012*\"polic\" + 0.011*\"educ\" + 0.011*\"public\" + 0.010*\"chief\" + 0.009*\"late\" + 0.009*\"manag\" + 0.008*\"mr\"'),\n", - " (38,\n", - " '0.112*\"royal\" + 0.085*\"john\" + 0.083*\"william\" + 0.054*\"lieuten\" + 0.044*\"georg\" + 0.041*\"offic\" + 0.041*\"jame\" + 0.038*\"sergeant\" + 0.037*\"major\" + 0.035*\"charl\"'),\n", - " (39,\n", - " '0.051*\"song\" + 0.043*\"releas\" + 0.042*\"singl\" + 0.027*\"chart\" + 0.025*\"album\" + 0.017*\"number\" + 0.014*\"video\" + 0.013*\"version\" + 0.012*\"love\" + 0.011*\"featur\"'),\n", - " (40,\n", - " '0.031*\"time\" + 0.028*\"later\" + 0.026*\"appear\" + 0.025*\"man\" + 0.024*\"kill\" + 0.020*\"charact\" + 0.019*\"work\" + 0.018*\"father\" + 0.018*\"death\" + 0.018*\"famili\"'),\n", - " (41,\n", - " '0.126*\"seri\" + 0.064*\"episod\" + 0.026*\"season\" + 0.021*\"televis\" + 0.015*\"comic\" + 0.013*\"charact\" + 0.012*\"dvd\" + 0.012*\"anim\" + 0.012*\"star\" + 0.011*\"appear\"'),\n", - " (42,\n", - " '0.143*\"born\" + 0.073*\"american\" + 0.027*\"footbal\" + 0.024*\"player\" + 0.024*\"william\" + 0.023*\"singer\" + 0.019*\"actor\" + 0.017*\"politician\" + 0.015*\"actress\" + 0.013*\"english\"'),\n", - " (43,\n", - " '0.044*\"march\" + 0.042*\"septemb\" + 0.036*\"octob\" + 0.033*\"januari\" + 0.032*\"april\" + 0.031*\"august\" + 0.031*\"juli\" + 0.029*\"novemb\" + 0.029*\"june\" + 0.028*\"decemb\"'),\n", - " (44,\n", - " '0.149*\"island\" + 0.013*\"south\" + 0.013*\"australia\" + 0.009*\"sea\" + 0.008*\"north\" + 0.008*\"bai\" + 0.008*\"western\" + 0.008*\"airport\" + 0.007*\"coast\" + 0.006*\"pacif\"'),\n", - " (45,\n", - " '0.028*\"studi\" + 0.026*\"research\" + 0.023*\"health\" + 0.019*\"human\" + 0.019*\"term\" + 0.019*\"develop\" + 0.018*\"includ\" + 0.018*\"peopl\" + 0.017*\"report\" + 0.017*\"cell\"'),\n", - " (46,\n", - " '0.112*\"school\" + 0.028*\"high\" + 0.016*\"student\" + 0.012*\"educ\" + 0.009*\"grade\" + 0.008*\"primari\" + 0.007*\"public\" + 0.006*\"colleg\" + 0.006*\"elementari\" + 0.006*\"pennsylvania\"'),\n", - " (47,\n", - " '0.137*\"royal\" + 0.121*\"capt\" + 0.103*\"armi\" + 0.090*\"maj\" + 0.089*\"corp\" + 0.075*\"col\" + 0.074*\"temp\" + 0.048*\"servic\" + 0.040*\"engin\" + 0.033*\"reg\"'),\n", - " (48,\n", - " '0.183*\"art\" + 0.117*\"museum\" + 0.071*\"paint\" + 0.062*\"work\" + 0.046*\"artist\" + 0.043*\"galleri\" + 0.040*\"exhibit\" + 0.034*\"collect\" + 0.027*\"histori\" + 0.022*\"jpg\"'),\n", - " (49,\n", - " '0.068*\"regiment\" + 0.062*\"divis\" + 0.049*\"battalion\" + 0.045*\"infantri\" + 0.036*\"brigad\" + 0.024*\"armi\" + 0.023*\"artilleri\" + 0.019*\"compani\" + 0.018*\"gener\" + 0.018*\"colonel\"')]" - ] - }, - "execution_count": 14, - "metadata": {}, - "output_type": "execute_result" - } - ], - "source": [ - "nmf = Nmf.load('nmf.model')\n", - "row.update(get_tm_metrics(nmf, test_corpus))\n", - "tm_metrics = tm_metrics.append(pd.Series(row), ignore_index=True)\n", - "\n", - "nmf.show_topics(50)" - ] - }, - { - "cell_type": "markdown", - "metadata": {}, - "source": [ - "### Train NMF with residuals and save it\n", - "Residuals add regularization to the model thus increasing quality, but slows down training" - ] - }, - { - "cell_type": "code", - "execution_count": 15, - "metadata": { - "scrolled": false - }, - "outputs": [ { "name": "stderr", "output_type": "stream", "text": [ - "2019-01-15 20:54:05,363 : INFO : Loss (no outliers): 2179.9524465227146\tLoss (with outliers): 2102.354108449905\n", - "2019-01-15 20:57:12,821 : INFO : Loss (no outliers): 2268.3200929871823\tLoss (with outliers): 2110.928651253909\n", - "==Truncated==\n", - "2019-01-16 04:05:46,589 : INFO : Loss (no outliers): 1321.521323758918\tLoss (with outliers): 1282.9364495345592\n", - "2019-01-16 04:05:46,599 : INFO : saving Nmf object under nmf_with_r.model, separately None\n", - "2019-01-16 04:05:46,601 : INFO : storing scipy.sparse array '_r' under nmf_with_r.model._r.npy\n", - "2019-01-16 04:05:47,781 : INFO : saved nmf_with_r.model\n" + "2019-01-31 00:05:47,007 : INFO : Loss: 0.9996352155288082\n", + "2019-01-31 00:05:52,261 : INFO : Loss: 1.0004395613185166\n", + "2019-01-31 00:05:57,342 : INFO : Loss: 1.0\n", + "2019-01-31 00:06:02,548 : INFO : Loss: 0.9998527076273703\n", + "2019-01-31 00:06:07,609 : INFO : Loss: 0.9996924850765493\n", + "2019-01-31 00:06:12,841 : INFO : Loss: 0.9998465986185003\n", + "2019-01-31 00:06:18,157 : INFO : Loss: 0.9997732510121399\n", + "2019-01-31 00:06:23,211 : INFO : Loss: 0.9997941508395527\n", + "2019-01-31 00:06:28,233 : INFO : Loss: 0.9995770839553472\n", + "2019-01-31 00:06:33,449 : INFO : Loss: 0.9997390770111323\n", + "2019-01-31 00:06:38,821 : INFO : Loss: 0.9997499890547042\n", + "2019-01-31 00:06:43,967 : INFO : Loss: 1.0002122989122686\n", + "2019-01-31 00:06:48,974 : INFO : Loss: 1.0\n", + "2019-01-31 00:06:54,205 : INFO : Loss: 0.9996768801524232\n", + "2019-01-31 00:06:59,422 : INFO : Loss: 0.9998134505747993\n", + "2019-01-31 00:07:04,626 : INFO : Loss: 1.0001153274263432\n", + "2019-01-31 00:07:09,638 : INFO : Loss: 0.9997996517667606\n", + "2019-01-31 00:07:14,849 : INFO : Loss: 0.9998403875727927\n", + "2019-01-31 00:07:20,090 : INFO : Loss: 0.9996267017145936\n", + "2019-01-31 00:07:25,508 : INFO : Loss: 0.9997907577614406\n", + "2019-01-31 00:07:30,734 : INFO : Loss: 0.9997841500239624\n", + "2019-01-31 00:07:36,017 : INFO : Loss: 1.0\n", + "2019-01-31 00:07:41,135 : INFO : Loss: 0.9997873958125003\n", + "2019-01-31 00:07:46,540 : INFO : Loss: 0.9997595467577249\n", + "2019-01-31 00:07:51,748 : INFO : Loss: 0.999873831646166\n", + "2019-01-31 00:07:57,127 : INFO : Loss: 0.9998347951106515\n", + "2019-01-31 00:08:02,303 : INFO : Loss: 0.9998140553862679\n", + "2019-01-31 00:08:07,383 : INFO : Loss: 1.0\n", + "2019-01-31 00:08:12,659 : INFO : Loss: 0.9998790606131965\n", + "2019-01-31 00:08:17,961 : INFO : Loss: 1.0012735986432386\n", + "2019-01-31 00:08:23,045 : INFO : Loss: 0.999858411002553\n", + "2019-01-31 00:08:28,185 : INFO : Loss: 1.0\n", + "2019-01-31 00:08:33,478 : INFO : Loss: 0.9998548688610734\n", + "2019-01-31 00:08:38,574 : INFO : Loss: 0.9998995265289764\n", + "2019-01-31 00:08:43,852 : INFO : Loss: 0.9996783400306337\n", + "2019-01-31 00:08:48,908 : INFO : Loss: 0.999809554970957\n", + "2019-01-31 00:08:54,134 : INFO : Loss: 0.9998686530125888\n", + "2019-01-31 00:08:59,089 : INFO : Loss: 1.0\n", + "2019-01-31 00:09:04,296 : INFO : Loss: 0.9998445345959373\n", + "2019-01-31 00:09:09,296 : INFO : Loss: 1.0\n", + "2019-01-31 00:09:14,588 : INFO : Loss: 0.9998738577942256\n", + "2019-01-31 00:09:19,823 : INFO : Loss: 0.9998218345196497\n", + "2019-01-31 00:09:25,763 : INFO : Loss: 0.9997310226556387\n", + "2019-01-31 00:09:30,687 : INFO : Loss: 0.9998278855547782\n", + "2019-01-31 00:09:35,864 : INFO : Loss: 0.9998134496128264\n", + "2019-01-31 00:09:40,772 : INFO : Loss: 1.0\n", + "2019-01-31 00:09:45,996 : INFO : Loss: 1.0001263005843612\n", + "2019-01-31 00:09:50,992 : INFO : Loss: 1.000122255529092\n", + "2019-01-31 00:09:55,857 : INFO : Loss: 1.0\n", + "2019-01-31 00:10:00,948 : INFO : Loss: 1.0\n", + "2019-01-31 00:10:06,167 : INFO : Loss: 0.9998815976117489\n", + "2019-01-31 00:10:11,262 : INFO : Loss: 0.999890247300433\n", + "2019-01-31 00:10:16,500 : INFO : Loss: 0.9998806365118564\n", + "2019-01-31 00:10:21,694 : INFO : Loss: 1.0001709576054592\n", + "2019-01-31 00:10:26,958 : INFO : Loss: 1.0\n", + "2019-01-31 00:10:32,250 : INFO : Loss: 0.9998330489296149\n", + "2019-01-31 00:10:37,228 : INFO : Loss: 1.0\n", + "2019-01-31 00:10:42,163 : INFO : Loss: 1.0\n", + "2019-01-31 00:10:47,334 : INFO : Loss: 0.9998966449924491\n", + "2019-01-31 00:10:52,615 : INFO : Loss: 1.0003706657662512\n", + "2019-01-31 00:10:57,904 : INFO : Loss: 0.9997845906095503\n", + "2019-01-31 00:11:02,918 : INFO : Loss: 1.0\n", + "2019-01-31 00:11:07,999 : INFO : Loss: 0.9998334349495988\n", + "2019-01-31 00:11:13,335 : INFO : Loss: 0.9998445825797048\n", + "2019-01-31 00:11:18,437 : INFO : Loss: 1.0\n", + "2019-01-31 00:11:23,781 : INFO : Loss: 0.9998438578968686\n", + "2019-01-31 00:11:28,865 : INFO : Loss: 0.9998068614306783\n", + "2019-01-31 00:11:34,139 : INFO : Loss: 1.0004395455200112\n", + "2019-01-31 00:11:39,209 : INFO : Loss: 0.9998766923098149\n", + "2019-01-31 00:11:44,425 : INFO : Loss: 0.9997906796629782\n", + "2019-01-31 00:11:49,535 : INFO : Loss: 1.0001801536949044\n", + "2019-01-31 00:11:54,579 : INFO : Loss: 1.0001437620714628\n", + "2019-01-31 00:11:59,748 : INFO : Loss: 1.0\n", + "2019-01-31 00:12:04,987 : INFO : Loss: 0.999884636287942\n", + "2019-01-31 00:12:10,210 : INFO : Loss: 0.9998901577816464\n", + "2019-01-31 00:12:15,452 : INFO : Loss: 0.9998956750880632\n", + "2019-01-31 00:12:20,596 : INFO : Loss: 1.000601359253442\n", + "2019-01-31 00:12:25,881 : INFO : Loss: 0.9998337004095269\n", + "2019-01-31 00:12:31,113 : INFO : Loss: 0.9997855646540594\n", + "2019-01-31 00:12:36,300 : INFO : Loss: 0.9998248266745982\n", + "2019-01-31 00:12:41,551 : INFO : Loss: 0.999853040713727\n", + "2019-01-31 00:12:46,496 : INFO : Loss: 1.0\n", + "2019-01-31 00:12:51,501 : INFO : Loss: 1.0\n", + "2019-01-31 00:12:56,720 : INFO : Loss: 0.9998980680510154\n", + "2019-01-31 00:13:01,810 : INFO : Loss: 0.9997133093239652\n", + "2019-01-31 00:13:06,749 : INFO : Loss: 1.0001004306361925\n", + "2019-01-31 00:13:12,510 : INFO : Loss: 0.9998121380431872\n", + "2019-01-31 00:13:17,541 : INFO : Loss: 1.000437901798028\n", + "2019-01-31 00:13:22,733 : INFO : Loss: 0.9998402614113828\n", + "2019-01-31 00:13:27,866 : INFO : Loss: 0.9998710291755407\n", + "2019-01-31 00:13:32,989 : INFO : Loss: 1.000374596112327\n", + "2019-01-31 00:13:38,039 : INFO : Loss: 0.9998417020643313\n", + "2019-01-31 00:13:43,181 : INFO : Loss: 0.9998518749352925\n", + "2019-01-31 00:13:48,367 : INFO : Loss: 1.0\n", + "2019-01-31 00:13:53,164 : INFO : Loss: 1.0001097961478265\n", + "2019-01-31 00:13:58,309 : INFO : Loss: 1.000755562323596\n", + "2019-01-31 00:14:03,222 : INFO : Loss: 1.0001917822169584\n", + "2019-01-31 00:14:08,151 : INFO : Loss: 1.0\n", + "2019-01-31 00:14:13,369 : INFO : Loss: 1.0001054497548354\n", + "2019-01-31 00:14:18,332 : INFO : Loss: 1.0\n", + "2019-01-31 00:14:19,114 : INFO : Loss: 0.9997699788421133\n", + "2019-01-31 00:14:19,127 : INFO : saving Nmf object under gensim_nmf.model, separately None\n", + "2019-01-31 00:14:19,520 : INFO : saved gensim_nmf.model\n" ] } ], "source": [ "row = dict()\n", - "row['model'] = 'nmf_with_r'\n", - "row['train_time'], nmf_with_r = get_execution_time(\n", - " lambda: Nmf(\n", - " use_r=True,\n", - " lambda_=200,\n", + "row['model'] = 'gensim_nmf'\n", + "row['train_time'], row['mean_ram'], row['max_ram'], nmf = get_train_time_and_ram(\n", + " lambda: GensimNmf(\n", " normalize=False,\n", " **params\n", - " )\n", + " ),\n", + " 'gensim_nmf',\n", ")\n", - "nmf_with_r.save('nmf_with_r.model')" + "\n", + "nmf.save('gensim_nmf.model')" ] }, { "cell_type": "markdown", "metadata": {}, "source": [ - "### Load NMF with residuals and store metrics" + "### Load Gensim NMF and store metrics" ] }, { @@ -713,130 +875,20 @@ "name": "stderr", "output_type": "stream", "text": [ - "2019-01-16 04:05:48,017 : INFO : loading Nmf object from nmf_with_r.model\n", - "2019-01-16 04:05:48,272 : INFO : loading id2word recursively from nmf_with_r.model.id2word.* with mmap=None\n", - "2019-01-16 04:05:48,273 : INFO : loading _r from nmf_with_r.model._r.npy with mmap=None\n", - "2019-01-16 04:05:48,304 : INFO : loaded nmf_with_r.model\n", - "2019-01-16 04:06:27,119 : INFO : CorpusAccumulator accumulated stats from 1000 documents\n", - "2019-01-16 04:06:27,253 : INFO : CorpusAccumulator accumulated stats from 2000 documents\n" + "2019-01-31 00:14:19,539 : INFO : loading Nmf object from gensim_nmf.model\n", + "2019-01-31 00:14:19,856 : INFO : loading id2word recursively from gensim_nmf.model.id2word.* with mmap=None\n", + "2019-01-31 00:14:19,856 : INFO : loaded gensim_nmf.model\n", + "/home/anotherbugmaster/gensim/gensim/matutils.py:503: FutureWarning: arrays to stack must be passed as a \"sequence\" type such as list or tuple. Support for non-sequence iterables such as generators is deprecated as of NumPy 1.16 and will raise an error in the future.\n", + " result = np.column_stack(sparse2full(doc, num_terms) for doc in corpus)\n", + "2019-01-31 00:14:59,973 : INFO : CorpusAccumulator accumulated stats from 1000 documents\n", + "2019-01-31 00:15:00,082 : INFO : CorpusAccumulator accumulated stats from 2000 documents\n" ] - }, - { - "data": { - "text/plain": [ - "[(0,\n", - " '0.062*\"parti\" + 0.061*\"elect\" + 0.031*\"democrat\" + 0.020*\"republican\" + 0.020*\"vote\" + 0.013*\"liber\" + 0.012*\"candid\" + 0.012*\"conserv\" + 0.011*\"seat\" + 0.010*\"member\"'),\n", - " (1,\n", - " '0.052*\"book\" + 0.040*\"centuri\" + 0.039*\"publish\" + 0.031*\"languag\" + 0.027*\"histori\" + 0.025*\"work\" + 0.023*\"english\" + 0.022*\"king\" + 0.019*\"polit\" + 0.019*\"author\"'),\n", - " (2,\n", - " '0.031*\"armi\" + 0.028*\"divis\" + 0.025*\"regiment\" + 0.022*\"forc\" + 0.020*\"battalion\" + 0.019*\"infantri\" + 0.019*\"command\" + 0.017*\"brigad\" + 0.016*\"gener\" + 0.012*\"corp\"'),\n", - " (3,\n", - " '0.110*\"race\" + 0.059*\"car\" + 0.033*\"engin\" + 0.025*\"lap\" + 0.023*\"driver\" + 0.021*\"ret\" + 0.020*\"ford\" + 0.015*\"finish\" + 0.015*\"motorsport\" + 0.015*\"chevrolet\"'),\n", - " (4,\n", - " '0.130*\"club\" + 0.068*\"cup\" + 0.046*\"footbal\" + 0.044*\"goal\" + 0.032*\"leagu\" + 0.031*\"unit\" + 0.031*\"plai\" + 0.030*\"match\" + 0.026*\"score\" + 0.021*\"player\"'),\n", - " (5,\n", - " '0.041*\"award\" + 0.030*\"best\" + 0.006*\"nomin\" + 0.005*\"actress\" + 0.005*\"year\" + 0.004*\"actor\" + 0.004*\"won\" + 0.004*\"perform\" + 0.003*\"outstand\" + 0.003*\"artist\"'),\n", - " (6,\n", - " '0.087*\"citi\" + 0.013*\"town\" + 0.009*\"popul\" + 0.008*\"area\" + 0.007*\"san\" + 0.006*\"center\" + 0.006*\"airport\" + 0.006*\"unit\" + 0.006*\"locat\" + 0.005*\"municip\"'),\n", - " (7,\n", - " '0.171*\"act\" + 0.021*\"amend\" + 0.018*\"order\" + 0.010*\"ireland\" + 0.009*\"law\" + 0.007*\"court\" + 0.007*\"regul\" + 0.006*\"road\" + 0.006*\"scotland\" + 0.006*\"nation\"'),\n", - " (8,\n", - " '0.064*\"leagu\" + 0.014*\"divis\" + 0.012*\"left\" + 0.011*\"align\" + 0.009*\"basebal\" + 0.008*\"footbal\" + 0.007*\"run\" + 0.007*\"major\" + 0.005*\"home\" + 0.005*\"hit\"'),\n", - " (9,\n", - " '0.086*\"team\" + 0.013*\"championship\" + 0.007*\"nation\" + 0.007*\"race\" + 0.007*\"coach\" + 0.005*\"time\" + 0.004*\"sport\" + 0.004*\"ret\" + 0.004*\"player\" + 0.004*\"match\"'),\n", - " (10,\n", - " '0.100*\"episod\" + 0.055*\"compani\" + 0.021*\"product\" + 0.011*\"produc\" + 0.011*\"televis\" + 0.009*\"role\" + 0.009*\"busi\" + 0.008*\"market\" + 0.008*\"corpor\" + 0.007*\"bank\"'),\n", - " (11,\n", - " '0.050*\"new\" + 0.017*\"york\" + 0.003*\"zealand\" + 0.003*\"jersei\" + 0.002*\"time\" + 0.002*\"radio\" + 0.002*\"broadcast\" + 0.002*\"station\" + 0.002*\"washington\" + 0.002*\"australia\"'),\n", - " (12,\n", - " '0.035*\"final\" + 0.033*\"world\" + 0.030*\"round\" + 0.030*\"championship\" + 0.025*\"win\" + 0.025*\"match\" + 0.021*\"open\" + 0.017*\"won\" + 0.016*\"tournament\" + 0.015*\"event\"'),\n", - " (13,\n", - " '0.020*\"record\" + 0.019*\"band\" + 0.015*\"album\" + 0.007*\"releas\" + 0.007*\"guitar\" + 0.006*\"tour\" + 0.005*\"rock\" + 0.005*\"vocal\" + 0.004*\"plai\" + 0.004*\"live\"'),\n", - " (14,\n", - " '0.096*\"church\" + 0.015*\"cathol\" + 0.012*\"christian\" + 0.010*\"saint\" + 0.010*\"bishop\" + 0.009*\"centuri\" + 0.008*\"build\" + 0.007*\"parish\" + 0.007*\"built\" + 0.007*\"roman\"'),\n", - " (15,\n", - " '0.084*\"presid\" + 0.055*\"minist\" + 0.037*\"prime\" + 0.014*\"govern\" + 0.012*\"gener\" + 0.010*\"governor\" + 0.010*\"nation\" + 0.008*\"council\" + 0.008*\"secretari\" + 0.008*\"visit\"'),\n", - " (16,\n", - " '0.089*\"yard\" + 0.035*\"pass\" + 0.035*\"touchdown\" + 0.028*\"field\" + 0.025*\"run\" + 0.023*\"win\" + 0.022*\"score\" + 0.021*\"quarter\" + 0.017*\"record\" + 0.016*\"second\"'),\n", - " (17,\n", - " '0.042*\"season\" + 0.006*\"plai\" + 0.004*\"coach\" + 0.004*\"final\" + 0.004*\"second\" + 0.004*\"win\" + 0.004*\"record\" + 0.003*\"career\" + 0.003*\"finish\" + 0.003*\"point\"'),\n", - " (18,\n", - " '0.174*\"counti\" + 0.034*\"township\" + 0.014*\"area\" + 0.013*\"statist\" + 0.004*\"texa\" + 0.004*\"ohio\" + 0.004*\"virginia\" + 0.004*\"washington\" + 0.003*\"metropolitan\" + 0.003*\"pennsylvania\"'),\n", - " (19,\n", - " '0.012*\"water\" + 0.010*\"area\" + 0.010*\"speci\" + 0.007*\"larg\" + 0.006*\"order\" + 0.006*\"region\" + 0.006*\"includ\" + 0.005*\"black\" + 0.005*\"famili\" + 0.005*\"popul\"'),\n", - " (20,\n", - " '0.020*\"us\" + 0.015*\"gener\" + 0.014*\"design\" + 0.014*\"model\" + 0.012*\"develop\" + 0.012*\"time\" + 0.012*\"data\" + 0.011*\"number\" + 0.011*\"function\" + 0.011*\"process\"'),\n", - " (21,\n", - " '0.165*\"group\" + 0.023*\"left\" + 0.022*\"align\" + 0.021*\"member\" + 0.017*\"text\" + 0.015*\"bar\" + 0.011*\"order\" + 0.011*\"point\" + 0.010*\"till\" + 0.009*\"stage\"'),\n", - " (22,\n", - " '0.095*\"film\" + 0.009*\"director\" + 0.008*\"star\" + 0.008*\"movi\" + 0.008*\"product\" + 0.008*\"festiv\" + 0.008*\"releas\" + 0.008*\"produc\" + 0.007*\"direct\" + 0.006*\"featur\"'),\n", - " (23,\n", - " '0.107*\"music\" + 0.024*\"perform\" + 0.019*\"piano\" + 0.018*\"song\" + 0.017*\"compos\" + 0.017*\"orchestra\" + 0.017*\"viola\" + 0.012*\"plai\" + 0.011*\"radio\" + 0.011*\"danc\"'),\n", - " (24,\n", - " '0.023*\"septemb\" + 0.023*\"march\" + 0.020*\"octob\" + 0.020*\"juli\" + 0.019*\"june\" + 0.019*\"april\" + 0.019*\"august\" + 0.018*\"januari\" + 0.018*\"novemb\" + 0.017*\"decemb\"'),\n", - " (25,\n", - " '0.078*\"air\" + 0.041*\"forc\" + 0.031*\"aircraft\" + 0.027*\"squadron\" + 0.026*\"oper\" + 0.021*\"unit\" + 0.016*\"base\" + 0.016*\"wing\" + 0.016*\"flight\" + 0.015*\"fighter\"'),\n", - " (26,\n", - " '0.101*\"hous\" + 0.023*\"build\" + 0.021*\"term\" + 0.015*\"member\" + 0.014*\"serv\" + 0.014*\"march\" + 0.014*\"left\" + 0.012*\"congress\" + 0.011*\"hall\" + 0.010*\"street\"'),\n", - " (27,\n", - " '0.123*\"district\" + 0.024*\"pennsylvania\" + 0.019*\"grade\" + 0.016*\"educ\" + 0.015*\"fund\" + 0.014*\"basic\" + 0.013*\"level\" + 0.011*\"student\" + 0.011*\"receiv\" + 0.010*\"tax\"'),\n", - " (28,\n", - " '0.048*\"year\" + 0.007*\"dai\" + 0.005*\"time\" + 0.005*\"ag\" + 0.003*\"month\" + 0.003*\"old\" + 0.003*\"student\" + 0.003*\"includ\" + 0.003*\"later\" + 0.002*\"million\"'),\n", - " (29,\n", - " '0.090*\"line\" + 0.083*\"station\" + 0.054*\"road\" + 0.053*\"railwai\" + 0.036*\"rout\" + 0.030*\"train\" + 0.027*\"oper\" + 0.020*\"street\" + 0.016*\"servic\" + 0.016*\"open\"'),\n", - " (30,\n", - " '0.031*\"park\" + 0.030*\"south\" + 0.030*\"north\" + 0.023*\"west\" + 0.020*\"river\" + 0.020*\"east\" + 0.015*\"area\" + 0.014*\"town\" + 0.013*\"lake\" + 0.013*\"nation\"'),\n", - " (31,\n", - " '0.071*\"women\" + 0.041*\"men\" + 0.027*\"nation\" + 0.023*\"right\" + 0.012*\"countri\" + 0.012*\"intern\" + 0.012*\"athlet\" + 0.011*\"advanc\" + 0.011*\"rank\" + 0.010*\"law\"'),\n", - " (32,\n", - " '0.104*\"linear\" + 0.104*\"socorro\" + 0.025*\"septemb\" + 0.020*\"neat\" + 0.018*\"palomar\" + 0.018*\"octob\" + 0.013*\"decemb\" + 0.013*\"august\" + 0.012*\"anderson\" + 0.012*\"mesa\"'),\n", - " (33,\n", - " '0.089*\"univers\" + 0.011*\"scienc\" + 0.009*\"institut\" + 0.008*\"research\" + 0.008*\"professor\" + 0.006*\"student\" + 0.005*\"technolog\" + 0.005*\"faculti\" + 0.005*\"studi\" + 0.005*\"engin\"'),\n", - " (34,\n", - " '0.064*\"state\" + 0.024*\"unit\" + 0.005*\"court\" + 0.005*\"law\" + 0.004*\"feder\" + 0.003*\"nation\" + 0.003*\"govern\" + 0.002*\"senat\" + 0.002*\"california\" + 0.002*\"constitut\"'),\n", - " (35,\n", - " '0.085*\"colleg\" + 0.019*\"univers\" + 0.014*\"student\" + 0.008*\"campu\" + 0.007*\"institut\" + 0.006*\"educ\" + 0.005*\"hall\" + 0.005*\"program\" + 0.005*\"commun\" + 0.005*\"state\"'),\n", - " (36,\n", - " '0.118*\"class\" + 0.079*\"director\" + 0.053*\"rifl\" + 0.050*\"south\" + 0.048*\"×mm\" + 0.046*\"action\" + 0.045*\"san\" + 0.044*\"actor\" + 0.041*\"angel\" + 0.037*\"lo\"'),\n", - " (37,\n", - " '0.092*\"servic\" + 0.025*\"offic\" + 0.023*\"commun\" + 0.013*\"john\" + 0.012*\"chief\" + 0.011*\"polic\" + 0.011*\"public\" + 0.011*\"british\" + 0.010*\"late\" + 0.010*\"director\"'),\n", - " (38,\n", - " '0.156*\"royal\" + 0.072*\"william\" + 0.068*\"john\" + 0.058*\"corp\" + 0.051*\"lieuten\" + 0.046*\"capt\" + 0.041*\"engin\" + 0.041*\"armi\" + 0.039*\"georg\" + 0.039*\"temp\"'),\n", - " (39,\n", - " '0.042*\"song\" + 0.039*\"album\" + 0.034*\"releas\" + 0.029*\"singl\" + 0.024*\"chart\" + 0.013*\"number\" + 0.011*\"video\" + 0.010*\"love\" + 0.010*\"featur\" + 0.010*\"track\"'),\n", - " (40,\n", - " '0.028*\"time\" + 0.025*\"later\" + 0.023*\"kill\" + 0.019*\"appear\" + 0.018*\"man\" + 0.016*\"death\" + 0.016*\"father\" + 0.015*\"return\" + 0.015*\"son\" + 0.014*\"charact\"'),\n", - " (41,\n", - " '0.110*\"seri\" + 0.016*\"charact\" + 0.016*\"episod\" + 0.015*\"comic\" + 0.013*\"televis\" + 0.012*\"anim\" + 0.011*\"appear\" + 0.009*\"stori\" + 0.009*\"origin\" + 0.009*\"featur\"'),\n", - " (42,\n", - " '0.091*\"born\" + 0.070*\"american\" + 0.022*\"player\" + 0.021*\"footbal\" + 0.020*\"william\" + 0.016*\"actor\" + 0.014*\"politician\" + 0.014*\"singer\" + 0.013*\"john\" + 0.012*\"actress\"'),\n", - " (43,\n", - " '0.072*\"game\" + 0.017*\"player\" + 0.011*\"plai\" + 0.004*\"releas\" + 0.004*\"point\" + 0.004*\"develop\" + 0.004*\"score\" + 0.003*\"video\" + 0.003*\"time\" + 0.003*\"card\"'),\n", - " (44,\n", - " '0.110*\"island\" + 0.007*\"australia\" + 0.007*\"ship\" + 0.007*\"south\" + 0.007*\"sea\" + 0.006*\"bai\" + 0.005*\"coast\" + 0.004*\"pacif\" + 0.004*\"western\" + 0.004*\"british\"'),\n", - " (45,\n", - " '0.029*\"health\" + 0.028*\"studi\" + 0.027*\"research\" + 0.022*\"peopl\" + 0.020*\"human\" + 0.019*\"medic\" + 0.019*\"cell\" + 0.018*\"report\" + 0.018*\"ag\" + 0.017*\"includ\"'),\n", - " (46,\n", - " '0.113*\"school\" + 0.025*\"high\" + 0.014*\"student\" + 0.011*\"educ\" + 0.007*\"grade\" + 0.006*\"public\" + 0.005*\"elementari\" + 0.005*\"primari\" + 0.004*\"pennsylvania\" + 0.004*\"teacher\"'),\n", - " (47,\n", - " '0.050*\"war\" + 0.021*\"german\" + 0.017*\"american\" + 0.016*\"british\" + 0.016*\"world\" + 0.012*\"french\" + 0.010*\"battl\" + 0.010*\"germani\" + 0.009*\"ship\" + 0.009*\"soviet\"'),\n", - " (48,\n", - " '0.174*\"art\" + 0.099*\"museum\" + 0.058*\"paint\" + 0.057*\"work\" + 0.044*\"artist\" + 0.041*\"galleri\" + 0.038*\"exhibit\" + 0.031*\"collect\" + 0.023*\"histori\" + 0.021*\"design\"'),\n", - " (49,\n", - " '0.067*\"peak\" + 0.066*\"kitt\" + 0.066*\"mount\" + 0.066*\"spacewatch\" + 0.065*\"lemmon\" + 0.033*\"survei\" + 0.026*\"octob\" + 0.024*\"septemb\" + 0.015*\"novemb\" + 0.012*\"march\"')]" - ] - }, - "execution_count": 16, - "metadata": {}, - "output_type": "execute_result" } ], "source": [ - "nmf_with_r = Nmf.load('nmf_with_r.model')\n", - "row.update(get_tm_metrics(nmf_with_r, test_corpus))\n", - "tm_metrics = tm_metrics.append(pd.Series(row), ignore_index=True)\n", - "\n", - "nmf_with_r.show_topics(50)" + "nmf = GensimNmf.load('gensim_nmf.model')\n", + "row.update(get_tm_metrics(nmf, test_corpus))\n", + "tm_metrics = tm_metrics.append(pd.Series(row), ignore_index=True)" ] }, { @@ -856,428 +908,22602 @@ "name": "stderr", "output_type": "stream", "text": [ - "2019-01-16 04:06:27,576 : INFO : using symmetric alpha at 0.02\n", - "2019-01-16 04:06:27,576 : INFO : using symmetric eta at 0.02\n", - "2019-01-16 04:06:27,589 : INFO : using serial LDA version on this node\n", - "2019-01-16 04:06:28,185 : INFO : running online (single-pass) LDA training, 50 topics, 1 passes over the supplied corpus of 4922894 documents, updating model once every 2000 documents, evaluating perplexity every 20000 documents, iterating 50x with a convergence threshold of 0.001000\n", - "2019-01-16 04:06:28,910 : INFO : PROGRESS: pass 0, at document #2000/4922894\n", - "==Truncated==\n", - "2019-01-16 06:24:26,456 : INFO : topic diff=0.003897, rho=0.020154\n", - "2019-01-16 06:24:26,465 : INFO : saving LdaState object under lda.model.state, separately None\n", - "2019-01-16 06:24:26,680 : INFO : saved lda.model.state\n", - "2019-01-16 06:24:26,732 : INFO : saving LdaModel object under lda.model, separately ['expElogbeta', 'sstats']\n", - "2019-01-16 06:24:26,732 : INFO : storing np array 'expElogbeta' to lda.model.expElogbeta.npy\n", - "2019-01-16 06:24:26,812 : INFO : not storing attribute dispatcher\n", - "2019-01-16 06:24:26,814 : INFO : not storing attribute id2word\n", - "2019-01-16 06:24:26,815 : INFO : not storing attribute state\n", - "2019-01-16 06:24:26,828 : INFO : saved lda.model\n" + "2019-01-31 00:15:00,190 : INFO : using symmetric alpha at 0.02\n", + "2019-01-31 00:15:00,192 : INFO : using symmetric eta at 0.02\n", + "2019-01-31 00:15:00,209 : INFO : using serial LDA version on this node\n", + "2019-01-31 00:15:00,734 : INFO : running online (single-pass) LDA training, 50 topics, 1 passes over the supplied corpus of 4922894 documents, updating model once every 2000 documents, evaluating perplexity every 20000 documents, iterating 50x with a convergence threshold of 0.001000\n", + "2019-01-31 00:15:00,890 : INFO : PROGRESS: pass 0, at document #2000/4922894\n", + "2019-01-31 00:15:02,814 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:15:03,134 : INFO : topic #36 (0.020): 0.006*\"new\" + 0.005*\"reconstruct\" + 0.004*\"serv\" + 0.004*\"includ\" + 0.003*\"yawn\" + 0.003*\"start\" + 0.003*\"depress\" + 0.003*\"word\" + 0.003*\"théori\" + 0.003*\"american\"\n", + "2019-01-31 00:15:03,136 : INFO : topic #19 (0.020): 0.005*\"taxpay\" + 0.005*\"new\" + 0.004*\"nation\" + 0.004*\"start\" + 0.004*\"includ\" + 0.003*\"théori\" + 0.003*\"apocrypha\" + 0.003*\"yawn\" + 0.002*\"unionist\" + 0.002*\"level\"\n", + "2019-01-31 00:15:03,138 : INFO : topic #42 (0.020): 0.004*\"new\" + 0.004*\"teufel\" + 0.004*\"yawn\" + 0.004*\"member\" + 0.003*\"théori\" + 0.003*\"start\" + 0.003*\"workplac\" + 0.003*\"unit\" + 0.003*\"word\" + 0.003*\"nation\"\n", + "2019-01-31 00:15:03,140 : INFO : topic #43 (0.020): 0.006*\"start\" + 0.005*\"yawn\" + 0.005*\"includ\" + 0.005*\"elect\" + 0.003*\"fusiform\" + 0.003*\"nation\" + 0.003*\"scholar\" + 0.003*\"new\" + 0.003*\"rivièr\" + 0.003*\"muscl\"\n", + "2019-01-31 00:15:03,142 : INFO : topic #5 (0.020): 0.010*\"abroad\" + 0.004*\"yawn\" + 0.004*\"new\" + 0.003*\"start\" + 0.003*\"bone\" + 0.003*\"reconstruct\" + 0.003*\"includ\" + 0.003*\"son\" + 0.003*\"rel\" + 0.003*\"charcoal\"\n", + "2019-01-31 00:15:03,150 : INFO : topic diff=40.889942, rho=1.000000\n", + "2019-01-31 00:15:03,325 : INFO : PROGRESS: pass 0, at document #4000/4922894\n", + "2019-01-31 00:15:05,268 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:15:05,527 : INFO : topic #1 (0.020): 0.007*\"yawn\" + 0.006*\"kosmo\" + 0.005*\"scholar\" + 0.004*\"cabinetmak\" + 0.004*\"taxpay\" + 0.004*\"nathali\" + 0.004*\"optimum\" + 0.004*\"start\" + 0.003*\"march\" + 0.003*\"soyuz\"\n", + "2019-01-31 00:15:05,528 : INFO : topic #33 (0.020): 0.004*\"levi\" + 0.004*\"wreath\" + 0.004*\"start\" + 0.004*\"anglo\" + 0.004*\"bourbon\" + 0.003*\"hofsted\" + 0.003*\"includ\" + 0.003*\"decatur\" + 0.003*\"hesit\" + 0.003*\"workplac\"\n", + "2019-01-31 00:15:05,529 : INFO : topic #15 (0.020): 0.008*\"leagu\" + 0.006*\"goal\" + 0.006*\"start\" + 0.006*\"taxpay\" + 0.006*\"econom\" + 0.004*\"theoret\" + 0.004*\"economi\" + 0.004*\"schuster\" + 0.004*\"develop\" + 0.004*\"resolut\"\n", + "2019-01-31 00:15:05,531 : INFO : topic #14 (0.020): 0.011*\"armi\" + 0.011*\"aggress\" + 0.008*\"airbu\" + 0.008*\"com\" + 0.007*\"forc\" + 0.007*\"unionist\" + 0.006*\"corp\" + 0.006*\"diversifi\" + 0.005*\"fiscal\" + 0.005*\"gener\"\n", + "2019-01-31 00:15:05,532 : INFO : topic #3 (0.020): 0.007*\"start\" + 0.006*\"new\" + 0.005*\"american\" + 0.004*\"walter\" + 0.004*\"nation\" + 0.004*\"yawn\" + 0.004*\"gaa\" + 0.004*\"gener\" + 0.003*\"workplac\" + 0.003*\"diversifi\"\n", + "2019-01-31 00:15:05,537 : INFO : topic diff=0.441109, rho=0.707107\n", + "2019-01-31 00:15:05,696 : INFO : PROGRESS: pass 0, at document #6000/4922894\n", + "2019-01-31 00:15:07,514 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:15:07,769 : INFO : topic #1 (0.020): 0.007*\"yawn\" + 0.005*\"gabriela\" + 0.005*\"taxpay\" + 0.004*\"optimum\" + 0.004*\"cleveland\" + 0.004*\"kosmo\" + 0.004*\"scholar\" + 0.004*\"champion\" + 0.003*\"questionnair\" + 0.003*\"cabinetmak\"\n", + "2019-01-31 00:15:07,771 : INFO : topic #22 (0.020): 0.013*\"isl\" + 0.012*\"citi\" + 0.011*\"popolo\" + 0.011*\"spars\" + 0.010*\"adulthood\" + 0.010*\"factor\" + 0.008*\"hostil\" + 0.007*\"yawn\" + 0.007*\"area\" + 0.006*\"feel\"\n", + "2019-01-31 00:15:07,772 : INFO : topic #7 (0.020): 0.007*\"darwin\" + 0.006*\"hous\" + 0.005*\"yawn\" + 0.005*\"church\" + 0.005*\"john\" + 0.004*\"member\" + 0.004*\"dai\" + 0.004*\"kangaroo\" + 0.004*\"start\" + 0.004*\"new\"\n", + "2019-01-31 00:15:07,773 : INFO : topic #24 (0.020): 0.012*\"page\" + 0.011*\"do\" + 0.007*\"book\" + 0.006*\"languag\" + 0.006*\"new\" + 0.006*\"nicola\" + 0.005*\"ural\" + 0.005*\"american\" + 0.005*\"publicis\" + 0.004*\"storag\"\n", + "2019-01-31 00:15:07,774 : INFO : topic #4 (0.020): 0.009*\"enfranchis\" + 0.008*\"companhia\" + 0.007*\"new\" + 0.007*\"diagnost\" + 0.005*\"candid\" + 0.005*\"mandir\" + 0.005*\"depress\" + 0.005*\"frozen\" + 0.005*\"wheel\" + 0.005*\"oper\"\n", + "2019-01-31 00:15:07,780 : INFO : topic diff=0.324808, rho=0.577350\n", + "2019-01-31 00:15:07,940 : INFO : PROGRESS: pass 0, at document #8000/4922894\n", + "2019-01-31 00:15:09,689 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:15:09,949 : INFO : topic #49 (0.020): 0.007*\"area\" + 0.007*\"line\" + 0.006*\"govern\" + 0.006*\"start\" + 0.006*\"warmth\" + 0.006*\"protect\" + 0.005*\"regim\" + 0.005*\"india\" + 0.005*\"statewid\" + 0.005*\"lobe\"\n", + "2019-01-31 00:15:09,950 : INFO : topic #0 (0.020): 0.023*\"statewid\" + 0.022*\"arsen\" + 0.009*\"raid\" + 0.008*\"pain\" + 0.008*\"line\" + 0.007*\"gai\" + 0.007*\"ret\" + 0.006*\"museo\" + 0.005*\"new\" + 0.005*\"centuri\"\n", + "2019-01-31 00:15:09,952 : INFO : topic #25 (0.020): 0.016*\"palmer\" + 0.011*\"mount\" + 0.007*\"mound\" + 0.006*\"includ\" + 0.006*\"spars\" + 0.005*\"area\" + 0.005*\"biom\" + 0.005*\"new\" + 0.004*\"rain\" + 0.004*\"arsen\"\n", + "2019-01-31 00:15:09,953 : INFO : topic #30 (0.020): 0.015*\"cleveland\" + 0.014*\"scientist\" + 0.013*\"leagu\" + 0.013*\"crete\" + 0.013*\"taxpay\" + 0.012*\"place\" + 0.011*\"final\" + 0.011*\"champion\" + 0.010*\"women\" + 0.008*\"rooftop\"\n", + "2019-01-31 00:15:09,954 : INFO : topic #24 (0.020): 0.014*\"book\" + 0.010*\"publicis\" + 0.009*\"page\" + 0.007*\"nicola\" + 0.007*\"languag\" + 0.006*\"new\" + 0.005*\"storag\" + 0.005*\"do\" + 0.005*\"american\" + 0.005*\"ural\"\n", + "2019-01-31 00:15:09,960 : INFO : topic diff=0.256670, rho=0.500000\n", + "2019-01-31 00:15:10,121 : INFO : PROGRESS: pass 0, at document #10000/4922894\n", + "2019-01-31 00:15:11,841 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:15:12,099 : INFO : topic #35 (0.020): 0.021*\"parti\" + 0.011*\"rural\" + 0.010*\"group\" + 0.010*\"voluntari\" + 0.010*\"elect\" + 0.008*\"district\" + 0.007*\"local\" + 0.007*\"govern\" + 0.006*\"moscow\" + 0.006*\"new\"\n", + "2019-01-31 00:15:12,101 : INFO : topic #24 (0.020): 0.024*\"book\" + 0.015*\"voic\" + 0.013*\"publicis\" + 0.009*\"page\" + 0.007*\"languag\" + 0.007*\"nicola\" + 0.007*\"new\" + 0.006*\"magazin\" + 0.006*\"word\" + 0.006*\"storag\"\n", + "2019-01-31 00:15:12,102 : INFO : topic #39 (0.020): 0.034*\"taxpay\" + 0.023*\"scientist\" + 0.023*\"leagu\" + 0.021*\"clot\" + 0.015*\"place\" + 0.011*\"player\" + 0.010*\"folei\" + 0.009*\"hoar\" + 0.008*\"yawn\" + 0.007*\"fusiform\"\n", + "2019-01-31 00:15:12,104 : INFO : topic #38 (0.020): 0.011*\"aza\" + 0.011*\"teufel\" + 0.008*\"walter\" + 0.007*\"fit\" + 0.006*\"king\" + 0.006*\"deal\" + 0.006*\"start\" + 0.005*\"murder\" + 0.005*\"british\" + 0.005*\"book\"\n", + "2019-01-31 00:15:12,105 : INFO : topic #21 (0.020): 0.006*\"honeymoon\" + 0.006*\"spain\" + 0.006*\"samford\" + 0.005*\"mercier\" + 0.005*\"juan\" + 0.005*\"santa\" + 0.005*\"mexico\" + 0.005*\"rosa\" + 0.005*\"venezuela\" + 0.005*\"josé\"\n", + "2019-01-31 00:15:12,112 : INFO : topic diff=0.237227, rho=0.447214\n", + "2019-01-31 00:15:12,277 : INFO : PROGRESS: pass 0, at document #12000/4922894\n", + "2019-01-31 00:15:13,929 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:15:14,187 : INFO : topic #1 (0.020): 0.016*\"shu\" + 0.007*\"yawn\" + 0.005*\"argentina\" + 0.005*\"brigitt\" + 0.005*\"åsa\" + 0.004*\"cleveland\" + 0.004*\"taxpay\" + 0.004*\"pledg\" + 0.004*\"rancheria\" + 0.004*\"paraboloid\"\n", + "2019-01-31 00:15:14,189 : INFO : topic #20 (0.020): 0.053*\"scholar\" + 0.017*\"struggl\" + 0.015*\"educ\" + 0.011*\"prognosi\" + 0.010*\"high\" + 0.009*\"woman\" + 0.008*\"yawn\" + 0.007*\"intern\" + 0.006*\"new\" + 0.006*\"nation\"\n", + "2019-01-31 00:15:14,190 : INFO : topic #49 (0.020): 0.010*\"area\" + 0.007*\"line\" + 0.007*\"regim\" + 0.007*\"govern\" + 0.006*\"start\" + 0.006*\"khalsa\" + 0.005*\"india\" + 0.005*\"rosenwald\" + 0.005*\"near\" + 0.005*\"peopl\"\n", + "2019-01-31 00:15:14,192 : INFO : topic #23 (0.020): 0.060*\"audit\" + 0.032*\"best\" + 0.011*\"noll\" + 0.010*\"yawn\" + 0.006*\"michel\" + 0.004*\"muscl\" + 0.004*\"dai\" + 0.004*\"intern\" + 0.004*\"fewer\" + 0.004*\"women\"\n", + "2019-01-31 00:15:14,193 : INFO : topic #10 (0.020): 0.008*\"cdd\" + 0.008*\"fusiform\" + 0.007*\"pathwai\" + 0.006*\"cancer\" + 0.006*\"disco\" + 0.006*\"effect\" + 0.005*\"includ\" + 0.005*\"gastrointestin\" + 0.004*\"théori\" + 0.004*\"uruguayan\"\n" ] - } - ], - "source": [ - "row = dict()\n", - "row['model'] = 'lda'\n", - "row['train_time'], lda = get_execution_time(\n", - " lambda: LdaModel(**params)\n", - ")\n", - "lda.save('lda.model')" - ] - }, - { - "cell_type": "markdown", - "metadata": {}, - "source": [ - "### Load LDA and store metrics" - ] - }, - { - "cell_type": "code", - "execution_count": 18, - "metadata": {}, - "outputs": [ + }, { "name": "stderr", "output_type": "stream", "text": [ - "2019-01-16 06:24:27,064 : INFO : loading LdaModel object from lda.model\n", - "2019-01-16 06:24:27,070 : INFO : loading expElogbeta from lda.model.expElogbeta.npy with mmap=None\n", - "2019-01-16 06:24:27,077 : INFO : setting ignored attribute dispatcher to None\n", - "2019-01-16 06:24:27,078 : INFO : setting ignored attribute id2word to None\n", - "2019-01-16 06:24:27,078 : INFO : setting ignored attribute state to None\n", - "2019-01-16 06:24:27,079 : INFO : loaded lda.model\n", - "2019-01-16 06:24:27,079 : INFO : loading LdaState object from lda.model.state\n", - "2019-01-16 06:24:27,173 : INFO : loaded lda.model.state\n", - "2019-01-16 06:24:41,257 : INFO : CorpusAccumulator accumulated stats from 1000 documents\n", - "2019-01-16 06:24:41,452 : INFO : CorpusAccumulator accumulated stats from 2000 documents\n" + "2019-01-31 00:15:14,199 : INFO : topic diff=0.220294, rho=0.408248\n", + "2019-01-31 00:15:14,358 : INFO : PROGRESS: pass 0, at document #14000/4922894\n", + "2019-01-31 00:15:16,536 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:15:16,796 : INFO : topic #39 (0.020): 0.038*\"taxpay\" + 0.025*\"scientist\" + 0.025*\"clot\" + 0.020*\"leagu\" + 0.015*\"place\" + 0.012*\"player\" + 0.012*\"folei\" + 0.010*\"hoar\" + 0.009*\"yawn\" + 0.009*\"basketbal\"\n", + "2019-01-31 00:15:16,797 : INFO : topic #0 (0.020): 0.035*\"statewid\" + 0.031*\"arsen\" + 0.015*\"line\" + 0.014*\"raid\" + 0.012*\"museo\" + 0.012*\"pain\" + 0.012*\"left\" + 0.011*\"alic\" + 0.010*\"word\" + 0.009*\"artist\"\n", + "2019-01-31 00:15:16,798 : INFO : topic #13 (0.020): 0.020*\"sourc\" + 0.018*\"north\" + 0.015*\"weekli\" + 0.013*\"earthworm\" + 0.012*\"castl\" + 0.012*\"lagrang\" + 0.010*\"cotton\" + 0.009*\"vigour\" + 0.008*\"vacant\" + 0.008*\"hormon\"\n", + "2019-01-31 00:15:16,800 : INFO : topic #45 (0.020): 0.015*\"depress\" + 0.007*\"slow\" + 0.006*\"stanc\" + 0.006*\"dendrit\" + 0.006*\"uruguayan\" + 0.005*\"light\" + 0.005*\"pour\" + 0.005*\"warmth\" + 0.004*\"color\" + 0.004*\"encyclopedia\"\n", + "2019-01-31 00:15:16,801 : INFO : topic #12 (0.020): 0.009*\"frontal\" + 0.008*\"number\" + 0.007*\"form\" + 0.006*\"gener\" + 0.006*\"servitud\" + 0.006*\"uruguayan\" + 0.005*\"exampl\" + 0.005*\"order\" + 0.005*\"differ\" + 0.005*\"théori\"\n", + "2019-01-31 00:15:16,807 : INFO : topic diff=0.214280, rho=0.377964\n", + "2019-01-31 00:15:16,962 : INFO : PROGRESS: pass 0, at document #16000/4922894\n", + "2019-01-31 00:15:18,538 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:15:18,797 : INFO : topic #13 (0.020): 0.021*\"sourc\" + 0.018*\"north\" + 0.015*\"earthworm\" + 0.015*\"weekli\" + 0.015*\"lagrang\" + 0.012*\"castl\" + 0.010*\"cotton\" + 0.009*\"hormon\" + 0.009*\"vigour\" + 0.008*\"vacant\"\n", + "2019-01-31 00:15:18,798 : INFO : topic #40 (0.020): 0.052*\"unit\" + 0.022*\"collector\" + 0.019*\"start\" + 0.010*\"new\" + 0.009*\"american\" + 0.009*\"scholar\" + 0.008*\"institut\" + 0.006*\"word\" + 0.006*\"terri\" + 0.006*\"governor\"\n", + "2019-01-31 00:15:18,799 : INFO : topic #45 (0.020): 0.019*\"depress\" + 0.008*\"cat\" + 0.007*\"light\" + 0.006*\"uruguayan\" + 0.005*\"pour\" + 0.005*\"cambridg\" + 0.005*\"hade\" + 0.005*\"warmth\" + 0.004*\"slow\" + 0.004*\"stanc\"\n", + "2019-01-31 00:15:18,800 : INFO : topic #33 (0.020): 0.011*\"wreath\" + 0.010*\"french\" + 0.010*\"chemic\" + 0.007*\"lazi\" + 0.007*\"diphthong\" + 0.007*\"lebanon\" + 0.007*\"arbroath\" + 0.007*\"sauc\" + 0.006*\"mcdonald\" + 0.005*\"daphn\"\n", + "2019-01-31 00:15:18,801 : INFO : topic #19 (0.020): 0.009*\"pour\" + 0.006*\"anim\" + 0.006*\"uruguayan\" + 0.005*\"form\" + 0.005*\"charact\" + 0.005*\"bodi\" + 0.005*\"like\" + 0.004*\"person\" + 0.004*\"act\" + 0.004*\"origin\"\n", + "2019-01-31 00:15:18,807 : INFO : topic diff=0.231270, rho=0.353553\n", + "2019-01-31 00:15:18,964 : INFO : PROGRESS: pass 0, at document #18000/4922894\n", + "2019-01-31 00:15:20,562 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:15:20,821 : INFO : topic #36 (0.020): 0.024*\"elegan\" + 0.018*\"companhia\" + 0.010*\"serv\" + 0.008*\"manag\" + 0.007*\"market\" + 0.007*\"produc\" + 0.007*\"new\" + 0.007*\"oper\" + 0.006*\"network\" + 0.006*\"develop\"\n", + "2019-01-31 00:15:20,823 : INFO : topic #20 (0.020): 0.065*\"scholar\" + 0.020*\"struggl\" + 0.019*\"educ\" + 0.013*\"prognosi\" + 0.012*\"high\" + 0.010*\"yawn\" + 0.009*\"woman\" + 0.007*\"pseudo\" + 0.006*\"intern\" + 0.006*\"commun\"\n", + "2019-01-31 00:15:20,823 : INFO : topic #23 (0.020): 0.081*\"audit\" + 0.045*\"best\" + 0.018*\"noll\" + 0.015*\"yawn\" + 0.010*\"kri\" + 0.007*\"women\" + 0.007*\"tokyo\" + 0.006*\"winner\" + 0.006*\"prison\" + 0.006*\"dai\"\n", + "2019-01-31 00:15:20,825 : INFO : topic #21 (0.020): 0.015*\"spain\" + 0.015*\"samford\" + 0.013*\"mexico\" + 0.011*\"santa\" + 0.011*\"juan\" + 0.011*\"del\" + 0.010*\"josé\" + 0.009*\"misconcept\" + 0.007*\"plung\" + 0.007*\"soviet\"\n", + "2019-01-31 00:15:20,826 : INFO : topic #40 (0.020): 0.051*\"unit\" + 0.022*\"collector\" + 0.018*\"start\" + 0.011*\"american\" + 0.010*\"new\" + 0.009*\"scholar\" + 0.008*\"institut\" + 0.007*\"word\" + 0.007*\"terri\" + 0.007*\"governor\"\n", + "2019-01-31 00:15:20,831 : INFO : topic diff=0.230670, rho=0.333333\n", + "2019-01-31 00:15:23,694 : INFO : -11.706 per-word bound, 3341.9 perplexity estimate based on a held-out corpus of 2000 documents with 557209 words\n", + "2019-01-31 00:15:23,694 : INFO : PROGRESS: pass 0, at document #20000/4922894\n", + "2019-01-31 00:15:25,238 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:15:25,498 : INFO : topic #41 (0.020): 0.020*\"new\" + 0.019*\"citi\" + 0.013*\"museo\" + 0.012*\"strategist\" + 0.011*\"year\" + 0.010*\"center\" + 0.009*\"festiv\" + 0.009*\"briarwood\" + 0.007*\"arsen\" + 0.007*\"hot\"\n", + "2019-01-31 00:15:25,499 : INFO : topic #42 (0.020): 0.012*\"german\" + 0.007*\"anglo\" + 0.006*\"germani\" + 0.006*\"europ\" + 0.006*\"histori\" + 0.006*\"vol\" + 0.006*\"polici\" + 0.005*\"der\" + 0.005*\"islam\" + 0.005*\"centuri\"\n", + "2019-01-31 00:15:25,500 : INFO : topic #13 (0.020): 0.021*\"sourc\" + 0.018*\"north\" + 0.016*\"weekli\" + 0.015*\"earthworm\" + 0.014*\"ireland\" + 0.013*\"neutral\" + 0.012*\"lagrang\" + 0.011*\"castl\" + 0.010*\"cotton\" + 0.009*\"wale\"\n", + "2019-01-31 00:15:25,502 : INFO : topic #31 (0.020): 0.051*\"fusiform\" + 0.024*\"player\" + 0.021*\"place\" + 0.013*\"scientist\" + 0.011*\"folei\" + 0.010*\"yard\" + 0.010*\"leagu\" + 0.010*\"taxpay\" + 0.009*\"yawn\" + 0.007*\"ruler\"\n", + "2019-01-31 00:15:25,503 : INFO : topic #1 (0.020): 0.008*\"brazil\" + 0.008*\"abreast\" + 0.008*\"argentina\" + 0.007*\"shu\" + 0.007*\"brazilian\" + 0.007*\"yawn\" + 0.007*\"min\" + 0.006*\"proton\" + 0.005*\"justinian\" + 0.005*\"hildesheim\"\n", + "2019-01-31 00:15:25,509 : INFO : topic diff=0.242050, rho=0.316228\n", + "2019-01-31 00:15:25,672 : INFO : PROGRESS: pass 0, at document #22000/4922894\n", + "2019-01-31 00:15:27,254 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:15:27,515 : INFO : topic #37 (0.020): 0.007*\"rel\" + 0.007*\"love\" + 0.006*\"théori\" + 0.006*\"place\" + 0.005*\"appear\" + 0.004*\"son\" + 0.004*\"night\" + 0.003*\"man\" + 0.003*\"perceptu\" + 0.003*\"live\"\n", + "2019-01-31 00:15:27,516 : INFO : topic #45 (0.020): 0.016*\"depress\" + 0.011*\"light\" + 0.006*\"uruguayan\" + 0.006*\"warmth\" + 0.005*\"summer\" + 0.005*\"cat\" + 0.005*\"color\" + 0.004*\"cambridg\" + 0.004*\"black\" + 0.004*\"like\"\n", + "2019-01-31 00:15:27,518 : INFO : topic #1 (0.020): 0.010*\"min\" + 0.008*\"brazil\" + 0.007*\"hildesheim\" + 0.007*\"justinian\" + 0.006*\"brazilian\" + 0.006*\"argentina\" + 0.006*\"yawn\" + 0.006*\"abreast\" + 0.005*\"bernabéu\" + 0.005*\"leah\"\n", + "2019-01-31 00:15:27,518 : INFO : topic #28 (0.020): 0.020*\"rivièr\" + 0.016*\"ring\" + 0.016*\"build\" + 0.015*\"hous\" + 0.011*\"buford\" + 0.010*\"lobe\" + 0.009*\"histor\" + 0.009*\"area\" + 0.009*\"church\" + 0.009*\"tortur\"\n", + "2019-01-31 00:15:27,519 : INFO : topic #12 (0.020): 0.007*\"number\" + 0.007*\"frontal\" + 0.006*\"exampl\" + 0.006*\"differ\" + 0.006*\"method\" + 0.006*\"gener\" + 0.006*\"form\" + 0.006*\"uruguayan\" + 0.005*\"group\" + 0.005*\"superimpos\"\n", + "2019-01-31 00:15:27,525 : INFO : topic diff=0.259331, rho=0.301511\n", + "2019-01-31 00:15:27,684 : INFO : PROGRESS: pass 0, at document #24000/4922894\n", + "2019-01-31 00:15:29,222 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:15:29,482 : INFO : topic #7 (0.020): 0.019*\"locri\" + 0.013*\"sir\" + 0.013*\"church\" + 0.010*\"snatch\" + 0.008*\"john\" + 0.008*\"yawn\" + 0.008*\"factor\" + 0.008*\"di\" + 0.006*\"hous\" + 0.006*\"faster\"\n", + "2019-01-31 00:15:29,483 : INFO : topic #22 (0.020): 0.025*\"factor\" + 0.021*\"spars\" + 0.019*\"isl\" + 0.014*\"popolo\" + 0.013*\"adulthood\" + 0.010*\"feel\" + 0.009*\"male\" + 0.009*\"hostil\" + 0.009*\"area\" + 0.008*\"live\"\n", + "2019-01-31 00:15:29,484 : INFO : topic #4 (0.020): 0.024*\"enfranchis\" + 0.022*\"candid\" + 0.016*\"veget\" + 0.013*\"mode\" + 0.011*\"elabor\" + 0.009*\"depress\" + 0.009*\"pour\" + 0.007*\"fuel\" + 0.006*\"mandir\" + 0.006*\"companhia\"\n", + "2019-01-31 00:15:29,485 : INFO : topic #28 (0.020): 0.017*\"rivièr\" + 0.017*\"build\" + 0.015*\"hous\" + 0.015*\"ring\" + 0.012*\"buford\" + 0.011*\"area\" + 0.010*\"lobe\" + 0.010*\"tortur\" + 0.009*\"histor\" + 0.009*\"church\"\n", + "2019-01-31 00:15:29,486 : INFO : topic #14 (0.020): 0.021*\"armi\" + 0.017*\"forc\" + 0.016*\"walter\" + 0.013*\"aggress\" + 0.013*\"refut\" + 0.012*\"com\" + 0.011*\"unionist\" + 0.011*\"librari\" + 0.011*\"diversifi\" + 0.010*\"rotterdam\"\n", + "2019-01-31 00:15:29,492 : INFO : topic diff=0.261842, rho=0.288675\n" ] }, { - "data": { - "text/plain": [ - "[(0,\n", - " '0.033*\"war\" + 0.028*\"armi\" + 0.021*\"forc\" + 0.020*\"command\" + 0.015*\"militari\" + 0.015*\"battl\" + 0.013*\"gener\" + 0.012*\"offic\" + 0.011*\"divis\" + 0.011*\"regiment\"'),\n", - " (1,\n", - " '0.038*\"album\" + 0.028*\"song\" + 0.026*\"releas\" + 0.026*\"record\" + 0.021*\"band\" + 0.016*\"singl\" + 0.015*\"music\" + 0.014*\"chart\" + 0.013*\"track\" + 0.010*\"guitar\"'),\n", - " (2,\n", - " '0.062*\"german\" + 0.039*\"germani\" + 0.025*\"van\" + 0.023*\"von\" + 0.020*\"der\" + 0.019*\"dutch\" + 0.019*\"berlin\" + 0.015*\"swedish\" + 0.014*\"netherland\" + 0.014*\"sweden\"'),\n", - " (3,\n", - " '0.032*\"john\" + 0.027*\"william\" + 0.019*\"british\" + 0.015*\"georg\" + 0.015*\"london\" + 0.014*\"thoma\" + 0.014*\"sir\" + 0.014*\"jame\" + 0.013*\"royal\" + 0.013*\"henri\"'),\n", - " (4,\n", - " '0.137*\"school\" + 0.040*\"colleg\" + 0.039*\"student\" + 0.033*\"univers\" + 0.030*\"high\" + 0.028*\"educ\" + 0.016*\"year\" + 0.011*\"graduat\" + 0.010*\"state\" + 0.009*\"campu\"'),\n", - " (5,\n", - " '0.030*\"game\" + 0.009*\"develop\" + 0.009*\"player\" + 0.008*\"releas\" + 0.008*\"us\" + 0.008*\"softwar\" + 0.008*\"version\" + 0.008*\"user\" + 0.007*\"data\" + 0.007*\"includ\"'),\n", - " (6,\n", - " '0.061*\"music\" + 0.030*\"perform\" + 0.019*\"theatr\" + 0.018*\"compos\" + 0.016*\"plai\" + 0.016*\"festiv\" + 0.015*\"danc\" + 0.014*\"orchestra\" + 0.012*\"opera\" + 0.011*\"piano\"'),\n", - " (7,\n", - " '0.013*\"number\" + 0.011*\"function\" + 0.010*\"model\" + 0.009*\"valu\" + 0.008*\"set\" + 0.008*\"exampl\" + 0.007*\"gener\" + 0.007*\"theori\" + 0.007*\"point\" + 0.006*\"method\"'),\n", - " (8,\n", - " '0.048*\"india\" + 0.037*\"indian\" + 0.020*\"http\" + 0.016*\"www\" + 0.015*\"pakistan\" + 0.015*\"iran\" + 0.013*\"sri\" + 0.012*\"khan\" + 0.012*\"islam\" + 0.012*\"tamil\"'),\n", - " (9,\n", - " '0.067*\"film\" + 0.025*\"award\" + 0.022*\"seri\" + 0.021*\"episod\" + 0.021*\"best\" + 0.015*\"star\" + 0.012*\"role\" + 0.012*\"actor\" + 0.011*\"televis\" + 0.011*\"produc\"'),\n", - " (10,\n", - " '0.020*\"engin\" + 0.013*\"power\" + 0.011*\"product\" + 0.011*\"design\" + 0.010*\"model\" + 0.009*\"produc\" + 0.008*\"us\" + 0.008*\"electr\" + 0.008*\"type\" + 0.007*\"vehicl\"'),\n", - " (11,\n", - " '0.024*\"law\" + 0.021*\"court\" + 0.016*\"state\" + 0.016*\"act\" + 0.011*\"polic\" + 0.010*\"case\" + 0.009*\"offic\" + 0.009*\"report\" + 0.009*\"right\" + 0.007*\"legal\"'),\n", - " (12,\n", - " '0.056*\"elect\" + 0.041*\"parti\" + 0.023*\"member\" + 0.020*\"vote\" + 0.020*\"presid\" + 0.017*\"democrat\" + 0.017*\"minist\" + 0.013*\"council\" + 0.013*\"repres\" + 0.012*\"polit\"'),\n", - " (13,\n", - " '0.057*\"state\" + 0.035*\"new\" + 0.029*\"american\" + 0.024*\"unit\" + 0.024*\"york\" + 0.020*\"counti\" + 0.015*\"citi\" + 0.014*\"california\" + 0.012*\"washington\" + 0.010*\"texa\"'),\n", - " (14,\n", - " '0.027*\"univers\" + 0.015*\"research\" + 0.014*\"institut\" + 0.012*\"nation\" + 0.012*\"scienc\" + 0.012*\"work\" + 0.012*\"intern\" + 0.011*\"award\" + 0.011*\"develop\" + 0.010*\"organ\"'),\n", - " (15,\n", - " '0.034*\"england\" + 0.024*\"unit\" + 0.021*\"london\" + 0.019*\"cricket\" + 0.019*\"town\" + 0.016*\"citi\" + 0.015*\"scotland\" + 0.013*\"manchest\" + 0.013*\"west\" + 0.012*\"scottish\"'),\n", - " (16,\n", - " '0.031*\"church\" + 0.017*\"famili\" + 0.017*\"di\" + 0.016*\"son\" + 0.015*\"marri\" + 0.014*\"year\" + 0.013*\"father\" + 0.013*\"life\" + 0.013*\"born\" + 0.012*\"daughter\"'),\n", - " (17,\n", - " '0.060*\"race\" + 0.020*\"car\" + 0.017*\"team\" + 0.012*\"finish\" + 0.012*\"tour\" + 0.012*\"driver\" + 0.011*\"ford\" + 0.011*\"time\" + 0.011*\"championship\" + 0.011*\"year\"'),\n", - " (18,\n", - " '0.010*\"water\" + 0.007*\"light\" + 0.007*\"energi\" + 0.007*\"high\" + 0.006*\"surfac\" + 0.006*\"earth\" + 0.006*\"time\" + 0.005*\"effect\" + 0.005*\"temperatur\" + 0.005*\"materi\"'),\n", - " (19,\n", - " '0.022*\"radio\" + 0.020*\"new\" + 0.019*\"broadcast\" + 0.018*\"station\" + 0.014*\"televis\" + 0.013*\"channel\" + 0.013*\"dai\" + 0.011*\"program\" + 0.011*\"host\" + 0.011*\"air\"'),\n", - " (20,\n", - " '0.035*\"win\" + 0.018*\"contest\" + 0.017*\"wrestl\" + 0.017*\"fight\" + 0.016*\"match\" + 0.016*\"titl\" + 0.015*\"championship\" + 0.014*\"team\" + 0.012*\"world\" + 0.011*\"defeat\"'),\n", - " (21,\n", - " '0.011*\"languag\" + 0.007*\"word\" + 0.007*\"form\" + 0.006*\"peopl\" + 0.006*\"differ\" + 0.006*\"cultur\" + 0.006*\"us\" + 0.006*\"mean\" + 0.005*\"tradit\" + 0.005*\"term\"'),\n", - " (22,\n", - " '0.051*\"popul\" + 0.033*\"ag\" + 0.030*\"citi\" + 0.029*\"town\" + 0.027*\"famili\" + 0.026*\"censu\" + 0.023*\"household\" + 0.023*\"commun\" + 0.021*\"peopl\" + 0.021*\"counti\"'),\n", - " (23,\n", - " '0.016*\"medic\" + 0.014*\"health\" + 0.014*\"hospit\" + 0.013*\"cell\" + 0.011*\"diseas\" + 0.010*\"patient\" + 0.009*\"ret\" + 0.009*\"caus\" + 0.008*\"human\" + 0.008*\"treatment\"'),\n", - " (24,\n", - " '0.037*\"ship\" + 0.017*\"navi\" + 0.015*\"sea\" + 0.012*\"island\" + 0.012*\"boat\" + 0.011*\"port\" + 0.010*\"naval\" + 0.010*\"coast\" + 0.010*\"gun\" + 0.009*\"fleet\"'),\n", - " (25,\n", - " '0.044*\"round\" + 0.044*\"final\" + 0.025*\"tournament\" + 0.023*\"group\" + 0.020*\"point\" + 0.020*\"winner\" + 0.018*\"open\" + 0.015*\"place\" + 0.013*\"qualifi\" + 0.012*\"won\"'),\n", - " (26,\n", - " '0.032*\"world\" + 0.030*\"women\" + 0.028*\"championship\" + 0.026*\"olymp\" + 0.023*\"men\" + 0.022*\"event\" + 0.022*\"medal\" + 0.018*\"athlet\" + 0.017*\"gold\" + 0.017*\"nation\"'),\n", - " (27,\n", - " '0.056*\"born\" + 0.034*\"russian\" + 0.026*\"american\" + 0.020*\"russia\" + 0.020*\"soviet\" + 0.017*\"polish\" + 0.015*\"jewish\" + 0.014*\"poland\" + 0.014*\"republ\" + 0.013*\"moscow\"'),\n", - " (28,\n", - " '0.029*\"build\" + 0.025*\"hous\" + 0.014*\"built\" + 0.012*\"locat\" + 0.012*\"street\" + 0.012*\"site\" + 0.011*\"histor\" + 0.009*\"park\" + 0.009*\"citi\" + 0.009*\"place\"'),\n", - " (29,\n", - " '0.039*\"leagu\" + 0.036*\"club\" + 0.035*\"plai\" + 0.031*\"team\" + 0.026*\"footbal\" + 0.026*\"season\" + 0.023*\"cup\" + 0.018*\"goal\" + 0.016*\"player\" + 0.016*\"match\"'),\n", - " (30,\n", - " '0.053*\"french\" + 0.041*\"franc\" + 0.027*\"italian\" + 0.025*\"pari\" + 0.022*\"saint\" + 0.020*\"itali\" + 0.018*\"jean\" + 0.014*\"de\" + 0.011*\"loui\" + 0.011*\"le\"'),\n", - " (31,\n", - " '0.067*\"australia\" + 0.058*\"australian\" + 0.051*\"new\" + 0.040*\"china\" + 0.033*\"zealand\" + 0.032*\"south\" + 0.027*\"chines\" + 0.021*\"sydnei\" + 0.015*\"melbourn\" + 0.013*\"queensland\"'),\n", - " (32,\n", - " '0.026*\"speci\" + 0.011*\"famili\" + 0.009*\"plant\" + 0.008*\"white\" + 0.008*\"bird\" + 0.007*\"genu\" + 0.007*\"red\" + 0.007*\"forest\" + 0.007*\"fish\" + 0.006*\"tree\"'),\n", - " (33,\n", - " '0.033*\"compani\" + 0.013*\"million\" + 0.012*\"busi\" + 0.012*\"market\" + 0.011*\"product\" + 0.010*\"bank\" + 0.010*\"year\" + 0.009*\"industri\" + 0.008*\"oper\" + 0.008*\"new\"'),\n", - " (34,\n", - " '0.085*\"island\" + 0.073*\"canada\" + 0.065*\"canadian\" + 0.026*\"toronto\" + 0.025*\"ontario\" + 0.017*\"korean\" + 0.017*\"korea\" + 0.016*\"quebec\" + 0.016*\"montreal\" + 0.016*\"british\"'),\n", - " (35,\n", - " '0.034*\"kong\" + 0.034*\"japanes\" + 0.033*\"hong\" + 0.023*\"lee\" + 0.021*\"singapor\" + 0.019*\"chines\" + 0.018*\"kim\" + 0.015*\"japan\" + 0.014*\"indonesia\" + 0.014*\"thailand\"'),\n", - " (36,\n", - " '0.054*\"art\" + 0.034*\"museum\" + 0.030*\"jpg\" + 0.027*\"file\" + 0.024*\"work\" + 0.022*\"paint\" + 0.020*\"artist\" + 0.019*\"design\" + 0.017*\"imag\" + 0.017*\"exhibit\"'),\n", - " (37,\n", - " '0.008*\"time\" + 0.007*\"man\" + 0.005*\"later\" + 0.005*\"appear\" + 0.005*\"charact\" + 0.005*\"kill\" + 0.004*\"like\" + 0.004*\"friend\" + 0.004*\"return\" + 0.004*\"end\"'),\n", - " (38,\n", - " '0.014*\"govern\" + 0.012*\"state\" + 0.012*\"nation\" + 0.010*\"war\" + 0.009*\"polit\" + 0.008*\"countri\" + 0.008*\"peopl\" + 0.007*\"group\" + 0.007*\"unit\" + 0.007*\"support\"'),\n", - " (39,\n", - " '0.050*\"air\" + 0.026*\"aircraft\" + 0.026*\"oper\" + 0.025*\"airport\" + 0.017*\"forc\" + 0.017*\"flight\" + 0.015*\"squadron\" + 0.014*\"unit\" + 0.012*\"base\" + 0.011*\"wing\"'),\n", - " (40,\n", - " '0.052*\"bar\" + 0.038*\"africa\" + 0.033*\"text\" + 0.033*\"african\" + 0.031*\"till\" + 0.029*\"color\" + 0.026*\"south\" + 0.023*\"black\" + 0.013*\"tropic\" + 0.013*\"storm\"'),\n", - " (41,\n", - " '0.039*\"book\" + 0.033*\"publish\" + 0.021*\"work\" + 0.015*\"new\" + 0.013*\"press\" + 0.013*\"univers\" + 0.013*\"edit\" + 0.011*\"stori\" + 0.011*\"novel\" + 0.011*\"author\"'),\n", - " (42,\n", - " '0.026*\"king\" + 0.019*\"centuri\" + 0.010*\"princ\" + 0.009*\"empir\" + 0.009*\"kingdom\" + 0.009*\"emperor\" + 0.009*\"greek\" + 0.008*\"roman\" + 0.007*\"ancient\" + 0.006*\"year\"'),\n", - " (43,\n", - " '0.033*\"san\" + 0.022*\"spanish\" + 0.017*\"mexico\" + 0.016*\"del\" + 0.013*\"spain\" + 0.012*\"santa\" + 0.011*\"brazil\" + 0.011*\"juan\" + 0.010*\"josé\" + 0.009*\"francisco\"'),\n", - " (44,\n", - " '0.029*\"game\" + 0.027*\"season\" + 0.023*\"team\" + 0.015*\"plai\" + 0.014*\"coach\" + 0.014*\"player\" + 0.011*\"footbal\" + 0.010*\"year\" + 0.010*\"leagu\" + 0.009*\"record\"'),\n", - " (45,\n", - " '0.015*\"john\" + 0.011*\"david\" + 0.010*\"michael\" + 0.008*\"paul\" + 0.008*\"smith\" + 0.007*\"robert\" + 0.007*\"jame\" + 0.006*\"peter\" + 0.006*\"jack\" + 0.006*\"jone\"'),\n", - " (46,\n", - " '0.133*\"class\" + 0.062*\"align\" + 0.060*\"left\" + 0.056*\"wikit\" + 0.046*\"style\" + 0.043*\"center\" + 0.035*\"right\" + 0.032*\"philippin\" + 0.032*\"list\" + 0.026*\"text\"'),\n", - " (47,\n", - " '0.025*\"river\" + 0.024*\"station\" + 0.021*\"line\" + 0.020*\"road\" + 0.017*\"railwai\" + 0.015*\"rout\" + 0.013*\"lake\" + 0.012*\"park\" + 0.011*\"bridg\" + 0.011*\"area\"'),\n", - " (48,\n", - " '0.072*\"octob\" + 0.070*\"septemb\" + 0.069*\"march\" + 0.062*\"decemb\" + 0.062*\"januari\" + 0.062*\"novemb\" + 0.061*\"juli\" + 0.061*\"august\" + 0.060*\"april\" + 0.058*\"june\"'),\n", - " (49,\n", - " '0.093*\"district\" + 0.066*\"villag\" + 0.047*\"region\" + 0.039*\"east\" + 0.039*\"west\" + 0.038*\"north\" + 0.036*\"counti\" + 0.033*\"south\" + 0.032*\"municip\" + 0.029*\"provinc\"')]" - ] - }, - "execution_count": 18, - "metadata": {}, - "output_type": "execute_result" - } - ], - "source": [ - "lda = LdaModel.load('lda.model')\n", - "row.update(get_tm_metrics(lda, test_corpus))\n", - "tm_metrics = tm_metrics.append(pd.Series(row), ignore_index=True)\n", - "\n", - "lda.show_topics(50)" - ] - }, - { - "cell_type": "markdown", - "metadata": {}, - "source": [ - "## Results" - ] - }, - { - "cell_type": "code", - "execution_count": 19, - "metadata": {}, - "outputs": [ + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 00:15:29,649 : INFO : PROGRESS: pass 0, at document #26000/4922894\n", + "2019-01-31 00:15:31,187 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:15:31,448 : INFO : topic #10 (0.020): 0.010*\"cdd\" + 0.009*\"disco\" + 0.007*\"cancer\" + 0.007*\"gastrointestin\" + 0.007*\"acid\" + 0.007*\"caus\" + 0.006*\"pathwai\" + 0.006*\"treat\" + 0.006*\"proper\" + 0.005*\"includ\"\n", + "2019-01-31 00:15:31,449 : INFO : topic #18 (0.020): 0.007*\"man\" + 0.006*\"kill\" + 0.005*\"charact\" + 0.005*\"théori\" + 0.004*\"septemb\" + 0.004*\"later\" + 0.004*\"appear\" + 0.004*\"epiru\" + 0.004*\"storag\" + 0.004*\"faster\"\n", + "2019-01-31 00:15:31,450 : INFO : topic #0 (0.020): 0.055*\"statewid\" + 0.038*\"arsen\" + 0.024*\"line\" + 0.024*\"raid\" + 0.016*\"pain\" + 0.016*\"word\" + 0.013*\"alic\" + 0.012*\"traceabl\" + 0.012*\"museo\" + 0.012*\"london\"\n", + "2019-01-31 00:15:31,451 : INFO : topic #37 (0.020): 0.007*\"love\" + 0.007*\"théori\" + 0.006*\"place\" + 0.006*\"rel\" + 0.005*\"appear\" + 0.005*\"night\" + 0.004*\"man\" + 0.004*\"son\" + 0.003*\"gestur\" + 0.003*\"yawn\"\n", + "2019-01-31 00:15:31,453 : INFO : topic #35 (0.020): 0.022*\"russia\" + 0.020*\"rural\" + 0.018*\"parti\" + 0.017*\"personifi\" + 0.013*\"unfortun\" + 0.013*\"moscow\" + 0.013*\"china\" + 0.011*\"sovereignti\" + 0.011*\"govern\" + 0.011*\"chilton\"\n", + "2019-01-31 00:15:31,459 : INFO : topic diff=0.267734, rho=0.277350\n", + "2019-01-31 00:15:31,610 : INFO : PROGRESS: pass 0, at document #28000/4922894\n", + "2019-01-31 00:15:33,125 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:15:33,387 : INFO : topic #9 (0.020): 0.058*\"bone\" + 0.021*\"muscl\" + 0.013*\"korea\" + 0.013*\"olympo\" + 0.012*\"compos\" + 0.012*\"simpler\" + 0.011*\"korean\" + 0.009*\"perceptu\" + 0.006*\"musician\" + 0.006*\"american\"\n", + "2019-01-31 00:15:33,388 : INFO : topic #29 (0.020): 0.017*\"govern\" + 0.010*\"work\" + 0.008*\"replac\" + 0.007*\"nation\" + 0.007*\"start\" + 0.006*\"pseudo\" + 0.006*\"yawn\" + 0.006*\"countri\" + 0.005*\"unfortun\" + 0.005*\"law\"\n", + "2019-01-31 00:15:33,389 : INFO : topic #16 (0.020): 0.017*\"rotterdam\" + 0.014*\"sino\" + 0.013*\"margin\" + 0.013*\"london\" + 0.012*\"priest\" + 0.011*\"quarterli\" + 0.011*\"daughter\" + 0.009*\"di\" + 0.009*\"locri\" + 0.008*\"snatch\"\n", + "2019-01-31 00:15:33,390 : INFO : topic #22 (0.020): 0.024*\"spars\" + 0.023*\"factor\" + 0.015*\"isl\" + 0.014*\"popolo\" + 0.012*\"adulthood\" + 0.011*\"feel\" + 0.010*\"male\" + 0.009*\"hostil\" + 0.009*\"genu\" + 0.008*\"live\"\n", + "2019-01-31 00:15:33,392 : INFO : topic #45 (0.020): 0.013*\"depress\" + 0.010*\"light\" + 0.008*\"black\" + 0.006*\"blind\" + 0.006*\"colder\" + 0.005*\"record\" + 0.005*\"weapon\" + 0.005*\"summer\" + 0.005*\"cat\" + 0.005*\"like\"\n", + "2019-01-31 00:15:33,398 : INFO : topic diff=0.277764, rho=0.267261\n", + "2019-01-31 00:15:33,554 : INFO : PROGRESS: pass 0, at document #30000/4922894\n", + "2019-01-31 00:15:35,091 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:15:35,353 : INFO : topic #14 (0.020): 0.036*\"armi\" + 0.029*\"rotterdam\" + 0.027*\"corp\" + 0.022*\"refut\" + 0.019*\"serv\" + 0.015*\"forc\" + 0.015*\"apc\" + 0.015*\"walter\" + 0.014*\"leonida\" + 0.014*\"aggress\"\n", + "2019-01-31 00:15:35,354 : INFO : topic #33 (0.020): 0.035*\"french\" + 0.018*\"daphn\" + 0.017*\"jean\" + 0.015*\"franc\" + 0.015*\"sail\" + 0.013*\"lazi\" + 0.013*\"pari\" + 0.012*\"dish\" + 0.009*\"quebec\" + 0.008*\"piec\"\n", + "2019-01-31 00:15:35,355 : INFO : topic #13 (0.020): 0.033*\"sourc\" + 0.021*\"rotterdam\" + 0.020*\"north\" + 0.020*\"weekli\" + 0.016*\"earthworm\" + 0.015*\"ireland\" + 0.011*\"england\" + 0.011*\"ipa\" + 0.011*\"hormon\" + 0.010*\"parish\"\n", + "2019-01-31 00:15:35,356 : INFO : topic #10 (0.020): 0.009*\"cdd\" + 0.009*\"disco\" + 0.007*\"cancer\" + 0.007*\"caus\" + 0.006*\"pathwai\" + 0.006*\"acid\" + 0.006*\"proper\" + 0.006*\"gastrointestin\" + 0.006*\"student\" + 0.005*\"includ\"\n", + "2019-01-31 00:15:35,357 : INFO : topic #23 (0.020): 0.107*\"audit\" + 0.059*\"best\" + 0.018*\"noll\" + 0.017*\"yawn\" + 0.013*\"jacksonvil\" + 0.011*\"women\" + 0.009*\"prison\" + 0.008*\"tokyo\" + 0.008*\"ur\" + 0.008*\"intern\"\n", + "2019-01-31 00:15:35,363 : INFO : topic diff=0.287250, rho=0.258199\n", + "2019-01-31 00:15:35,588 : INFO : PROGRESS: pass 0, at document #32000/4922894\n", + "2019-01-31 00:15:37,112 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:15:37,374 : INFO : topic #3 (0.020): 0.020*\"present\" + 0.018*\"american\" + 0.015*\"seri\" + 0.015*\"offic\" + 0.015*\"bone\" + 0.014*\"minist\" + 0.013*\"start\" + 0.013*\"appeas\" + 0.011*\"secess\" + 0.011*\"chickasaw\"\n", + "2019-01-31 00:15:37,376 : INFO : topic #24 (0.020): 0.030*\"book\" + 0.029*\"publicis\" + 0.014*\"word\" + 0.012*\"languag\" + 0.010*\"new\" + 0.010*\"edit\" + 0.010*\"nicola\" + 0.009*\"worldwid\" + 0.009*\"storag\" + 0.009*\"magazin\"\n", + "2019-01-31 00:15:37,377 : INFO : topic #43 (0.020): 0.050*\"elect\" + 0.045*\"parti\" + 0.019*\"voluntari\" + 0.018*\"democrat\" + 0.017*\"tendenc\" + 0.016*\"member\" + 0.015*\"republ\" + 0.013*\"polici\" + 0.013*\"start\" + 0.013*\"selma\"\n", + "2019-01-31 00:15:37,378 : INFO : topic #28 (0.020): 0.022*\"rivièr\" + 0.018*\"build\" + 0.015*\"hous\" + 0.012*\"buford\" + 0.012*\"ring\" + 0.011*\"lobe\" + 0.011*\"rosenwald\" + 0.010*\"area\" + 0.010*\"tortur\" + 0.009*\"histor\"\n", + "2019-01-31 00:15:37,379 : INFO : topic #48 (0.020): 0.065*\"januari\" + 0.061*\"octob\" + 0.060*\"march\" + 0.058*\"sens\" + 0.054*\"notion\" + 0.052*\"april\" + 0.052*\"juli\" + 0.052*\"judici\" + 0.049*\"august\" + 0.049*\"februari\"\n", + "2019-01-31 00:15:37,385 : INFO : topic diff=0.292880, rho=0.250000\n", + "2019-01-31 00:15:37,539 : INFO : PROGRESS: pass 0, at document #34000/4922894\n", + "2019-01-31 00:15:39,061 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:15:39,323 : INFO : topic #32 (0.020): 0.079*\"district\" + 0.066*\"vigour\" + 0.047*\"popolo\" + 0.033*\"multitud\" + 0.028*\"prosper\" + 0.026*\"regim\" + 0.022*\"cotton\" + 0.018*\"tortur\" + 0.018*\"cede\" + 0.016*\"ruptur\"\n", + "2019-01-31 00:15:39,324 : INFO : topic #35 (0.020): 0.024*\"russia\" + 0.023*\"chilton\" + 0.021*\"china\" + 0.020*\"personifi\" + 0.016*\"rural\" + 0.015*\"sovereignti\" + 0.013*\"parti\" + 0.013*\"moscow\" + 0.012*\"communist\" + 0.011*\"unfortun\"\n", + "2019-01-31 00:15:39,326 : INFO : topic #43 (0.020): 0.052*\"elect\" + 0.046*\"parti\" + 0.020*\"voluntari\" + 0.018*\"democrat\" + 0.016*\"member\" + 0.015*\"tendenc\" + 0.014*\"republ\" + 0.013*\"polici\" + 0.013*\"selma\" + 0.013*\"start\"\n", + "2019-01-31 00:15:39,327 : INFO : topic #26 (0.020): 0.031*\"olymp\" + 0.028*\"workplac\" + 0.026*\"men\" + 0.023*\"event\" + 0.023*\"medal\" + 0.023*\"champion\" + 0.018*\"atheist\" + 0.017*\"woman\" + 0.016*\"gold\" + 0.015*\"théori\"\n", + "2019-01-31 00:15:39,328 : INFO : topic #22 (0.020): 0.028*\"spars\" + 0.021*\"factor\" + 0.017*\"isl\" + 0.015*\"adulthood\" + 0.014*\"popolo\" + 0.011*\"hostil\" + 0.011*\"feel\" + 0.010*\"live\" + 0.009*\"yawn\" + 0.009*\"male\"\n", + "2019-01-31 00:15:39,334 : INFO : topic diff=0.286981, rho=0.242536\n", + "2019-01-31 00:15:39,493 : INFO : PROGRESS: pass 0, at document #36000/4922894\n", + "2019-01-31 00:15:41,070 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:15:41,333 : INFO : topic #32 (0.020): 0.079*\"district\" + 0.061*\"vigour\" + 0.050*\"popolo\" + 0.032*\"multitud\" + 0.026*\"regim\" + 0.026*\"prosper\" + 0.022*\"cotton\" + 0.019*\"tortur\" + 0.019*\"cede\" + 0.016*\"ruptur\"\n", + "2019-01-31 00:15:41,334 : INFO : topic #7 (0.020): 0.016*\"locri\" + 0.015*\"church\" + 0.014*\"snatch\" + 0.011*\"sir\" + 0.011*\"di\" + 0.010*\"factor\" + 0.010*\"john\" + 0.009*\"yawn\" + 0.008*\"hous\" + 0.007*\"faster\"\n", + "2019-01-31 00:15:41,335 : INFO : topic #4 (0.020): 0.024*\"enfranchis\" + 0.020*\"candid\" + 0.015*\"mode\" + 0.012*\"veget\" + 0.011*\"pour\" + 0.010*\"elabor\" + 0.010*\"depress\" + 0.009*\"mandir\" + 0.008*\"fuel\" + 0.008*\"produc\"\n", + "2019-01-31 00:15:41,336 : INFO : topic #17 (0.020): 0.030*\"church\" + 0.019*\"sail\" + 0.018*\"fifteenth\" + 0.018*\"bishop\" + 0.017*\"centuri\" + 0.016*\"retroflex\" + 0.013*\"toluen\" + 0.012*\"jpg\" + 0.011*\"italian\" + 0.011*\"cathol\"\n", + "2019-01-31 00:15:41,337 : INFO : topic #12 (0.020): 0.007*\"gener\" + 0.007*\"number\" + 0.007*\"frontal\" + 0.006*\"poet\" + 0.006*\"exampl\" + 0.005*\"uruguayan\" + 0.005*\"measur\" + 0.005*\"differ\" + 0.005*\"pro\" + 0.005*\"servitud\"\n", + "2019-01-31 00:15:41,343 : INFO : topic diff=0.292892, rho=0.235702\n", + "2019-01-31 00:15:41,510 : INFO : PROGRESS: pass 0, at document #38000/4922894\n", + "2019-01-31 00:15:43,031 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:15:43,295 : INFO : topic #34 (0.020): 0.068*\"cotton\" + 0.033*\"start\" + 0.020*\"toni\" + 0.017*\"violent\" + 0.014*\"california\" + 0.011*\"carefulli\" + 0.010*\"unionist\" + 0.010*\"terri\" + 0.010*\"citi\" + 0.009*\"obes\"\n" + ] + }, { - "data": { - "text/html": [ - "
\n", - "\n", - "\n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - "
coherencel2_normmodelperplexitytopicstrain_time
0-2.8141357.265412nmf975.740399[(24, 0.131*\"mount\" + 0.129*\"lemmon\" + 0.129*\"...4394.560518
1-2.4366507.268837nmf_with_r985.570926[(49, 0.112*\"peak\" + 0.111*\"kitt\" + 0.111*\"mou...26451.927848
2-2.5144697.371544lda4727.075546[(35, 0.034*\"kong\" + 0.034*\"japanes\" + 0.033*\"...8278.891060
\n", - "
" - ], - "text/plain": [ - " coherence l2_norm model perplexity \\\n", - "0 -2.814135 7.265412 nmf 975.740399 \n", - "1 -2.436650 7.268837 nmf_with_r 985.570926 \n", - "2 -2.514469 7.371544 lda 4727.075546 \n", - "\n", - " topics train_time \n", - "0 [(24, 0.131*\"mount\" + 0.129*\"lemmon\" + 0.129*\"... 4394.560518 \n", - "1 [(49, 0.112*\"peak\" + 0.111*\"kitt\" + 0.111*\"mou... 26451.927848 \n", - "2 [(35, 0.034*\"kong\" + 0.034*\"japanes\" + 0.033*\"... 8278.891060 " - ] - }, - "execution_count": 19, - "metadata": {}, - "output_type": "execute_result" - } - ], - "source": [ - "tm_metrics" - ] - }, - { - "cell_type": "markdown", - "metadata": {}, - "source": [ - "#### RAM Usage:\n", - "- nmf: 100-150Mb\n", - "- nmf_with_r: 3-9Gb\n", - "- lda: 100Mb" - ] - }, - { - "cell_type": "code", - "execution_count": 20, - "metadata": {}, - "outputs": [ + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 00:15:43,296 : INFO : topic #40 (0.020): 0.072*\"unit\" + 0.025*\"collector\" + 0.015*\"start\" + 0.014*\"american\" + 0.011*\"new\" + 0.011*\"institut\" + 0.009*\"scholar\" + 0.009*\"word\" + 0.009*\"governor\" + 0.008*\"professor\"\n", + "2019-01-31 00:15:43,297 : INFO : topic #25 (0.020): 0.016*\"mount\" + 0.015*\"ring\" + 0.015*\"palmer\" + 0.014*\"lagrang\" + 0.013*\"mound\" + 0.011*\"area\" + 0.008*\"pcb\" + 0.007*\"robespierr\" + 0.006*\"natur\" + 0.006*\"surrend\"\n", + "2019-01-31 00:15:43,299 : INFO : topic #27 (0.020): 0.045*\"questionnair\" + 0.015*\"dai\" + 0.012*\"taxpay\" + 0.012*\"tornado\" + 0.012*\"théori\" + 0.010*\"rick\" + 0.010*\"horac\" + 0.010*\"squatter\" + 0.010*\"find\" + 0.009*\"sebastien\"\n", + "2019-01-31 00:15:43,301 : INFO : topic #48 (0.020): 0.066*\"octob\" + 0.062*\"januari\" + 0.061*\"march\" + 0.057*\"sens\" + 0.055*\"notion\" + 0.053*\"judici\" + 0.053*\"april\" + 0.052*\"juli\" + 0.051*\"august\" + 0.051*\"decatur\"\n", + "2019-01-31 00:15:43,307 : INFO : topic diff=0.286263, rho=0.229416\n", + "2019-01-31 00:15:46,145 : INFO : -11.672 per-word bound, 3262.6 perplexity estimate based on a held-out corpus of 2000 documents with 564313 words\n", + "2019-01-31 00:15:46,146 : INFO : PROGRESS: pass 0, at document #40000/4922894\n", + "2019-01-31 00:15:47,687 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:15:47,951 : INFO : topic #23 (0.020): 0.109*\"audit\" + 0.056*\"best\" + 0.020*\"yawn\" + 0.020*\"noll\" + 0.018*\"jacksonvil\" + 0.017*\"japanes\" + 0.013*\"women\" + 0.011*\"prison\" + 0.011*\"harmsworth\" + 0.009*\"winner\"\n", + "2019-01-31 00:15:47,953 : INFO : topic #42 (0.020): 0.026*\"german\" + 0.014*\"germani\" + 0.009*\"vol\" + 0.009*\"der\" + 0.007*\"jewish\" + 0.007*\"berlin\" + 0.006*\"anglo\" + 0.006*\"jeremiah\" + 0.006*\"und\" + 0.006*\"israel\"\n", + "2019-01-31 00:15:47,954 : INFO : topic #11 (0.020): 0.029*\"john\" + 0.024*\"will\" + 0.017*\"jame\" + 0.016*\"georg\" + 0.014*\"rival\" + 0.010*\"chandra\" + 0.010*\"thirtieth\" + 0.009*\"townhous\" + 0.009*\"henri\" + 0.008*\"slur\"\n", + "2019-01-31 00:15:47,956 : INFO : topic #38 (0.020): 0.015*\"king\" + 0.013*\"walter\" + 0.010*\"aza\" + 0.010*\"teufel\" + 0.008*\"french\" + 0.007*\"embassi\" + 0.007*\"till\" + 0.006*\"yawn\" + 0.006*\"franc\" + 0.005*\"deal\"\n", + "2019-01-31 00:15:47,957 : INFO : topic #48 (0.020): 0.067*\"octob\" + 0.062*\"januari\" + 0.062*\"march\" + 0.060*\"sens\" + 0.056*\"notion\" + 0.056*\"april\" + 0.054*\"judici\" + 0.054*\"august\" + 0.053*\"decatur\" + 0.052*\"juli\"\n", + "2019-01-31 00:15:47,963 : INFO : topic diff=0.280474, rho=0.223607\n", + "2019-01-31 00:15:48,119 : INFO : PROGRESS: pass 0, at document #42000/4922894\n", + "2019-01-31 00:15:49,658 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:15:49,921 : INFO : topic #3 (0.020): 0.028*\"present\" + 0.022*\"american\" + 0.016*\"minist\" + 0.016*\"start\" + 0.016*\"seri\" + 0.015*\"offic\" + 0.013*\"appeas\" + 0.013*\"gov\" + 0.012*\"gener\" + 0.012*\"bone\"\n", + "2019-01-31 00:15:49,922 : INFO : topic #36 (0.020): 0.025*\"companhia\" + 0.009*\"serv\" + 0.009*\"busi\" + 0.009*\"develop\" + 0.008*\"market\" + 0.008*\"manag\" + 0.008*\"produc\" + 0.008*\"oper\" + 0.008*\"network\" + 0.007*\"bank\"\n", + "2019-01-31 00:15:49,923 : INFO : topic #16 (0.020): 0.018*\"rotterdam\" + 0.018*\"london\" + 0.016*\"quarterli\" + 0.015*\"priest\" + 0.015*\"margin\" + 0.013*\"duke\" + 0.012*\"sino\" + 0.011*\"daughter\" + 0.011*\"di\" + 0.009*\"snatch\"\n", + "2019-01-31 00:15:49,925 : INFO : topic #48 (0.020): 0.067*\"octob\" + 0.066*\"march\" + 0.062*\"januari\" + 0.061*\"notion\" + 0.061*\"sens\" + 0.057*\"april\" + 0.055*\"judici\" + 0.055*\"august\" + 0.054*\"decatur\" + 0.053*\"juli\"\n", + "2019-01-31 00:15:49,926 : INFO : topic #32 (0.020): 0.080*\"district\" + 0.060*\"vigour\" + 0.053*\"popolo\" + 0.034*\"multitud\" + 0.028*\"regim\" + 0.024*\"prosper\" + 0.022*\"cotton\" + 0.020*\"tortur\" + 0.018*\"cede\" + 0.018*\"ruptur\"\n", + "2019-01-31 00:15:49,932 : INFO : topic diff=0.275367, rho=0.218218\n", + "2019-01-31 00:15:50,087 : INFO : PROGRESS: pass 0, at document #44000/4922894\n", + "2019-01-31 00:15:51,609 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:15:51,873 : INFO : topic #22 (0.020): 0.025*\"spars\" + 0.023*\"factor\" + 0.018*\"adulthood\" + 0.014*\"popolo\" + 0.014*\"isl\" + 0.013*\"hostil\" + 0.013*\"feel\" + 0.011*\"male\" + 0.010*\"live\" + 0.010*\"western\"\n", + "2019-01-31 00:15:51,874 : INFO : topic #2 (0.020): 0.051*\"shield\" + 0.019*\"narrat\" + 0.017*\"isl\" + 0.015*\"class\" + 0.013*\"blur\" + 0.012*\"pope\" + 0.012*\"scot\" + 0.011*\"nativist\" + 0.011*\"crew\" + 0.009*\"vernon\"\n", + "2019-01-31 00:15:51,875 : INFO : topic #5 (0.020): 0.039*\"abroad\" + 0.029*\"son\" + 0.027*\"rel\" + 0.025*\"reconstruct\" + 0.019*\"band\" + 0.018*\"muscl\" + 0.015*\"simultan\" + 0.013*\"toyota\" + 0.013*\"charcoal\" + 0.010*\"vocabulari\"\n", + "2019-01-31 00:15:51,877 : INFO : topic #41 (0.020): 0.037*\"citi\" + 0.029*\"new\" + 0.017*\"year\" + 0.014*\"strategist\" + 0.014*\"center\" + 0.013*\"festiv\" + 0.012*\"palmer\" + 0.009*\"hot\" + 0.008*\"museo\" + 0.008*\"open\"\n", + "2019-01-31 00:15:51,878 : INFO : topic #12 (0.020): 0.006*\"number\" + 0.006*\"exampl\" + 0.006*\"gener\" + 0.006*\"poet\" + 0.006*\"differ\" + 0.005*\"servitud\" + 0.005*\"frontal\" + 0.005*\"uruguayan\" + 0.005*\"method\" + 0.005*\"measur\"\n", + "2019-01-31 00:15:51,883 : INFO : topic diff=0.267459, rho=0.213201\n", + "2019-01-31 00:15:52,039 : INFO : PROGRESS: pass 0, at document #46000/4922894\n", + "2019-01-31 00:15:53,587 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:15:53,852 : INFO : topic #43 (0.020): 0.056*\"elect\" + 0.050*\"parti\" + 0.020*\"conserv\" + 0.019*\"democrat\" + 0.019*\"voluntari\" + 0.017*\"member\" + 0.014*\"labour\" + 0.014*\"polici\" + 0.012*\"liber\" + 0.012*\"bypass\"\n", + "2019-01-31 00:15:53,853 : INFO : topic #5 (0.020): 0.038*\"abroad\" + 0.028*\"son\" + 0.027*\"rel\" + 0.025*\"reconstruct\" + 0.021*\"band\" + 0.018*\"muscl\" + 0.015*\"simultan\" + 0.013*\"toyota\" + 0.013*\"charcoal\" + 0.010*\"vocabulari\"\n", + "2019-01-31 00:15:53,854 : INFO : topic #13 (0.020): 0.032*\"sourc\" + 0.021*\"north\" + 0.020*\"weekli\" + 0.019*\"earthworm\" + 0.016*\"england\" + 0.014*\"ireland\" + 0.013*\"ipa\" + 0.013*\"youth\" + 0.012*\"wale\" + 0.011*\"castl\"\n", + "2019-01-31 00:15:53,856 : INFO : topic #47 (0.020): 0.050*\"muscl\" + 0.024*\"perceptu\" + 0.019*\"compos\" + 0.019*\"orchestr\" + 0.018*\"physician\" + 0.015*\"place\" + 0.011*\"jack\" + 0.011*\"word\" + 0.009*\"strict\" + 0.009*\"insomnia\"\n", + "2019-01-31 00:15:53,857 : INFO : topic #4 (0.020): 0.023*\"enfranchis\" + 0.017*\"candid\" + 0.013*\"pour\" + 0.012*\"mode\" + 0.012*\"depress\" + 0.011*\"veget\" + 0.010*\"elabor\" + 0.008*\"produc\" + 0.008*\"spectacl\" + 0.008*\"fuel\"\n", + "2019-01-31 00:15:53,863 : INFO : topic diff=0.261450, rho=0.208514\n", + "2019-01-31 00:15:54,018 : INFO : PROGRESS: pass 0, at document #48000/4922894\n", + "2019-01-31 00:15:55,518 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:15:55,782 : INFO : topic #38 (0.020): 0.017*\"king\" + 0.014*\"walter\" + 0.008*\"aza\" + 0.007*\"teufel\" + 0.007*\"french\" + 0.006*\"yawn\" + 0.006*\"embassi\" + 0.006*\"battalion\" + 0.006*\"princess\" + 0.006*\"empath\"\n", + "2019-01-31 00:15:55,783 : INFO : topic #12 (0.020): 0.007*\"gener\" + 0.007*\"number\" + 0.007*\"frontal\" + 0.006*\"poet\" + 0.006*\"exampl\" + 0.005*\"differ\" + 0.005*\"servitud\" + 0.005*\"uruguayan\" + 0.005*\"utopian\" + 0.005*\"group\"\n", + "2019-01-31 00:15:55,785 : INFO : topic #37 (0.020): 0.008*\"love\" + 0.007*\"place\" + 0.006*\"théori\" + 0.005*\"night\" + 0.004*\"appear\" + 0.004*\"gestur\" + 0.004*\"jolli\" + 0.004*\"live\" + 0.003*\"introductori\" + 0.003*\"man\"\n", + "2019-01-31 00:15:55,786 : INFO : topic #46 (0.020): 0.024*\"warmth\" + 0.019*\"turkish\" + 0.017*\"norwegian\" + 0.014*\"norwai\" + 0.011*\"sweden\" + 0.009*\"cameron\" + 0.009*\"turkei\" + 0.008*\"swedish\" + 0.008*\"scot\" + 0.008*\"weevil\"\n", + "2019-01-31 00:15:55,788 : INFO : topic #11 (0.020): 0.029*\"john\" + 0.021*\"will\" + 0.016*\"jame\" + 0.014*\"georg\" + 0.013*\"rival\" + 0.010*\"thirtieth\" + 0.010*\"henri\" + 0.009*\"rhyme\" + 0.009*\"chandra\" + 0.009*\"slur\"\n", + "2019-01-31 00:15:55,793 : INFO : topic diff=0.250452, rho=0.204124\n", + "2019-01-31 00:15:55,947 : INFO : PROGRESS: pass 0, at document #50000/4922894\n", + "2019-01-31 00:15:57,482 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:15:57,746 : INFO : topic #36 (0.020): 0.022*\"companhia\" + 0.010*\"network\" + 0.009*\"manag\" + 0.009*\"market\" + 0.009*\"develop\" + 0.009*\"serv\" + 0.009*\"busi\" + 0.009*\"oper\" + 0.008*\"produc\" + 0.007*\"base\"\n", + "2019-01-31 00:15:57,747 : INFO : topic #40 (0.020): 0.075*\"unit\" + 0.028*\"collector\" + 0.013*\"american\" + 0.013*\"start\" + 0.012*\"institut\" + 0.011*\"governor\" + 0.011*\"new\" + 0.011*\"professor\" + 0.010*\"scholar\" + 0.009*\"degre\"\n" + ] + }, { - "name": "stdout", + "name": "stderr", "output_type": "stream", "text": [ - "====================\n", - "nmf\n", - "====================\n", - "\n", - "Topic: 24\n", - "0.131*\"mount\" + 0.129*\"lemmon\" + 0.129*\"peak\" + 0.127*\"kitt\" + 0.127*\"spacewatch\" + 0.065*\"survei\" + 0.037*\"octob\" + 0.031*\"septemb\" + 0.023*\"css\" + 0.023*\"catalina\"\n", - "\n", - "Topic: 32\n", - "0.196*\"linear\" + 0.195*\"socorro\" + 0.045*\"septemb\" + 0.039*\"neat\" + 0.035*\"palomar\" + 0.032*\"octob\" + 0.024*\"kitt\" + 0.024*\"peak\" + 0.024*\"spacewatch\" + 0.023*\"anderson\"\n", - "\n", - "Topic: 8\n", - "0.331*\"align\" + 0.270*\"left\" + 0.071*\"right\" + 0.040*\"text\" + 0.035*\"style\" + 0.022*\"center\" + 0.013*\"bar\" + 0.009*\"till\" + 0.008*\"bgcolor\" + 0.008*\"color\"\n", - "\n", - "Topic: 27\n", - "0.186*\"district\" + 0.027*\"pennsylvania\" + 0.022*\"grade\" + 0.017*\"fund\" + 0.017*\"educ\" + 0.017*\"basic\" + 0.016*\"level\" + 0.014*\"oblast\" + 0.014*\"rural\" + 0.013*\"tax\"\n", - "\n", - "Topic: 48\n", - "0.103*\"art\" + 0.066*\"museum\" + 0.040*\"paint\" + 0.035*\"work\" + 0.026*\"artist\" + 0.024*\"galleri\" + 0.022*\"exhibit\" + 0.019*\"collect\" + 0.015*\"histori\" + 0.013*\"jpg\"\n", - "\n", - "Topic: 11\n", - "0.122*\"new\" + 0.043*\"york\" + 0.009*\"zealand\" + 0.007*\"jersei\" + 0.006*\"american\" + 0.006*\"time\" + 0.006*\"australia\" + 0.005*\"radio\" + 0.005*\"press\" + 0.005*\"washington\"\n", - "\n", - "Topic: 20\n", - "0.008*\"us\" + 0.006*\"gener\" + 0.006*\"model\" + 0.006*\"data\" + 0.006*\"design\" + 0.005*\"time\" + 0.005*\"function\" + 0.005*\"number\" + 0.005*\"process\" + 0.005*\"exampl\"\n", - "\n", - "Topic: 28\n", - "0.074*\"year\" + 0.022*\"dai\" + 0.012*\"time\" + 0.008*\"ag\" + 0.006*\"month\" + 0.006*\"includ\" + 0.006*\"follow\" + 0.005*\"later\" + 0.005*\"old\" + 0.005*\"student\"\n", - "\n", - "Topic: 38\n", - "0.033*\"royal\" + 0.025*\"john\" + 0.025*\"william\" + 0.016*\"lieuten\" + 0.013*\"georg\" + 0.012*\"offic\" + 0.012*\"jame\" + 0.011*\"sergeant\" + 0.011*\"major\" + 0.010*\"charl\"\n", - "\n", - "Topic: 19\n", - "0.012*\"area\" + 0.011*\"river\" + 0.010*\"water\" + 0.004*\"larg\" + 0.004*\"region\" + 0.004*\"lake\" + 0.004*\"power\" + 0.004*\"high\" + 0.004*\"bar\" + 0.004*\"form\"\n", - "\n", - "\n", - "====================\n", - "nmf_with_r\n", - "====================\n", - "\n", - "Topic: 49\n", - "0.112*\"peak\" + 0.111*\"kitt\" + 0.111*\"mount\" + 0.111*\"spacewatch\" + 0.109*\"lemmon\" + 0.055*\"survei\" + 0.044*\"octob\" + 0.041*\"septemb\" + 0.026*\"novemb\" + 0.021*\"march\"\n", - "\n", - "Topic: 32\n", - "0.194*\"linear\" + 0.193*\"socorro\" + 0.047*\"septemb\" + 0.038*\"neat\" + 0.034*\"palomar\" + 0.034*\"octob\" + 0.025*\"decemb\" + 0.024*\"august\" + 0.023*\"anderson\" + 0.023*\"mesa\"\n", - "\n", - "Topic: 48\n", - "0.112*\"art\" + 0.063*\"museum\" + 0.037*\"paint\" + 0.036*\"work\" + 0.028*\"artist\" + 0.026*\"galleri\" + 0.025*\"exhibit\" + 0.020*\"collect\" + 0.015*\"histori\" + 0.014*\"design\"\n", - "\n", - "Topic: 4\n", - "0.093*\"club\" + 0.049*\"cup\" + 0.033*\"footbal\" + 0.031*\"goal\" + 0.022*\"leagu\" + 0.022*\"unit\" + 0.022*\"plai\" + 0.022*\"match\" + 0.018*\"score\" + 0.015*\"player\"\n", - "\n", - "Topic: 27\n", - "0.159*\"district\" + 0.031*\"pennsylvania\" + 0.025*\"grade\" + 0.021*\"educ\" + 0.019*\"fund\" + 0.018*\"basic\" + 0.017*\"level\" + 0.015*\"student\" + 0.014*\"receiv\" + 0.014*\"tax\"\n", - "\n", - "Topic: 17\n", - "0.095*\"season\" + 0.014*\"plai\" + 0.010*\"coach\" + 0.009*\"final\" + 0.009*\"second\" + 0.008*\"win\" + 0.008*\"record\" + 0.008*\"career\" + 0.008*\"finish\" + 0.007*\"point\"\n", - "\n", - "Topic: 40\n", - "0.009*\"time\" + 0.008*\"later\" + 0.007*\"kill\" + 0.006*\"appear\" + 0.005*\"man\" + 0.005*\"death\" + 0.005*\"father\" + 0.005*\"return\" + 0.005*\"son\" + 0.004*\"charact\"\n", - "\n", - "Topic: 20\n", - "0.008*\"us\" + 0.006*\"gener\" + 0.005*\"design\" + 0.005*\"model\" + 0.005*\"develop\" + 0.005*\"time\" + 0.004*\"data\" + 0.004*\"number\" + 0.004*\"function\" + 0.004*\"process\"\n", - "\n", - "Topic: 19\n", - "0.009*\"water\" + 0.008*\"area\" + 0.008*\"speci\" + 0.005*\"larg\" + 0.004*\"order\" + 0.004*\"region\" + 0.004*\"includ\" + 0.004*\"black\" + 0.004*\"famili\" + 0.004*\"popul\"\n", - "\n", - "Topic: 38\n", - "0.044*\"royal\" + 0.020*\"william\" + 0.019*\"john\" + 0.016*\"corp\" + 0.014*\"lieuten\" + 0.013*\"capt\" + 0.012*\"engin\" + 0.011*\"armi\" + 0.011*\"georg\" + 0.011*\"temp\"\n", - "\n", - "\n", - "====================\n", - "lda\n", - "====================\n", - "\n", - "Topic: 35\n", - "0.034*\"kong\" + 0.034*\"japanes\" + 0.033*\"hong\" + 0.023*\"lee\" + 0.021*\"singapor\" + 0.019*\"chines\" + 0.018*\"kim\" + 0.015*\"japan\" + 0.014*\"indonesia\" + 0.014*\"thailand\"\n", - "\n", - "Topic: 23\n", - "0.016*\"medic\" + 0.014*\"health\" + 0.014*\"hospit\" + 0.013*\"cell\" + 0.011*\"diseas\" + 0.010*\"patient\" + 0.009*\"ret\" + 0.009*\"caus\" + 0.008*\"human\" + 0.008*\"treatment\"\n", - "\n", - "Topic: 47\n", - "0.025*\"river\" + 0.024*\"station\" + 0.021*\"line\" + 0.020*\"road\" + 0.017*\"railwai\" + 0.015*\"rout\" + 0.013*\"lake\" + 0.012*\"park\" + 0.011*\"bridg\" + 0.011*\"area\"\n", - "\n", - "Topic: 14\n", - "0.027*\"univers\" + 0.015*\"research\" + 0.014*\"institut\" + 0.012*\"nation\" + 0.012*\"scienc\" + 0.012*\"work\" + 0.012*\"intern\" + 0.011*\"award\" + 0.011*\"develop\" + 0.010*\"organ\"\n", - "\n", - "Topic: 39\n", - "0.050*\"air\" + 0.026*\"aircraft\" + 0.026*\"oper\" + 0.025*\"airport\" + 0.017*\"forc\" + 0.017*\"flight\" + 0.015*\"squadron\" + 0.014*\"unit\" + 0.012*\"base\" + 0.011*\"wing\"\n", - "\n", - "Topic: 17\n", - "0.060*\"race\" + 0.020*\"car\" + 0.017*\"team\" + 0.012*\"finish\" + 0.012*\"tour\" + 0.012*\"driver\" + 0.011*\"ford\" + 0.011*\"time\" + 0.011*\"championship\" + 0.011*\"year\"\n", - "\n", - "Topic: 4\n", - "0.137*\"school\" + 0.040*\"colleg\" + 0.039*\"student\" + 0.033*\"univers\" + 0.030*\"high\" + 0.028*\"educ\" + 0.016*\"year\" + 0.011*\"graduat\" + 0.010*\"state\" + 0.009*\"campu\"\n", - "\n", - "Topic: 8\n", - "0.048*\"india\" + 0.037*\"indian\" + 0.020*\"http\" + 0.016*\"www\" + 0.015*\"pakistan\" + 0.015*\"iran\" + 0.013*\"sri\" + 0.012*\"khan\" + 0.012*\"islam\" + 0.012*\"tamil\"\n", - "\n", - "Topic: 2\n", - "0.062*\"german\" + 0.039*\"germani\" + 0.025*\"van\" + 0.023*\"von\" + 0.020*\"der\" + 0.019*\"dutch\" + 0.019*\"berlin\" + 0.015*\"swedish\" + 0.014*\"netherland\" + 0.014*\"sweden\"\n", - "\n", - "Topic: 11\n", - "0.024*\"law\" + 0.021*\"court\" + 0.016*\"state\" + 0.016*\"act\" + 0.011*\"polic\" + 0.010*\"case\" + 0.009*\"offic\" + 0.009*\"report\" + 0.009*\"right\" + 0.007*\"legal\"\n", - "\n", - "\n" + "2019-01-31 00:15:57,749 : INFO : topic #48 (0.020): 0.065*\"octob\" + 0.063*\"notion\" + 0.063*\"januari\" + 0.063*\"sens\" + 0.060*\"judici\" + 0.060*\"march\" + 0.059*\"april\" + 0.059*\"august\" + 0.057*\"decatur\" + 0.056*\"juli\"\n", + "2019-01-31 00:15:57,751 : INFO : topic #21 (0.020): 0.025*\"samford\" + 0.021*\"spain\" + 0.019*\"mexico\" + 0.016*\"del\" + 0.012*\"juan\" + 0.012*\"soviet\" + 0.012*\"mexican\" + 0.011*\"plung\" + 0.010*\"santa\" + 0.010*\"josé\"\n", + "2019-01-31 00:15:57,752 : INFO : topic #49 (0.020): 0.028*\"india\" + 0.022*\"incumb\" + 0.007*\"singh\" + 0.006*\"peopl\" + 0.006*\"pakistan\" + 0.006*\"treeless\" + 0.006*\"alam\" + 0.006*\"pradesh\" + 0.006*\"area\" + 0.006*\"khalsa\"\n", + "2019-01-31 00:15:57,758 : INFO : topic diff=0.237375, rho=0.200000\n", + "2019-01-31 00:15:57,910 : INFO : PROGRESS: pass 0, at document #52000/4922894\n", + "2019-01-31 00:15:59,443 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:15:59,707 : INFO : topic #21 (0.020): 0.027*\"samford\" + 0.020*\"spain\" + 0.019*\"mexico\" + 0.018*\"del\" + 0.013*\"juan\" + 0.011*\"mexican\" + 0.011*\"soviet\" + 0.011*\"josé\" + 0.010*\"plung\" + 0.010*\"rico\"\n", + "2019-01-31 00:15:59,709 : INFO : topic #25 (0.020): 0.022*\"ring\" + 0.015*\"lagrang\" + 0.015*\"mount\" + 0.012*\"area\" + 0.011*\"palmer\" + 0.009*\"warmth\" + 0.008*\"robespierr\" + 0.007*\"natur\" + 0.007*\"mound\" + 0.006*\"foam\"\n", + "2019-01-31 00:15:59,710 : INFO : topic #14 (0.020): 0.024*\"forc\" + 0.021*\"armi\" + 0.018*\"walter\" + 0.018*\"aggress\" + 0.017*\"com\" + 0.014*\"unionist\" + 0.012*\"oper\" + 0.012*\"militari\" + 0.011*\"diversifi\" + 0.011*\"refut\"\n", + "2019-01-31 00:15:59,711 : INFO : topic #0 (0.020): 0.062*\"statewid\" + 0.051*\"arsen\" + 0.029*\"line\" + 0.028*\"museo\" + 0.027*\"raid\" + 0.020*\"word\" + 0.020*\"pain\" + 0.017*\"traceabl\" + 0.016*\"artist\" + 0.013*\"gai\"\n", + "2019-01-31 00:15:59,712 : INFO : topic #8 (0.020): 0.032*\"start\" + 0.023*\"law\" + 0.018*\"cortic\" + 0.018*\"act\" + 0.016*\"unionist\" + 0.011*\"feder\" + 0.011*\"ricardo\" + 0.010*\"serv\" + 0.010*\"fengxiang\" + 0.009*\"case\"\n", + "2019-01-31 00:15:59,718 : INFO : topic diff=0.228056, rho=0.196116\n", + "2019-01-31 00:15:59,867 : INFO : PROGRESS: pass 0, at document #54000/4922894\n", + "2019-01-31 00:16:01,364 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:16:01,628 : INFO : topic #10 (0.020): 0.012*\"cdd\" + 0.009*\"proper\" + 0.008*\"acid\" + 0.007*\"disco\" + 0.007*\"pathwai\" + 0.007*\"treat\" + 0.006*\"caus\" + 0.006*\"gastrointestin\" + 0.006*\"media\" + 0.006*\"effect\"\n", + "2019-01-31 00:16:01,630 : INFO : topic #2 (0.020): 0.046*\"shield\" + 0.025*\"isl\" + 0.018*\"narrat\" + 0.015*\"pope\" + 0.015*\"class\" + 0.013*\"blur\" + 0.011*\"scot\" + 0.011*\"crew\" + 0.010*\"vernon\" + 0.010*\"fleet\"\n", + "2019-01-31 00:16:01,631 : INFO : topic #15 (0.020): 0.020*\"requir\" + 0.012*\"develop\" + 0.012*\"schuster\" + 0.012*\"small\" + 0.011*\"student\" + 0.009*\"word\" + 0.008*\"socialist\" + 0.008*\"human\" + 0.007*\"intern\" + 0.007*\"institut\"\n", + "2019-01-31 00:16:01,633 : INFO : topic #48 (0.020): 0.061*\"march\" + 0.061*\"octob\" + 0.060*\"april\" + 0.059*\"judici\" + 0.059*\"januari\" + 0.059*\"notion\" + 0.059*\"sens\" + 0.057*\"februari\" + 0.054*\"decatur\" + 0.053*\"juli\"\n", + "2019-01-31 00:16:01,635 : INFO : topic #43 (0.020): 0.060*\"elect\" + 0.047*\"parti\" + 0.020*\"voluntari\" + 0.019*\"democrat\" + 0.019*\"member\" + 0.017*\"polici\" + 0.015*\"conserv\" + 0.013*\"republ\" + 0.012*\"bypass\" + 0.012*\"liber\"\n", + "2019-01-31 00:16:01,640 : INFO : topic diff=0.220688, rho=0.192450\n", + "2019-01-31 00:16:01,795 : INFO : PROGRESS: pass 0, at document #56000/4922894\n", + "2019-01-31 00:16:03,341 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:16:03,606 : INFO : topic #4 (0.020): 0.023*\"enfranchis\" + 0.014*\"candid\" + 0.013*\"pour\" + 0.012*\"depress\" + 0.012*\"mode\" + 0.010*\"veget\" + 0.009*\"elabor\" + 0.008*\"produc\" + 0.008*\"mandir\" + 0.007*\"spectacl\"\n", + "2019-01-31 00:16:03,607 : INFO : topic #33 (0.020): 0.043*\"french\" + 0.033*\"franc\" + 0.023*\"jean\" + 0.022*\"pari\" + 0.020*\"daphn\" + 0.020*\"sail\" + 0.019*\"wreath\" + 0.016*\"lazi\" + 0.011*\"piec\" + 0.009*\"convei\"\n", + "2019-01-31 00:16:03,608 : INFO : topic #30 (0.020): 0.032*\"cleveland\" + 0.028*\"leagu\" + 0.026*\"place\" + 0.024*\"taxpay\" + 0.024*\"crete\" + 0.022*\"scientist\" + 0.020*\"folei\" + 0.015*\"goal\" + 0.015*\"martin\" + 0.012*\"schmitz\"\n", + "2019-01-31 00:16:03,609 : INFO : topic #0 (0.020): 0.061*\"statewid\" + 0.050*\"arsen\" + 0.034*\"line\" + 0.029*\"raid\" + 0.027*\"museo\" + 0.021*\"word\" + 0.020*\"pain\" + 0.019*\"traceabl\" + 0.016*\"artist\" + 0.014*\"exhaust\"\n", + "2019-01-31 00:16:03,610 : INFO : topic #13 (0.020): 0.028*\"sourc\" + 0.019*\"north\" + 0.019*\"england\" + 0.017*\"ireland\" + 0.017*\"earthworm\" + 0.017*\"weekli\" + 0.013*\"australia\" + 0.013*\"wale\" + 0.013*\"london\" + 0.012*\"ipa\"\n", + "2019-01-31 00:16:03,616 : INFO : topic diff=0.216646, rho=0.188982\n", + "2019-01-31 00:16:03,772 : INFO : PROGRESS: pass 0, at document #58000/4922894\n", + "2019-01-31 00:16:05,313 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:16:05,579 : INFO : topic #17 (0.020): 0.047*\"church\" + 0.021*\"bishop\" + 0.019*\"centuri\" + 0.017*\"retroflex\" + 0.016*\"cathol\" + 0.014*\"fifteenth\" + 0.013*\"sail\" + 0.013*\"jpg\" + 0.011*\"italian\" + 0.010*\"christian\"\n", + "2019-01-31 00:16:05,580 : INFO : topic #32 (0.020): 0.082*\"district\" + 0.063*\"vigour\" + 0.044*\"popolo\" + 0.033*\"regim\" + 0.029*\"multitud\" + 0.028*\"tortur\" + 0.023*\"prosper\" + 0.023*\"cotton\" + 0.020*\"area\" + 0.018*\"cede\"\n", + "2019-01-31 00:16:05,581 : INFO : topic #23 (0.020): 0.120*\"audit\" + 0.059*\"best\" + 0.026*\"jacksonvil\" + 0.022*\"yawn\" + 0.022*\"noll\" + 0.020*\"japanes\" + 0.017*\"women\" + 0.012*\"prison\" + 0.010*\"festiv\" + 0.010*\"intern\"\n", + "2019-01-31 00:16:05,582 : INFO : topic #2 (0.020): 0.046*\"shield\" + 0.030*\"isl\" + 0.017*\"narrat\" + 0.015*\"pope\" + 0.015*\"class\" + 0.012*\"blur\" + 0.011*\"scot\" + 0.011*\"crew\" + 0.010*\"vernon\" + 0.010*\"coalit\"\n", + "2019-01-31 00:16:05,583 : INFO : topic #15 (0.020): 0.020*\"requir\" + 0.013*\"schuster\" + 0.013*\"develop\" + 0.011*\"small\" + 0.011*\"word\" + 0.010*\"student\" + 0.009*\"socialist\" + 0.008*\"human\" + 0.007*\"intern\" + 0.006*\"theoret\"\n", + "2019-01-31 00:16:05,589 : INFO : topic diff=0.207294, rho=0.185695\n", + "2019-01-31 00:16:08,366 : INFO : -11.864 per-word bound, 3727.7 perplexity estimate based on a held-out corpus of 2000 documents with 543136 words\n", + "2019-01-31 00:16:08,367 : INFO : PROGRESS: pass 0, at document #60000/4922894\n", + "2019-01-31 00:16:09,880 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:16:10,144 : INFO : topic #13 (0.020): 0.031*\"sourc\" + 0.018*\"england\" + 0.018*\"ireland\" + 0.018*\"north\" + 0.017*\"weekli\" + 0.016*\"australia\" + 0.016*\"earthworm\" + 0.014*\"london\" + 0.012*\"ipa\" + 0.012*\"castl\"\n", + "2019-01-31 00:16:10,145 : INFO : topic #4 (0.020): 0.024*\"enfranchis\" + 0.013*\"candid\" + 0.013*\"pour\" + 0.012*\"depress\" + 0.012*\"mode\" + 0.011*\"veget\" + 0.008*\"elabor\" + 0.008*\"produc\" + 0.007*\"mandir\" + 0.007*\"spectacl\"\n", + "2019-01-31 00:16:10,146 : INFO : topic #34 (0.020): 0.049*\"start\" + 0.045*\"cotton\" + 0.019*\"unionist\" + 0.017*\"terri\" + 0.016*\"california\" + 0.014*\"toni\" + 0.012*\"violent\" + 0.012*\"carefulli\" + 0.010*\"citi\" + 0.010*\"warrior\"\n", + "2019-01-31 00:16:10,148 : INFO : topic #29 (0.020): 0.015*\"govern\" + 0.013*\"replac\" + 0.007*\"start\" + 0.007*\"nation\" + 0.007*\"yawn\" + 0.007*\"organ\" + 0.006*\"unfortun\" + 0.006*\"placement\" + 0.006*\"countri\" + 0.005*\"million\"\n", + "2019-01-31 00:16:10,149 : INFO : topic #38 (0.020): 0.015*\"king\" + 0.015*\"walter\" + 0.010*\"aza\" + 0.009*\"teufel\" + 0.007*\"battalion\" + 0.007*\"till\" + 0.007*\"yawn\" + 0.006*\"french\" + 0.006*\"embassi\" + 0.006*\"princess\"\n", + "2019-01-31 00:16:10,155 : INFO : topic diff=0.195251, rho=0.182574\n", + "2019-01-31 00:16:10,363 : INFO : PROGRESS: pass 0, at document #62000/4922894\n", + "2019-01-31 00:16:11,872 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:16:12,137 : INFO : topic #2 (0.020): 0.041*\"shield\" + 0.038*\"isl\" + 0.021*\"pope\" + 0.017*\"narrat\" + 0.014*\"class\" + 0.014*\"blur\" + 0.011*\"crew\" + 0.011*\"scot\" + 0.011*\"coalit\" + 0.011*\"fleet\"\n", + "2019-01-31 00:16:12,139 : INFO : topic #5 (0.020): 0.038*\"abroad\" + 0.028*\"son\" + 0.028*\"rel\" + 0.024*\"reconstruct\" + 0.020*\"band\" + 0.019*\"muscl\" + 0.017*\"simultan\" + 0.015*\"charcoal\" + 0.013*\"toyota\" + 0.011*\"myspac\"\n", + "2019-01-31 00:16:12,140 : INFO : topic #15 (0.020): 0.019*\"requir\" + 0.013*\"develop\" + 0.012*\"small\" + 0.012*\"schuster\" + 0.011*\"student\" + 0.010*\"word\" + 0.009*\"cultur\" + 0.008*\"socialist\" + 0.008*\"human\" + 0.008*\"intern\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 00:16:12,142 : INFO : topic #30 (0.020): 0.033*\"cleveland\" + 0.029*\"leagu\" + 0.026*\"place\" + 0.024*\"taxpay\" + 0.022*\"scientist\" + 0.022*\"crete\" + 0.020*\"folei\" + 0.014*\"martin\" + 0.014*\"goal\" + 0.011*\"schmitz\"\n", + "2019-01-31 00:16:12,143 : INFO : topic #49 (0.020): 0.032*\"india\" + 0.030*\"incumb\" + 0.010*\"singh\" + 0.009*\"alam\" + 0.008*\"televis\" + 0.007*\"sri\" + 0.006*\"pakistan\" + 0.006*\"tajikistan\" + 0.006*\"peopl\" + 0.006*\"muhammad\"\n", + "2019-01-31 00:16:12,149 : INFO : topic diff=0.184001, rho=0.179605\n", + "2019-01-31 00:16:12,306 : INFO : PROGRESS: pass 0, at document #64000/4922894\n", + "2019-01-31 00:16:13,850 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:16:14,115 : INFO : topic #15 (0.020): 0.019*\"requir\" + 0.013*\"develop\" + 0.012*\"schuster\" + 0.011*\"small\" + 0.010*\"word\" + 0.010*\"student\" + 0.008*\"cultur\" + 0.008*\"intern\" + 0.008*\"socialist\" + 0.008*\"human\"\n", + "2019-01-31 00:16:14,116 : INFO : topic #16 (0.020): 0.018*\"margin\" + 0.017*\"quarterli\" + 0.015*\"priest\" + 0.015*\"rotterdam\" + 0.014*\"london\" + 0.013*\"daughter\" + 0.011*\"duke\" + 0.011*\"marriag\" + 0.011*\"di\" + 0.010*\"sino\"\n", + "2019-01-31 00:16:14,117 : INFO : topic #34 (0.020): 0.053*\"start\" + 0.045*\"cotton\" + 0.020*\"unionist\" + 0.017*\"terri\" + 0.015*\"california\" + 0.012*\"toni\" + 0.012*\"violent\" + 0.012*\"warrior\" + 0.012*\"carefulli\" + 0.010*\"north\"\n", + "2019-01-31 00:16:14,119 : INFO : topic #29 (0.020): 0.015*\"govern\" + 0.012*\"replac\" + 0.007*\"yawn\" + 0.007*\"start\" + 0.007*\"nation\" + 0.006*\"unfortun\" + 0.006*\"organ\" + 0.006*\"placement\" + 0.005*\"countri\" + 0.005*\"new\"\n", + "2019-01-31 00:16:14,119 : INFO : topic #13 (0.020): 0.030*\"sourc\" + 0.018*\"ireland\" + 0.018*\"england\" + 0.017*\"north\" + 0.017*\"earthworm\" + 0.016*\"australia\" + 0.016*\"weekli\" + 0.014*\"london\" + 0.014*\"youth\" + 0.012*\"wale\"\n", + "2019-01-31 00:16:14,125 : INFO : topic diff=0.177516, rho=0.176777\n", + "2019-01-31 00:16:14,280 : INFO : PROGRESS: pass 0, at document #66000/4922894\n", + "2019-01-31 00:16:15,801 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:16:16,066 : INFO : topic #18 (0.020): 0.007*\"man\" + 0.007*\"théori\" + 0.007*\"kill\" + 0.006*\"later\" + 0.005*\"deal\" + 0.005*\"sack\" + 0.004*\"life\" + 0.004*\"charact\" + 0.004*\"teatro\" + 0.004*\"fraud\"\n", + "2019-01-31 00:16:16,067 : INFO : topic #27 (0.020): 0.048*\"questionnair\" + 0.015*\"dai\" + 0.015*\"taxpay\" + 0.015*\"rick\" + 0.015*\"tornado\" + 0.013*\"théori\" + 0.011*\"find\" + 0.011*\"horac\" + 0.011*\"squatter\" + 0.010*\"yawn\"\n", + "2019-01-31 00:16:16,068 : INFO : topic #0 (0.020): 0.064*\"statewid\" + 0.048*\"arsen\" + 0.035*\"line\" + 0.031*\"raid\" + 0.026*\"museo\" + 0.022*\"traceabl\" + 0.022*\"word\" + 0.019*\"pain\" + 0.016*\"artist\" + 0.013*\"gai\"\n", + "2019-01-31 00:16:16,069 : INFO : topic #11 (0.020): 0.029*\"john\" + 0.022*\"will\" + 0.016*\"jame\" + 0.013*\"georg\" + 0.012*\"rival\" + 0.010*\"rhyme\" + 0.009*\"david\" + 0.009*\"slur\" + 0.009*\"thirtieth\" + 0.007*\"edg\"\n", + "2019-01-31 00:16:16,070 : INFO : topic #3 (0.020): 0.028*\"present\" + 0.023*\"seri\" + 0.020*\"minist\" + 0.020*\"offic\" + 0.016*\"american\" + 0.016*\"gener\" + 0.016*\"appeas\" + 0.015*\"chickasaw\" + 0.014*\"start\" + 0.013*\"bone\"\n", + "2019-01-31 00:16:16,076 : INFO : topic diff=0.174786, rho=0.174078\n", + "2019-01-31 00:16:16,234 : INFO : PROGRESS: pass 0, at document #68000/4922894\n", + "2019-01-31 00:16:17,818 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:16:18,083 : INFO : topic #40 (0.020): 0.075*\"unit\" + 0.027*\"collector\" + 0.013*\"american\" + 0.012*\"governor\" + 0.012*\"professor\" + 0.011*\"institut\" + 0.011*\"new\" + 0.010*\"start\" + 0.010*\"schuster\" + 0.010*\"degre\"\n", + "2019-01-31 00:16:18,084 : INFO : topic #7 (0.020): 0.017*\"snatch\" + 0.015*\"church\" + 0.014*\"di\" + 0.013*\"locri\" + 0.012*\"factor\" + 0.011*\"john\" + 0.010*\"sir\" + 0.010*\"yawn\" + 0.009*\"margin\" + 0.008*\"life\"\n", + "2019-01-31 00:16:18,086 : INFO : topic #42 (0.020): 0.029*\"german\" + 0.017*\"germani\" + 0.011*\"vol\" + 0.011*\"der\" + 0.010*\"jewish\" + 0.010*\"greek\" + 0.009*\"berlin\" + 0.009*\"israel\" + 0.008*\"anglo\" + 0.007*\"austria\"\n", + "2019-01-31 00:16:18,087 : INFO : topic #25 (0.020): 0.027*\"ring\" + 0.018*\"lagrang\" + 0.014*\"mount\" + 0.013*\"area\" + 0.011*\"warmth\" + 0.010*\"palmer\" + 0.009*\"mound\" + 0.008*\"foam\" + 0.007*\"isl\" + 0.007*\"natur\"\n", + "2019-01-31 00:16:18,088 : INFO : topic #28 (0.020): 0.024*\"build\" + 0.019*\"hous\" + 0.017*\"rivièr\" + 0.015*\"buford\" + 0.010*\"histor\" + 0.009*\"lobe\" + 0.009*\"briarwood\" + 0.009*\"area\" + 0.009*\"constitut\" + 0.009*\"tortur\"\n", + "2019-01-31 00:16:18,094 : INFO : topic diff=0.168273, rho=0.171499\n", + "2019-01-31 00:16:18,247 : INFO : PROGRESS: pass 0, at document #70000/4922894\n", + "2019-01-31 00:16:19,759 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:16:20,024 : INFO : topic #22 (0.020): 0.028*\"spars\" + 0.026*\"factor\" + 0.021*\"adulthood\" + 0.015*\"hostil\" + 0.014*\"feel\" + 0.014*\"popolo\" + 0.012*\"male\" + 0.012*\"plaisir\" + 0.012*\"live\" + 0.010*\"yawn\"\n", + "2019-01-31 00:16:20,025 : INFO : topic #15 (0.020): 0.019*\"requir\" + 0.013*\"develop\" + 0.012*\"small\" + 0.011*\"schuster\" + 0.011*\"word\" + 0.010*\"student\" + 0.009*\"human\" + 0.009*\"intern\" + 0.008*\"socialist\" + 0.008*\"cultur\"\n", + "2019-01-31 00:16:20,027 : INFO : topic #33 (0.020): 0.046*\"french\" + 0.036*\"franc\" + 0.024*\"pari\" + 0.023*\"jean\" + 0.022*\"sail\" + 0.018*\"daphn\" + 0.012*\"lazi\" + 0.012*\"convei\" + 0.012*\"piec\" + 0.011*\"focal\"\n", + "2019-01-31 00:16:20,028 : INFO : topic #20 (0.020): 0.103*\"scholar\" + 0.033*\"struggl\" + 0.029*\"educ\" + 0.022*\"high\" + 0.016*\"yawn\" + 0.013*\"prognosi\" + 0.012*\"collector\" + 0.010*\"commun\" + 0.008*\"class\" + 0.007*\"children\"\n", + "2019-01-31 00:16:20,029 : INFO : topic #46 (0.020): 0.028*\"warmth\" + 0.015*\"turkish\" + 0.014*\"damag\" + 0.013*\"norwegian\" + 0.013*\"norwai\" + 0.013*\"sweden\" + 0.012*\"turkei\" + 0.012*\"swedish\" + 0.010*\"cameron\" + 0.009*\"wind\"\n", + "2019-01-31 00:16:20,036 : INFO : topic diff=0.152998, rho=0.169031\n", + "2019-01-31 00:16:20,192 : INFO : PROGRESS: pass 0, at document #72000/4922894\n", + "2019-01-31 00:16:21,747 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:16:22,012 : INFO : topic #21 (0.020): 0.033*\"samford\" + 0.022*\"spain\" + 0.021*\"del\" + 0.019*\"mexico\" + 0.014*\"soviet\" + 0.011*\"santa\" + 0.010*\"juan\" + 0.010*\"carlo\" + 0.010*\"francisco\" + 0.009*\"mexican\"\n", + "2019-01-31 00:16:22,014 : INFO : topic #35 (0.020): 0.039*\"china\" + 0.034*\"russia\" + 0.032*\"sovereignti\" + 0.025*\"chilton\" + 0.024*\"rural\" + 0.017*\"reprint\" + 0.016*\"personifi\" + 0.015*\"poison\" + 0.012*\"moscow\" + 0.011*\"unfortun\"\n", + "2019-01-31 00:16:22,015 : INFO : topic #18 (0.020): 0.007*\"man\" + 0.007*\"théori\" + 0.007*\"kill\" + 0.006*\"later\" + 0.005*\"deal\" + 0.005*\"sack\" + 0.004*\"life\" + 0.004*\"charact\" + 0.004*\"help\" + 0.004*\"fraud\"\n", + "2019-01-31 00:16:22,017 : INFO : topic #27 (0.020): 0.056*\"questionnair\" + 0.015*\"taxpay\" + 0.014*\"dai\" + 0.014*\"tornado\" + 0.013*\"théori\" + 0.012*\"rick\" + 0.012*\"candid\" + 0.011*\"find\" + 0.011*\"driver\" + 0.010*\"squatter\"\n", + "2019-01-31 00:16:22,018 : INFO : topic #20 (0.020): 0.103*\"scholar\" + 0.032*\"struggl\" + 0.028*\"educ\" + 0.022*\"high\" + 0.016*\"yawn\" + 0.013*\"prognosi\" + 0.012*\"collector\" + 0.010*\"commun\" + 0.008*\"class\" + 0.008*\"task\"\n", + "2019-01-31 00:16:22,024 : INFO : topic diff=0.152972, rho=0.166667\n", + "2019-01-31 00:16:22,179 : INFO : PROGRESS: pass 0, at document #74000/4922894\n", + "2019-01-31 00:16:23,699 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:16:23,963 : INFO : topic #46 (0.020): 0.023*\"warmth\" + 0.019*\"damag\" + 0.015*\"turkish\" + 0.014*\"cameron\" + 0.014*\"turkei\" + 0.013*\"sweden\" + 0.013*\"norwai\" + 0.013*\"norwegian\" + 0.011*\"ton\" + 0.011*\"swedish\"\n", + "2019-01-31 00:16:23,965 : INFO : topic #2 (0.020): 0.042*\"shield\" + 0.034*\"isl\" + 0.017*\"pope\" + 0.015*\"narrat\" + 0.015*\"class\" + 0.013*\"blur\" + 0.012*\"scot\" + 0.012*\"coalit\" + 0.010*\"nativist\" + 0.010*\"fleet\"\n", + "2019-01-31 00:16:23,966 : INFO : topic #17 (0.020): 0.044*\"church\" + 0.019*\"centuri\" + 0.017*\"bishop\" + 0.016*\"fifteenth\" + 0.016*\"retroflex\" + 0.016*\"cathol\" + 0.015*\"jpg\" + 0.013*\"italian\" + 0.013*\"sail\" + 0.010*\"christian\"\n", + "2019-01-31 00:16:23,968 : INFO : topic #42 (0.020): 0.030*\"german\" + 0.018*\"germani\" + 0.011*\"jewish\" + 0.011*\"der\" + 0.010*\"vol\" + 0.010*\"anglo\" + 0.009*\"berlin\" + 0.009*\"israel\" + 0.009*\"greek\" + 0.007*\"jeremiah\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 00:16:23,969 : INFO : topic #22 (0.020): 0.028*\"spars\" + 0.027*\"factor\" + 0.021*\"adulthood\" + 0.016*\"hostil\" + 0.015*\"feel\" + 0.014*\"popolo\" + 0.012*\"male\" + 0.012*\"live\" + 0.010*\"plaisir\" + 0.010*\"yawn\"\n", + "2019-01-31 00:16:23,975 : INFO : topic diff=0.148557, rho=0.164399\n", + "2019-01-31 00:16:24,128 : INFO : PROGRESS: pass 0, at document #76000/4922894\n", + "2019-01-31 00:16:25,653 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:16:25,917 : INFO : topic #3 (0.020): 0.032*\"present\" + 0.023*\"offic\" + 0.022*\"minist\" + 0.021*\"seri\" + 0.015*\"gener\" + 0.015*\"appeas\" + 0.014*\"chickasaw\" + 0.013*\"start\" + 0.012*\"member\" + 0.012*\"american\"\n", + "2019-01-31 00:16:25,918 : INFO : topic #14 (0.020): 0.021*\"walter\" + 0.021*\"forc\" + 0.019*\"armi\" + 0.019*\"aggress\" + 0.018*\"com\" + 0.014*\"militari\" + 0.013*\"unionist\" + 0.012*\"oper\" + 0.011*\"refut\" + 0.011*\"serv\"\n", + "2019-01-31 00:16:25,919 : INFO : topic #28 (0.020): 0.024*\"build\" + 0.019*\"hous\" + 0.018*\"rivièr\" + 0.014*\"buford\" + 0.010*\"histor\" + 0.010*\"rosenwald\" + 0.010*\"lobe\" + 0.009*\"area\" + 0.009*\"constitut\" + 0.009*\"briarwood\"\n", + "2019-01-31 00:16:25,920 : INFO : topic #44 (0.020): 0.027*\"rooftop\" + 0.025*\"wife\" + 0.025*\"final\" + 0.019*\"tourist\" + 0.016*\"champion\" + 0.014*\"chamber\" + 0.014*\"martin\" + 0.014*\"tiepolo\" + 0.012*\"taxpay\" + 0.012*\"ret\"\n", + "2019-01-31 00:16:25,921 : INFO : topic #19 (0.020): 0.008*\"like\" + 0.008*\"form\" + 0.008*\"uruguayan\" + 0.007*\"origin\" + 0.007*\"woodcut\" + 0.007*\"mean\" + 0.007*\"charact\" + 0.007*\"differ\" + 0.006*\"pour\" + 0.006*\"anim\"\n", + "2019-01-31 00:16:25,927 : INFO : topic diff=0.135212, rho=0.162221\n", + "2019-01-31 00:16:26,085 : INFO : PROGRESS: pass 0, at document #78000/4922894\n", + "2019-01-31 00:16:27,656 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:16:27,921 : INFO : topic #17 (0.020): 0.043*\"church\" + 0.021*\"retroflex\" + 0.020*\"centuri\" + 0.018*\"bishop\" + 0.015*\"cathol\" + 0.015*\"fifteenth\" + 0.014*\"jpg\" + 0.013*\"sail\" + 0.013*\"italian\" + 0.011*\"christian\"\n", + "2019-01-31 00:16:27,922 : INFO : topic #14 (0.020): 0.021*\"walter\" + 0.020*\"forc\" + 0.020*\"aggress\" + 0.020*\"armi\" + 0.018*\"com\" + 0.014*\"militari\" + 0.014*\"unionist\" + 0.011*\"oper\" + 0.010*\"serv\" + 0.010*\"airmen\"\n", + "2019-01-31 00:16:27,923 : INFO : topic #42 (0.020): 0.030*\"german\" + 0.018*\"germani\" + 0.012*\"vol\" + 0.011*\"jewish\" + 0.010*\"der\" + 0.010*\"anglo\" + 0.009*\"berlin\" + 0.009*\"israel\" + 0.008*\"greek\" + 0.006*\"und\"\n", + "2019-01-31 00:16:27,925 : INFO : topic #21 (0.020): 0.032*\"samford\" + 0.020*\"del\" + 0.019*\"spain\" + 0.017*\"mexico\" + 0.014*\"soviet\" + 0.011*\"santa\" + 0.010*\"josé\" + 0.010*\"juan\" + 0.010*\"mexican\" + 0.010*\"carlo\"\n", + "2019-01-31 00:16:27,926 : INFO : topic #15 (0.020): 0.018*\"requir\" + 0.014*\"develop\" + 0.013*\"small\" + 0.011*\"schuster\" + 0.010*\"student\" + 0.010*\"word\" + 0.009*\"human\" + 0.008*\"commun\" + 0.008*\"intern\" + 0.008*\"socialist\"\n", + "2019-01-31 00:16:27,932 : INFO : topic diff=0.140688, rho=0.160128\n", + "2019-01-31 00:16:30,791 : INFO : -11.771 per-word bound, 3493.9 perplexity estimate based on a held-out corpus of 2000 documents with 590987 words\n", + "2019-01-31 00:16:30,792 : INFO : PROGRESS: pass 0, at document #80000/4922894\n", + "2019-01-31 00:16:32,340 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:16:32,604 : INFO : topic #34 (0.020): 0.061*\"start\" + 0.046*\"cotton\" + 0.023*\"toni\" + 0.023*\"unionist\" + 0.015*\"terri\" + 0.014*\"california\" + 0.012*\"violent\" + 0.011*\"carefulli\" + 0.011*\"north\" + 0.010*\"new\"\n", + "2019-01-31 00:16:32,605 : INFO : topic #12 (0.020): 0.009*\"number\" + 0.007*\"gener\" + 0.007*\"frontal\" + 0.006*\"turn\" + 0.006*\"utopian\" + 0.006*\"exampl\" + 0.006*\"servitud\" + 0.006*\"southern\" + 0.006*\"poet\" + 0.006*\"differ\"\n", + "2019-01-31 00:16:32,606 : INFO : topic #37 (0.020): 0.008*\"love\" + 0.005*\"théori\" + 0.005*\"place\" + 0.005*\"gestur\" + 0.004*\"night\" + 0.004*\"bewild\" + 0.004*\"appear\" + 0.004*\"introductori\" + 0.004*\"dai\" + 0.004*\"litig\"\n", + "2019-01-31 00:16:32,608 : INFO : topic #24 (0.020): 0.035*\"book\" + 0.030*\"publicis\" + 0.018*\"word\" + 0.013*\"new\" + 0.012*\"storag\" + 0.012*\"edit\" + 0.011*\"presid\" + 0.011*\"magazin\" + 0.011*\"nicola\" + 0.010*\"worldwid\"\n", + "2019-01-31 00:16:32,609 : INFO : topic #42 (0.020): 0.029*\"german\" + 0.018*\"germani\" + 0.012*\"vol\" + 0.011*\"jewish\" + 0.009*\"anglo\" + 0.009*\"berlin\" + 0.009*\"israel\" + 0.009*\"der\" + 0.008*\"greek\" + 0.007*\"hungarian\"\n", + "2019-01-31 00:16:32,615 : INFO : topic diff=0.136293, rho=0.158114\n", + "2019-01-31 00:16:32,768 : INFO : PROGRESS: pass 0, at document #82000/4922894\n", + "2019-01-31 00:16:34,281 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:16:34,546 : INFO : topic #13 (0.020): 0.026*\"sourc\" + 0.022*\"london\" + 0.021*\"australia\" + 0.020*\"ireland\" + 0.019*\"england\" + 0.017*\"north\" + 0.016*\"weekli\" + 0.014*\"wale\" + 0.014*\"earthworm\" + 0.013*\"castl\"\n", + "2019-01-31 00:16:34,547 : INFO : topic #28 (0.020): 0.024*\"build\" + 0.019*\"hous\" + 0.017*\"rivièr\" + 0.014*\"buford\" + 0.010*\"histor\" + 0.010*\"rosenwald\" + 0.009*\"lobe\" + 0.009*\"constitut\" + 0.009*\"briarwood\" + 0.009*\"area\"\n", + "2019-01-31 00:16:34,548 : INFO : topic #49 (0.020): 0.034*\"india\" + 0.023*\"incumb\" + 0.009*\"treeless\" + 0.009*\"pakistan\" + 0.009*\"tajikistan\" + 0.009*\"sri\" + 0.008*\"televis\" + 0.008*\"khalsa\" + 0.007*\"muskoge\" + 0.006*\"alam\"\n", + "2019-01-31 00:16:34,550 : INFO : topic #46 (0.020): 0.022*\"warmth\" + 0.020*\"stop\" + 0.017*\"damag\" + 0.016*\"wind\" + 0.012*\"norwai\" + 0.011*\"sweden\" + 0.011*\"cameron\" + 0.011*\"turkish\" + 0.011*\"norwegian\" + 0.009*\"turkei\"\n", + "2019-01-31 00:16:34,551 : INFO : topic #30 (0.020): 0.035*\"cleveland\" + 0.031*\"leagu\" + 0.026*\"place\" + 0.024*\"taxpay\" + 0.024*\"crete\" + 0.022*\"scientist\" + 0.020*\"folei\" + 0.014*\"martin\" + 0.013*\"goal\" + 0.011*\"diversifi\"\n", + "2019-01-31 00:16:34,557 : INFO : topic diff=0.124826, rho=0.156174\n", + "2019-01-31 00:16:34,714 : INFO : PROGRESS: pass 0, at document #84000/4922894\n", + "2019-01-31 00:16:36,235 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:16:36,500 : INFO : topic #30 (0.020): 0.036*\"cleveland\" + 0.032*\"leagu\" + 0.026*\"place\" + 0.024*\"crete\" + 0.024*\"taxpay\" + 0.022*\"scientist\" + 0.021*\"folei\" + 0.014*\"goal\" + 0.013*\"martin\" + 0.012*\"diversifi\"\n", + "2019-01-31 00:16:36,501 : INFO : topic #4 (0.020): 0.024*\"enfranchis\" + 0.015*\"pour\" + 0.014*\"depress\" + 0.010*\"candid\" + 0.010*\"veget\" + 0.009*\"elabor\" + 0.009*\"mode\" + 0.008*\"produc\" + 0.008*\"turn\" + 0.008*\"fuel\"\n", + "2019-01-31 00:16:36,503 : INFO : topic #9 (0.020): 0.063*\"bone\" + 0.036*\"american\" + 0.016*\"valour\" + 0.013*\"smithsonian\" + 0.012*\"player\" + 0.012*\"dutch\" + 0.012*\"simpler\" + 0.012*\"folei\" + 0.011*\"english\" + 0.010*\"polit\"\n", + "2019-01-31 00:16:36,504 : INFO : topic #34 (0.020): 0.066*\"start\" + 0.043*\"cotton\" + 0.023*\"unionist\" + 0.018*\"toni\" + 0.015*\"terri\" + 0.013*\"california\" + 0.013*\"violent\" + 0.012*\"north\" + 0.011*\"carefulli\" + 0.010*\"weekli\"\n", + "2019-01-31 00:16:36,505 : INFO : topic #25 (0.020): 0.026*\"ring\" + 0.016*\"lagrang\" + 0.014*\"mount\" + 0.014*\"area\" + 0.012*\"warmth\" + 0.009*\"palmer\" + 0.008*\"north\" + 0.007*\"mound\" + 0.007*\"foam\" + 0.007*\"lobe\"\n", + "2019-01-31 00:16:36,511 : INFO : topic diff=0.120656, rho=0.154303\n", + "2019-01-31 00:16:36,663 : INFO : PROGRESS: pass 0, at document #86000/4922894\n", + "2019-01-31 00:16:38,389 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:16:38,654 : INFO : topic #5 (0.020): 0.038*\"abroad\" + 0.028*\"rel\" + 0.028*\"son\" + 0.027*\"reconstruct\" + 0.020*\"band\" + 0.019*\"muscl\" + 0.017*\"simultan\" + 0.015*\"charcoal\" + 0.013*\"toyota\" + 0.009*\"myspac\"\n", + "2019-01-31 00:16:38,656 : INFO : topic #18 (0.020): 0.007*\"kill\" + 0.007*\"man\" + 0.006*\"théori\" + 0.006*\"later\" + 0.005*\"sack\" + 0.005*\"deal\" + 0.004*\"life\" + 0.004*\"charact\" + 0.004*\"fraud\" + 0.004*\"retrospect\"\n", + "2019-01-31 00:16:38,657 : INFO : topic #42 (0.020): 0.029*\"german\" + 0.018*\"germani\" + 0.012*\"vol\" + 0.011*\"jewish\" + 0.010*\"der\" + 0.010*\"berlin\" + 0.009*\"israel\" + 0.009*\"anglo\" + 0.008*\"austria\" + 0.008*\"egypt\"\n", + "2019-01-31 00:16:38,658 : INFO : topic #37 (0.020): 0.008*\"love\" + 0.005*\"place\" + 0.005*\"gestur\" + 0.005*\"théori\" + 0.004*\"night\" + 0.004*\"litig\" + 0.004*\"bewild\" + 0.004*\"introductori\" + 0.004*\"appear\" + 0.003*\"dai\"\n", + "2019-01-31 00:16:38,659 : INFO : topic #33 (0.020): 0.050*\"french\" + 0.038*\"franc\" + 0.026*\"pari\" + 0.023*\"jean\" + 0.022*\"sail\" + 0.016*\"daphn\" + 0.015*\"wreath\" + 0.014*\"lazi\" + 0.013*\"loui\" + 0.012*\"quebec\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 00:16:38,665 : INFO : topic diff=0.113836, rho=0.152499\n", + "2019-01-31 00:16:38,821 : INFO : PROGRESS: pass 0, at document #88000/4922894\n", + "2019-01-31 00:16:40,395 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:16:40,660 : INFO : topic #22 (0.020): 0.031*\"spars\" + 0.024*\"factor\" + 0.021*\"adulthood\" + 0.018*\"feel\" + 0.015*\"hostil\" + 0.014*\"male\" + 0.014*\"popolo\" + 0.012*\"live\" + 0.010*\"plaisir\" + 0.010*\"avail\"\n", + "2019-01-31 00:16:40,661 : INFO : topic #34 (0.020): 0.065*\"start\" + 0.040*\"cotton\" + 0.023*\"unionist\" + 0.015*\"toni\" + 0.015*\"california\" + 0.015*\"terri\" + 0.012*\"violent\" + 0.012*\"north\" + 0.010*\"carefulli\" + 0.010*\"new\"\n", + "2019-01-31 00:16:40,662 : INFO : topic #11 (0.020): 0.030*\"john\" + 0.019*\"will\" + 0.016*\"jame\" + 0.012*\"georg\" + 0.012*\"rival\" + 0.010*\"david\" + 0.009*\"rhyme\" + 0.009*\"thirtieth\" + 0.009*\"slur\" + 0.007*\"chandra\"\n", + "2019-01-31 00:16:40,663 : INFO : topic #12 (0.020): 0.008*\"number\" + 0.007*\"frontal\" + 0.006*\"gener\" + 0.006*\"southern\" + 0.006*\"exampl\" + 0.006*\"servitud\" + 0.006*\"differ\" + 0.006*\"poet\" + 0.006*\"théori\" + 0.006*\"cytokin\"\n", + "2019-01-31 00:16:40,664 : INFO : topic #40 (0.020): 0.082*\"unit\" + 0.033*\"collector\" + 0.015*\"institut\" + 0.013*\"american\" + 0.012*\"scholar\" + 0.012*\"schuster\" + 0.011*\"degre\" + 0.011*\"governor\" + 0.011*\"student\" + 0.011*\"professor\"\n", + "2019-01-31 00:16:40,670 : INFO : topic diff=0.112515, rho=0.150756\n", + "2019-01-31 00:16:40,827 : INFO : PROGRESS: pass 0, at document #90000/4922894\n", + "2019-01-31 00:16:42,365 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:16:42,630 : INFO : topic #40 (0.020): 0.082*\"unit\" + 0.032*\"collector\" + 0.015*\"institut\" + 0.013*\"american\" + 0.012*\"scholar\" + 0.012*\"schuster\" + 0.011*\"governor\" + 0.011*\"degre\" + 0.011*\"professor\" + 0.011*\"student\"\n", + "2019-01-31 00:16:42,632 : INFO : topic #42 (0.020): 0.031*\"german\" + 0.018*\"germani\" + 0.013*\"vol\" + 0.011*\"jewish\" + 0.011*\"berlin\" + 0.010*\"der\" + 0.009*\"israel\" + 0.008*\"anglo\" + 0.008*\"austria\" + 0.007*\"greek\"\n", + "2019-01-31 00:16:42,633 : INFO : topic #45 (0.020): 0.017*\"black\" + 0.016*\"record\" + 0.014*\"colder\" + 0.012*\"western\" + 0.011*\"blind\" + 0.010*\"light\" + 0.009*\"depress\" + 0.007*\"arm\" + 0.007*\"hand\" + 0.007*\"green\"\n", + "2019-01-31 00:16:42,634 : INFO : topic #12 (0.020): 0.008*\"number\" + 0.007*\"frontal\" + 0.006*\"gener\" + 0.006*\"servitud\" + 0.006*\"exampl\" + 0.006*\"differ\" + 0.006*\"southern\" + 0.006*\"turn\" + 0.006*\"poet\" + 0.006*\"cytokin\"\n", + "2019-01-31 00:16:42,635 : INFO : topic #26 (0.020): 0.031*\"olymp\" + 0.031*\"workplac\" + 0.031*\"champion\" + 0.026*\"medal\" + 0.022*\"event\" + 0.022*\"woman\" + 0.019*\"gold\" + 0.019*\"rainfal\" + 0.018*\"men\" + 0.017*\"nation\"\n", + "2019-01-31 00:16:42,641 : INFO : topic diff=0.111307, rho=0.149071\n", + "2019-01-31 00:16:42,791 : INFO : PROGRESS: pass 0, at document #92000/4922894\n", + "2019-01-31 00:16:44,271 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:16:44,536 : INFO : topic #38 (0.020): 0.019*\"king\" + 0.014*\"walter\" + 0.013*\"aza\" + 0.013*\"teufel\" + 0.008*\"empath\" + 0.008*\"till\" + 0.008*\"embassi\" + 0.007*\"battalion\" + 0.007*\"armi\" + 0.006*\"forc\"\n", + "2019-01-31 00:16:44,538 : INFO : topic #36 (0.020): 0.026*\"companhia\" + 0.013*\"bank\" + 0.012*\"serv\" + 0.009*\"oper\" + 0.009*\"market\" + 0.009*\"develop\" + 0.008*\"busi\" + 0.008*\"manag\" + 0.008*\"produc\" + 0.008*\"includ\"\n", + "2019-01-31 00:16:44,539 : INFO : topic #18 (0.020): 0.007*\"man\" + 0.007*\"kill\" + 0.006*\"théori\" + 0.006*\"later\" + 0.005*\"deal\" + 0.005*\"sack\" + 0.004*\"life\" + 0.004*\"retrospect\" + 0.004*\"fraud\" + 0.004*\"help\"\n", + "2019-01-31 00:16:44,540 : INFO : topic #46 (0.020): 0.023*\"warmth\" + 0.021*\"wind\" + 0.020*\"stop\" + 0.017*\"damag\" + 0.012*\"norwai\" + 0.011*\"swedish\" + 0.011*\"cameron\" + 0.011*\"norwegian\" + 0.011*\"sweden\" + 0.009*\"turkish\"\n", + "2019-01-31 00:16:44,541 : INFO : topic #33 (0.020): 0.048*\"french\" + 0.039*\"franc\" + 0.024*\"pari\" + 0.023*\"jean\" + 0.022*\"sail\" + 0.016*\"daphn\" + 0.013*\"lazi\" + 0.013*\"piec\" + 0.012*\"loui\" + 0.012*\"wreath\"\n", + "2019-01-31 00:16:44,547 : INFO : topic diff=0.099452, rho=0.147442\n", + "2019-01-31 00:16:44,753 : INFO : PROGRESS: pass 0, at document #94000/4922894\n", + "2019-01-31 00:16:46,265 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:16:46,530 : INFO : topic #35 (0.020): 0.040*\"russia\" + 0.035*\"china\" + 0.024*\"rural\" + 0.021*\"sovereignti\" + 0.020*\"chilton\" + 0.018*\"reprint\" + 0.018*\"poison\" + 0.017*\"personifi\" + 0.014*\"unfortun\" + 0.013*\"shirin\"\n", + "2019-01-31 00:16:46,531 : INFO : topic #14 (0.020): 0.022*\"walter\" + 0.021*\"forc\" + 0.019*\"armi\" + 0.019*\"aggress\" + 0.017*\"com\" + 0.015*\"militari\" + 0.013*\"unionist\" + 0.012*\"oper\" + 0.011*\"refut\" + 0.011*\"airmen\"\n", + "2019-01-31 00:16:46,532 : INFO : topic #43 (0.020): 0.062*\"elect\" + 0.052*\"parti\" + 0.026*\"voluntari\" + 0.023*\"democrat\" + 0.021*\"member\" + 0.016*\"polici\" + 0.014*\"seaport\" + 0.013*\"republ\" + 0.013*\"bypass\" + 0.012*\"liber\"\n", + "2019-01-31 00:16:46,534 : INFO : topic #23 (0.020): 0.133*\"audit\" + 0.069*\"best\" + 0.031*\"yawn\" + 0.028*\"jacksonvil\" + 0.027*\"japanes\" + 0.023*\"noll\" + 0.017*\"women\" + 0.014*\"prison\" + 0.013*\"festiv\" + 0.010*\"intern\"\n", + "2019-01-31 00:16:46,535 : INFO : topic #47 (0.020): 0.073*\"muscl\" + 0.034*\"perceptu\" + 0.019*\"compos\" + 0.016*\"physician\" + 0.015*\"damn\" + 0.014*\"place\" + 0.014*\"orchestr\" + 0.013*\"jack\" + 0.013*\"olympo\" + 0.011*\"word\"\n", + "2019-01-31 00:16:46,541 : INFO : topic diff=0.100869, rho=0.145865\n", + "2019-01-31 00:16:46,699 : INFO : PROGRESS: pass 0, at document #96000/4922894\n", + "2019-01-31 00:16:48,255 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:16:48,520 : INFO : topic #45 (0.020): 0.019*\"record\" + 0.017*\"black\" + 0.016*\"western\" + 0.014*\"blind\" + 0.013*\"colder\" + 0.011*\"light\" + 0.008*\"depress\" + 0.008*\"wors\" + 0.007*\"bodi\" + 0.007*\"glass\"\n", + "2019-01-31 00:16:48,521 : INFO : topic #22 (0.020): 0.032*\"spars\" + 0.026*\"factor\" + 0.021*\"adulthood\" + 0.019*\"male\" + 0.017*\"feel\" + 0.016*\"hostil\" + 0.013*\"popolo\" + 0.012*\"live\" + 0.010*\"avail\" + 0.010*\"genu\"\n", + "2019-01-31 00:16:48,522 : INFO : topic #0 (0.020): 0.059*\"statewid\" + 0.052*\"arsen\" + 0.041*\"line\" + 0.035*\"raid\" + 0.032*\"museo\" + 0.021*\"word\" + 0.021*\"pain\" + 0.018*\"traceabl\" + 0.018*\"artist\" + 0.016*\"exhaust\"\n", + "2019-01-31 00:16:48,524 : INFO : topic #9 (0.020): 0.079*\"bone\" + 0.051*\"american\" + 0.016*\"folei\" + 0.016*\"valour\" + 0.015*\"player\" + 0.013*\"polit\" + 0.013*\"simpler\" + 0.011*\"dutch\" + 0.011*\"english\" + 0.011*\"acrimoni\"\n", + "2019-01-31 00:16:48,525 : INFO : topic #6 (0.020): 0.065*\"fewer\" + 0.020*\"septemb\" + 0.017*\"epiru\" + 0.017*\"stake\" + 0.016*\"teacher\" + 0.012*\"rodríguez\" + 0.011*\"movi\" + 0.011*\"proclaim\" + 0.010*\"direct\" + 0.010*\"pop\"\n", + "2019-01-31 00:16:48,531 : INFO : topic diff=0.100107, rho=0.144338\n", + "2019-01-31 00:16:48,687 : INFO : PROGRESS: pass 0, at document #98000/4922894\n", + "2019-01-31 00:16:50,228 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:16:50,493 : INFO : topic #7 (0.020): 0.019*\"snatch\" + 0.017*\"di\" + 0.014*\"factor\" + 0.013*\"john\" + 0.012*\"locri\" + 0.011*\"yawn\" + 0.010*\"sir\" + 0.010*\"church\" + 0.009*\"faster\" + 0.009*\"margin\"\n", + "2019-01-31 00:16:50,495 : INFO : topic #48 (0.020): 0.075*\"march\" + 0.073*\"januari\" + 0.070*\"sens\" + 0.066*\"octob\" + 0.061*\"august\" + 0.060*\"juli\" + 0.059*\"april\" + 0.058*\"notion\" + 0.058*\"judici\" + 0.057*\"decatur\"\n", + "2019-01-31 00:16:50,496 : INFO : topic #27 (0.020): 0.058*\"questionnair\" + 0.017*\"taxpay\" + 0.015*\"dai\" + 0.014*\"tornado\" + 0.014*\"candid\" + 0.013*\"yawn\" + 0.011*\"théori\" + 0.011*\"find\" + 0.011*\"allud\" + 0.011*\"driver\"\n", + "2019-01-31 00:16:50,498 : INFO : topic #9 (0.020): 0.078*\"bone\" + 0.049*\"american\" + 0.017*\"folei\" + 0.016*\"player\" + 0.016*\"valour\" + 0.014*\"polit\" + 0.013*\"simpler\" + 0.012*\"dutch\" + 0.011*\"english\" + 0.011*\"acrimoni\"\n", + "2019-01-31 00:16:50,499 : INFO : topic #4 (0.020): 0.027*\"enfranchis\" + 0.018*\"candid\" + 0.014*\"pour\" + 0.014*\"depress\" + 0.010*\"elabor\" + 0.009*\"veget\" + 0.009*\"produc\" + 0.008*\"spectacl\" + 0.008*\"mode\" + 0.007*\"buford\"\n", + "2019-01-31 00:16:50,504 : INFO : topic diff=0.092596, rho=0.142857\n", + "2019-01-31 00:16:53,292 : INFO : -11.669 per-word bound, 3256.5 perplexity estimate based on a held-out corpus of 2000 documents with 568899 words\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 00:16:53,292 : INFO : PROGRESS: pass 0, at document #100000/4922894\n", + "2019-01-31 00:16:54,816 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:16:55,081 : INFO : topic #9 (0.020): 0.076*\"bone\" + 0.050*\"american\" + 0.018*\"valour\" + 0.017*\"folei\" + 0.016*\"player\" + 0.014*\"dutch\" + 0.014*\"polit\" + 0.013*\"simpler\" + 0.012*\"english\" + 0.011*\"acrimoni\"\n", + "2019-01-31 00:16:55,082 : INFO : topic #33 (0.020): 0.053*\"french\" + 0.039*\"franc\" + 0.024*\"pari\" + 0.023*\"sail\" + 0.022*\"jean\" + 0.015*\"daphn\" + 0.012*\"lazi\" + 0.012*\"piec\" + 0.011*\"loui\" + 0.009*\"focal\"\n", + "2019-01-31 00:16:55,083 : INFO : topic #6 (0.020): 0.064*\"fewer\" + 0.021*\"septemb\" + 0.017*\"stake\" + 0.017*\"epiru\" + 0.017*\"teacher\" + 0.012*\"rodríguez\" + 0.011*\"proclaim\" + 0.010*\"movi\" + 0.010*\"direct\" + 0.010*\"pop\"\n", + "2019-01-31 00:16:55,084 : INFO : topic #28 (0.020): 0.025*\"build\" + 0.024*\"hous\" + 0.019*\"rivièr\" + 0.016*\"buford\" + 0.012*\"histor\" + 0.010*\"rosenwald\" + 0.010*\"briarwood\" + 0.009*\"constitut\" + 0.009*\"lobe\" + 0.008*\"silicon\"\n", + "2019-01-31 00:16:55,085 : INFO : topic #0 (0.020): 0.063*\"statewid\" + 0.047*\"arsen\" + 0.042*\"line\" + 0.034*\"raid\" + 0.029*\"museo\" + 0.021*\"traceabl\" + 0.020*\"word\" + 0.019*\"pain\" + 0.016*\"artist\" + 0.015*\"exhaust\"\n", + "2019-01-31 00:16:55,091 : INFO : topic diff=0.098104, rho=0.141421\n", + "2019-01-31 00:16:55,250 : INFO : PROGRESS: pass 0, at document #102000/4922894\n", + "2019-01-31 00:16:56,793 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:16:57,058 : INFO : topic #44 (0.020): 0.027*\"rooftop\" + 0.025*\"final\" + 0.023*\"ret\" + 0.022*\"wife\" + 0.018*\"season\" + 0.017*\"tourist\" + 0.014*\"winner\" + 0.014*\"chamber\" + 0.013*\"champion\" + 0.013*\"tiepolo\"\n", + "2019-01-31 00:16:57,059 : INFO : topic #1 (0.020): 0.030*\"korean\" + 0.026*\"hong\" + 0.025*\"kong\" + 0.025*\"korea\" + 0.025*\"chilton\" + 0.018*\"leah\" + 0.016*\"han\" + 0.015*\"kim\" + 0.015*\"china\" + 0.013*\"sourc\"\n", + "2019-01-31 00:16:57,060 : INFO : topic #32 (0.020): 0.076*\"district\" + 0.053*\"vigour\" + 0.045*\"popolo\" + 0.042*\"tortur\" + 0.032*\"regim\" + 0.028*\"multitud\" + 0.024*\"area\" + 0.023*\"cotton\" + 0.020*\"prosper\" + 0.020*\"commun\"\n", + "2019-01-31 00:16:57,061 : INFO : topic #16 (0.020): 0.022*\"priest\" + 0.017*\"quarterli\" + 0.016*\"rotterdam\" + 0.016*\"duke\" + 0.014*\"margin\" + 0.012*\"daughter\" + 0.010*\"maria\" + 0.010*\"snatch\" + 0.009*\"king\" + 0.009*\"sino\"\n", + "2019-01-31 00:16:57,063 : INFO : topic #46 (0.020): 0.021*\"warmth\" + 0.016*\"damag\" + 0.015*\"wind\" + 0.015*\"stop\" + 0.014*\"sk\" + 0.014*\"norwai\" + 0.012*\"norwegian\" + 0.012*\"sweden\" + 0.012*\"farid\" + 0.011*\"swedish\"\n", + "2019-01-31 00:16:57,069 : INFO : topic diff=0.087283, rho=0.140028\n", + "2019-01-31 00:16:57,220 : INFO : PROGRESS: pass 0, at document #104000/4922894\n", + "2019-01-31 00:16:58,708 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:16:58,973 : INFO : topic #49 (0.020): 0.040*\"india\" + 0.028*\"incumb\" + 0.013*\"televis\" + 0.011*\"tajikistan\" + 0.010*\"pakistan\" + 0.009*\"sri\" + 0.008*\"muskoge\" + 0.008*\"singh\" + 0.008*\"khalsa\" + 0.007*\"islam\"\n", + "2019-01-31 00:16:58,975 : INFO : topic #38 (0.020): 0.019*\"king\" + 0.015*\"walter\" + 0.013*\"aza\" + 0.011*\"teufel\" + 0.009*\"till\" + 0.008*\"empath\" + 0.007*\"embassi\" + 0.007*\"battalion\" + 0.007*\"armi\" + 0.007*\"forc\"\n", + "2019-01-31 00:16:58,976 : INFO : topic #12 (0.020): 0.008*\"frontal\" + 0.007*\"number\" + 0.007*\"exampl\" + 0.006*\"mode\" + 0.006*\"poet\" + 0.006*\"southern\" + 0.006*\"gener\" + 0.006*\"differ\" + 0.006*\"servitud\" + 0.006*\"théori\"\n", + "2019-01-31 00:16:58,977 : INFO : topic #4 (0.020): 0.026*\"жизнь\" + 0.022*\"enfranchis\" + 0.019*\"automat\" + 0.017*\"mode\" + 0.015*\"candid\" + 0.014*\"depress\" + 0.012*\"pour\" + 0.011*\"pioneer\" + 0.011*\"season\" + 0.009*\"veget\"\n", + "2019-01-31 00:16:58,978 : INFO : topic #43 (0.020): 0.061*\"parti\" + 0.060*\"elect\" + 0.024*\"democrat\" + 0.024*\"voluntari\" + 0.021*\"member\" + 0.018*\"polici\" + 0.015*\"republ\" + 0.014*\"seaport\" + 0.013*\"bypass\" + 0.013*\"tendenc\"\n", + "2019-01-31 00:16:58,984 : INFO : topic diff=0.087083, rho=0.138675\n", + "2019-01-31 00:16:59,140 : INFO : PROGRESS: pass 0, at document #106000/4922894\n", + "2019-01-31 00:17:00,672 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:17:00,936 : INFO : topic #34 (0.020): 0.063*\"start\" + 0.036*\"cotton\" + 0.024*\"unionist\" + 0.016*\"california\" + 0.014*\"toni\" + 0.013*\"north\" + 0.013*\"terri\" + 0.013*\"carefulli\" + 0.013*\"violent\" + 0.012*\"american\"\n", + "2019-01-31 00:17:00,938 : INFO : topic #10 (0.020): 0.012*\"cdd\" + 0.009*\"disco\" + 0.008*\"media\" + 0.007*\"pathwai\" + 0.007*\"proper\" + 0.007*\"acid\" + 0.007*\"caus\" + 0.006*\"effect\" + 0.006*\"treat\" + 0.006*\"includ\"\n", + "2019-01-31 00:17:00,939 : INFO : topic #17 (0.020): 0.049*\"church\" + 0.020*\"retroflex\" + 0.019*\"centuri\" + 0.018*\"jpg\" + 0.018*\"fifteenth\" + 0.018*\"cathol\" + 0.016*\"bishop\" + 0.013*\"italian\" + 0.013*\"christian\" + 0.012*\"sail\"\n", + "2019-01-31 00:17:00,940 : INFO : topic #22 (0.020): 0.031*\"spars\" + 0.030*\"factor\" + 0.028*\"genu\" + 0.021*\"adulthood\" + 0.016*\"hostil\" + 0.016*\"male\" + 0.016*\"feel\" + 0.013*\"popolo\" + 0.011*\"live\" + 0.010*\"plaisir\"\n", + "2019-01-31 00:17:00,942 : INFO : topic #6 (0.020): 0.062*\"fewer\" + 0.021*\"septemb\" + 0.018*\"epiru\" + 0.018*\"teacher\" + 0.017*\"stake\" + 0.012*\"rodríguez\" + 0.011*\"proclaim\" + 0.011*\"acrimoni\" + 0.010*\"movi\" + 0.010*\"director\"\n", + "2019-01-31 00:17:00,947 : INFO : topic diff=0.089772, rho=0.137361\n", + "2019-01-31 00:17:01,102 : INFO : PROGRESS: pass 0, at document #108000/4922894\n", + "2019-01-31 00:17:02,637 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:17:02,901 : INFO : topic #28 (0.020): 0.025*\"build\" + 0.024*\"hous\" + 0.019*\"rivièr\" + 0.015*\"buford\" + 0.011*\"histor\" + 0.010*\"rosenwald\" + 0.010*\"constitut\" + 0.009*\"lobe\" + 0.009*\"briarwood\" + 0.008*\"silicon\"\n", + "2019-01-31 00:17:02,903 : INFO : topic #38 (0.020): 0.017*\"king\" + 0.017*\"walter\" + 0.012*\"aza\" + 0.011*\"teufel\" + 0.009*\"empath\" + 0.008*\"battalion\" + 0.008*\"till\" + 0.007*\"embassi\" + 0.007*\"armi\" + 0.007*\"forc\"\n", + "2019-01-31 00:17:02,904 : INFO : topic #8 (0.020): 0.029*\"law\" + 0.027*\"cortic\" + 0.023*\"act\" + 0.022*\"start\" + 0.015*\"case\" + 0.010*\"ricardo\" + 0.009*\"legal\" + 0.009*\"unionist\" + 0.009*\"polaris\" + 0.008*\"feder\"\n", + "2019-01-31 00:17:02,905 : INFO : topic #35 (0.020): 0.042*\"russia\" + 0.034*\"china\" + 0.028*\"sovereignti\" + 0.027*\"reprint\" + 0.025*\"rural\" + 0.018*\"poison\" + 0.016*\"personifi\" + 0.016*\"unfortun\" + 0.015*\"chilton\" + 0.015*\"malaysia\"\n", + "2019-01-31 00:17:02,906 : INFO : topic #14 (0.020): 0.026*\"forc\" + 0.024*\"aggress\" + 0.020*\"armi\" + 0.019*\"walter\" + 0.016*\"com\" + 0.015*\"militari\" + 0.014*\"unionist\" + 0.012*\"rifl\" + 0.011*\"oper\" + 0.011*\"airbu\"\n", + "2019-01-31 00:17:02,912 : INFO : topic diff=0.081186, rho=0.136083\n", + "2019-01-31 00:17:03,072 : INFO : PROGRESS: pass 0, at document #110000/4922894\n", + "2019-01-31 00:17:04,635 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:17:04,901 : INFO : topic #38 (0.020): 0.017*\"walter\" + 0.017*\"king\" + 0.011*\"teufel\" + 0.011*\"aza\" + 0.008*\"empath\" + 0.008*\"battalion\" + 0.008*\"till\" + 0.007*\"embassi\" + 0.007*\"armi\" + 0.007*\"forc\"\n", + "2019-01-31 00:17:04,903 : INFO : topic #26 (0.020): 0.035*\"workplac\" + 0.033*\"champion\" + 0.027*\"olymp\" + 0.027*\"woman\" + 0.024*\"medal\" + 0.022*\"event\" + 0.021*\"men\" + 0.019*\"nation\" + 0.019*\"gold\" + 0.018*\"atheist\"\n", + "2019-01-31 00:17:04,904 : INFO : topic #14 (0.020): 0.025*\"forc\" + 0.022*\"aggress\" + 0.020*\"armi\" + 0.019*\"walter\" + 0.015*\"com\" + 0.015*\"militari\" + 0.014*\"unionist\" + 0.014*\"refut\" + 0.011*\"rifl\" + 0.011*\"oper\"\n", + "2019-01-31 00:17:04,905 : INFO : topic #20 (0.020): 0.120*\"scholar\" + 0.031*\"struggl\" + 0.029*\"educ\" + 0.028*\"high\" + 0.016*\"yawn\" + 0.015*\"collector\" + 0.012*\"prognosi\" + 0.010*\"commun\" + 0.008*\"children\" + 0.008*\"class\"\n", + "2019-01-31 00:17:04,906 : INFO : topic #28 (0.020): 0.025*\"build\" + 0.023*\"hous\" + 0.020*\"rivièr\" + 0.015*\"buford\" + 0.011*\"histor\" + 0.010*\"rosenwald\" + 0.010*\"constitut\" + 0.009*\"lobe\" + 0.009*\"briarwood\" + 0.008*\"silicon\"\n", + "2019-01-31 00:17:04,911 : INFO : topic diff=0.083256, rho=0.134840\n", + "2019-01-31 00:17:05,066 : INFO : PROGRESS: pass 0, at document #112000/4922894\n", + "2019-01-31 00:17:06,597 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 00:17:06,862 : INFO : topic #19 (0.020): 0.008*\"like\" + 0.008*\"form\" + 0.008*\"woodcut\" + 0.008*\"origin\" + 0.008*\"uruguayan\" + 0.007*\"mean\" + 0.007*\"god\" + 0.007*\"charact\" + 0.006*\"differ\" + 0.006*\"pour\"\n", + "2019-01-31 00:17:06,863 : INFO : topic #32 (0.020): 0.069*\"district\" + 0.052*\"vigour\" + 0.044*\"popolo\" + 0.041*\"tortur\" + 0.035*\"area\" + 0.030*\"regim\" + 0.028*\"multitud\" + 0.022*\"cotton\" + 0.022*\"station\" + 0.020*\"prosper\"\n", + "2019-01-31 00:17:06,864 : INFO : topic #49 (0.020): 0.039*\"india\" + 0.029*\"incumb\" + 0.013*\"tajikistan\" + 0.012*\"sri\" + 0.012*\"televis\" + 0.010*\"pakistan\" + 0.009*\"khalsa\" + 0.008*\"singh\" + 0.008*\"start\" + 0.008*\"lanka\"\n", + "2019-01-31 00:17:06,865 : INFO : topic #29 (0.020): 0.013*\"govern\" + 0.009*\"start\" + 0.009*\"replac\" + 0.008*\"yawn\" + 0.007*\"countri\" + 0.007*\"nation\" + 0.006*\"million\" + 0.006*\"new\" + 0.006*\"summerhil\" + 0.005*\"théori\"\n", + "2019-01-31 00:17:06,866 : INFO : topic #0 (0.020): 0.064*\"statewid\" + 0.051*\"arsen\" + 0.040*\"line\" + 0.037*\"raid\" + 0.028*\"museo\" + 0.021*\"word\" + 0.020*\"traceabl\" + 0.020*\"pain\" + 0.019*\"artist\" + 0.017*\"serv\"\n", + "2019-01-31 00:17:06,872 : INFO : topic diff=0.072134, rho=0.133631\n", + "2019-01-31 00:17:07,028 : INFO : PROGRESS: pass 0, at document #114000/4922894\n", + "2019-01-31 00:17:08,568 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:17:08,833 : INFO : topic #38 (0.020): 0.019*\"king\" + 0.018*\"walter\" + 0.011*\"teufel\" + 0.010*\"aza\" + 0.008*\"battalion\" + 0.008*\"empath\" + 0.007*\"armi\" + 0.007*\"till\" + 0.007*\"embassi\" + 0.006*\"kingdom\"\n", + "2019-01-31 00:17:08,834 : INFO : topic #26 (0.020): 0.033*\"workplac\" + 0.032*\"champion\" + 0.031*\"woman\" + 0.026*\"olymp\" + 0.024*\"men\" + 0.023*\"event\" + 0.022*\"medal\" + 0.018*\"atheist\" + 0.018*\"nation\" + 0.018*\"gold\"\n", + "2019-01-31 00:17:08,835 : INFO : topic #28 (0.020): 0.024*\"build\" + 0.024*\"hous\" + 0.023*\"rivièr\" + 0.016*\"buford\" + 0.011*\"histor\" + 0.010*\"constitut\" + 0.009*\"rosenwald\" + 0.009*\"lobe\" + 0.009*\"briarwood\" + 0.008*\"silicon\"\n", + "2019-01-31 00:17:08,836 : INFO : topic #22 (0.020): 0.034*\"spars\" + 0.028*\"factor\" + 0.021*\"adulthood\" + 0.021*\"genu\" + 0.016*\"feel\" + 0.015*\"male\" + 0.015*\"hostil\" + 0.012*\"popolo\" + 0.012*\"live\" + 0.012*\"plaisir\"\n", + "2019-01-31 00:17:08,837 : INFO : topic #13 (0.020): 0.025*\"australia\" + 0.023*\"ireland\" + 0.023*\"sourc\" + 0.022*\"london\" + 0.021*\"australian\" + 0.020*\"england\" + 0.015*\"youth\" + 0.014*\"scotland\" + 0.014*\"weekli\" + 0.014*\"wale\"\n", + "2019-01-31 00:17:08,844 : INFO : topic diff=0.074001, rho=0.132453\n", + "2019-01-31 00:17:09,004 : INFO : PROGRESS: pass 0, at document #116000/4922894\n", + "2019-01-31 00:17:10,572 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:17:10,836 : INFO : topic #17 (0.020): 0.049*\"church\" + 0.019*\"bishop\" + 0.018*\"centuri\" + 0.018*\"jpg\" + 0.017*\"retroflex\" + 0.017*\"fifteenth\" + 0.017*\"cathol\" + 0.014*\"italian\" + 0.014*\"sail\" + 0.013*\"christian\"\n", + "2019-01-31 00:17:10,838 : INFO : topic #38 (0.020): 0.019*\"king\" + 0.017*\"walter\" + 0.010*\"teufel\" + 0.010*\"aza\" + 0.008*\"battalion\" + 0.008*\"empath\" + 0.008*\"armi\" + 0.007*\"till\" + 0.007*\"embassi\" + 0.007*\"forc\"\n", + "2019-01-31 00:17:10,839 : INFO : topic #10 (0.020): 0.013*\"cdd\" + 0.008*\"disco\" + 0.008*\"acid\" + 0.007*\"media\" + 0.007*\"caus\" + 0.006*\"pathwai\" + 0.006*\"proper\" + 0.006*\"effect\" + 0.006*\"disintegr\" + 0.006*\"activ\"\n", + "2019-01-31 00:17:10,840 : INFO : topic #22 (0.020): 0.033*\"spars\" + 0.027*\"factor\" + 0.020*\"adulthood\" + 0.019*\"genu\" + 0.016*\"feel\" + 0.015*\"male\" + 0.015*\"hostil\" + 0.012*\"popolo\" + 0.012*\"live\" + 0.011*\"plaisir\"\n", + "2019-01-31 00:17:10,841 : INFO : topic #26 (0.020): 0.033*\"woman\" + 0.032*\"workplac\" + 0.031*\"champion\" + 0.026*\"olymp\" + 0.025*\"men\" + 0.024*\"event\" + 0.022*\"medal\" + 0.019*\"atheist\" + 0.018*\"rainfal\" + 0.018*\"nation\"\n", + "2019-01-31 00:17:10,847 : INFO : topic diff=0.073465, rho=0.131306\n", + "2019-01-31 00:17:11,002 : INFO : PROGRESS: pass 0, at document #118000/4922894\n", + "2019-01-31 00:17:12,524 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:17:12,789 : INFO : topic #11 (0.020): 0.029*\"john\" + 0.019*\"will\" + 0.015*\"jame\" + 0.012*\"rival\" + 0.012*\"david\" + 0.011*\"georg\" + 0.009*\"rhyme\" + 0.008*\"slur\" + 0.008*\"thirtieth\" + 0.007*\"chandra\"\n", + "2019-01-31 00:17:12,790 : INFO : topic #30 (0.020): 0.036*\"cleveland\" + 0.032*\"leagu\" + 0.027*\"place\" + 0.025*\"scientist\" + 0.024*\"crete\" + 0.024*\"taxpay\" + 0.021*\"folei\" + 0.017*\"martin\" + 0.017*\"goal\" + 0.011*\"schmitz\"\n", + "2019-01-31 00:17:12,791 : INFO : topic #37 (0.020): 0.007*\"love\" + 0.005*\"gestur\" + 0.005*\"théori\" + 0.004*\"place\" + 0.004*\"night\" + 0.004*\"litig\" + 0.004*\"man\" + 0.004*\"blue\" + 0.003*\"introductori\" + 0.003*\"appear\"\n", + "2019-01-31 00:17:12,792 : INFO : topic #39 (0.020): 0.041*\"scientist\" + 0.035*\"taxpay\" + 0.024*\"clot\" + 0.024*\"canada\" + 0.019*\"canadian\" + 0.014*\"hoar\" + 0.013*\"basketbal\" + 0.013*\"confer\" + 0.010*\"toronto\" + 0.010*\"place\"\n", + "2019-01-31 00:17:12,794 : INFO : topic #49 (0.020): 0.037*\"india\" + 0.028*\"incumb\" + 0.014*\"tajikistan\" + 0.014*\"televis\" + 0.012*\"sri\" + 0.010*\"pakistan\" + 0.009*\"singh\" + 0.008*\"khalsa\" + 0.008*\"islam\" + 0.008*\"start\"\n", + "2019-01-31 00:17:12,800 : INFO : topic diff=0.069374, rho=0.130189\n", + "2019-01-31 00:17:15,656 : INFO : -11.572 per-word bound, 3045.6 perplexity estimate based on a held-out corpus of 2000 documents with 561550 words\n", + "2019-01-31 00:17:15,657 : INFO : PROGRESS: pass 0, at document #120000/4922894\n", + "2019-01-31 00:17:17,200 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:17:17,466 : INFO : topic #45 (0.020): 0.019*\"black\" + 0.018*\"record\" + 0.016*\"western\" + 0.016*\"colder\" + 0.016*\"blind\" + 0.011*\"light\" + 0.008*\"depress\" + 0.008*\"green\" + 0.006*\"illicit\" + 0.006*\"arm\"\n", + "2019-01-31 00:17:17,467 : INFO : topic #33 (0.020): 0.053*\"french\" + 0.048*\"franc\" + 0.026*\"pari\" + 0.023*\"sail\" + 0.021*\"jean\" + 0.017*\"daphn\" + 0.012*\"lazi\" + 0.011*\"loui\" + 0.011*\"dish\" + 0.011*\"piec\"\n", + "2019-01-31 00:17:17,468 : INFO : topic #15 (0.020): 0.016*\"requir\" + 0.015*\"develop\" + 0.013*\"small\" + 0.011*\"word\" + 0.010*\"student\" + 0.008*\"socialist\" + 0.008*\"human\" + 0.008*\"cultur\" + 0.008*\"organ\" + 0.008*\"intern\"\n", + "2019-01-31 00:17:17,470 : INFO : topic #27 (0.020): 0.064*\"questionnair\" + 0.018*\"tornado\" + 0.018*\"taxpay\" + 0.012*\"candid\" + 0.012*\"driver\" + 0.012*\"dai\" + 0.011*\"find\" + 0.011*\"squatter\" + 0.011*\"théori\" + 0.011*\"yawn\"\n", + "2019-01-31 00:17:17,471 : INFO : topic #44 (0.020): 0.032*\"rooftop\" + 0.024*\"final\" + 0.020*\"wife\" + 0.019*\"tourist\" + 0.018*\"ret\" + 0.013*\"winner\" + 0.013*\"chamber\" + 0.012*\"taxpay\" + 0.012*\"champion\" + 0.012*\"tiepolo\"\n", + "2019-01-31 00:17:17,477 : INFO : topic diff=0.065374, rho=0.129099\n", + "2019-01-31 00:17:17,631 : INFO : PROGRESS: pass 0, at document #122000/4922894\n", + "2019-01-31 00:17:19,141 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:17:19,406 : INFO : topic #29 (0.020): 0.013*\"govern\" + 0.009*\"replac\" + 0.009*\"start\" + 0.008*\"yawn\" + 0.007*\"countri\" + 0.007*\"million\" + 0.007*\"nation\" + 0.006*\"summerhil\" + 0.006*\"new\" + 0.005*\"théori\"\n", + "2019-01-31 00:17:19,407 : INFO : topic #5 (0.020): 0.039*\"abroad\" + 0.029*\"son\" + 0.029*\"rel\" + 0.028*\"reconstruct\" + 0.022*\"band\" + 0.017*\"muscl\" + 0.015*\"simultan\" + 0.014*\"charcoal\" + 0.013*\"toyota\" + 0.010*\"vocabulari\"\n", + "2019-01-31 00:17:19,408 : INFO : topic #25 (0.020): 0.027*\"ring\" + 0.015*\"lagrang\" + 0.014*\"area\" + 0.014*\"warmth\" + 0.014*\"mount\" + 0.009*\"foam\" + 0.008*\"north\" + 0.008*\"vacant\" + 0.008*\"palmer\" + 0.007*\"robespierr\"\n", + "2019-01-31 00:17:19,410 : INFO : topic #20 (0.020): 0.122*\"scholar\" + 0.033*\"struggl\" + 0.028*\"educ\" + 0.027*\"high\" + 0.016*\"yawn\" + 0.014*\"collector\" + 0.012*\"prognosi\" + 0.010*\"commun\" + 0.010*\"children\" + 0.008*\"second\"\n", + "2019-01-31 00:17:19,411 : INFO : topic #17 (0.020): 0.054*\"church\" + 0.018*\"centuri\" + 0.018*\"bishop\" + 0.017*\"cathol\" + 0.016*\"jpg\" + 0.016*\"retroflex\" + 0.016*\"fifteenth\" + 0.014*\"italian\" + 0.014*\"christian\" + 0.014*\"sail\"\n", + "2019-01-31 00:17:19,417 : INFO : topic diff=0.066877, rho=0.128037\n", + "2019-01-31 00:17:19,570 : INFO : PROGRESS: pass 0, at document #124000/4922894\n", + "2019-01-31 00:17:21,088 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 00:17:21,352 : INFO : topic #41 (0.020): 0.047*\"citi\" + 0.038*\"new\" + 0.023*\"year\" + 0.022*\"palmer\" + 0.021*\"center\" + 0.019*\"strategist\" + 0.010*\"open\" + 0.009*\"hot\" + 0.009*\"includ\" + 0.008*\"lobe\"\n", + "2019-01-31 00:17:21,353 : INFO : topic #13 (0.020): 0.026*\"australia\" + 0.023*\"london\" + 0.023*\"england\" + 0.023*\"sourc\" + 0.022*\"ireland\" + 0.021*\"australian\" + 0.014*\"wale\" + 0.014*\"youth\" + 0.014*\"north\" + 0.014*\"new\"\n", + "2019-01-31 00:17:21,355 : INFO : topic #45 (0.020): 0.019*\"black\" + 0.017*\"record\" + 0.015*\"colder\" + 0.015*\"western\" + 0.015*\"blind\" + 0.011*\"light\" + 0.008*\"green\" + 0.007*\"depress\" + 0.006*\"illicit\" + 0.006*\"wors\"\n", + "2019-01-31 00:17:21,355 : INFO : topic #40 (0.020): 0.087*\"unit\" + 0.030*\"collector\" + 0.015*\"institut\" + 0.013*\"student\" + 0.012*\"american\" + 0.012*\"professor\" + 0.012*\"schuster\" + 0.012*\"governor\" + 0.011*\"degre\" + 0.011*\"http\"\n", + "2019-01-31 00:17:21,357 : INFO : topic #49 (0.020): 0.040*\"india\" + 0.028*\"incumb\" + 0.012*\"televis\" + 0.012*\"sri\" + 0.012*\"tajikistan\" + 0.010*\"pakistan\" + 0.009*\"singh\" + 0.008*\"start\" + 0.008*\"khalsa\" + 0.008*\"islam\"\n", + "2019-01-31 00:17:21,363 : INFO : topic diff=0.067341, rho=0.127000\n", + "2019-01-31 00:17:21,519 : INFO : PROGRESS: pass 0, at document #126000/4922894\n", + "2019-01-31 00:17:23,043 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:17:23,308 : INFO : topic #32 (0.020): 0.066*\"district\" + 0.050*\"vigour\" + 0.044*\"popolo\" + 0.040*\"tortur\" + 0.035*\"area\" + 0.030*\"regim\" + 0.027*\"multitud\" + 0.024*\"cotton\" + 0.019*\"prosper\" + 0.018*\"citi\"\n", + "2019-01-31 00:17:23,309 : INFO : topic #28 (0.020): 0.025*\"build\" + 0.023*\"hous\" + 0.021*\"rivièr\" + 0.016*\"buford\" + 0.012*\"histor\" + 0.010*\"constitut\" + 0.010*\"briarwood\" + 0.010*\"lobe\" + 0.009*\"rosenwald\" + 0.009*\"silicon\"\n", + "2019-01-31 00:17:23,310 : INFO : topic #15 (0.020): 0.016*\"requir\" + 0.014*\"develop\" + 0.013*\"small\" + 0.011*\"word\" + 0.010*\"student\" + 0.009*\"socialist\" + 0.009*\"cultur\" + 0.008*\"organ\" + 0.008*\"human\" + 0.008*\"commun\"\n", + "2019-01-31 00:17:23,311 : INFO : topic #14 (0.020): 0.025*\"walter\" + 0.022*\"forc\" + 0.021*\"armi\" + 0.021*\"aggress\" + 0.016*\"com\" + 0.016*\"unionist\" + 0.013*\"militari\" + 0.012*\"airbu\" + 0.011*\"oper\" + 0.010*\"diversifi\"\n", + "2019-01-31 00:17:23,312 : INFO : topic #16 (0.020): 0.027*\"priest\" + 0.017*\"duke\" + 0.016*\"rotterdam\" + 0.015*\"quarterli\" + 0.013*\"margin\" + 0.011*\"king\" + 0.011*\"maria\" + 0.010*\"count\" + 0.010*\"princ\" + 0.010*\"order\"\n", + "2019-01-31 00:17:23,318 : INFO : topic diff=0.065059, rho=0.125988\n", + "2019-01-31 00:17:23,531 : INFO : PROGRESS: pass 0, at document #128000/4922894\n", + "2019-01-31 00:17:25,059 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:17:25,324 : INFO : topic #22 (0.020): 0.035*\"spars\" + 0.027*\"factor\" + 0.022*\"adulthood\" + 0.017*\"feel\" + 0.016*\"hostil\" + 0.015*\"male\" + 0.015*\"genu\" + 0.012*\"popolo\" + 0.012*\"live\" + 0.011*\"plaisir\"\n", + "2019-01-31 00:17:25,325 : INFO : topic #20 (0.020): 0.120*\"scholar\" + 0.034*\"struggl\" + 0.028*\"high\" + 0.027*\"educ\" + 0.016*\"yawn\" + 0.014*\"collector\" + 0.013*\"prognosi\" + 0.009*\"commun\" + 0.009*\"children\" + 0.008*\"class\"\n", + "2019-01-31 00:17:25,327 : INFO : topic #31 (0.020): 0.071*\"fusiform\" + 0.027*\"player\" + 0.021*\"place\" + 0.015*\"scientist\" + 0.013*\"taxpay\" + 0.012*\"leagu\" + 0.010*\"ruler\" + 0.010*\"folei\" + 0.009*\"barber\" + 0.008*\"schmitz\"\n", + "2019-01-31 00:17:25,328 : INFO : topic #33 (0.020): 0.052*\"french\" + 0.048*\"franc\" + 0.027*\"pari\" + 0.022*\"sail\" + 0.021*\"jean\" + 0.017*\"daphn\" + 0.013*\"focal\" + 0.013*\"lazi\" + 0.011*\"convei\" + 0.011*\"wine\"\n", + "2019-01-31 00:17:25,329 : INFO : topic #10 (0.020): 0.013*\"cdd\" + 0.009*\"disco\" + 0.007*\"acid\" + 0.007*\"pathwai\" + 0.007*\"media\" + 0.007*\"caus\" + 0.006*\"treat\" + 0.006*\"proper\" + 0.006*\"effect\" + 0.006*\"activ\"\n", + "2019-01-31 00:17:25,335 : INFO : topic diff=0.060318, rho=0.125000\n", + "2019-01-31 00:17:25,492 : INFO : PROGRESS: pass 0, at document #130000/4922894\n", + "2019-01-31 00:17:27,028 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:17:27,293 : INFO : topic #1 (0.020): 0.035*\"chilton\" + 0.034*\"hong\" + 0.034*\"kong\" + 0.026*\"china\" + 0.022*\"leah\" + 0.020*\"kim\" + 0.018*\"korean\" + 0.018*\"korea\" + 0.012*\"sourc\" + 0.012*\"han\"\n", + "2019-01-31 00:17:27,294 : INFO : topic #31 (0.020): 0.073*\"fusiform\" + 0.029*\"player\" + 0.022*\"place\" + 0.015*\"scientist\" + 0.013*\"taxpay\" + 0.012*\"leagu\" + 0.010*\"ruler\" + 0.010*\"folei\" + 0.009*\"barber\" + 0.008*\"schmitz\"\n", + "2019-01-31 00:17:27,295 : INFO : topic #37 (0.020): 0.007*\"love\" + 0.005*\"gestur\" + 0.004*\"night\" + 0.004*\"théori\" + 0.004*\"introductori\" + 0.004*\"blue\" + 0.004*\"litig\" + 0.004*\"place\" + 0.004*\"man\" + 0.004*\"misconcept\"\n", + "2019-01-31 00:17:27,296 : INFO : topic #16 (0.020): 0.028*\"priest\" + 0.017*\"quarterli\" + 0.016*\"duke\" + 0.016*\"rotterdam\" + 0.013*\"margin\" + 0.012*\"king\" + 0.012*\"princ\" + 0.011*\"maria\" + 0.011*\"grammat\" + 0.010*\"count\"\n", + "2019-01-31 00:17:27,298 : INFO : topic #27 (0.020): 0.070*\"questionnair\" + 0.020*\"taxpay\" + 0.017*\"tornado\" + 0.015*\"horac\" + 0.012*\"find\" + 0.012*\"candid\" + 0.011*\"squatter\" + 0.011*\"driver\" + 0.010*\"yawn\" + 0.010*\"théori\"\n", + "2019-01-31 00:17:27,304 : INFO : topic diff=0.059915, rho=0.124035\n", + "2019-01-31 00:17:27,457 : INFO : PROGRESS: pass 0, at document #132000/4922894\n", + "2019-01-31 00:17:28,978 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:17:29,243 : INFO : topic #14 (0.020): 0.024*\"forc\" + 0.023*\"walter\" + 0.022*\"aggress\" + 0.020*\"armi\" + 0.017*\"unionist\" + 0.016*\"com\" + 0.012*\"militari\" + 0.012*\"oper\" + 0.011*\"airbu\" + 0.011*\"refut\"\n", + "2019-01-31 00:17:29,244 : INFO : topic #12 (0.020): 0.008*\"number\" + 0.007*\"frontal\" + 0.007*\"exampl\" + 0.007*\"gener\" + 0.006*\"southern\" + 0.006*\"poet\" + 0.006*\"théori\" + 0.006*\"servitud\" + 0.006*\"cytokin\" + 0.006*\"turn\"\n", + "2019-01-31 00:17:29,245 : INFO : topic #48 (0.020): 0.077*\"januari\" + 0.072*\"sens\" + 0.070*\"march\" + 0.070*\"octob\" + 0.067*\"august\" + 0.066*\"juli\" + 0.063*\"notion\" + 0.063*\"april\" + 0.060*\"judici\" + 0.060*\"decatur\"\n", + "2019-01-31 00:17:29,246 : INFO : topic #4 (0.020): 0.028*\"enfranchis\" + 0.016*\"depress\" + 0.015*\"candid\" + 0.014*\"pour\" + 0.013*\"mode\" + 0.012*\"veget\" + 0.011*\"elabor\" + 0.009*\"spectacl\" + 0.008*\"mandir\" + 0.007*\"produc\"\n", + "2019-01-31 00:17:29,248 : INFO : topic #27 (0.020): 0.069*\"questionnair\" + 0.020*\"taxpay\" + 0.017*\"tornado\" + 0.015*\"horac\" + 0.012*\"find\" + 0.011*\"candid\" + 0.011*\"squatter\" + 0.011*\"théori\" + 0.010*\"driver\" + 0.010*\"yawn\"\n", + "2019-01-31 00:17:29,254 : INFO : topic diff=0.057532, rho=0.123091\n", + "2019-01-31 00:17:29,408 : INFO : PROGRESS: pass 0, at document #134000/4922894\n", + "2019-01-31 00:17:30,890 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:17:31,156 : INFO : topic #21 (0.020): 0.038*\"samford\" + 0.020*\"spain\" + 0.019*\"del\" + 0.018*\"mexico\" + 0.013*\"soviet\" + 0.012*\"santa\" + 0.012*\"lizard\" + 0.011*\"francisco\" + 0.010*\"latin\" + 0.010*\"carlo\"\n", + "2019-01-31 00:17:31,156 : INFO : topic #0 (0.020): 0.070*\"statewid\" + 0.045*\"arsen\" + 0.039*\"line\" + 0.036*\"raid\" + 0.030*\"museo\" + 0.024*\"traceabl\" + 0.019*\"word\" + 0.018*\"pain\" + 0.018*\"artist\" + 0.016*\"exhaust\"\n", + "2019-01-31 00:17:31,158 : INFO : topic #43 (0.020): 0.067*\"elect\" + 0.055*\"parti\" + 0.025*\"voluntari\" + 0.025*\"democrat\" + 0.024*\"member\" + 0.016*\"republ\" + 0.016*\"polici\" + 0.015*\"seaport\" + 0.015*\"tendenc\" + 0.014*\"bypass\"\n", + "2019-01-31 00:17:31,159 : INFO : topic #32 (0.020): 0.067*\"district\" + 0.049*\"vigour\" + 0.043*\"popolo\" + 0.040*\"tortur\" + 0.033*\"area\" + 0.029*\"regim\" + 0.028*\"multitud\" + 0.024*\"cotton\" + 0.020*\"earthworm\" + 0.020*\"north\"\n", + "2019-01-31 00:17:31,160 : INFO : topic #8 (0.020): 0.031*\"law\" + 0.027*\"cortic\" + 0.027*\"act\" + 0.021*\"start\" + 0.014*\"case\" + 0.014*\"ricardo\" + 0.011*\"polaris\" + 0.010*\"legal\" + 0.009*\"unionist\" + 0.007*\"feder\"\n", + "2019-01-31 00:17:31,166 : INFO : topic diff=0.058482, rho=0.122169\n", + "2019-01-31 00:17:31,319 : INFO : PROGRESS: pass 0, at document #136000/4922894\n", + "2019-01-31 00:17:32,830 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:17:33,096 : INFO : topic #42 (0.020): 0.035*\"german\" + 0.024*\"germani\" + 0.015*\"greek\" + 0.011*\"vol\" + 0.011*\"der\" + 0.010*\"israel\" + 0.010*\"berlin\" + 0.010*\"jewish\" + 0.007*\"anglo\" + 0.007*\"europ\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 00:17:33,097 : INFO : topic #37 (0.020): 0.007*\"love\" + 0.006*\"gestur\" + 0.005*\"night\" + 0.004*\"blue\" + 0.004*\"litig\" + 0.004*\"théori\" + 0.004*\"misconcept\" + 0.004*\"man\" + 0.004*\"place\" + 0.004*\"introductori\"\n", + "2019-01-31 00:17:33,098 : INFO : topic #12 (0.020): 0.008*\"number\" + 0.007*\"frontal\" + 0.007*\"southern\" + 0.007*\"exampl\" + 0.007*\"gener\" + 0.006*\"poet\" + 0.006*\"théori\" + 0.006*\"cytokin\" + 0.006*\"servitud\" + 0.006*\"differ\"\n", + "2019-01-31 00:17:33,099 : INFO : topic #44 (0.020): 0.036*\"rooftop\" + 0.026*\"final\" + 0.021*\"wife\" + 0.019*\"tourist\" + 0.016*\"ret\" + 0.014*\"chamber\" + 0.013*\"champion\" + 0.013*\"winner\" + 0.013*\"tiepolo\" + 0.011*\"taxpay\"\n", + "2019-01-31 00:17:33,100 : INFO : topic #45 (0.020): 0.019*\"black\" + 0.016*\"record\" + 0.016*\"colder\" + 0.015*\"western\" + 0.014*\"acacia\" + 0.013*\"blind\" + 0.010*\"light\" + 0.008*\"green\" + 0.007*\"depress\" + 0.006*\"hand\"\n", + "2019-01-31 00:17:33,106 : INFO : topic diff=0.057041, rho=0.121268\n", + "2019-01-31 00:17:33,261 : INFO : PROGRESS: pass 0, at document #138000/4922894\n", + "2019-01-31 00:17:34,778 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:17:35,043 : INFO : topic #29 (0.020): 0.013*\"govern\" + 0.010*\"start\" + 0.010*\"replac\" + 0.008*\"countri\" + 0.007*\"yawn\" + 0.006*\"nation\" + 0.006*\"summerhil\" + 0.006*\"million\" + 0.006*\"new\" + 0.005*\"théori\"\n", + "2019-01-31 00:17:35,044 : INFO : topic #20 (0.020): 0.121*\"scholar\" + 0.034*\"struggl\" + 0.028*\"high\" + 0.027*\"educ\" + 0.016*\"yawn\" + 0.015*\"collector\" + 0.013*\"prognosi\" + 0.009*\"commun\" + 0.008*\"class\" + 0.008*\"children\"\n", + "2019-01-31 00:17:35,045 : INFO : topic #19 (0.020): 0.009*\"form\" + 0.009*\"like\" + 0.008*\"origin\" + 0.008*\"woodcut\" + 0.008*\"mean\" + 0.007*\"uruguayan\" + 0.007*\"charact\" + 0.006*\"differ\" + 0.006*\"god\" + 0.006*\"pour\"\n", + "2019-01-31 00:17:35,047 : INFO : topic #30 (0.020): 0.037*\"cleveland\" + 0.034*\"leagu\" + 0.030*\"place\" + 0.026*\"taxpay\" + 0.025*\"crete\" + 0.023*\"scientist\" + 0.021*\"folei\" + 0.016*\"goal\" + 0.015*\"martin\" + 0.011*\"schmitz\"\n", + "2019-01-31 00:17:35,048 : INFO : topic #45 (0.020): 0.019*\"black\" + 0.016*\"record\" + 0.016*\"colder\" + 0.015*\"western\" + 0.013*\"acacia\" + 0.012*\"blind\" + 0.010*\"light\" + 0.008*\"green\" + 0.007*\"depress\" + 0.006*\"hand\"\n", + "2019-01-31 00:17:35,054 : INFO : topic diff=0.053944, rho=0.120386\n", + "2019-01-31 00:17:37,801 : INFO : -11.718 per-word bound, 3368.9 perplexity estimate based on a held-out corpus of 2000 documents with 535236 words\n", + "2019-01-31 00:17:37,801 : INFO : PROGRESS: pass 0, at document #140000/4922894\n", + "2019-01-31 00:17:39,284 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:17:39,549 : INFO : topic #7 (0.020): 0.019*\"snatch\" + 0.016*\"di\" + 0.016*\"factor\" + 0.014*\"bang\" + 0.012*\"yawn\" + 0.012*\"john\" + 0.011*\"margin\" + 0.011*\"will\" + 0.010*\"faster\" + 0.010*\"locri\"\n", + "2019-01-31 00:17:39,551 : INFO : topic #36 (0.020): 0.027*\"companhia\" + 0.010*\"serv\" + 0.009*\"develop\" + 0.009*\"bank\" + 0.009*\"market\" + 0.009*\"busi\" + 0.009*\"oper\" + 0.008*\"produc\" + 0.008*\"manag\" + 0.008*\"network\"\n", + "2019-01-31 00:17:39,552 : INFO : topic #35 (0.020): 0.052*\"russia\" + 0.033*\"turin\" + 0.026*\"china\" + 0.025*\"reprint\" + 0.025*\"sovereignti\" + 0.023*\"rural\" + 0.019*\"personifi\" + 0.017*\"poison\" + 0.016*\"unfortun\" + 0.015*\"moscow\"\n", + "2019-01-31 00:17:39,554 : INFO : topic #38 (0.020): 0.018*\"walter\" + 0.016*\"king\" + 0.011*\"aza\" + 0.009*\"teufel\" + 0.008*\"battalion\" + 0.007*\"till\" + 0.007*\"forc\" + 0.007*\"empath\" + 0.007*\"armi\" + 0.006*\"embassi\"\n", + "2019-01-31 00:17:39,555 : INFO : topic #9 (0.020): 0.082*\"bone\" + 0.041*\"american\" + 0.020*\"valour\" + 0.015*\"dutch\" + 0.015*\"player\" + 0.014*\"folei\" + 0.013*\"polit\" + 0.013*\"english\" + 0.012*\"simpler\" + 0.010*\"surnam\"\n", + "2019-01-31 00:17:39,561 : INFO : topic diff=0.053215, rho=0.119523\n", + "2019-01-31 00:17:39,719 : INFO : PROGRESS: pass 0, at document #142000/4922894\n", + "2019-01-31 00:17:41,240 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:17:41,506 : INFO : topic #22 (0.020): 0.033*\"spars\" + 0.025*\"factor\" + 0.022*\"adulthood\" + 0.017*\"feel\" + 0.016*\"hostil\" + 0.016*\"male\" + 0.013*\"genu\" + 0.012*\"popolo\" + 0.012*\"live\" + 0.010*\"yawn\"\n", + "2019-01-31 00:17:41,507 : INFO : topic #18 (0.020): 0.008*\"théori\" + 0.007*\"kill\" + 0.006*\"later\" + 0.006*\"man\" + 0.005*\"deal\" + 0.005*\"sack\" + 0.005*\"retrospect\" + 0.004*\"fraud\" + 0.004*\"life\" + 0.004*\"dai\"\n", + "2019-01-31 00:17:41,509 : INFO : topic #26 (0.020): 0.034*\"workplac\" + 0.032*\"woman\" + 0.032*\"champion\" + 0.025*\"olymp\" + 0.025*\"men\" + 0.025*\"medal\" + 0.023*\"event\" + 0.018*\"rainfal\" + 0.018*\"atheist\" + 0.017*\"théori\"\n", + "2019-01-31 00:17:41,509 : INFO : topic #14 (0.020): 0.024*\"forc\" + 0.021*\"aggress\" + 0.021*\"walter\" + 0.019*\"armi\" + 0.017*\"com\" + 0.015*\"unionist\" + 0.012*\"militari\" + 0.012*\"oper\" + 0.010*\"airbu\" + 0.010*\"refut\"\n", + "2019-01-31 00:17:41,510 : INFO : topic #0 (0.020): 0.067*\"statewid\" + 0.047*\"arsen\" + 0.041*\"line\" + 0.036*\"raid\" + 0.030*\"museo\" + 0.023*\"traceabl\" + 0.019*\"word\" + 0.019*\"artist\" + 0.018*\"pain\" + 0.016*\"serv\"\n", + "2019-01-31 00:17:41,516 : INFO : topic diff=0.050616, rho=0.118678\n", + "2019-01-31 00:17:41,673 : INFO : PROGRESS: pass 0, at document #144000/4922894\n", + "2019-01-31 00:17:43,198 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:17:43,464 : INFO : topic #6 (0.020): 0.066*\"fewer\" + 0.027*\"septemb\" + 0.021*\"epiru\" + 0.017*\"teacher\" + 0.016*\"stake\" + 0.013*\"pop\" + 0.012*\"proclaim\" + 0.012*\"rodríguez\" + 0.011*\"acrimoni\" + 0.010*\"direct\"\n", + "2019-01-31 00:17:43,466 : INFO : topic #46 (0.020): 0.022*\"damag\" + 0.018*\"stop\" + 0.018*\"wind\" + 0.015*\"treeless\" + 0.012*\"sweden\" + 0.012*\"norwai\" + 0.012*\"utc\" + 0.011*\"huntsvil\" + 0.011*\"swedish\" + 0.010*\"warmth\"\n", + "2019-01-31 00:17:43,467 : INFO : topic #37 (0.020): 0.008*\"love\" + 0.006*\"gestur\" + 0.005*\"night\" + 0.004*\"litig\" + 0.004*\"blue\" + 0.004*\"man\" + 0.004*\"théori\" + 0.004*\"introductori\" + 0.004*\"misconcept\" + 0.003*\"bewild\"\n", + "2019-01-31 00:17:43,468 : INFO : topic #15 (0.020): 0.015*\"requir\" + 0.014*\"develop\" + 0.013*\"small\" + 0.011*\"word\" + 0.010*\"student\" + 0.009*\"human\" + 0.009*\"socialist\" + 0.008*\"commun\" + 0.008*\"cultur\" + 0.008*\"organ\"\n", + "2019-01-31 00:17:43,469 : INFO : topic #11 (0.020): 0.028*\"john\" + 0.018*\"will\" + 0.014*\"jame\" + 0.012*\"georg\" + 0.012*\"rival\" + 0.011*\"david\" + 0.009*\"rhyme\" + 0.008*\"slur\" + 0.008*\"mexican–american\" + 0.008*\"thirtieth\"\n", + "2019-01-31 00:17:43,475 : INFO : topic diff=0.053246, rho=0.117851\n", + "2019-01-31 00:17:43,634 : INFO : PROGRESS: pass 0, at document #146000/4922894\n", + "2019-01-31 00:17:45,169 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:17:45,434 : INFO : topic #30 (0.020): 0.035*\"cleveland\" + 0.034*\"leagu\" + 0.030*\"place\" + 0.026*\"taxpay\" + 0.025*\"crete\" + 0.023*\"scientist\" + 0.021*\"folei\" + 0.017*\"goal\" + 0.015*\"martin\" + 0.011*\"schmitz\"\n", + "2019-01-31 00:17:45,436 : INFO : topic #38 (0.020): 0.018*\"walter\" + 0.015*\"king\" + 0.013*\"aza\" + 0.011*\"teufel\" + 0.008*\"till\" + 0.008*\"battalion\" + 0.008*\"empath\" + 0.007*\"embassi\" + 0.007*\"armi\" + 0.007*\"forc\"\n", + "2019-01-31 00:17:45,437 : INFO : topic #28 (0.020): 0.027*\"hous\" + 0.026*\"build\" + 0.019*\"rivièr\" + 0.016*\"buford\" + 0.011*\"histor\" + 0.010*\"constitut\" + 0.010*\"hale\" + 0.010*\"briarwood\" + 0.010*\"rosenwald\" + 0.009*\"silicon\"\n", + "2019-01-31 00:17:45,437 : INFO : topic #0 (0.020): 0.069*\"statewid\" + 0.047*\"arsen\" + 0.040*\"line\" + 0.034*\"raid\" + 0.031*\"museo\" + 0.022*\"traceabl\" + 0.019*\"word\" + 0.019*\"pain\" + 0.018*\"artist\" + 0.016*\"serv\"\n", + "2019-01-31 00:17:45,439 : INFO : topic #47 (0.020): 0.073*\"muscl\" + 0.033*\"perceptu\" + 0.019*\"damn\" + 0.018*\"compos\" + 0.017*\"place\" + 0.014*\"jack\" + 0.014*\"orchestr\" + 0.014*\"theater\" + 0.013*\"physician\" + 0.013*\"olympo\"\n", + "2019-01-31 00:17:45,445 : INFO : topic diff=0.049351, rho=0.117041\n", + "2019-01-31 00:17:45,600 : INFO : PROGRESS: pass 0, at document #148000/4922894\n", + "2019-01-31 00:17:47,108 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:17:47,373 : INFO : topic #39 (0.020): 0.035*\"taxpay\" + 0.033*\"scientist\" + 0.026*\"canada\" + 0.024*\"clot\" + 0.021*\"canadian\" + 0.015*\"basketbal\" + 0.013*\"hoar\" + 0.013*\"confer\" + 0.011*\"toronto\" + 0.011*\"ontario\"\n", + "2019-01-31 00:17:47,374 : INFO : topic #46 (0.020): 0.021*\"damag\" + 0.018*\"stop\" + 0.017*\"wind\" + 0.014*\"treeless\" + 0.013*\"sweden\" + 0.013*\"norwai\" + 0.011*\"huntsvil\" + 0.011*\"swedish\" + 0.010*\"norwegian\" + 0.010*\"utc\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 00:17:47,376 : INFO : topic #15 (0.020): 0.015*\"requir\" + 0.013*\"develop\" + 0.012*\"small\" + 0.011*\"word\" + 0.010*\"student\" + 0.010*\"human\" + 0.009*\"socialist\" + 0.009*\"commun\" + 0.009*\"cultur\" + 0.008*\"organ\"\n", + "2019-01-31 00:17:47,377 : INFO : topic #43 (0.020): 0.065*\"elect\" + 0.057*\"parti\" + 0.026*\"voluntari\" + 0.022*\"member\" + 0.022*\"democrat\" + 0.016*\"polici\" + 0.016*\"tendenc\" + 0.014*\"republ\" + 0.014*\"seaport\" + 0.014*\"bypass\"\n", + "2019-01-31 00:17:47,378 : INFO : topic #12 (0.020): 0.009*\"number\" + 0.008*\"frontal\" + 0.007*\"exampl\" + 0.006*\"southern\" + 0.006*\"gener\" + 0.006*\"poet\" + 0.006*\"servitud\" + 0.006*\"théori\" + 0.005*\"differ\" + 0.005*\"utopian\"\n", + "2019-01-31 00:17:47,384 : INFO : topic diff=0.051028, rho=0.116248\n", + "2019-01-31 00:17:47,541 : INFO : PROGRESS: pass 0, at document #150000/4922894\n", + "2019-01-31 00:17:49,060 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:17:49,326 : INFO : topic #22 (0.020): 0.033*\"spars\" + 0.026*\"factor\" + 0.023*\"adulthood\" + 0.018*\"hostil\" + 0.017*\"feel\" + 0.016*\"male\" + 0.013*\"genu\" + 0.012*\"live\" + 0.012*\"popolo\" + 0.010*\"yawn\"\n", + "2019-01-31 00:17:49,327 : INFO : topic #15 (0.020): 0.015*\"requir\" + 0.013*\"develop\" + 0.012*\"small\" + 0.010*\"word\" + 0.010*\"cultur\" + 0.010*\"student\" + 0.010*\"human\" + 0.009*\"socialist\" + 0.009*\"commun\" + 0.008*\"group\"\n", + "2019-01-31 00:17:49,328 : INFO : topic #8 (0.020): 0.030*\"law\" + 0.026*\"cortic\" + 0.022*\"act\" + 0.021*\"start\" + 0.015*\"ricardo\" + 0.015*\"case\" + 0.011*\"polaris\" + 0.010*\"legal\" + 0.009*\"unionist\" + 0.008*\"feder\"\n", + "2019-01-31 00:17:49,329 : INFO : topic #33 (0.020): 0.054*\"french\" + 0.045*\"franc\" + 0.028*\"pari\" + 0.024*\"sail\" + 0.023*\"jean\" + 0.017*\"daphn\" + 0.017*\"focal\" + 0.015*\"lazi\" + 0.012*\"piec\" + 0.011*\"loui\"\n", + "2019-01-31 00:17:49,330 : INFO : topic #30 (0.020): 0.035*\"cleveland\" + 0.034*\"leagu\" + 0.030*\"place\" + 0.025*\"taxpay\" + 0.025*\"crete\" + 0.024*\"scientist\" + 0.021*\"folei\" + 0.017*\"goal\" + 0.015*\"martin\" + 0.011*\"schmitz\"\n", + "2019-01-31 00:17:49,336 : INFO : topic diff=0.050762, rho=0.115470\n", + "2019-01-31 00:17:49,488 : INFO : PROGRESS: pass 0, at document #152000/4922894\n", + "2019-01-31 00:17:50,969 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:17:51,234 : INFO : topic #39 (0.020): 0.036*\"taxpay\" + 0.031*\"scientist\" + 0.026*\"canada\" + 0.024*\"clot\" + 0.022*\"canadian\" + 0.015*\"basketbal\" + 0.014*\"hoar\" + 0.012*\"confer\" + 0.011*\"ontario\" + 0.011*\"toronto\"\n", + "2019-01-31 00:17:51,235 : INFO : topic #34 (0.020): 0.072*\"start\" + 0.040*\"cotton\" + 0.030*\"unionist\" + 0.018*\"american\" + 0.014*\"terri\" + 0.013*\"california\" + 0.013*\"north\" + 0.012*\"new\" + 0.012*\"toni\" + 0.011*\"violent\"\n", + "2019-01-31 00:17:51,237 : INFO : topic #45 (0.020): 0.018*\"black\" + 0.016*\"colder\" + 0.016*\"western\" + 0.014*\"record\" + 0.011*\"blind\" + 0.011*\"light\" + 0.008*\"green\" + 0.007*\"depress\" + 0.007*\"illicit\" + 0.007*\"hade\"\n", + "2019-01-31 00:17:51,238 : INFO : topic #0 (0.020): 0.070*\"statewid\" + 0.046*\"arsen\" + 0.040*\"line\" + 0.033*\"raid\" + 0.030*\"museo\" + 0.021*\"traceabl\" + 0.020*\"pain\" + 0.019*\"word\" + 0.018*\"artist\" + 0.016*\"exhaust\"\n", + "2019-01-31 00:17:51,239 : INFO : topic #30 (0.020): 0.040*\"leagu\" + 0.035*\"cleveland\" + 0.029*\"place\" + 0.028*\"crete\" + 0.026*\"taxpay\" + 0.023*\"scientist\" + 0.022*\"folei\" + 0.016*\"goal\" + 0.015*\"martin\" + 0.011*\"diversifi\"\n", + "2019-01-31 00:17:51,245 : INFO : topic diff=0.049907, rho=0.114708\n", + "2019-01-31 00:17:51,400 : INFO : PROGRESS: pass 0, at document #154000/4922894\n", + "2019-01-31 00:17:52,909 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:17:53,174 : INFO : topic #37 (0.020): 0.008*\"love\" + 0.006*\"gestur\" + 0.005*\"night\" + 0.005*\"man\" + 0.004*\"christma\" + 0.004*\"litig\" + 0.004*\"blue\" + 0.004*\"théori\" + 0.004*\"introductori\" + 0.004*\"place\"\n", + "2019-01-31 00:17:53,175 : INFO : topic #41 (0.020): 0.047*\"citi\" + 0.039*\"new\" + 0.023*\"palmer\" + 0.022*\"year\" + 0.019*\"center\" + 0.015*\"strategist\" + 0.010*\"open\" + 0.009*\"hot\" + 0.009*\"includ\" + 0.009*\"lobe\"\n", + "2019-01-31 00:17:53,176 : INFO : topic #18 (0.020): 0.008*\"théori\" + 0.006*\"later\" + 0.006*\"kill\" + 0.006*\"man\" + 0.005*\"sack\" + 0.005*\"deal\" + 0.005*\"retrospect\" + 0.004*\"dai\" + 0.004*\"fraud\" + 0.004*\"life\"\n", + "2019-01-31 00:17:53,177 : INFO : topic #34 (0.020): 0.072*\"start\" + 0.040*\"cotton\" + 0.030*\"unionist\" + 0.018*\"american\" + 0.014*\"terri\" + 0.014*\"california\" + 0.012*\"north\" + 0.012*\"toni\" + 0.012*\"new\" + 0.011*\"violent\"\n", + "2019-01-31 00:17:53,179 : INFO : topic #46 (0.020): 0.019*\"damag\" + 0.018*\"stop\" + 0.016*\"wind\" + 0.014*\"sweden\" + 0.014*\"norwai\" + 0.013*\"swedish\" + 0.011*\"treeless\" + 0.011*\"danish\" + 0.011*\"norwegian\" + 0.010*\"denmark\"\n", + "2019-01-31 00:17:53,185 : INFO : topic diff=0.046475, rho=0.113961\n", + "2019-01-31 00:17:53,338 : INFO : PROGRESS: pass 0, at document #156000/4922894\n", + "2019-01-31 00:17:54,834 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:17:55,100 : INFO : topic #20 (0.020): 0.123*\"scholar\" + 0.034*\"struggl\" + 0.030*\"high\" + 0.028*\"educ\" + 0.017*\"yawn\" + 0.014*\"collector\" + 0.012*\"prognosi\" + 0.009*\"commun\" + 0.008*\"task\" + 0.008*\"children\"\n", + "2019-01-31 00:17:55,101 : INFO : topic #2 (0.020): 0.044*\"isl\" + 0.041*\"shield\" + 0.020*\"narrat\" + 0.015*\"pope\" + 0.015*\"scot\" + 0.012*\"blur\" + 0.012*\"nativist\" + 0.010*\"coalit\" + 0.010*\"crew\" + 0.010*\"class\"\n", + "2019-01-31 00:17:55,103 : INFO : topic #22 (0.020): 0.036*\"spars\" + 0.028*\"factor\" + 0.023*\"adulthood\" + 0.018*\"hostil\" + 0.017*\"feel\" + 0.015*\"male\" + 0.012*\"genu\" + 0.012*\"popolo\" + 0.012*\"live\" + 0.010*\"yawn\"\n", + "2019-01-31 00:17:55,104 : INFO : topic #45 (0.020): 0.018*\"black\" + 0.017*\"colder\" + 0.016*\"record\" + 0.016*\"western\" + 0.011*\"blind\" + 0.010*\"light\" + 0.008*\"green\" + 0.007*\"depress\" + 0.007*\"illicit\" + 0.006*\"hand\"\n", + "2019-01-31 00:17:55,105 : INFO : topic #24 (0.020): 0.037*\"book\" + 0.031*\"publicis\" + 0.020*\"word\" + 0.014*\"new\" + 0.014*\"edit\" + 0.012*\"worldwid\" + 0.011*\"storag\" + 0.011*\"presid\" + 0.011*\"nicola\" + 0.011*\"magazin\"\n", + "2019-01-31 00:17:55,111 : INFO : topic diff=0.046562, rho=0.113228\n", + "2019-01-31 00:17:55,323 : INFO : PROGRESS: pass 0, at document #158000/4922894\n", + "2019-01-31 00:17:56,815 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:17:57,081 : INFO : topic #44 (0.020): 0.034*\"rooftop\" + 0.024*\"final\" + 0.022*\"wife\" + 0.018*\"tourist\" + 0.014*\"tiepolo\" + 0.013*\"taxpay\" + 0.013*\"champion\" + 0.013*\"chamber\" + 0.013*\"martin\" + 0.013*\"open\"\n", + "2019-01-31 00:17:57,082 : INFO : topic #11 (0.020): 0.030*\"john\" + 0.018*\"will\" + 0.014*\"jame\" + 0.012*\"rival\" + 0.012*\"david\" + 0.011*\"georg\" + 0.009*\"slur\" + 0.009*\"rhyme\" + 0.008*\"thirtieth\" + 0.008*\"mexican–american\"\n", + "2019-01-31 00:17:57,084 : INFO : topic #26 (0.020): 0.035*\"workplac\" + 0.034*\"champion\" + 0.032*\"woman\" + 0.025*\"olymp\" + 0.024*\"men\" + 0.022*\"medal\" + 0.022*\"event\" + 0.017*\"atheist\" + 0.017*\"théori\" + 0.017*\"taxpay\"\n", + "2019-01-31 00:17:57,085 : INFO : topic #36 (0.020): 0.027*\"companhia\" + 0.010*\"serv\" + 0.009*\"develop\" + 0.009*\"oper\" + 0.009*\"network\" + 0.009*\"manag\" + 0.009*\"market\" + 0.009*\"busi\" + 0.008*\"produc\" + 0.008*\"prognosi\"\n", + "2019-01-31 00:17:57,086 : INFO : topic #39 (0.020): 0.035*\"taxpay\" + 0.031*\"scientist\" + 0.028*\"canada\" + 0.023*\"canadian\" + 0.022*\"clot\" + 0.014*\"basketbal\" + 0.013*\"hoar\" + 0.013*\"ontario\" + 0.012*\"confer\" + 0.011*\"head\"\n", + "2019-01-31 00:17:57,092 : INFO : topic diff=0.047035, rho=0.112509\n", + "2019-01-31 00:17:59,843 : INFO : -11.752 per-word bound, 3448.6 perplexity estimate based on a held-out corpus of 2000 documents with 534019 words\n", + "2019-01-31 00:17:59,843 : INFO : PROGRESS: pass 0, at document #160000/4922894\n", + "2019-01-31 00:18:01,318 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:18:01,583 : INFO : topic #11 (0.020): 0.030*\"john\" + 0.018*\"will\" + 0.014*\"jame\" + 0.012*\"rival\" + 0.012*\"david\" + 0.011*\"georg\" + 0.009*\"slur\" + 0.009*\"rhyme\" + 0.008*\"thirtieth\" + 0.008*\"mexican–american\"\n", + "2019-01-31 00:18:01,584 : INFO : topic #13 (0.020): 0.028*\"australia\" + 0.025*\"sourc\" + 0.024*\"london\" + 0.022*\"australian\" + 0.020*\"england\" + 0.020*\"ireland\" + 0.018*\"new\" + 0.016*\"wale\" + 0.015*\"youth\" + 0.013*\"north\"\n", + "2019-01-31 00:18:01,585 : INFO : topic #12 (0.020): 0.010*\"number\" + 0.007*\"frontal\" + 0.007*\"exampl\" + 0.006*\"turn\" + 0.006*\"gener\" + 0.006*\"théori\" + 0.006*\"uruguayan\" + 0.006*\"servitud\" + 0.006*\"poet\" + 0.006*\"southern\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 00:18:01,586 : INFO : topic #21 (0.020): 0.035*\"samford\" + 0.023*\"spain\" + 0.020*\"del\" + 0.019*\"soviet\" + 0.017*\"mexico\" + 0.012*\"juan\" + 0.012*\"santa\" + 0.012*\"francisco\" + 0.011*\"josé\" + 0.010*\"carlo\"\n", + "2019-01-31 00:18:01,587 : INFO : topic #33 (0.020): 0.059*\"french\" + 0.043*\"franc\" + 0.033*\"jean\" + 0.030*\"pari\" + 0.024*\"sail\" + 0.017*\"daphn\" + 0.016*\"piec\" + 0.014*\"focal\" + 0.013*\"lazi\" + 0.012*\"loui\"\n", + "2019-01-31 00:18:01,593 : INFO : topic diff=0.045646, rho=0.111803\n", + "2019-01-31 00:18:01,749 : INFO : PROGRESS: pass 0, at document #162000/4922894\n", + "2019-01-31 00:18:03,246 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:18:03,511 : INFO : topic #28 (0.020): 0.027*\"build\" + 0.024*\"hous\" + 0.021*\"rivièr\" + 0.016*\"buford\" + 0.011*\"rosenwald\" + 0.011*\"histor\" + 0.010*\"constitut\" + 0.009*\"silicon\" + 0.009*\"briarwood\" + 0.009*\"lobe\"\n", + "2019-01-31 00:18:03,513 : INFO : topic #9 (0.020): 0.067*\"bone\" + 0.040*\"american\" + 0.025*\"valour\" + 0.018*\"folei\" + 0.017*\"dutch\" + 0.016*\"player\" + 0.014*\"polit\" + 0.013*\"english\" + 0.010*\"simpler\" + 0.009*\"surnam\"\n", + "2019-01-31 00:18:03,514 : INFO : topic #44 (0.020): 0.034*\"rooftop\" + 0.024*\"final\" + 0.023*\"wife\" + 0.019*\"tourist\" + 0.015*\"champion\" + 0.015*\"open\" + 0.014*\"tiepolo\" + 0.014*\"chamber\" + 0.013*\"winner\" + 0.013*\"taxpay\"\n", + "2019-01-31 00:18:03,515 : INFO : topic #12 (0.020): 0.010*\"number\" + 0.007*\"frontal\" + 0.007*\"exampl\" + 0.006*\"turn\" + 0.006*\"gener\" + 0.006*\"uruguayan\" + 0.006*\"théori\" + 0.006*\"servitud\" + 0.006*\"poet\" + 0.006*\"utopian\"\n", + "2019-01-31 00:18:03,517 : INFO : topic #25 (0.020): 0.028*\"ring\" + 0.016*\"lagrang\" + 0.015*\"warmth\" + 0.014*\"area\" + 0.014*\"mount\" + 0.009*\"north\" + 0.008*\"foam\" + 0.008*\"palmer\" + 0.007*\"near\" + 0.007*\"firm\"\n", + "2019-01-31 00:18:03,522 : INFO : topic diff=0.043966, rho=0.111111\n", + "2019-01-31 00:18:03,673 : INFO : PROGRESS: pass 0, at document #164000/4922894\n", + "2019-01-31 00:18:05,155 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:18:05,421 : INFO : topic #9 (0.020): 0.066*\"bone\" + 0.039*\"american\" + 0.026*\"valour\" + 0.017*\"folei\" + 0.017*\"dutch\" + 0.015*\"player\" + 0.014*\"polit\" + 0.013*\"english\" + 0.010*\"simpler\" + 0.009*\"acrimoni\"\n", + "2019-01-31 00:18:05,423 : INFO : topic #30 (0.020): 0.037*\"leagu\" + 0.036*\"cleveland\" + 0.029*\"place\" + 0.026*\"crete\" + 0.025*\"taxpay\" + 0.022*\"scientist\" + 0.021*\"folei\" + 0.016*\"martin\" + 0.016*\"goal\" + 0.011*\"schmitz\"\n", + "2019-01-31 00:18:05,424 : INFO : topic #1 (0.020): 0.055*\"chilton\" + 0.045*\"china\" + 0.023*\"kong\" + 0.023*\"hong\" + 0.023*\"korea\" + 0.019*\"korean\" + 0.018*\"kim\" + 0.017*\"leah\" + 0.013*\"sourc\" + 0.012*\"min\"\n", + "2019-01-31 00:18:05,425 : INFO : topic #2 (0.020): 0.048*\"shield\" + 0.041*\"isl\" + 0.025*\"narrat\" + 0.014*\"scot\" + 0.014*\"pope\" + 0.014*\"capshaw\" + 0.010*\"nativist\" + 0.010*\"blur\" + 0.010*\"bahá\" + 0.009*\"coalit\"\n", + "2019-01-31 00:18:05,427 : INFO : topic #23 (0.020): 0.134*\"audit\" + 0.066*\"best\" + 0.033*\"jacksonvil\" + 0.032*\"yawn\" + 0.025*\"japanes\" + 0.022*\"noll\" + 0.020*\"women\" + 0.019*\"festiv\" + 0.015*\"prison\" + 0.013*\"winner\"\n", + "2019-01-31 00:18:05,432 : INFO : topic diff=0.040320, rho=0.110432\n", + "2019-01-31 00:18:05,590 : INFO : PROGRESS: pass 0, at document #166000/4922894\n", + "2019-01-31 00:18:07,107 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:18:07,372 : INFO : topic #36 (0.020): 0.028*\"companhia\" + 0.010*\"serv\" + 0.009*\"develop\" + 0.009*\"network\" + 0.009*\"busi\" + 0.009*\"manag\" + 0.009*\"oper\" + 0.009*\"market\" + 0.008*\"produc\" + 0.007*\"prognosi\"\n", + "2019-01-31 00:18:07,373 : INFO : topic #16 (0.020): 0.028*\"priest\" + 0.019*\"quarterli\" + 0.017*\"duke\" + 0.015*\"rotterdam\" + 0.015*\"king\" + 0.012*\"princ\" + 0.012*\"maria\" + 0.012*\"grammat\" + 0.010*\"count\" + 0.009*\"portugues\"\n", + "2019-01-31 00:18:07,375 : INFO : topic #45 (0.020): 0.019*\"black\" + 0.016*\"colder\" + 0.015*\"western\" + 0.015*\"record\" + 0.013*\"blind\" + 0.009*\"light\" + 0.007*\"green\" + 0.007*\"depress\" + 0.007*\"illicit\" + 0.006*\"hand\"\n", + "2019-01-31 00:18:07,376 : INFO : topic #49 (0.020): 0.041*\"india\" + 0.032*\"incumb\" + 0.014*\"pakistan\" + 0.012*\"televis\" + 0.009*\"start\" + 0.009*\"khalsa\" + 0.008*\"islam\" + 0.008*\"sri\" + 0.008*\"singh\" + 0.008*\"muskoge\"\n", + "2019-01-31 00:18:07,377 : INFO : topic #9 (0.020): 0.071*\"bone\" + 0.039*\"american\" + 0.025*\"valour\" + 0.017*\"folei\" + 0.016*\"dutch\" + 0.015*\"player\" + 0.014*\"polit\" + 0.013*\"english\" + 0.010*\"simpler\" + 0.009*\"surnam\"\n", + "2019-01-31 00:18:07,383 : INFO : topic diff=0.042581, rho=0.109764\n", + "2019-01-31 00:18:07,534 : INFO : PROGRESS: pass 0, at document #168000/4922894\n", + "2019-01-31 00:18:08,996 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:18:09,261 : INFO : topic #23 (0.020): 0.133*\"audit\" + 0.065*\"best\" + 0.035*\"jacksonvil\" + 0.031*\"yawn\" + 0.028*\"japanes\" + 0.022*\"noll\" + 0.020*\"women\" + 0.020*\"festiv\" + 0.014*\"prison\" + 0.013*\"intern\"\n", + "2019-01-31 00:18:09,262 : INFO : topic #20 (0.020): 0.128*\"scholar\" + 0.033*\"struggl\" + 0.028*\"high\" + 0.028*\"educ\" + 0.018*\"yawn\" + 0.012*\"collector\" + 0.012*\"prognosi\" + 0.012*\"district\" + 0.009*\"task\" + 0.009*\"electron\"\n", + "2019-01-31 00:18:09,264 : INFO : topic #49 (0.020): 0.042*\"india\" + 0.033*\"incumb\" + 0.013*\"pakistan\" + 0.012*\"televis\" + 0.010*\"start\" + 0.009*\"islam\" + 0.008*\"khalsa\" + 0.008*\"singh\" + 0.008*\"sri\" + 0.008*\"tajikistan\"\n", + "2019-01-31 00:18:09,265 : INFO : topic #42 (0.020): 0.037*\"german\" + 0.022*\"germani\" + 0.012*\"jewish\" + 0.012*\"der\" + 0.011*\"vol\" + 0.010*\"greek\" + 0.010*\"israel\" + 0.010*\"berlin\" + 0.008*\"anglo\" + 0.007*\"und\"\n", + "2019-01-31 00:18:09,266 : INFO : topic #39 (0.020): 0.034*\"taxpay\" + 0.029*\"scientist\" + 0.027*\"canada\" + 0.024*\"canadian\" + 0.022*\"clot\" + 0.015*\"basketbal\" + 0.013*\"hoar\" + 0.012*\"toronto\" + 0.012*\"confer\" + 0.012*\"ontario\"\n", + "2019-01-31 00:18:09,272 : INFO : topic diff=0.041998, rho=0.109109\n", + "2019-01-31 00:18:09,424 : INFO : PROGRESS: pass 0, at document #170000/4922894\n", + "2019-01-31 00:18:10,902 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:18:11,168 : INFO : topic #21 (0.020): 0.034*\"samford\" + 0.023*\"spain\" + 0.020*\"del\" + 0.019*\"mexico\" + 0.016*\"soviet\" + 0.014*\"santa\" + 0.012*\"juan\" + 0.011*\"josé\" + 0.011*\"antiqu\" + 0.010*\"francisco\"\n", + "2019-01-31 00:18:11,169 : INFO : topic #11 (0.020): 0.028*\"john\" + 0.017*\"will\" + 0.014*\"jame\" + 0.012*\"rival\" + 0.012*\"david\" + 0.011*\"georg\" + 0.009*\"slur\" + 0.009*\"rhyme\" + 0.008*\"thirtieth\" + 0.008*\"mexican–american\"\n", + "2019-01-31 00:18:11,170 : INFO : topic #20 (0.020): 0.127*\"scholar\" + 0.032*\"struggl\" + 0.028*\"high\" + 0.028*\"educ\" + 0.018*\"yawn\" + 0.012*\"collector\" + 0.012*\"prognosi\" + 0.012*\"district\" + 0.009*\"task\" + 0.009*\"electron\"\n", + "2019-01-31 00:18:11,171 : INFO : topic #10 (0.020): 0.013*\"cdd\" + 0.008*\"media\" + 0.007*\"disco\" + 0.007*\"pathwai\" + 0.006*\"caus\" + 0.006*\"effect\" + 0.006*\"treat\" + 0.006*\"activ\" + 0.006*\"proper\" + 0.005*\"acid\"\n", + "2019-01-31 00:18:11,172 : INFO : topic #0 (0.020): 0.071*\"statewid\" + 0.046*\"arsen\" + 0.037*\"line\" + 0.032*\"raid\" + 0.032*\"museo\" + 0.021*\"traceabl\" + 0.020*\"pain\" + 0.019*\"word\" + 0.017*\"artist\" + 0.015*\"exhaust\"\n", + "2019-01-31 00:18:11,178 : INFO : topic diff=0.041250, rho=0.108465\n", + "2019-01-31 00:18:11,335 : INFO : PROGRESS: pass 0, at document #172000/4922894\n", + "2019-01-31 00:18:12,834 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:18:13,100 : INFO : topic #19 (0.020): 0.009*\"like\" + 0.009*\"origin\" + 0.008*\"form\" + 0.008*\"woodcut\" + 0.007*\"mean\" + 0.007*\"uruguayan\" + 0.007*\"charact\" + 0.007*\"differ\" + 0.006*\"dynam\" + 0.005*\"anim\"\n", + "2019-01-31 00:18:13,101 : INFO : topic #4 (0.020): 0.026*\"enfranchis\" + 0.016*\"depress\" + 0.015*\"pour\" + 0.013*\"candid\" + 0.011*\"mode\" + 0.010*\"elabor\" + 0.010*\"veget\" + 0.008*\"spectacl\" + 0.008*\"produc\" + 0.007*\"turn\"\n", + "2019-01-31 00:18:13,102 : INFO : topic #12 (0.020): 0.009*\"number\" + 0.007*\"southern\" + 0.007*\"frontal\" + 0.006*\"exampl\" + 0.006*\"théori\" + 0.006*\"cytokin\" + 0.006*\"poet\" + 0.006*\"servitud\" + 0.006*\"gener\" + 0.006*\"uruguayan\"\n", + "2019-01-31 00:18:13,102 : INFO : topic #8 (0.020): 0.028*\"law\" + 0.025*\"cortic\" + 0.021*\"start\" + 0.020*\"act\" + 0.017*\"ricardo\" + 0.013*\"case\" + 0.010*\"polaris\" + 0.009*\"legal\" + 0.009*\"unionist\" + 0.008*\"feder\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 00:18:13,103 : INFO : topic #41 (0.020): 0.049*\"citi\" + 0.039*\"new\" + 0.024*\"palmer\" + 0.022*\"year\" + 0.017*\"center\" + 0.016*\"strategist\" + 0.010*\"open\" + 0.009*\"hot\" + 0.009*\"includ\" + 0.008*\"lobe\"\n", + "2019-01-31 00:18:13,109 : INFO : topic diff=0.041530, rho=0.107833\n", + "2019-01-31 00:18:13,264 : INFO : PROGRESS: pass 0, at document #174000/4922894\n", + "2019-01-31 00:18:14,756 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:18:15,021 : INFO : topic #2 (0.020): 0.053*\"isl\" + 0.043*\"shield\" + 0.022*\"narrat\" + 0.014*\"scot\" + 0.013*\"pope\" + 0.011*\"capshaw\" + 0.011*\"nativist\" + 0.010*\"coalit\" + 0.010*\"blur\" + 0.009*\"bahá\"\n", + "2019-01-31 00:18:15,022 : INFO : topic #14 (0.020): 0.023*\"walter\" + 0.022*\"forc\" + 0.020*\"aggress\" + 0.019*\"armi\" + 0.017*\"com\" + 0.015*\"unionist\" + 0.012*\"militari\" + 0.012*\"refut\" + 0.012*\"oper\" + 0.011*\"diversifi\"\n", + "2019-01-31 00:18:15,023 : INFO : topic #41 (0.020): 0.049*\"citi\" + 0.039*\"new\" + 0.024*\"palmer\" + 0.021*\"year\" + 0.017*\"strategist\" + 0.017*\"center\" + 0.011*\"open\" + 0.009*\"includ\" + 0.009*\"hot\" + 0.008*\"lobe\"\n", + "2019-01-31 00:18:15,025 : INFO : topic #9 (0.020): 0.068*\"bone\" + 0.040*\"american\" + 0.026*\"valour\" + 0.017*\"dutch\" + 0.017*\"folei\" + 0.017*\"player\" + 0.015*\"polit\" + 0.015*\"english\" + 0.010*\"simpler\" + 0.010*\"surnam\"\n", + "2019-01-31 00:18:15,026 : INFO : topic #25 (0.020): 0.028*\"ring\" + 0.015*\"lagrang\" + 0.015*\"warmth\" + 0.015*\"mount\" + 0.015*\"area\" + 0.008*\"north\" + 0.008*\"foam\" + 0.007*\"palmer\" + 0.007*\"land\" + 0.007*\"lobe\"\n", + "2019-01-31 00:18:15,032 : INFO : topic diff=0.037128, rho=0.107211\n", + "2019-01-31 00:18:15,183 : INFO : PROGRESS: pass 0, at document #176000/4922894\n", + "2019-01-31 00:18:16,676 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:18:16,941 : INFO : topic #47 (0.020): 0.067*\"muscl\" + 0.033*\"perceptu\" + 0.020*\"damn\" + 0.019*\"compos\" + 0.017*\"place\" + 0.016*\"theater\" + 0.014*\"olympo\" + 0.014*\"orchestr\" + 0.013*\"word\" + 0.013*\"jack\"\n", + "2019-01-31 00:18:16,943 : INFO : topic #46 (0.020): 0.021*\"wind\" + 0.018*\"damag\" + 0.017*\"stop\" + 0.016*\"norwai\" + 0.014*\"sweden\" + 0.011*\"swedish\" + 0.011*\"turkish\" + 0.011*\"treeless\" + 0.011*\"norwegian\" + 0.011*\"huntsvil\"\n", + "2019-01-31 00:18:16,944 : INFO : topic #48 (0.020): 0.081*\"august\" + 0.076*\"januari\" + 0.076*\"octob\" + 0.075*\"march\" + 0.074*\"juli\" + 0.073*\"sens\" + 0.069*\"judici\" + 0.069*\"notion\" + 0.068*\"april\" + 0.065*\"decatur\"\n", + "2019-01-31 00:18:16,945 : INFO : topic #8 (0.020): 0.028*\"law\" + 0.023*\"cortic\" + 0.022*\"start\" + 0.019*\"act\" + 0.017*\"ricardo\" + 0.013*\"case\" + 0.009*\"polaris\" + 0.009*\"legal\" + 0.009*\"unionist\" + 0.008*\"justic\"\n", + "2019-01-31 00:18:16,946 : INFO : topic #29 (0.020): 0.013*\"govern\" + 0.011*\"start\" + 0.009*\"replac\" + 0.008*\"countri\" + 0.007*\"yawn\" + 0.006*\"nation\" + 0.006*\"summerhil\" + 0.006*\"million\" + 0.006*\"new\" + 0.005*\"théori\"\n", + "2019-01-31 00:18:16,952 : INFO : topic diff=0.039723, rho=0.106600\n", + "2019-01-31 00:18:17,108 : INFO : PROGRESS: pass 0, at document #178000/4922894\n", + "2019-01-31 00:18:18,617 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:18:18,883 : INFO : topic #43 (0.020): 0.069*\"elect\" + 0.057*\"parti\" + 0.025*\"voluntari\" + 0.023*\"member\" + 0.022*\"democrat\" + 0.017*\"polici\" + 0.015*\"republ\" + 0.014*\"bypass\" + 0.014*\"seaport\" + 0.013*\"report\"\n", + "2019-01-31 00:18:18,884 : INFO : topic #45 (0.020): 0.018*\"black\" + 0.016*\"western\" + 0.015*\"colder\" + 0.014*\"record\" + 0.012*\"blind\" + 0.009*\"light\" + 0.008*\"green\" + 0.007*\"illicit\" + 0.006*\"color\" + 0.006*\"arm\"\n", + "2019-01-31 00:18:18,885 : INFO : topic #11 (0.020): 0.028*\"john\" + 0.016*\"will\" + 0.014*\"jame\" + 0.013*\"rival\" + 0.012*\"david\" + 0.011*\"georg\" + 0.009*\"rhyme\" + 0.008*\"slur\" + 0.008*\"mexican–american\" + 0.008*\"thirtieth\"\n", + "2019-01-31 00:18:18,886 : INFO : topic #7 (0.020): 0.021*\"snatch\" + 0.019*\"di\" + 0.017*\"factor\" + 0.014*\"yawn\" + 0.013*\"deal\" + 0.013*\"margin\" + 0.013*\"faster\" + 0.011*\"john\" + 0.011*\"daughter\" + 0.011*\"bone\"\n", + "2019-01-31 00:18:18,887 : INFO : topic #41 (0.020): 0.049*\"citi\" + 0.039*\"new\" + 0.024*\"palmer\" + 0.021*\"year\" + 0.017*\"strategist\" + 0.016*\"center\" + 0.011*\"open\" + 0.009*\"hot\" + 0.009*\"includ\" + 0.008*\"lobe\"\n", + "2019-01-31 00:18:18,893 : INFO : topic diff=0.036481, rho=0.106000\n", + "2019-01-31 00:18:21,674 : INFO : -11.775 per-word bound, 3505.3 perplexity estimate based on a held-out corpus of 2000 documents with 552825 words\n", + "2019-01-31 00:18:21,675 : INFO : PROGRESS: pass 0, at document #180000/4922894\n", + "2019-01-31 00:18:23,155 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:18:23,420 : INFO : topic #33 (0.020): 0.053*\"french\" + 0.041*\"franc\" + 0.028*\"pari\" + 0.027*\"jean\" + 0.021*\"sail\" + 0.020*\"daphn\" + 0.015*\"piec\" + 0.014*\"lazi\" + 0.012*\"focal\" + 0.011*\"loui\"\n", + "2019-01-31 00:18:23,422 : INFO : topic #27 (0.020): 0.069*\"questionnair\" + 0.018*\"taxpay\" + 0.017*\"tornado\" + 0.013*\"candid\" + 0.012*\"driver\" + 0.011*\"horac\" + 0.011*\"find\" + 0.011*\"yawn\" + 0.011*\"squatter\" + 0.011*\"champion\"\n", + "2019-01-31 00:18:23,423 : INFO : topic #40 (0.020): 0.080*\"unit\" + 0.029*\"collector\" + 0.018*\"institut\" + 0.016*\"schuster\" + 0.014*\"professor\" + 0.014*\"student\" + 0.012*\"governor\" + 0.012*\"american\" + 0.012*\"degre\" + 0.011*\"word\"\n", + "2019-01-31 00:18:23,424 : INFO : topic #19 (0.020): 0.009*\"like\" + 0.009*\"origin\" + 0.008*\"form\" + 0.008*\"woodcut\" + 0.007*\"mean\" + 0.007*\"charact\" + 0.007*\"uruguayan\" + 0.007*\"differ\" + 0.006*\"dynam\" + 0.006*\"god\"\n", + "2019-01-31 00:18:23,425 : INFO : topic #39 (0.020): 0.033*\"taxpay\" + 0.029*\"scientist\" + 0.026*\"canada\" + 0.024*\"canadian\" + 0.021*\"clot\" + 0.015*\"basketbal\" + 0.014*\"toronto\" + 0.012*\"hoar\" + 0.012*\"ontario\" + 0.011*\"confer\"\n", + "2019-01-31 00:18:23,431 : INFO : topic diff=0.035389, rho=0.105409\n", + "2019-01-31 00:18:23,587 : INFO : PROGRESS: pass 0, at document #182000/4922894\n", + "2019-01-31 00:18:25,087 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:18:25,352 : INFO : topic #25 (0.020): 0.027*\"ring\" + 0.017*\"lagrang\" + 0.016*\"mount\" + 0.016*\"warmth\" + 0.015*\"area\" + 0.008*\"foam\" + 0.008*\"north\" + 0.008*\"palmer\" + 0.007*\"land\" + 0.007*\"vacant\"\n", + "2019-01-31 00:18:25,354 : INFO : topic #32 (0.020): 0.068*\"district\" + 0.051*\"vigour\" + 0.045*\"popolo\" + 0.040*\"tortur\" + 0.030*\"area\" + 0.030*\"regim\" + 0.028*\"multitud\" + 0.027*\"cotton\" + 0.020*\"commun\" + 0.020*\"prosper\"\n", + "2019-01-31 00:18:25,355 : INFO : topic #34 (0.020): 0.075*\"start\" + 0.042*\"cotton\" + 0.028*\"unionist\" + 0.019*\"american\" + 0.014*\"california\" + 0.013*\"terri\" + 0.013*\"new\" + 0.012*\"north\" + 0.011*\"violent\" + 0.010*\"obes\"\n", + "2019-01-31 00:18:25,356 : INFO : topic #20 (0.020): 0.129*\"scholar\" + 0.034*\"struggl\" + 0.029*\"high\" + 0.028*\"educ\" + 0.017*\"yawn\" + 0.013*\"prognosi\" + 0.012*\"collector\" + 0.011*\"district\" + 0.009*\"task\" + 0.008*\"gothic\"\n", + "2019-01-31 00:18:25,358 : INFO : topic #17 (0.020): 0.062*\"church\" + 0.021*\"fifteenth\" + 0.020*\"jpg\" + 0.019*\"cathol\" + 0.017*\"christian\" + 0.017*\"centuri\" + 0.016*\"bishop\" + 0.016*\"retroflex\" + 0.015*\"sail\" + 0.013*\"italian\"\n", + "2019-01-31 00:18:25,363 : INFO : topic diff=0.037979, rho=0.104828\n", + "2019-01-31 00:18:25,518 : INFO : PROGRESS: pass 0, at document #184000/4922894\n", + "2019-01-31 00:18:26,995 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:18:27,260 : INFO : topic #13 (0.020): 0.032*\"australia\" + 0.026*\"sourc\" + 0.024*\"australian\" + 0.023*\"london\" + 0.022*\"england\" + 0.021*\"ireland\" + 0.020*\"new\" + 0.016*\"youth\" + 0.014*\"wale\" + 0.014*\"british\"\n", + "2019-01-31 00:18:27,261 : INFO : topic #11 (0.020): 0.028*\"john\" + 0.015*\"will\" + 0.014*\"jame\" + 0.013*\"rival\" + 0.012*\"david\" + 0.011*\"georg\" + 0.009*\"rhyme\" + 0.009*\"mexican–american\" + 0.008*\"slur\" + 0.007*\"paul\"\n", + "2019-01-31 00:18:27,262 : INFO : topic #36 (0.020): 0.027*\"companhia\" + 0.009*\"serv\" + 0.009*\"prognosi\" + 0.009*\"develop\" + 0.009*\"oper\" + 0.009*\"manag\" + 0.009*\"market\" + 0.009*\"busi\" + 0.008*\"produc\" + 0.008*\"network\"\n", + "2019-01-31 00:18:27,263 : INFO : topic #16 (0.020): 0.026*\"priest\" + 0.019*\"king\" + 0.017*\"quarterli\" + 0.016*\"duke\" + 0.016*\"maria\" + 0.014*\"klux\" + 0.014*\"rotterdam\" + 0.012*\"grammat\" + 0.012*\"princ\" + 0.010*\"count\"\n", + "2019-01-31 00:18:27,264 : INFO : topic #25 (0.020): 0.027*\"ring\" + 0.018*\"lagrang\" + 0.016*\"warmth\" + 0.016*\"mount\" + 0.015*\"area\" + 0.008*\"north\" + 0.008*\"foam\" + 0.008*\"land\" + 0.007*\"palmer\" + 0.007*\"vacant\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 00:18:27,270 : INFO : topic diff=0.036239, rho=0.104257\n", + "2019-01-31 00:18:27,428 : INFO : PROGRESS: pass 0, at document #186000/4922894\n", + "2019-01-31 00:18:28,957 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:18:29,223 : INFO : topic #27 (0.020): 0.071*\"questionnair\" + 0.019*\"taxpay\" + 0.015*\"tornado\" + 0.015*\"candid\" + 0.013*\"driver\" + 0.012*\"fool\" + 0.011*\"find\" + 0.011*\"horac\" + 0.011*\"squatter\" + 0.010*\"yawn\"\n", + "2019-01-31 00:18:29,224 : INFO : topic #48 (0.020): 0.079*\"sens\" + 0.078*\"march\" + 0.078*\"august\" + 0.077*\"octob\" + 0.074*\"juli\" + 0.074*\"januari\" + 0.069*\"judici\" + 0.069*\"notion\" + 0.068*\"april\" + 0.066*\"decatur\"\n", + "2019-01-31 00:18:29,225 : INFO : topic #13 (0.020): 0.031*\"australia\" + 0.025*\"sourc\" + 0.023*\"australian\" + 0.022*\"london\" + 0.021*\"england\" + 0.020*\"ireland\" + 0.020*\"new\" + 0.018*\"youth\" + 0.016*\"british\" + 0.014*\"wale\"\n", + "2019-01-31 00:18:29,226 : INFO : topic #3 (0.020): 0.033*\"present\" + 0.032*\"offic\" + 0.025*\"seri\" + 0.024*\"minist\" + 0.018*\"gener\" + 0.017*\"serv\" + 0.016*\"chickasaw\" + 0.016*\"member\" + 0.014*\"appeas\" + 0.013*\"secess\"\n", + "2019-01-31 00:18:29,227 : INFO : topic #0 (0.020): 0.067*\"statewid\" + 0.047*\"arsen\" + 0.035*\"raid\" + 0.033*\"line\" + 0.033*\"museo\" + 0.020*\"word\" + 0.020*\"pain\" + 0.019*\"traceabl\" + 0.019*\"artist\" + 0.015*\"exhaust\"\n", + "2019-01-31 00:18:29,233 : INFO : topic diff=0.037878, rho=0.103695\n", + "2019-01-31 00:18:29,383 : INFO : PROGRESS: pass 0, at document #188000/4922894\n", + "2019-01-31 00:18:30,849 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:18:31,114 : INFO : topic #1 (0.020): 0.059*\"chilton\" + 0.048*\"china\" + 0.027*\"hong\" + 0.027*\"kong\" + 0.022*\"korea\" + 0.019*\"korean\" + 0.017*\"leah\" + 0.015*\"sourc\" + 0.014*\"kim\" + 0.010*\"summer\"\n", + "2019-01-31 00:18:31,115 : INFO : topic #41 (0.020): 0.046*\"citi\" + 0.039*\"new\" + 0.026*\"palmer\" + 0.022*\"year\" + 0.016*\"center\" + 0.015*\"strategist\" + 0.010*\"open\" + 0.009*\"includ\" + 0.009*\"hot\" + 0.008*\"lobe\"\n", + "2019-01-31 00:18:31,117 : INFO : topic #30 (0.020): 0.036*\"leagu\" + 0.035*\"cleveland\" + 0.029*\"place\" + 0.026*\"taxpay\" + 0.024*\"crete\" + 0.022*\"scientist\" + 0.021*\"folei\" + 0.017*\"martin\" + 0.016*\"goal\" + 0.012*\"schmitz\"\n", + "2019-01-31 00:18:31,118 : INFO : topic #32 (0.020): 0.064*\"district\" + 0.050*\"vigour\" + 0.047*\"tortur\" + 0.046*\"popolo\" + 0.030*\"regim\" + 0.029*\"area\" + 0.027*\"multitud\" + 0.026*\"cotton\" + 0.021*\"prosper\" + 0.020*\"commun\"\n", + "2019-01-31 00:18:31,119 : INFO : topic #39 (0.020): 0.031*\"taxpay\" + 0.029*\"scientist\" + 0.026*\"canada\" + 0.024*\"canadian\" + 0.023*\"clot\" + 0.015*\"basketbal\" + 0.014*\"toronto\" + 0.012*\"ontario\" + 0.012*\"confer\" + 0.012*\"hoar\"\n", + "2019-01-31 00:18:31,125 : INFO : topic diff=0.035583, rho=0.103142\n", + "2019-01-31 00:18:31,329 : INFO : PROGRESS: pass 0, at document #190000/4922894\n", + "2019-01-31 00:18:32,817 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:18:33,083 : INFO : topic #46 (0.020): 0.020*\"damag\" + 0.018*\"wind\" + 0.016*\"norwai\" + 0.015*\"sweden\" + 0.014*\"stop\" + 0.014*\"swedish\" + 0.012*\"turkei\" + 0.012*\"earthquak\" + 0.012*\"turkish\" + 0.011*\"norwegian\"\n", + "2019-01-31 00:18:33,084 : INFO : topic #15 (0.020): 0.014*\"requir\" + 0.013*\"develop\" + 0.012*\"small\" + 0.010*\"cultur\" + 0.010*\"word\" + 0.009*\"organ\" + 0.009*\"student\" + 0.008*\"socialist\" + 0.008*\"commun\" + 0.008*\"human\"\n", + "2019-01-31 00:18:33,085 : INFO : topic #3 (0.020): 0.034*\"present\" + 0.032*\"offic\" + 0.025*\"seri\" + 0.025*\"minist\" + 0.018*\"gener\" + 0.016*\"serv\" + 0.016*\"chickasaw\" + 0.016*\"member\" + 0.014*\"appeas\" + 0.013*\"secess\"\n", + "2019-01-31 00:18:33,086 : INFO : topic #16 (0.020): 0.029*\"priest\" + 0.020*\"king\" + 0.018*\"quarterli\" + 0.018*\"duke\" + 0.016*\"klux\" + 0.014*\"maria\" + 0.014*\"rotterdam\" + 0.013*\"princ\" + 0.013*\"portugues\" + 0.012*\"grammat\"\n", + "2019-01-31 00:18:33,088 : INFO : topic #20 (0.020): 0.126*\"scholar\" + 0.036*\"struggl\" + 0.029*\"educ\" + 0.028*\"high\" + 0.017*\"yawn\" + 0.013*\"prognosi\" + 0.012*\"collector\" + 0.010*\"district\" + 0.009*\"gothic\" + 0.008*\"task\"\n", + "2019-01-31 00:18:33,094 : INFO : topic diff=0.035430, rho=0.102598\n", + "2019-01-31 00:18:33,255 : INFO : PROGRESS: pass 0, at document #192000/4922894\n", + "2019-01-31 00:18:34,776 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:18:35,041 : INFO : topic #32 (0.020): 0.064*\"district\" + 0.050*\"vigour\" + 0.046*\"tortur\" + 0.045*\"popolo\" + 0.030*\"regim\" + 0.029*\"area\" + 0.027*\"multitud\" + 0.025*\"cotton\" + 0.022*\"prosper\" + 0.021*\"commun\"\n", + "2019-01-31 00:18:35,042 : INFO : topic #12 (0.020): 0.009*\"number\" + 0.007*\"southern\" + 0.007*\"frontal\" + 0.006*\"poet\" + 0.006*\"exampl\" + 0.006*\"théori\" + 0.006*\"measur\" + 0.006*\"gener\" + 0.005*\"cytokin\" + 0.005*\"uruguayan\"\n", + "2019-01-31 00:18:35,044 : INFO : topic #46 (0.020): 0.020*\"damag\" + 0.017*\"wind\" + 0.015*\"norwai\" + 0.015*\"sweden\" + 0.014*\"swedish\" + 0.014*\"stop\" + 0.012*\"turkish\" + 0.012*\"turkei\" + 0.012*\"earthquak\" + 0.011*\"norwegian\"\n", + "2019-01-31 00:18:35,045 : INFO : topic #11 (0.020): 0.029*\"john\" + 0.016*\"will\" + 0.014*\"jame\" + 0.012*\"rival\" + 0.012*\"david\" + 0.011*\"georg\" + 0.010*\"slur\" + 0.009*\"rhyme\" + 0.008*\"mexican–american\" + 0.007*\"thirtieth\"\n", + "2019-01-31 00:18:35,046 : INFO : topic #41 (0.020): 0.046*\"citi\" + 0.039*\"new\" + 0.025*\"palmer\" + 0.022*\"year\" + 0.016*\"center\" + 0.015*\"strategist\" + 0.010*\"open\" + 0.009*\"includ\" + 0.008*\"lobe\" + 0.008*\"hot\"\n", + "2019-01-31 00:18:35,051 : INFO : topic diff=0.039348, rho=0.102062\n", + "2019-01-31 00:18:35,207 : INFO : PROGRESS: pass 0, at document #194000/4922894\n", + "2019-01-31 00:18:36,705 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:18:36,971 : INFO : topic #26 (0.020): 0.033*\"workplac\" + 0.031*\"champion\" + 0.030*\"woman\" + 0.026*\"men\" + 0.024*\"olymp\" + 0.023*\"event\" + 0.021*\"alic\" + 0.020*\"medal\" + 0.017*\"atheist\" + 0.017*\"théori\"\n", + "2019-01-31 00:18:36,972 : INFO : topic #9 (0.020): 0.066*\"bone\" + 0.038*\"american\" + 0.031*\"valour\" + 0.017*\"dutch\" + 0.017*\"folei\" + 0.016*\"player\" + 0.016*\"polit\" + 0.014*\"english\" + 0.010*\"surnam\" + 0.010*\"simpler\"\n", + "2019-01-31 00:18:36,973 : INFO : topic #3 (0.020): 0.034*\"present\" + 0.031*\"offic\" + 0.025*\"seri\" + 0.024*\"minist\" + 0.018*\"gener\" + 0.016*\"chickasaw\" + 0.016*\"serv\" + 0.016*\"member\" + 0.015*\"appeas\" + 0.012*\"secess\"\n", + "2019-01-31 00:18:36,974 : INFO : topic #35 (0.020): 0.046*\"russia\" + 0.033*\"sovereignti\" + 0.030*\"rural\" + 0.026*\"reprint\" + 0.023*\"personifi\" + 0.019*\"unfortun\" + 0.018*\"moscow\" + 0.016*\"poison\" + 0.014*\"intern\" + 0.013*\"shirin\"\n", + "2019-01-31 00:18:36,975 : INFO : topic #41 (0.020): 0.046*\"citi\" + 0.039*\"new\" + 0.025*\"palmer\" + 0.022*\"year\" + 0.015*\"center\" + 0.015*\"strategist\" + 0.010*\"open\" + 0.009*\"includ\" + 0.008*\"lobe\" + 0.008*\"hot\"\n", + "2019-01-31 00:18:36,981 : INFO : topic diff=0.031677, rho=0.101535\n", + "2019-01-31 00:18:37,134 : INFO : PROGRESS: pass 0, at document #196000/4922894\n", + "2019-01-31 00:18:38,610 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:18:38,876 : INFO : topic #45 (0.020): 0.022*\"black\" + 0.016*\"western\" + 0.015*\"colder\" + 0.013*\"record\" + 0.011*\"blind\" + 0.010*\"light\" + 0.008*\"green\" + 0.007*\"illicit\" + 0.006*\"depress\" + 0.006*\"arm\"\n", + "2019-01-31 00:18:38,877 : INFO : topic #23 (0.020): 0.131*\"audit\" + 0.069*\"best\" + 0.034*\"jacksonvil\" + 0.029*\"japanes\" + 0.029*\"yawn\" + 0.021*\"festiv\" + 0.021*\"noll\" + 0.018*\"women\" + 0.015*\"intern\" + 0.014*\"prison\"\n", + "2019-01-31 00:18:38,878 : INFO : topic #7 (0.020): 0.021*\"snatch\" + 0.018*\"di\" + 0.017*\"factor\" + 0.014*\"yawn\" + 0.013*\"margin\" + 0.013*\"faster\" + 0.012*\"deal\" + 0.011*\"john\" + 0.011*\"daughter\" + 0.011*\"bone\"\n", + "2019-01-31 00:18:38,879 : INFO : topic #8 (0.020): 0.028*\"law\" + 0.026*\"cortic\" + 0.021*\"start\" + 0.021*\"act\" + 0.019*\"ricardo\" + 0.013*\"case\" + 0.011*\"polaris\" + 0.009*\"legal\" + 0.009*\"justic\" + 0.009*\"unionist\"\n", + "2019-01-31 00:18:38,880 : INFO : topic #25 (0.020): 0.029*\"ring\" + 0.017*\"warmth\" + 0.016*\"lagrang\" + 0.015*\"mount\" + 0.015*\"area\" + 0.008*\"north\" + 0.008*\"land\" + 0.008*\"foam\" + 0.007*\"palmer\" + 0.007*\"vacant\"\n", + "2019-01-31 00:18:38,886 : INFO : topic diff=0.034481, rho=0.101015\n", + "2019-01-31 00:18:39,043 : INFO : PROGRESS: pass 0, at document #198000/4922894\n", + "2019-01-31 00:18:40,529 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 00:18:40,795 : INFO : topic #42 (0.020): 0.038*\"german\" + 0.024*\"germani\" + 0.013*\"vol\" + 0.012*\"israel\" + 0.012*\"berlin\" + 0.011*\"jewish\" + 0.010*\"der\" + 0.010*\"anglo\" + 0.009*\"greek\" + 0.008*\"austria\"\n", + "2019-01-31 00:18:40,796 : INFO : topic #44 (0.020): 0.035*\"rooftop\" + 0.026*\"final\" + 0.022*\"wife\" + 0.020*\"tourist\" + 0.016*\"champion\" + 0.015*\"tiepolo\" + 0.014*\"poet\" + 0.013*\"chamber\" + 0.013*\"martin\" + 0.012*\"taxpay\"\n", + "2019-01-31 00:18:40,798 : INFO : topic #21 (0.020): 0.038*\"samford\" + 0.026*\"spain\" + 0.019*\"del\" + 0.017*\"mexico\" + 0.016*\"soviet\" + 0.012*\"santa\" + 0.012*\"francisco\" + 0.011*\"juan\" + 0.011*\"josé\" + 0.010*\"lizard\"\n", + "2019-01-31 00:18:40,799 : INFO : topic #48 (0.020): 0.079*\"august\" + 0.076*\"march\" + 0.075*\"sens\" + 0.074*\"octob\" + 0.074*\"juli\" + 0.071*\"januari\" + 0.070*\"decatur\" + 0.070*\"notion\" + 0.069*\"judici\" + 0.068*\"april\"\n", + "2019-01-31 00:18:40,800 : INFO : topic #30 (0.020): 0.036*\"leagu\" + 0.035*\"cleveland\" + 0.030*\"place\" + 0.027*\"taxpay\" + 0.025*\"crete\" + 0.022*\"scientist\" + 0.022*\"folei\" + 0.017*\"goal\" + 0.016*\"martin\" + 0.012*\"schmitz\"\n", + "2019-01-31 00:18:40,806 : INFO : topic diff=0.034555, rho=0.100504\n", + "2019-01-31 00:18:43,616 : INFO : -11.562 per-word bound, 3023.6 perplexity estimate based on a held-out corpus of 2000 documents with 555661 words\n", + "2019-01-31 00:18:43,617 : INFO : PROGRESS: pass 0, at document #200000/4922894\n", + "2019-01-31 00:18:45,119 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:18:45,385 : INFO : topic #6 (0.020): 0.069*\"fewer\" + 0.024*\"septemb\" + 0.020*\"epiru\" + 0.020*\"teacher\" + 0.015*\"stake\" + 0.012*\"rodríguez\" + 0.012*\"proclaim\" + 0.011*\"direct\" + 0.010*\"movi\" + 0.010*\"acrimoni\"\n", + "2019-01-31 00:18:45,386 : INFO : topic #48 (0.020): 0.079*\"august\" + 0.076*\"sens\" + 0.075*\"octob\" + 0.075*\"march\" + 0.074*\"juli\" + 0.073*\"januari\" + 0.070*\"decatur\" + 0.070*\"notion\" + 0.069*\"judici\" + 0.067*\"april\"\n", + "2019-01-31 00:18:45,388 : INFO : topic #22 (0.020): 0.033*\"spars\" + 0.027*\"factor\" + 0.022*\"adulthood\" + 0.016*\"hostil\" + 0.015*\"feel\" + 0.014*\"male\" + 0.013*\"genu\" + 0.012*\"live\" + 0.011*\"popolo\" + 0.010*\"yawn\"\n", + "2019-01-31 00:18:45,389 : INFO : topic #27 (0.020): 0.070*\"questionnair\" + 0.018*\"taxpay\" + 0.015*\"tornado\" + 0.013*\"candid\" + 0.012*\"find\" + 0.012*\"driver\" + 0.011*\"squatter\" + 0.011*\"fool\" + 0.010*\"théori\" + 0.010*\"yawn\"\n", + "2019-01-31 00:18:45,390 : INFO : topic #0 (0.020): 0.067*\"statewid\" + 0.043*\"arsen\" + 0.038*\"raid\" + 0.036*\"line\" + 0.030*\"museo\" + 0.020*\"pain\" + 0.020*\"traceabl\" + 0.019*\"word\" + 0.019*\"artist\" + 0.016*\"serv\"\n", + "2019-01-31 00:18:45,395 : INFO : topic diff=0.033841, rho=0.100000\n", + "2019-01-31 00:18:45,547 : INFO : PROGRESS: pass 0, at document #202000/4922894\n", + "2019-01-31 00:18:47,017 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:18:47,283 : INFO : topic #30 (0.020): 0.035*\"leagu\" + 0.035*\"cleveland\" + 0.029*\"place\" + 0.026*\"taxpay\" + 0.026*\"crete\" + 0.022*\"scientist\" + 0.022*\"folei\" + 0.017*\"goal\" + 0.016*\"martin\" + 0.012*\"schmitz\"\n", + "2019-01-31 00:18:47,284 : INFO : topic #36 (0.020): 0.028*\"companhia\" + 0.009*\"serv\" + 0.009*\"develop\" + 0.009*\"market\" + 0.009*\"network\" + 0.009*\"oper\" + 0.009*\"manag\" + 0.008*\"prognosi\" + 0.008*\"busi\" + 0.008*\"produc\"\n", + "2019-01-31 00:18:47,286 : INFO : topic #22 (0.020): 0.033*\"spars\" + 0.027*\"factor\" + 0.025*\"adulthood\" + 0.017*\"hostil\" + 0.016*\"feel\" + 0.013*\"male\" + 0.012*\"genu\" + 0.012*\"live\" + 0.011*\"popolo\" + 0.010*\"yawn\"\n", + "2019-01-31 00:18:47,287 : INFO : topic #40 (0.020): 0.089*\"unit\" + 0.029*\"collector\" + 0.019*\"institut\" + 0.018*\"schuster\" + 0.016*\"professor\" + 0.014*\"student\" + 0.013*\"requir\" + 0.012*\"american\" + 0.012*\"governor\" + 0.011*\"degre\"\n", + "2019-01-31 00:18:47,288 : INFO : topic #37 (0.020): 0.009*\"love\" + 0.006*\"gestur\" + 0.005*\"man\" + 0.005*\"night\" + 0.005*\"litig\" + 0.005*\"blue\" + 0.004*\"bewild\" + 0.004*\"misconcept\" + 0.004*\"dai\" + 0.003*\"introductori\"\n", + "2019-01-31 00:18:47,294 : INFO : topic diff=0.032983, rho=0.099504\n", + "2019-01-31 00:18:47,450 : INFO : PROGRESS: pass 0, at document #204000/4922894\n", + "2019-01-31 00:18:48,967 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:18:49,233 : INFO : topic #49 (0.020): 0.038*\"india\" + 0.028*\"incumb\" + 0.014*\"televis\" + 0.012*\"pakistan\" + 0.010*\"islam\" + 0.009*\"start\" + 0.009*\"muskoge\" + 0.009*\"sri\" + 0.009*\"khalsa\" + 0.009*\"singh\"\n", + "2019-01-31 00:18:49,234 : INFO : topic #7 (0.020): 0.021*\"snatch\" + 0.019*\"di\" + 0.016*\"factor\" + 0.013*\"yawn\" + 0.013*\"margin\" + 0.012*\"faster\" + 0.012*\"deal\" + 0.011*\"john\" + 0.011*\"life\" + 0.011*\"bone\"\n", + "2019-01-31 00:18:49,235 : INFO : topic #23 (0.020): 0.131*\"audit\" + 0.079*\"best\" + 0.035*\"jacksonvil\" + 0.029*\"yawn\" + 0.028*\"japanes\" + 0.020*\"noll\" + 0.020*\"festiv\" + 0.018*\"women\" + 0.014*\"intern\" + 0.013*\"categori\"\n", + "2019-01-31 00:18:49,237 : INFO : topic #22 (0.020): 0.033*\"spars\" + 0.026*\"factor\" + 0.025*\"adulthood\" + 0.017*\"hostil\" + 0.015*\"feel\" + 0.014*\"male\" + 0.012*\"genu\" + 0.011*\"live\" + 0.011*\"plaisir\" + 0.010*\"popolo\"\n", + "2019-01-31 00:18:49,238 : INFO : topic #24 (0.020): 0.039*\"book\" + 0.032*\"publicis\" + 0.019*\"word\" + 0.014*\"new\" + 0.014*\"edit\" + 0.012*\"nicola\" + 0.012*\"storag\" + 0.012*\"worldwid\" + 0.011*\"presid\" + 0.010*\"author\"\n", + "2019-01-31 00:18:49,244 : INFO : topic diff=0.033727, rho=0.099015\n", + "2019-01-31 00:18:49,401 : INFO : PROGRESS: pass 0, at document #206000/4922894\n", + "2019-01-31 00:18:50,904 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:18:51,170 : INFO : topic #38 (0.020): 0.021*\"walter\" + 0.015*\"king\" + 0.009*\"aza\" + 0.009*\"battalion\" + 0.009*\"empath\" + 0.008*\"forc\" + 0.008*\"teufel\" + 0.007*\"armi\" + 0.007*\"embassi\" + 0.007*\"till\"\n", + "2019-01-31 00:18:51,171 : INFO : topic #12 (0.020): 0.010*\"cytokin\" + 0.010*\"utopian\" + 0.009*\"number\" + 0.007*\"frontal\" + 0.006*\"measur\" + 0.006*\"southern\" + 0.006*\"poet\" + 0.006*\"théori\" + 0.006*\"exampl\" + 0.006*\"gener\"\n", + "2019-01-31 00:18:51,172 : INFO : topic #9 (0.020): 0.091*\"bone\" + 0.036*\"american\" + 0.027*\"valour\" + 0.018*\"player\" + 0.017*\"folei\" + 0.017*\"polit\" + 0.015*\"dutch\" + 0.013*\"english\" + 0.012*\"simpler\" + 0.010*\"acrimoni\"\n", + "2019-01-31 00:18:51,173 : INFO : topic #48 (0.020): 0.079*\"octob\" + 0.079*\"august\" + 0.078*\"sens\" + 0.077*\"march\" + 0.075*\"januari\" + 0.074*\"juli\" + 0.074*\"notion\" + 0.072*\"decatur\" + 0.070*\"april\" + 0.068*\"judici\"\n", + "2019-01-31 00:18:51,175 : INFO : topic #44 (0.020): 0.036*\"rooftop\" + 0.025*\"final\" + 0.022*\"wife\" + 0.020*\"tourist\" + 0.016*\"champion\" + 0.015*\"poet\" + 0.014*\"tiepolo\" + 0.014*\"ret\" + 0.014*\"martin\" + 0.013*\"chamber\"\n", + "2019-01-31 00:18:51,180 : INFO : topic diff=0.029353, rho=0.098533\n", + "2019-01-31 00:18:51,339 : INFO : PROGRESS: pass 0, at document #208000/4922894\n", + "2019-01-31 00:18:52,840 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:18:53,106 : INFO : topic #21 (0.020): 0.036*\"samford\" + 0.025*\"spain\" + 0.020*\"del\" + 0.018*\"mexico\" + 0.015*\"soviet\" + 0.011*\"juan\" + 0.011*\"santa\" + 0.011*\"francisco\" + 0.011*\"josé\" + 0.010*\"lizard\"\n", + "2019-01-31 00:18:53,107 : INFO : topic #16 (0.020): 0.031*\"priest\" + 0.019*\"king\" + 0.018*\"duke\" + 0.017*\"quarterli\" + 0.015*\"grammat\" + 0.015*\"rotterdam\" + 0.014*\"maria\" + 0.013*\"portugues\" + 0.012*\"princ\" + 0.012*\"anima\"\n", + "2019-01-31 00:18:53,108 : INFO : topic #23 (0.020): 0.134*\"audit\" + 0.078*\"best\" + 0.035*\"jacksonvil\" + 0.029*\"yawn\" + 0.028*\"japanes\" + 0.021*\"noll\" + 0.021*\"festiv\" + 0.018*\"women\" + 0.014*\"prison\" + 0.014*\"intern\"\n", + "2019-01-31 00:18:53,109 : INFO : topic #37 (0.020): 0.008*\"love\" + 0.006*\"gestur\" + 0.005*\"blue\" + 0.005*\"man\" + 0.005*\"night\" + 0.005*\"bewild\" + 0.004*\"litig\" + 0.004*\"introductori\" + 0.003*\"misconcept\" + 0.003*\"dai\"\n", + "2019-01-31 00:18:53,110 : INFO : topic #4 (0.020): 0.025*\"enfranchis\" + 0.017*\"pour\" + 0.016*\"depress\" + 0.012*\"mode\" + 0.012*\"candid\" + 0.010*\"elabor\" + 0.010*\"veget\" + 0.009*\"produc\" + 0.008*\"encyclopedia\" + 0.008*\"mandir\"\n", + "2019-01-31 00:18:53,116 : INFO : topic diff=0.035179, rho=0.098058\n", + "2019-01-31 00:18:53,273 : INFO : PROGRESS: pass 0, at document #210000/4922894\n", + "2019-01-31 00:18:54,765 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:18:55,031 : INFO : topic #37 (0.020): 0.008*\"love\" + 0.006*\"gestur\" + 0.005*\"man\" + 0.005*\"blue\" + 0.005*\"night\" + 0.005*\"litig\" + 0.004*\"bewild\" + 0.004*\"dai\" + 0.003*\"introductori\" + 0.003*\"misconcept\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 00:18:55,032 : INFO : topic #11 (0.020): 0.029*\"john\" + 0.016*\"will\" + 0.014*\"jame\" + 0.013*\"rival\" + 0.011*\"david\" + 0.011*\"georg\" + 0.010*\"slur\" + 0.009*\"rhyme\" + 0.008*\"mexican–american\" + 0.008*\"thirtieth\"\n", + "2019-01-31 00:18:55,033 : INFO : topic #14 (0.020): 0.025*\"forc\" + 0.024*\"aggress\" + 0.021*\"walter\" + 0.019*\"armi\" + 0.017*\"com\" + 0.014*\"militari\" + 0.014*\"unionist\" + 0.013*\"oper\" + 0.013*\"airmen\" + 0.012*\"airbu\"\n", + "2019-01-31 00:18:55,034 : INFO : topic #49 (0.020): 0.039*\"india\" + 0.030*\"incumb\" + 0.015*\"televis\" + 0.012*\"pakistan\" + 0.010*\"islam\" + 0.009*\"khalsa\" + 0.009*\"start\" + 0.009*\"singh\" + 0.009*\"muskoge\" + 0.009*\"sri\"\n", + "2019-01-31 00:18:55,035 : INFO : topic #4 (0.020): 0.025*\"enfranchis\" + 0.018*\"pour\" + 0.016*\"depress\" + 0.012*\"candid\" + 0.012*\"mode\" + 0.011*\"elabor\" + 0.010*\"veget\" + 0.008*\"produc\" + 0.008*\"encyclopedia\" + 0.008*\"spectacl\"\n", + "2019-01-31 00:18:55,041 : INFO : topic diff=0.030341, rho=0.097590\n", + "2019-01-31 00:18:55,195 : INFO : PROGRESS: pass 0, at document #212000/4922894\n", + "2019-01-31 00:18:56,665 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:18:56,931 : INFO : topic #43 (0.020): 0.067*\"parti\" + 0.065*\"elect\" + 0.026*\"democrat\" + 0.025*\"voluntari\" + 0.022*\"member\" + 0.017*\"polici\" + 0.017*\"republ\" + 0.015*\"bypass\" + 0.014*\"report\" + 0.014*\"seaport\"\n", + "2019-01-31 00:18:56,932 : INFO : topic #8 (0.020): 0.028*\"law\" + 0.028*\"cortic\" + 0.020*\"start\" + 0.019*\"act\" + 0.017*\"ricardo\" + 0.013*\"case\" + 0.011*\"polaris\" + 0.009*\"legal\" + 0.009*\"unionist\" + 0.008*\"justic\"\n", + "2019-01-31 00:18:56,933 : INFO : topic #38 (0.020): 0.023*\"walter\" + 0.015*\"king\" + 0.009*\"aza\" + 0.009*\"battalion\" + 0.008*\"empath\" + 0.008*\"embassi\" + 0.008*\"teufel\" + 0.008*\"forc\" + 0.007*\"armi\" + 0.007*\"till\"\n", + "2019-01-31 00:18:56,934 : INFO : topic #39 (0.020): 0.031*\"taxpay\" + 0.028*\"scientist\" + 0.025*\"canada\" + 0.023*\"clot\" + 0.021*\"canadian\" + 0.015*\"basketbal\" + 0.013*\"hoar\" + 0.012*\"confer\" + 0.011*\"yawn\" + 0.011*\"toronto\"\n", + "2019-01-31 00:18:56,935 : INFO : topic #32 (0.020): 0.063*\"district\" + 0.052*\"tortur\" + 0.049*\"vigour\" + 0.045*\"popolo\" + 0.029*\"regim\" + 0.028*\"multitud\" + 0.028*\"area\" + 0.027*\"cotton\" + 0.021*\"prosper\" + 0.020*\"commun\"\n", + "2019-01-31 00:18:56,941 : INFO : topic diff=0.032093, rho=0.097129\n", + "2019-01-31 00:18:57,096 : INFO : PROGRESS: pass 0, at document #214000/4922894\n", + "2019-01-31 00:18:58,568 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:18:58,834 : INFO : topic #8 (0.020): 0.028*\"cortic\" + 0.028*\"law\" + 0.020*\"start\" + 0.018*\"act\" + 0.017*\"ricardo\" + 0.013*\"case\" + 0.011*\"polaris\" + 0.009*\"unionist\" + 0.009*\"legal\" + 0.008*\"justic\"\n", + "2019-01-31 00:18:58,835 : INFO : topic #43 (0.020): 0.067*\"parti\" + 0.066*\"elect\" + 0.026*\"voluntari\" + 0.025*\"democrat\" + 0.022*\"member\" + 0.017*\"polici\" + 0.016*\"republ\" + 0.014*\"bypass\" + 0.014*\"seaport\" + 0.014*\"report\"\n", + "2019-01-31 00:18:58,836 : INFO : topic #41 (0.020): 0.049*\"citi\" + 0.038*\"new\" + 0.024*\"palmer\" + 0.023*\"year\" + 0.016*\"strategist\" + 0.015*\"center\" + 0.012*\"open\" + 0.009*\"includ\" + 0.009*\"lobe\" + 0.008*\"hot\"\n", + "2019-01-31 00:18:58,837 : INFO : topic #3 (0.020): 0.032*\"present\" + 0.031*\"offic\" + 0.025*\"minist\" + 0.023*\"seri\" + 0.019*\"gener\" + 0.017*\"chickasaw\" + 0.016*\"serv\" + 0.016*\"member\" + 0.014*\"appeas\" + 0.013*\"secess\"\n", + "2019-01-31 00:18:58,838 : INFO : topic #38 (0.020): 0.022*\"walter\" + 0.015*\"king\" + 0.009*\"empath\" + 0.009*\"aza\" + 0.009*\"battalion\" + 0.009*\"embassi\" + 0.008*\"teufel\" + 0.008*\"forc\" + 0.008*\"kingdom\" + 0.007*\"armi\"\n", + "2019-01-31 00:18:58,844 : INFO : topic diff=0.027992, rho=0.096674\n", + "2019-01-31 00:18:59,000 : INFO : PROGRESS: pass 0, at document #216000/4922894\n", + "2019-01-31 00:19:00,502 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:19:00,767 : INFO : topic #4 (0.020): 0.026*\"enfranchis\" + 0.018*\"pour\" + 0.016*\"depress\" + 0.012*\"candid\" + 0.011*\"mode\" + 0.011*\"elabor\" + 0.009*\"veget\" + 0.009*\"encyclopedia\" + 0.009*\"spectacl\" + 0.008*\"produc\"\n", + "2019-01-31 00:19:00,769 : INFO : topic #35 (0.020): 0.046*\"russia\" + 0.031*\"sovereignti\" + 0.031*\"rural\" + 0.025*\"reprint\" + 0.021*\"personifi\" + 0.020*\"poison\" + 0.019*\"unfortun\" + 0.017*\"moscow\" + 0.015*\"shirin\" + 0.015*\"poland\"\n", + "2019-01-31 00:19:00,770 : INFO : topic #25 (0.020): 0.028*\"ring\" + 0.018*\"warmth\" + 0.016*\"lagrang\" + 0.015*\"mount\" + 0.015*\"area\" + 0.009*\"land\" + 0.008*\"north\" + 0.007*\"firm\" + 0.007*\"foam\" + 0.007*\"vacant\"\n", + "2019-01-31 00:19:00,771 : INFO : topic #28 (0.020): 0.028*\"build\" + 0.024*\"hous\" + 0.017*\"rivièr\" + 0.016*\"buford\" + 0.011*\"histor\" + 0.011*\"rosenwald\" + 0.011*\"constitut\" + 0.010*\"briarwood\" + 0.010*\"strategist\" + 0.009*\"lobe\"\n", + "2019-01-31 00:19:00,772 : INFO : topic #23 (0.020): 0.136*\"audit\" + 0.077*\"best\" + 0.041*\"jacksonvil\" + 0.028*\"yawn\" + 0.027*\"japanes\" + 0.021*\"noll\" + 0.019*\"festiv\" + 0.018*\"women\" + 0.015*\"intern\" + 0.014*\"prison\"\n", + "2019-01-31 00:19:00,778 : INFO : topic diff=0.032962, rho=0.096225\n", + "2019-01-31 00:19:00,930 : INFO : PROGRESS: pass 0, at document #218000/4922894\n", + "2019-01-31 00:19:02,391 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:19:02,657 : INFO : topic #27 (0.020): 0.071*\"questionnair\" + 0.017*\"taxpay\" + 0.015*\"candid\" + 0.014*\"tornado\" + 0.012*\"fool\" + 0.012*\"find\" + 0.012*\"squatter\" + 0.011*\"driver\" + 0.011*\"septemb\" + 0.010*\"théori\"\n", + "2019-01-31 00:19:02,659 : INFO : topic #47 (0.020): 0.066*\"muscl\" + 0.033*\"perceptu\" + 0.019*\"compos\" + 0.018*\"damn\" + 0.018*\"physician\" + 0.018*\"wahl\" + 0.017*\"theater\" + 0.017*\"orchestr\" + 0.016*\"place\" + 0.014*\"olympo\"\n", + "2019-01-31 00:19:02,660 : INFO : topic #35 (0.020): 0.046*\"russia\" + 0.031*\"sovereignti\" + 0.030*\"rural\" + 0.025*\"reprint\" + 0.022*\"personifi\" + 0.019*\"poison\" + 0.019*\"unfortun\" + 0.018*\"moscow\" + 0.015*\"shirin\" + 0.014*\"poland\"\n", + "2019-01-31 00:19:02,662 : INFO : topic #46 (0.020): 0.023*\"wind\" + 0.019*\"sweden\" + 0.018*\"norwai\" + 0.015*\"damag\" + 0.014*\"swedish\" + 0.013*\"stop\" + 0.012*\"norwegian\" + 0.011*\"turkish\" + 0.011*\"turkei\" + 0.010*\"warren\"\n", + "2019-01-31 00:19:02,663 : INFO : topic #32 (0.020): 0.063*\"district\" + 0.052*\"vigour\" + 0.049*\"tortur\" + 0.044*\"popolo\" + 0.030*\"regim\" + 0.028*\"area\" + 0.028*\"multitud\" + 0.027*\"cotton\" + 0.021*\"prosper\" + 0.020*\"commun\"\n", + "2019-01-31 00:19:02,668 : INFO : topic diff=0.029279, rho=0.095783\n", + "2019-01-31 00:19:05,473 : INFO : -11.815 per-word bound, 3604.1 perplexity estimate based on a held-out corpus of 2000 documents with 557993 words\n", + "2019-01-31 00:19:05,473 : INFO : PROGRESS: pass 0, at document #220000/4922894\n", + "2019-01-31 00:19:06,970 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:19:07,235 : INFO : topic #0 (0.020): 0.064*\"statewid\" + 0.044*\"arsen\" + 0.038*\"line\" + 0.032*\"raid\" + 0.031*\"museo\" + 0.020*\"word\" + 0.019*\"traceabl\" + 0.019*\"artist\" + 0.019*\"pain\" + 0.017*\"serv\"\n", + "2019-01-31 00:19:07,236 : INFO : topic #46 (0.020): 0.023*\"wind\" + 0.021*\"norwai\" + 0.019*\"sweden\" + 0.015*\"norwegian\" + 0.014*\"swedish\" + 0.014*\"damag\" + 0.013*\"stop\" + 0.011*\"utc\" + 0.011*\"turkei\" + 0.010*\"turkish\"\n", + "2019-01-31 00:19:07,237 : INFO : topic #27 (0.020): 0.070*\"questionnair\" + 0.016*\"taxpay\" + 0.015*\"tornado\" + 0.014*\"candid\" + 0.013*\"squatter\" + 0.012*\"fool\" + 0.012*\"find\" + 0.011*\"driver\" + 0.010*\"théori\" + 0.010*\"rick\"\n", + "2019-01-31 00:19:07,239 : INFO : topic #1 (0.020): 0.050*\"china\" + 0.049*\"chilton\" + 0.030*\"kong\" + 0.029*\"hong\" + 0.023*\"korea\" + 0.021*\"korean\" + 0.017*\"huei\" + 0.016*\"sourc\" + 0.014*\"min\" + 0.013*\"dynasti\"\n", + "2019-01-31 00:19:07,240 : INFO : topic #22 (0.020): 0.033*\"spars\" + 0.026*\"factor\" + 0.024*\"adulthood\" + 0.018*\"hostil\" + 0.016*\"feel\" + 0.014*\"male\" + 0.012*\"live\" + 0.011*\"genu\" + 0.010*\"popolo\" + 0.010*\"yawn\"\n", + "2019-01-31 00:19:07,246 : INFO : topic diff=0.027617, rho=0.095346\n", + "2019-01-31 00:19:07,405 : INFO : PROGRESS: pass 0, at document #222000/4922894\n", + "2019-01-31 00:19:08,916 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:19:09,181 : INFO : topic #14 (0.020): 0.025*\"forc\" + 0.023*\"aggress\" + 0.021*\"walter\" + 0.018*\"armi\" + 0.017*\"com\" + 0.016*\"airmen\" + 0.014*\"unionist\" + 0.013*\"oper\" + 0.013*\"militari\" + 0.011*\"airbu\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 00:19:09,182 : INFO : topic #32 (0.020): 0.063*\"district\" + 0.050*\"vigour\" + 0.049*\"tortur\" + 0.044*\"popolo\" + 0.029*\"regim\" + 0.029*\"area\" + 0.028*\"multitud\" + 0.026*\"cotton\" + 0.022*\"prosper\" + 0.020*\"commun\"\n", + "2019-01-31 00:19:09,183 : INFO : topic #33 (0.020): 0.058*\"french\" + 0.048*\"franc\" + 0.029*\"pari\" + 0.026*\"sail\" + 0.023*\"jean\" + 0.017*\"daphn\" + 0.014*\"lazi\" + 0.011*\"piec\" + 0.010*\"loui\" + 0.010*\"wine\"\n", + "2019-01-31 00:19:09,184 : INFO : topic #47 (0.020): 0.067*\"muscl\" + 0.034*\"perceptu\" + 0.019*\"compos\" + 0.019*\"damn\" + 0.017*\"physician\" + 0.017*\"theater\" + 0.016*\"place\" + 0.016*\"orchestr\" + 0.015*\"wahl\" + 0.014*\"olympo\"\n", + "2019-01-31 00:19:09,186 : INFO : topic #15 (0.020): 0.013*\"develop\" + 0.012*\"requir\" + 0.012*\"small\" + 0.010*\"word\" + 0.009*\"cultur\" + 0.009*\"organ\" + 0.009*\"student\" + 0.008*\"commun\" + 0.008*\"socialist\" + 0.008*\"group\"\n", + "2019-01-31 00:19:09,191 : INFO : topic diff=0.031923, rho=0.094916\n", + "2019-01-31 00:19:09,406 : INFO : PROGRESS: pass 0, at document #224000/4922894\n", + "2019-01-31 00:19:10,896 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:19:11,161 : INFO : topic #11 (0.020): 0.028*\"john\" + 0.017*\"will\" + 0.014*\"jame\" + 0.012*\"rival\" + 0.012*\"david\" + 0.011*\"georg\" + 0.009*\"slur\" + 0.009*\"rhyme\" + 0.009*\"mexican–american\" + 0.008*\"paul\"\n", + "2019-01-31 00:19:11,163 : INFO : topic #1 (0.020): 0.052*\"chilton\" + 0.051*\"china\" + 0.029*\"kong\" + 0.029*\"hong\" + 0.023*\"korea\" + 0.021*\"korean\" + 0.016*\"sourc\" + 0.015*\"huei\" + 0.013*\"leah\" + 0.012*\"min\"\n", + "2019-01-31 00:19:11,164 : INFO : topic #16 (0.020): 0.029*\"priest\" + 0.020*\"quarterli\" + 0.019*\"king\" + 0.018*\"duke\" + 0.017*\"grammat\" + 0.016*\"rotterdam\" + 0.014*\"maria\" + 0.013*\"princ\" + 0.012*\"portugues\" + 0.011*\"klux\"\n", + "2019-01-31 00:19:11,165 : INFO : topic #48 (0.020): 0.083*\"sens\" + 0.081*\"march\" + 0.080*\"octob\" + 0.078*\"juli\" + 0.078*\"januari\" + 0.077*\"august\" + 0.075*\"judici\" + 0.075*\"april\" + 0.074*\"notion\" + 0.071*\"decatur\"\n", + "2019-01-31 00:19:11,167 : INFO : topic #39 (0.020): 0.030*\"taxpay\" + 0.028*\"scientist\" + 0.025*\"canada\" + 0.021*\"clot\" + 0.021*\"canadian\" + 0.015*\"basketbal\" + 0.013*\"hoar\" + 0.012*\"toronto\" + 0.012*\"confer\" + 0.011*\"yawn\"\n", + "2019-01-31 00:19:11,173 : INFO : topic diff=0.028385, rho=0.094491\n", + "2019-01-31 00:19:11,326 : INFO : PROGRESS: pass 0, at document #226000/4922894\n", + "2019-01-31 00:19:12,800 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:19:13,065 : INFO : topic #41 (0.020): 0.049*\"citi\" + 0.038*\"new\" + 0.024*\"palmer\" + 0.023*\"year\" + 0.017*\"center\" + 0.016*\"strategist\" + 0.011*\"open\" + 0.009*\"includ\" + 0.009*\"lobe\" + 0.008*\"hot\"\n", + "2019-01-31 00:19:13,066 : INFO : topic #3 (0.020): 0.033*\"present\" + 0.031*\"offic\" + 0.025*\"minist\" + 0.022*\"seri\" + 0.019*\"gener\" + 0.018*\"serv\" + 0.017*\"chickasaw\" + 0.016*\"member\" + 0.014*\"appeas\" + 0.013*\"secess\"\n", + "2019-01-31 00:19:13,067 : INFO : topic #33 (0.020): 0.060*\"french\" + 0.046*\"franc\" + 0.028*\"pari\" + 0.026*\"sail\" + 0.022*\"jean\" + 0.016*\"daphn\" + 0.013*\"lazi\" + 0.011*\"piec\" + 0.011*\"wine\" + 0.010*\"focal\"\n", + "2019-01-31 00:19:13,068 : INFO : topic #19 (0.020): 0.009*\"form\" + 0.009*\"origin\" + 0.008*\"woodcut\" + 0.008*\"god\" + 0.008*\"like\" + 0.008*\"mean\" + 0.007*\"uruguayan\" + 0.007*\"charact\" + 0.006*\"differ\" + 0.006*\"call\"\n", + "2019-01-31 00:19:13,069 : INFO : topic #37 (0.020): 0.009*\"love\" + 0.006*\"gestur\" + 0.005*\"man\" + 0.005*\"night\" + 0.005*\"blue\" + 0.004*\"bewild\" + 0.004*\"litig\" + 0.004*\"christma\" + 0.004*\"dai\" + 0.004*\"toll\"\n", + "2019-01-31 00:19:13,075 : INFO : topic diff=0.026800, rho=0.094072\n", + "2019-01-31 00:19:13,228 : INFO : PROGRESS: pass 0, at document #228000/4922894\n", + "2019-01-31 00:19:14,695 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:19:14,961 : INFO : topic #30 (0.020): 0.036*\"cleveland\" + 0.032*\"leagu\" + 0.030*\"place\" + 0.025*\"taxpay\" + 0.024*\"crete\" + 0.023*\"scientist\" + 0.022*\"folei\" + 0.017*\"goal\" + 0.016*\"martin\" + 0.012*\"schmitz\"\n", + "2019-01-31 00:19:14,962 : INFO : topic #41 (0.020): 0.048*\"citi\" + 0.038*\"new\" + 0.024*\"palmer\" + 0.023*\"year\" + 0.017*\"center\" + 0.016*\"strategist\" + 0.012*\"open\" + 0.009*\"includ\" + 0.009*\"lobe\" + 0.009*\"hot\"\n", + "2019-01-31 00:19:14,963 : INFO : topic #47 (0.020): 0.066*\"muscl\" + 0.033*\"perceptu\" + 0.020*\"compos\" + 0.019*\"physician\" + 0.017*\"damn\" + 0.017*\"place\" + 0.015*\"theater\" + 0.015*\"orchestr\" + 0.014*\"olympo\" + 0.012*\"wahl\"\n", + "2019-01-31 00:19:14,964 : INFO : topic #33 (0.020): 0.060*\"french\" + 0.046*\"franc\" + 0.028*\"pari\" + 0.027*\"sail\" + 0.022*\"jean\" + 0.016*\"daphn\" + 0.013*\"lazi\" + 0.011*\"piec\" + 0.010*\"loui\" + 0.010*\"wine\"\n", + "2019-01-31 00:19:14,965 : INFO : topic #32 (0.020): 0.062*\"district\" + 0.050*\"vigour\" + 0.048*\"tortur\" + 0.043*\"popolo\" + 0.029*\"regim\" + 0.029*\"area\" + 0.028*\"multitud\" + 0.026*\"cotton\" + 0.021*\"prosper\" + 0.020*\"commun\"\n", + "2019-01-31 00:19:14,971 : INFO : topic diff=0.026556, rho=0.093659\n", + "2019-01-31 00:19:15,126 : INFO : PROGRESS: pass 0, at document #230000/4922894\n", + "2019-01-31 00:19:16,589 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:19:16,855 : INFO : topic #41 (0.020): 0.048*\"citi\" + 0.038*\"new\" + 0.024*\"palmer\" + 0.023*\"year\" + 0.016*\"center\" + 0.016*\"strategist\" + 0.012*\"open\" + 0.009*\"includ\" + 0.009*\"hot\" + 0.009*\"lobe\"\n", + "2019-01-31 00:19:16,856 : INFO : topic #33 (0.020): 0.058*\"french\" + 0.044*\"franc\" + 0.027*\"sail\" + 0.027*\"pari\" + 0.021*\"jean\" + 0.016*\"daphn\" + 0.013*\"lazi\" + 0.012*\"wreath\" + 0.011*\"piec\" + 0.010*\"loui\"\n", + "2019-01-31 00:19:16,857 : INFO : topic #47 (0.020): 0.066*\"muscl\" + 0.033*\"perceptu\" + 0.020*\"compos\" + 0.019*\"physician\" + 0.018*\"damn\" + 0.017*\"place\" + 0.015*\"theater\" + 0.015*\"orchestr\" + 0.014*\"olympo\" + 0.011*\"word\"\n", + "2019-01-31 00:19:16,858 : INFO : topic #16 (0.020): 0.029*\"priest\" + 0.021*\"duke\" + 0.019*\"king\" + 0.018*\"quarterli\" + 0.016*\"grammat\" + 0.014*\"rotterdam\" + 0.013*\"maria\" + 0.013*\"princ\" + 0.011*\"portugues\" + 0.011*\"count\"\n", + "2019-01-31 00:19:16,859 : INFO : topic #11 (0.020): 0.028*\"john\" + 0.016*\"will\" + 0.014*\"jame\" + 0.012*\"rival\" + 0.012*\"david\" + 0.011*\"georg\" + 0.010*\"slur\" + 0.009*\"rhyme\" + 0.008*\"mexican–american\" + 0.007*\"thirtieth\"\n", + "2019-01-31 00:19:16,865 : INFO : topic diff=0.026651, rho=0.093250\n", + "2019-01-31 00:19:17,018 : INFO : PROGRESS: pass 0, at document #232000/4922894\n", + "2019-01-31 00:19:18,480 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:19:18,746 : INFO : topic #30 (0.020): 0.036*\"cleveland\" + 0.033*\"leagu\" + 0.030*\"place\" + 0.025*\"taxpay\" + 0.024*\"crete\" + 0.022*\"scientist\" + 0.022*\"folei\" + 0.017*\"martin\" + 0.016*\"goal\" + 0.012*\"schmitz\"\n", + "2019-01-31 00:19:18,747 : INFO : topic #17 (0.020): 0.058*\"church\" + 0.019*\"fifteenth\" + 0.018*\"jpg\" + 0.017*\"cathol\" + 0.017*\"retroflex\" + 0.016*\"bishop\" + 0.016*\"centuri\" + 0.015*\"christian\" + 0.013*\"sail\" + 0.012*\"italian\"\n", + "2019-01-31 00:19:18,749 : INFO : topic #1 (0.020): 0.053*\"chilton\" + 0.051*\"china\" + 0.026*\"kong\" + 0.026*\"hong\" + 0.022*\"korea\" + 0.020*\"korean\" + 0.017*\"sourc\" + 0.013*\"leah\" + 0.012*\"taiwan\" + 0.011*\"min\"\n", + "2019-01-31 00:19:18,750 : INFO : topic #36 (0.020): 0.028*\"companhia\" + 0.010*\"market\" + 0.009*\"serv\" + 0.009*\"manag\" + 0.009*\"develop\" + 0.009*\"busi\" + 0.009*\"oper\" + 0.008*\"produc\" + 0.008*\"prognosi\" + 0.008*\"includ\"\n", + "2019-01-31 00:19:18,751 : INFO : topic #37 (0.020): 0.009*\"love\" + 0.006*\"gestur\" + 0.005*\"man\" + 0.005*\"night\" + 0.005*\"blue\" + 0.004*\"bewild\" + 0.004*\"litig\" + 0.004*\"introductori\" + 0.004*\"christma\" + 0.004*\"dai\"\n", + "2019-01-31 00:19:18,757 : INFO : topic diff=0.025051, rho=0.092848\n", + "2019-01-31 00:19:18,911 : INFO : PROGRESS: pass 0, at document #234000/4922894\n", + "2019-01-31 00:19:20,383 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:19:20,648 : INFO : topic #28 (0.020): 0.027*\"build\" + 0.024*\"hous\" + 0.020*\"rivièr\" + 0.016*\"buford\" + 0.012*\"histor\" + 0.011*\"constitut\" + 0.011*\"rosenwald\" + 0.010*\"briarwood\" + 0.009*\"strategist\" + 0.009*\"lobe\"\n", + "2019-01-31 00:19:20,649 : INFO : topic #12 (0.020): 0.009*\"number\" + 0.007*\"cytokin\" + 0.007*\"frontal\" + 0.007*\"measur\" + 0.006*\"théori\" + 0.006*\"poet\" + 0.006*\"exampl\" + 0.006*\"gener\" + 0.006*\"utopian\" + 0.006*\"servitud\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 00:19:20,651 : INFO : topic #22 (0.020): 0.034*\"spars\" + 0.027*\"factor\" + 0.022*\"adulthood\" + 0.017*\"hostil\" + 0.015*\"feel\" + 0.013*\"male\" + 0.012*\"live\" + 0.011*\"genu\" + 0.010*\"plaisir\" + 0.010*\"popolo\"\n", + "2019-01-31 00:19:20,652 : INFO : topic #37 (0.020): 0.009*\"love\" + 0.006*\"gestur\" + 0.005*\"man\" + 0.005*\"night\" + 0.005*\"blue\" + 0.004*\"bewild\" + 0.004*\"litig\" + 0.004*\"todd\" + 0.004*\"introductori\" + 0.004*\"christma\"\n", + "2019-01-31 00:19:20,654 : INFO : topic #39 (0.020): 0.033*\"taxpay\" + 0.028*\"scientist\" + 0.026*\"canada\" + 0.023*\"clot\" + 0.022*\"canadian\" + 0.017*\"basketbal\" + 0.014*\"hoar\" + 0.012*\"confer\" + 0.011*\"toronto\" + 0.011*\"yawn\"\n", + "2019-01-31 00:19:20,659 : INFO : topic diff=0.026623, rho=0.092450\n", + "2019-01-31 00:19:20,814 : INFO : PROGRESS: pass 0, at document #236000/4922894\n", + "2019-01-31 00:19:22,300 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:19:22,566 : INFO : topic #35 (0.020): 0.045*\"russia\" + 0.035*\"sovereignti\" + 0.028*\"rural\" + 0.023*\"personifi\" + 0.022*\"reprint\" + 0.022*\"poison\" + 0.018*\"moscow\" + 0.018*\"unfortun\" + 0.014*\"shirin\" + 0.013*\"intern\"\n", + "2019-01-31 00:19:22,567 : INFO : topic #37 (0.020): 0.009*\"love\" + 0.006*\"gestur\" + 0.005*\"man\" + 0.005*\"blue\" + 0.005*\"night\" + 0.004*\"bewild\" + 0.004*\"litig\" + 0.004*\"todd\" + 0.004*\"christma\" + 0.004*\"dai\"\n", + "2019-01-31 00:19:22,568 : INFO : topic #0 (0.020): 0.066*\"statewid\" + 0.044*\"arsen\" + 0.038*\"line\" + 0.032*\"raid\" + 0.031*\"museo\" + 0.020*\"pain\" + 0.019*\"word\" + 0.019*\"traceabl\" + 0.017*\"artist\" + 0.017*\"serv\"\n", + "2019-01-31 00:19:22,569 : INFO : topic #15 (0.020): 0.014*\"develop\" + 0.012*\"requir\" + 0.012*\"small\" + 0.010*\"cultur\" + 0.010*\"word\" + 0.009*\"organ\" + 0.009*\"student\" + 0.008*\"socialist\" + 0.008*\"commun\" + 0.008*\"human\"\n", + "2019-01-31 00:19:22,571 : INFO : topic #48 (0.020): 0.083*\"octob\" + 0.083*\"march\" + 0.081*\"sens\" + 0.078*\"juli\" + 0.077*\"januari\" + 0.076*\"august\" + 0.076*\"april\" + 0.076*\"notion\" + 0.075*\"judici\" + 0.072*\"decatur\"\n", + "2019-01-31 00:19:22,577 : INFO : topic diff=0.027172, rho=0.092057\n", + "2019-01-31 00:19:22,732 : INFO : PROGRESS: pass 0, at document #238000/4922894\n", + "2019-01-31 00:19:24,220 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:19:24,486 : INFO : topic #20 (0.020): 0.125*\"scholar\" + 0.035*\"struggl\" + 0.029*\"high\" + 0.028*\"educ\" + 0.018*\"yawn\" + 0.016*\"collector\" + 0.014*\"prognosi\" + 0.008*\"task\" + 0.008*\"class\" + 0.008*\"gothic\"\n", + "2019-01-31 00:19:24,487 : INFO : topic #33 (0.020): 0.057*\"french\" + 0.045*\"franc\" + 0.028*\"pari\" + 0.026*\"sail\" + 0.021*\"jean\" + 0.017*\"daphn\" + 0.013*\"lazi\" + 0.012*\"piec\" + 0.011*\"wreath\" + 0.010*\"loui\"\n", + "2019-01-31 00:19:24,488 : INFO : topic #18 (0.020): 0.008*\"théori\" + 0.007*\"later\" + 0.006*\"kill\" + 0.006*\"man\" + 0.006*\"sack\" + 0.005*\"retrospect\" + 0.005*\"dai\" + 0.005*\"deal\" + 0.004*\"fraud\" + 0.004*\"help\"\n", + "2019-01-31 00:19:24,490 : INFO : topic #9 (0.020): 0.080*\"bone\" + 0.045*\"american\" + 0.027*\"valour\" + 0.018*\"player\" + 0.018*\"polit\" + 0.016*\"folei\" + 0.016*\"english\" + 0.015*\"dutch\" + 0.012*\"simpler\" + 0.012*\"wedg\"\n", + "2019-01-31 00:19:24,491 : INFO : topic #38 (0.020): 0.023*\"walter\" + 0.014*\"king\" + 0.011*\"battalion\" + 0.009*\"aza\" + 0.009*\"empath\" + 0.008*\"forc\" + 0.008*\"embassi\" + 0.007*\"centuri\" + 0.007*\"armi\" + 0.007*\"teufel\"\n", + "2019-01-31 00:19:24,497 : INFO : topic diff=0.027511, rho=0.091670\n", + "2019-01-31 00:19:27,254 : INFO : -11.718 per-word bound, 3369.6 perplexity estimate based on a held-out corpus of 2000 documents with 540188 words\n", + "2019-01-31 00:19:27,254 : INFO : PROGRESS: pass 0, at document #240000/4922894\n", + "2019-01-31 00:19:28,723 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:19:28,988 : INFO : topic #28 (0.020): 0.028*\"build\" + 0.023*\"hous\" + 0.019*\"rivièr\" + 0.016*\"buford\" + 0.012*\"histor\" + 0.011*\"constitut\" + 0.010*\"rosenwald\" + 0.009*\"briarwood\" + 0.009*\"lobe\" + 0.009*\"silicon\"\n", + "2019-01-31 00:19:28,990 : INFO : topic #26 (0.020): 0.033*\"woman\" + 0.031*\"workplac\" + 0.031*\"champion\" + 0.026*\"medal\" + 0.026*\"olymp\" + 0.024*\"men\" + 0.020*\"event\" + 0.019*\"alic\" + 0.019*\"atheist\" + 0.018*\"gold\"\n", + "2019-01-31 00:19:28,991 : INFO : topic #46 (0.020): 0.023*\"wind\" + 0.020*\"damag\" + 0.019*\"sweden\" + 0.019*\"norwai\" + 0.017*\"norwegian\" + 0.015*\"swedish\" + 0.014*\"stop\" + 0.010*\"turkei\" + 0.010*\"farid\" + 0.009*\"caus\"\n", + "2019-01-31 00:19:28,992 : INFO : topic #7 (0.020): 0.020*\"snatch\" + 0.019*\"di\" + 0.017*\"factor\" + 0.015*\"yawn\" + 0.014*\"margin\" + 0.013*\"deal\" + 0.013*\"faster\" + 0.012*\"life\" + 0.012*\"bone\" + 0.011*\"john\"\n", + "2019-01-31 00:19:28,993 : INFO : topic #9 (0.020): 0.078*\"bone\" + 0.047*\"american\" + 0.026*\"valour\" + 0.019*\"polit\" + 0.018*\"player\" + 0.017*\"folei\" + 0.015*\"english\" + 0.015*\"dutch\" + 0.012*\"wedg\" + 0.012*\"simpler\"\n", + "2019-01-31 00:19:28,999 : INFO : topic diff=0.024902, rho=0.091287\n", + "2019-01-31 00:19:29,152 : INFO : PROGRESS: pass 0, at document #242000/4922894\n", + "2019-01-31 00:19:30,604 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:19:30,871 : INFO : topic #15 (0.020): 0.014*\"develop\" + 0.012*\"requir\" + 0.012*\"small\" + 0.010*\"cultur\" + 0.010*\"word\" + 0.009*\"organ\" + 0.009*\"student\" + 0.009*\"commun\" + 0.008*\"human\" + 0.008*\"socialist\"\n", + "2019-01-31 00:19:30,872 : INFO : topic #35 (0.020): 0.045*\"russia\" + 0.035*\"sovereignti\" + 0.027*\"rural\" + 0.024*\"poison\" + 0.024*\"reprint\" + 0.023*\"personifi\" + 0.017*\"moscow\" + 0.017*\"unfortun\" + 0.015*\"shirin\" + 0.013*\"intern\"\n", + "2019-01-31 00:19:30,873 : INFO : topic #44 (0.020): 0.031*\"rooftop\" + 0.025*\"final\" + 0.024*\"wife\" + 0.017*\"champion\" + 0.017*\"tourist\" + 0.017*\"martin\" + 0.015*\"chamber\" + 0.014*\"poet\" + 0.014*\"open\" + 0.014*\"tiepolo\"\n", + "2019-01-31 00:19:30,875 : INFO : topic #1 (0.020): 0.055*\"chilton\" + 0.050*\"china\" + 0.027*\"hong\" + 0.027*\"kong\" + 0.021*\"korea\" + 0.019*\"korean\" + 0.015*\"sourc\" + 0.014*\"kim\" + 0.013*\"leah\" + 0.012*\"levinson\"\n", + "2019-01-31 00:19:30,876 : INFO : topic #17 (0.020): 0.056*\"church\" + 0.021*\"jpg\" + 0.020*\"fifteenth\" + 0.017*\"christian\" + 0.017*\"cathol\" + 0.016*\"bishop\" + 0.015*\"retroflex\" + 0.015*\"centuri\" + 0.014*\"italian\" + 0.013*\"sail\"\n", + "2019-01-31 00:19:30,882 : INFO : topic diff=0.025514, rho=0.090909\n", + "2019-01-31 00:19:31,030 : INFO : PROGRESS: pass 0, at document #244000/4922894\n", + "2019-01-31 00:19:32,472 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:19:32,738 : INFO : topic #42 (0.020): 0.042*\"german\" + 0.025*\"germani\" + 0.014*\"israel\" + 0.013*\"vol\" + 0.012*\"berlin\" + 0.012*\"der\" + 0.010*\"jewish\" + 0.009*\"isra\" + 0.008*\"greek\" + 0.008*\"austria\"\n", + "2019-01-31 00:19:32,739 : INFO : topic #11 (0.020): 0.028*\"john\" + 0.016*\"will\" + 0.014*\"jame\" + 0.012*\"rival\" + 0.011*\"david\" + 0.011*\"georg\" + 0.010*\"slur\" + 0.009*\"mexican–american\" + 0.009*\"rhyme\" + 0.008*\"paul\"\n", + "2019-01-31 00:19:32,740 : INFO : topic #8 (0.020): 0.029*\"law\" + 0.027*\"cortic\" + 0.020*\"start\" + 0.018*\"ricardo\" + 0.016*\"act\" + 0.014*\"case\" + 0.010*\"polaris\" + 0.009*\"legal\" + 0.008*\"judaism\" + 0.008*\"unionist\"\n", + "2019-01-31 00:19:32,741 : INFO : topic #37 (0.020): 0.009*\"love\" + 0.006*\"gestur\" + 0.005*\"man\" + 0.005*\"night\" + 0.005*\"blue\" + 0.004*\"litig\" + 0.004*\"bewild\" + 0.004*\"todd\" + 0.003*\"introductori\" + 0.003*\"dai\"\n", + "2019-01-31 00:19:32,742 : INFO : topic #36 (0.020): 0.028*\"companhia\" + 0.010*\"develop\" + 0.010*\"serv\" + 0.009*\"manag\" + 0.009*\"market\" + 0.008*\"oper\" + 0.008*\"includ\" + 0.008*\"produc\" + 0.008*\"busi\" + 0.008*\"prognosi\"\n", + "2019-01-31 00:19:32,748 : INFO : topic diff=0.027092, rho=0.090536\n", + "2019-01-31 00:19:32,902 : INFO : PROGRESS: pass 0, at document #246000/4922894\n", + "2019-01-31 00:19:34,363 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:19:34,630 : INFO : topic #31 (0.020): 0.065*\"fusiform\" + 0.024*\"player\" + 0.018*\"place\" + 0.018*\"scientist\" + 0.016*\"taxpay\" + 0.011*\"leagu\" + 0.011*\"yard\" + 0.010*\"folei\" + 0.010*\"ruler\" + 0.009*\"barber\"\n", + "2019-01-31 00:19:34,631 : INFO : topic #22 (0.020): 0.034*\"spars\" + 0.026*\"factor\" + 0.021*\"adulthood\" + 0.016*\"hostil\" + 0.015*\"feel\" + 0.013*\"male\" + 0.011*\"plaisir\" + 0.011*\"live\" + 0.010*\"popolo\" + 0.009*\"genu\"\n", + "2019-01-31 00:19:34,632 : INFO : topic #40 (0.020): 0.088*\"unit\" + 0.030*\"collector\" + 0.019*\"institut\" + 0.018*\"schuster\" + 0.015*\"student\" + 0.014*\"professor\" + 0.014*\"requir\" + 0.012*\"governor\" + 0.012*\"http\" + 0.011*\"word\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 00:19:34,633 : INFO : topic #16 (0.020): 0.029*\"priest\" + 0.021*\"duke\" + 0.019*\"king\" + 0.019*\"quarterli\" + 0.017*\"maria\" + 0.016*\"grammat\" + 0.014*\"rotterdam\" + 0.013*\"princ\" + 0.013*\"portrait\" + 0.013*\"portugues\"\n", + "2019-01-31 00:19:34,635 : INFO : topic #30 (0.020): 0.037*\"cleveland\" + 0.034*\"leagu\" + 0.029*\"place\" + 0.026*\"taxpay\" + 0.024*\"scientist\" + 0.023*\"crete\" + 0.022*\"folei\" + 0.016*\"goal\" + 0.015*\"martin\" + 0.011*\"schmitz\"\n", + "2019-01-31 00:19:34,641 : INFO : topic diff=0.026266, rho=0.090167\n", + "2019-01-31 00:19:34,790 : INFO : PROGRESS: pass 0, at document #248000/4922894\n", + "2019-01-31 00:19:36,215 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:19:36,481 : INFO : topic #10 (0.020): 0.011*\"cdd\" + 0.008*\"media\" + 0.008*\"disco\" + 0.008*\"have\" + 0.007*\"pathwai\" + 0.007*\"hormon\" + 0.006*\"caus\" + 0.006*\"treat\" + 0.006*\"effect\" + 0.006*\"proper\"\n", + "2019-01-31 00:19:36,482 : INFO : topic #34 (0.020): 0.069*\"start\" + 0.044*\"cotton\" + 0.029*\"unionist\" + 0.022*\"american\" + 0.017*\"toni\" + 0.015*\"new\" + 0.014*\"terri\" + 0.014*\"california\" + 0.012*\"warrior\" + 0.011*\"north\"\n", + "2019-01-31 00:19:36,483 : INFO : topic #30 (0.020): 0.036*\"cleveland\" + 0.034*\"leagu\" + 0.028*\"place\" + 0.026*\"taxpay\" + 0.024*\"scientist\" + 0.022*\"crete\" + 0.022*\"folei\" + 0.016*\"goal\" + 0.015*\"martin\" + 0.012*\"schmitz\"\n", + "2019-01-31 00:19:36,484 : INFO : topic #8 (0.020): 0.029*\"law\" + 0.026*\"cortic\" + 0.020*\"start\" + 0.017*\"ricardo\" + 0.016*\"act\" + 0.015*\"case\" + 0.010*\"polaris\" + 0.008*\"legal\" + 0.008*\"judaism\" + 0.008*\"unionist\"\n", + "2019-01-31 00:19:36,485 : INFO : topic #17 (0.020): 0.058*\"church\" + 0.020*\"jpg\" + 0.019*\"fifteenth\" + 0.018*\"cathol\" + 0.018*\"bishop\" + 0.017*\"christian\" + 0.015*\"retroflex\" + 0.015*\"centuri\" + 0.014*\"italian\" + 0.014*\"sail\"\n", + "2019-01-31 00:19:36,491 : INFO : topic diff=0.026258, rho=0.089803\n", + "2019-01-31 00:19:36,649 : INFO : PROGRESS: pass 0, at document #250000/4922894\n", + "2019-01-31 00:19:38,146 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:19:38,412 : INFO : topic #1 (0.020): 0.054*\"chilton\" + 0.051*\"china\" + 0.025*\"hong\" + 0.025*\"kong\" + 0.022*\"korean\" + 0.022*\"korea\" + 0.015*\"sourc\" + 0.013*\"kim\" + 0.013*\"leah\" + 0.012*\"taiwan\"\n", + "2019-01-31 00:19:38,413 : INFO : topic #28 (0.020): 0.028*\"build\" + 0.023*\"rivièr\" + 0.023*\"hous\" + 0.016*\"buford\" + 0.011*\"histor\" + 0.011*\"constitut\" + 0.011*\"rosenwald\" + 0.010*\"briarwood\" + 0.009*\"strategist\" + 0.009*\"lobe\"\n", + "2019-01-31 00:19:38,414 : INFO : topic #0 (0.020): 0.070*\"statewid\" + 0.041*\"arsen\" + 0.038*\"line\" + 0.033*\"raid\" + 0.031*\"museo\" + 0.020*\"pain\" + 0.019*\"traceabl\" + 0.018*\"word\" + 0.017*\"serv\" + 0.016*\"artist\"\n", + "2019-01-31 00:19:38,416 : INFO : topic #2 (0.020): 0.046*\"isl\" + 0.036*\"shield\" + 0.018*\"narrat\" + 0.016*\"blur\" + 0.014*\"scot\" + 0.012*\"pope\" + 0.011*\"nativist\" + 0.010*\"sai\" + 0.010*\"fleet\" + 0.009*\"coalit\"\n", + "2019-01-31 00:19:38,417 : INFO : topic #21 (0.020): 0.039*\"samford\" + 0.024*\"spain\" + 0.017*\"del\" + 0.017*\"mexico\" + 0.014*\"soviet\" + 0.013*\"lizard\" + 0.012*\"juan\" + 0.012*\"santa\" + 0.011*\"francisco\" + 0.011*\"josé\"\n", + "2019-01-31 00:19:38,423 : INFO : topic diff=0.026226, rho=0.089443\n", + "2019-01-31 00:19:38,578 : INFO : PROGRESS: pass 0, at document #252000/4922894\n", + "2019-01-31 00:19:40,049 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:19:40,315 : INFO : topic #48 (0.020): 0.076*\"march\" + 0.075*\"sens\" + 0.075*\"octob\" + 0.071*\"januari\" + 0.071*\"juli\" + 0.070*\"august\" + 0.070*\"notion\" + 0.069*\"decatur\" + 0.067*\"judici\" + 0.066*\"april\"\n", + "2019-01-31 00:19:40,316 : INFO : topic #19 (0.020): 0.009*\"origin\" + 0.009*\"charact\" + 0.009*\"form\" + 0.008*\"woodcut\" + 0.008*\"like\" + 0.008*\"mean\" + 0.007*\"uruguayan\" + 0.007*\"god\" + 0.007*\"languag\" + 0.006*\"dynam\"\n", + "2019-01-31 00:19:40,318 : INFO : topic #22 (0.020): 0.036*\"spars\" + 0.025*\"factor\" + 0.020*\"adulthood\" + 0.015*\"hostil\" + 0.015*\"feel\" + 0.013*\"male\" + 0.012*\"genu\" + 0.011*\"plaisir\" + 0.010*\"live\" + 0.010*\"popolo\"\n", + "2019-01-31 00:19:40,319 : INFO : topic #25 (0.020): 0.027*\"ring\" + 0.019*\"warmth\" + 0.015*\"mount\" + 0.015*\"lagrang\" + 0.014*\"area\" + 0.008*\"land\" + 0.008*\"firm\" + 0.008*\"north\" + 0.007*\"vacant\" + 0.007*\"foam\"\n", + "2019-01-31 00:19:40,320 : INFO : topic #13 (0.020): 0.029*\"australia\" + 0.028*\"sourc\" + 0.024*\"new\" + 0.024*\"australian\" + 0.022*\"england\" + 0.021*\"london\" + 0.017*\"youth\" + 0.016*\"ireland\" + 0.016*\"british\" + 0.015*\"wale\"\n", + "2019-01-31 00:19:40,326 : INFO : topic diff=0.024678, rho=0.089087\n", + "2019-01-31 00:19:40,540 : INFO : PROGRESS: pass 0, at document #254000/4922894\n", + "2019-01-31 00:19:42,027 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:19:42,293 : INFO : topic #28 (0.020): 0.028*\"build\" + 0.023*\"rivièr\" + 0.023*\"hous\" + 0.016*\"buford\" + 0.012*\"histor\" + 0.011*\"briarwood\" + 0.011*\"constitut\" + 0.010*\"rosenwald\" + 0.009*\"strategist\" + 0.009*\"lobe\"\n", + "2019-01-31 00:19:42,294 : INFO : topic #34 (0.020): 0.069*\"start\" + 0.041*\"cotton\" + 0.029*\"unionist\" + 0.022*\"american\" + 0.015*\"new\" + 0.015*\"california\" + 0.014*\"terri\" + 0.014*\"toni\" + 0.012*\"warrior\" + 0.011*\"north\"\n", + "2019-01-31 00:19:42,295 : INFO : topic #6 (0.020): 0.067*\"fewer\" + 0.024*\"septemb\" + 0.022*\"epiru\" + 0.019*\"teacher\" + 0.015*\"stake\" + 0.012*\"rodríguez\" + 0.011*\"proclaim\" + 0.011*\"direct\" + 0.011*\"movi\" + 0.010*\"acrimoni\"\n", + "2019-01-31 00:19:42,296 : INFO : topic #19 (0.020): 0.009*\"origin\" + 0.009*\"charact\" + 0.009*\"form\" + 0.009*\"woodcut\" + 0.008*\"like\" + 0.008*\"mean\" + 0.007*\"uruguayan\" + 0.007*\"god\" + 0.007*\"dynam\" + 0.007*\"languag\"\n", + "2019-01-31 00:19:42,298 : INFO : topic #18 (0.020): 0.008*\"théori\" + 0.007*\"later\" + 0.007*\"kill\" + 0.006*\"sack\" + 0.006*\"man\" + 0.005*\"retrospect\" + 0.005*\"dai\" + 0.004*\"deal\" + 0.004*\"help\" + 0.004*\"end\"\n", + "2019-01-31 00:19:42,304 : INFO : topic diff=0.023731, rho=0.088736\n", + "2019-01-31 00:19:42,463 : INFO : PROGRESS: pass 0, at document #256000/4922894\n", + "2019-01-31 00:19:43,952 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:19:44,218 : INFO : topic #22 (0.020): 0.035*\"spars\" + 0.025*\"factor\" + 0.021*\"adulthood\" + 0.016*\"feel\" + 0.015*\"hostil\" + 0.014*\"male\" + 0.011*\"genu\" + 0.011*\"plaisir\" + 0.011*\"live\" + 0.010*\"popolo\"\n", + "2019-01-31 00:19:44,219 : INFO : topic #42 (0.020): 0.040*\"german\" + 0.026*\"germani\" + 0.014*\"israel\" + 0.014*\"jewish\" + 0.012*\"berlin\" + 0.011*\"vol\" + 0.011*\"der\" + 0.008*\"isra\" + 0.008*\"anglo\" + 0.008*\"jeremiah\"\n", + "2019-01-31 00:19:44,221 : INFO : topic #45 (0.020): 0.019*\"black\" + 0.019*\"western\" + 0.015*\"colder\" + 0.013*\"record\" + 0.011*\"blind\" + 0.009*\"light\" + 0.009*\"green\" + 0.007*\"arm\" + 0.006*\"illicit\" + 0.006*\"hand\"\n", + "2019-01-31 00:19:44,222 : INFO : topic #25 (0.020): 0.028*\"ring\" + 0.019*\"warmth\" + 0.017*\"lagrang\" + 0.015*\"mount\" + 0.015*\"area\" + 0.008*\"land\" + 0.008*\"north\" + 0.008*\"foam\" + 0.008*\"firm\" + 0.007*\"vacant\"\n", + "2019-01-31 00:19:44,223 : INFO : topic #8 (0.020): 0.030*\"law\" + 0.026*\"cortic\" + 0.020*\"start\" + 0.017*\"act\" + 0.016*\"ricardo\" + 0.014*\"case\" + 0.010*\"polaris\" + 0.009*\"legal\" + 0.009*\"judaism\" + 0.008*\"justic\"\n", + "2019-01-31 00:19:44,229 : INFO : topic diff=0.026460, rho=0.088388\n", + "2019-01-31 00:19:44,385 : INFO : PROGRESS: pass 0, at document #258000/4922894\n", + "2019-01-31 00:19:45,867 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:19:46,133 : INFO : topic #25 (0.020): 0.028*\"ring\" + 0.019*\"warmth\" + 0.017*\"lagrang\" + 0.015*\"area\" + 0.015*\"mount\" + 0.008*\"land\" + 0.008*\"north\" + 0.008*\"foam\" + 0.008*\"firm\" + 0.007*\"vacant\"\n", + "2019-01-31 00:19:46,134 : INFO : topic #47 (0.020): 0.068*\"muscl\" + 0.036*\"perceptu\" + 0.020*\"theater\" + 0.018*\"compos\" + 0.018*\"place\" + 0.018*\"damn\" + 0.013*\"orchestr\" + 0.012*\"olympo\" + 0.012*\"physician\" + 0.012*\"word\"\n", + "2019-01-31 00:19:46,136 : INFO : topic #46 (0.020): 0.018*\"wind\" + 0.018*\"norwai\" + 0.016*\"stop\" + 0.016*\"sweden\" + 0.015*\"norwegian\" + 0.015*\"swedish\" + 0.014*\"damag\" + 0.011*\"turkish\" + 0.011*\"turkei\" + 0.010*\"financ\"\n", + "2019-01-31 00:19:46,137 : INFO : topic #41 (0.020): 0.050*\"citi\" + 0.036*\"new\" + 0.028*\"palmer\" + 0.021*\"year\" + 0.017*\"center\" + 0.015*\"strategist\" + 0.011*\"open\" + 0.010*\"hot\" + 0.009*\"includ\" + 0.009*\"lobe\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 00:19:46,137 : INFO : topic #0 (0.020): 0.070*\"statewid\" + 0.042*\"arsen\" + 0.037*\"line\" + 0.033*\"raid\" + 0.031*\"museo\" + 0.021*\"pain\" + 0.019*\"traceabl\" + 0.019*\"word\" + 0.016*\"serv\" + 0.016*\"artist\"\n", + "2019-01-31 00:19:46,143 : INFO : topic diff=0.026356, rho=0.088045\n", + "2019-01-31 00:19:48,892 : INFO : -11.654 per-word bound, 3222.2 perplexity estimate based on a held-out corpus of 2000 documents with 531693 words\n", + "2019-01-31 00:19:48,892 : INFO : PROGRESS: pass 0, at document #260000/4922894\n", + "2019-01-31 00:19:50,365 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:19:50,631 : INFO : topic #31 (0.020): 0.066*\"fusiform\" + 0.025*\"player\" + 0.020*\"place\" + 0.019*\"scientist\" + 0.016*\"taxpay\" + 0.012*\"leagu\" + 0.011*\"folei\" + 0.010*\"ruler\" + 0.010*\"yard\" + 0.008*\"barber\"\n", + "2019-01-31 00:19:50,633 : INFO : topic #21 (0.020): 0.037*\"samford\" + 0.024*\"spain\" + 0.018*\"mexico\" + 0.017*\"del\" + 0.015*\"soviet\" + 0.012*\"lizard\" + 0.012*\"santa\" + 0.011*\"josé\" + 0.011*\"juan\" + 0.011*\"carlo\"\n", + "2019-01-31 00:19:50,634 : INFO : topic #17 (0.020): 0.058*\"church\" + 0.019*\"jpg\" + 0.019*\"fifteenth\" + 0.018*\"christian\" + 0.017*\"bishop\" + 0.017*\"cathol\" + 0.016*\"centuri\" + 0.014*\"retroflex\" + 0.013*\"sail\" + 0.013*\"italian\"\n", + "2019-01-31 00:19:50,635 : INFO : topic #7 (0.020): 0.019*\"snatch\" + 0.019*\"di\" + 0.017*\"factor\" + 0.014*\"yawn\" + 0.014*\"margin\" + 0.012*\"deal\" + 0.012*\"life\" + 0.012*\"faster\" + 0.012*\"bone\" + 0.011*\"john\"\n", + "2019-01-31 00:19:50,636 : INFO : topic #43 (0.020): 0.067*\"elect\" + 0.058*\"parti\" + 0.031*\"voluntari\" + 0.023*\"democrat\" + 0.022*\"member\" + 0.018*\"polici\" + 0.016*\"liber\" + 0.016*\"bypass\" + 0.014*\"republ\" + 0.013*\"selma\"\n", + "2019-01-31 00:19:50,642 : INFO : topic diff=0.023684, rho=0.087706\n", + "2019-01-31 00:19:50,796 : INFO : PROGRESS: pass 0, at document #262000/4922894\n", + "2019-01-31 00:19:52,252 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:19:52,518 : INFO : topic #49 (0.020): 0.041*\"india\" + 0.029*\"incumb\" + 0.013*\"televis\" + 0.012*\"pakistan\" + 0.011*\"islam\" + 0.011*\"khalsa\" + 0.010*\"sri\" + 0.009*\"start\" + 0.009*\"alam\" + 0.009*\"muskoge\"\n", + "2019-01-31 00:19:52,520 : INFO : topic #6 (0.020): 0.066*\"fewer\" + 0.024*\"septemb\" + 0.021*\"epiru\" + 0.019*\"teacher\" + 0.016*\"stake\" + 0.012*\"rodríguez\" + 0.012*\"proclaim\" + 0.011*\"movi\" + 0.011*\"direct\" + 0.010*\"acrimoni\"\n", + "2019-01-31 00:19:52,522 : INFO : topic #25 (0.020): 0.028*\"ring\" + 0.018*\"warmth\" + 0.017*\"lagrang\" + 0.014*\"area\" + 0.014*\"mount\" + 0.008*\"north\" + 0.008*\"land\" + 0.007*\"firm\" + 0.007*\"foam\" + 0.007*\"vacant\"\n", + "2019-01-31 00:19:52,522 : INFO : topic #3 (0.020): 0.036*\"present\" + 0.028*\"offic\" + 0.026*\"minist\" + 0.023*\"seri\" + 0.018*\"gener\" + 0.018*\"member\" + 0.016*\"chickasaw\" + 0.016*\"serv\" + 0.015*\"appeas\" + 0.012*\"secess\"\n", + "2019-01-31 00:19:52,523 : INFO : topic #29 (0.020): 0.012*\"govern\" + 0.011*\"start\" + 0.009*\"replac\" + 0.008*\"countri\" + 0.008*\"yawn\" + 0.007*\"million\" + 0.007*\"nation\" + 0.006*\"new\" + 0.006*\"placement\" + 0.006*\"summerhil\"\n", + "2019-01-31 00:19:52,529 : INFO : topic diff=0.022696, rho=0.087370\n", + "2019-01-31 00:19:52,683 : INFO : PROGRESS: pass 0, at document #264000/4922894\n", + "2019-01-31 00:19:54,144 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:19:54,410 : INFO : topic #4 (0.020): 0.024*\"enfranchis\" + 0.016*\"depress\" + 0.015*\"pour\" + 0.012*\"candid\" + 0.011*\"elabor\" + 0.010*\"mode\" + 0.009*\"produc\" + 0.008*\"veget\" + 0.007*\"mandir\" + 0.007*\"uruguayan\"\n", + "2019-01-31 00:19:54,411 : INFO : topic #32 (0.020): 0.064*\"district\" + 0.051*\"vigour\" + 0.046*\"tortur\" + 0.042*\"popolo\" + 0.029*\"regim\" + 0.027*\"area\" + 0.025*\"multitud\" + 0.023*\"cotton\" + 0.020*\"commun\" + 0.019*\"prosper\"\n", + "2019-01-31 00:19:54,411 : INFO : topic #0 (0.020): 0.068*\"statewid\" + 0.042*\"arsen\" + 0.039*\"line\" + 0.034*\"raid\" + 0.030*\"museo\" + 0.019*\"pain\" + 0.019*\"word\" + 0.018*\"traceabl\" + 0.017*\"serv\" + 0.016*\"artist\"\n", + "2019-01-31 00:19:54,413 : INFO : topic #39 (0.020): 0.032*\"taxpay\" + 0.028*\"canada\" + 0.027*\"scientist\" + 0.023*\"canadian\" + 0.021*\"clot\" + 0.016*\"basketbal\" + 0.015*\"hoar\" + 0.013*\"toronto\" + 0.013*\"confer\" + 0.011*\"ontario\"\n", + "2019-01-31 00:19:54,414 : INFO : topic #30 (0.020): 0.034*\"leagu\" + 0.034*\"cleveland\" + 0.029*\"place\" + 0.026*\"taxpay\" + 0.025*\"crete\" + 0.024*\"scientist\" + 0.022*\"folei\" + 0.016*\"martin\" + 0.016*\"goal\" + 0.012*\"schmitz\"\n", + "2019-01-31 00:19:54,420 : INFO : topic diff=0.022069, rho=0.087039\n", + "2019-01-31 00:19:54,575 : INFO : PROGRESS: pass 0, at document #266000/4922894\n", + "2019-01-31 00:19:56,039 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:19:56,304 : INFO : topic #16 (0.020): 0.031*\"priest\" + 0.022*\"king\" + 0.022*\"duke\" + 0.018*\"quarterli\" + 0.017*\"grammat\" + 0.016*\"maria\" + 0.015*\"rotterdam\" + 0.014*\"princ\" + 0.012*\"idiosyncrat\" + 0.012*\"order\"\n", + "2019-01-31 00:19:56,305 : INFO : topic #24 (0.020): 0.039*\"book\" + 0.033*\"publicis\" + 0.020*\"word\" + 0.016*\"new\" + 0.014*\"storag\" + 0.014*\"edit\" + 0.012*\"presid\" + 0.012*\"worldwid\" + 0.011*\"nicola\" + 0.011*\"magazin\"\n", + "2019-01-31 00:19:56,307 : INFO : topic #31 (0.020): 0.069*\"fusiform\" + 0.027*\"player\" + 0.021*\"place\" + 0.018*\"scientist\" + 0.016*\"taxpay\" + 0.011*\"leagu\" + 0.011*\"folei\" + 0.010*\"ruler\" + 0.009*\"yard\" + 0.009*\"barber\"\n", + "2019-01-31 00:19:56,308 : INFO : topic #14 (0.020): 0.024*\"forc\" + 0.022*\"aggress\" + 0.021*\"walter\" + 0.020*\"armi\" + 0.017*\"com\" + 0.014*\"oper\" + 0.013*\"unionist\" + 0.012*\"airbu\" + 0.012*\"militari\" + 0.011*\"airmen\"\n", + "2019-01-31 00:19:56,309 : INFO : topic #0 (0.020): 0.069*\"statewid\" + 0.042*\"arsen\" + 0.039*\"line\" + 0.034*\"raid\" + 0.030*\"museo\" + 0.019*\"pain\" + 0.018*\"word\" + 0.018*\"traceabl\" + 0.017*\"serv\" + 0.017*\"artist\"\n", + "2019-01-31 00:19:56,315 : INFO : topic diff=0.021942, rho=0.086711\n", + "2019-01-31 00:19:56,469 : INFO : PROGRESS: pass 0, at document #268000/4922894\n", + "2019-01-31 00:19:57,926 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:19:58,192 : INFO : topic #46 (0.020): 0.019*\"stop\" + 0.017*\"wind\" + 0.017*\"norwai\" + 0.016*\"sweden\" + 0.014*\"damag\" + 0.014*\"swedish\" + 0.014*\"norwegian\" + 0.013*\"turkish\" + 0.012*\"turkei\" + 0.010*\"wavi\"\n", + "2019-01-31 00:19:58,193 : INFO : topic #32 (0.020): 0.063*\"district\" + 0.049*\"vigour\" + 0.046*\"tortur\" + 0.043*\"popolo\" + 0.028*\"regim\" + 0.027*\"area\" + 0.025*\"multitud\" + 0.023*\"cotton\" + 0.020*\"commun\" + 0.019*\"citi\"\n", + "2019-01-31 00:19:58,195 : INFO : topic #29 (0.020): 0.012*\"govern\" + 0.011*\"start\" + 0.008*\"replac\" + 0.007*\"countri\" + 0.007*\"yawn\" + 0.007*\"million\" + 0.007*\"nation\" + 0.006*\"summerhil\" + 0.006*\"new\" + 0.006*\"théori\"\n", + "2019-01-31 00:19:58,196 : INFO : topic #6 (0.020): 0.064*\"fewer\" + 0.024*\"septemb\" + 0.021*\"epiru\" + 0.019*\"teacher\" + 0.016*\"stake\" + 0.012*\"rodríguez\" + 0.012*\"proclaim\" + 0.011*\"movi\" + 0.010*\"direct\" + 0.010*\"acrimoni\"\n", + "2019-01-31 00:19:58,198 : INFO : topic #17 (0.020): 0.062*\"church\" + 0.020*\"jpg\" + 0.020*\"fifteenth\" + 0.018*\"christian\" + 0.017*\"cathol\" + 0.017*\"bishop\" + 0.016*\"centuri\" + 0.015*\"retroflex\" + 0.013*\"italian\" + 0.013*\"sail\"\n", + "2019-01-31 00:19:58,204 : INFO : topic diff=0.021961, rho=0.086387\n", + "2019-01-31 00:19:58,357 : INFO : PROGRESS: pass 0, at document #270000/4922894\n", + "2019-01-31 00:19:59,816 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:20:00,082 : INFO : topic #15 (0.020): 0.014*\"develop\" + 0.012*\"requir\" + 0.011*\"small\" + 0.010*\"cultur\" + 0.010*\"word\" + 0.009*\"organ\" + 0.009*\"student\" + 0.009*\"commun\" + 0.008*\"human\" + 0.008*\"socialist\"\n", + "2019-01-31 00:20:00,083 : INFO : topic #37 (0.020): 0.008*\"love\" + 0.007*\"gestur\" + 0.005*\"man\" + 0.005*\"night\" + 0.005*\"blue\" + 0.004*\"bewild\" + 0.004*\"litig\" + 0.004*\"christma\" + 0.003*\"dai\" + 0.003*\"introductori\"\n", + "2019-01-31 00:20:00,085 : INFO : topic #24 (0.020): 0.038*\"book\" + 0.033*\"publicis\" + 0.020*\"word\" + 0.016*\"new\" + 0.014*\"storag\" + 0.013*\"edit\" + 0.012*\"presid\" + 0.012*\"worldwid\" + 0.011*\"nicola\" + 0.011*\"magazin\"\n", + "2019-01-31 00:20:00,086 : INFO : topic #26 (0.020): 0.032*\"workplac\" + 0.031*\"woman\" + 0.029*\"champion\" + 0.024*\"olymp\" + 0.024*\"medal\" + 0.023*\"event\" + 0.023*\"men\" + 0.018*\"taxpay\" + 0.018*\"atheist\" + 0.017*\"nation\"\n", + "2019-01-31 00:20:00,087 : INFO : topic #8 (0.020): 0.032*\"act\" + 0.030*\"law\" + 0.024*\"cortic\" + 0.019*\"start\" + 0.014*\"ricardo\" + 0.014*\"case\" + 0.010*\"polaris\" + 0.009*\"legal\" + 0.008*\"judaism\" + 0.007*\"justic\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 00:20:00,093 : INFO : topic diff=0.021281, rho=0.086066\n", + "2019-01-31 00:20:00,248 : INFO : PROGRESS: pass 0, at document #272000/4922894\n", + "2019-01-31 00:20:01,730 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:20:01,996 : INFO : topic #25 (0.020): 0.027*\"ring\" + 0.018*\"warmth\" + 0.016*\"lagrang\" + 0.015*\"area\" + 0.014*\"mount\" + 0.009*\"foam\" + 0.008*\"land\" + 0.008*\"north\" + 0.007*\"firm\" + 0.007*\"lobe\"\n", + "2019-01-31 00:20:01,997 : INFO : topic #35 (0.020): 0.046*\"russia\" + 0.034*\"sovereignti\" + 0.026*\"rural\" + 0.024*\"poison\" + 0.023*\"personifi\" + 0.023*\"reprint\" + 0.016*\"unfortun\" + 0.016*\"moscow\" + 0.015*\"malaysia\" + 0.014*\"tyrant\"\n", + "2019-01-31 00:20:01,998 : INFO : topic #3 (0.020): 0.039*\"present\" + 0.028*\"offic\" + 0.026*\"minist\" + 0.024*\"seri\" + 0.018*\"gener\" + 0.017*\"chickasaw\" + 0.017*\"member\" + 0.016*\"appeas\" + 0.015*\"serv\" + 0.012*\"gov\"\n", + "2019-01-31 00:20:01,999 : INFO : topic #42 (0.020): 0.037*\"german\" + 0.026*\"germani\" + 0.014*\"jewish\" + 0.013*\"israel\" + 0.011*\"vol\" + 0.011*\"der\" + 0.010*\"berlin\" + 0.009*\"greek\" + 0.008*\"austria\" + 0.008*\"europ\"\n", + "2019-01-31 00:20:02,000 : INFO : topic #7 (0.020): 0.020*\"snatch\" + 0.019*\"di\" + 0.017*\"factor\" + 0.014*\"yawn\" + 0.014*\"margin\" + 0.012*\"life\" + 0.012*\"faster\" + 0.012*\"john\" + 0.012*\"deal\" + 0.011*\"bone\"\n", + "2019-01-31 00:20:02,006 : INFO : topic diff=0.021751, rho=0.085749\n", + "2019-01-31 00:20:02,164 : INFO : PROGRESS: pass 0, at document #274000/4922894\n", + "2019-01-31 00:20:03,647 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:20:03,912 : INFO : topic #12 (0.020): 0.008*\"number\" + 0.007*\"frontal\" + 0.007*\"southern\" + 0.007*\"gener\" + 0.007*\"théori\" + 0.007*\"poet\" + 0.006*\"exampl\" + 0.006*\"cytokin\" + 0.006*\"servitud\" + 0.006*\"measur\"\n", + "2019-01-31 00:20:03,914 : INFO : topic #47 (0.020): 0.069*\"muscl\" + 0.035*\"perceptu\" + 0.021*\"theater\" + 0.019*\"place\" + 0.017*\"compos\" + 0.017*\"damn\" + 0.013*\"physician\" + 0.013*\"olympo\" + 0.012*\"orchestr\" + 0.012*\"word\"\n", + "2019-01-31 00:20:03,915 : INFO : topic #33 (0.020): 0.060*\"french\" + 0.044*\"franc\" + 0.031*\"pari\" + 0.029*\"sail\" + 0.023*\"jean\" + 0.017*\"daphn\" + 0.015*\"loui\" + 0.014*\"lazi\" + 0.013*\"wreath\" + 0.011*\"piec\"\n", + "2019-01-31 00:20:03,916 : INFO : topic #26 (0.020): 0.031*\"workplac\" + 0.031*\"woman\" + 0.029*\"champion\" + 0.024*\"olymp\" + 0.023*\"event\" + 0.023*\"medal\" + 0.023*\"men\" + 0.018*\"atheist\" + 0.018*\"taxpay\" + 0.017*\"rainfal\"\n", + "2019-01-31 00:20:03,917 : INFO : topic #13 (0.020): 0.027*\"australia\" + 0.027*\"sourc\" + 0.025*\"new\" + 0.023*\"london\" + 0.023*\"australian\" + 0.021*\"england\" + 0.020*\"ireland\" + 0.017*\"british\" + 0.015*\"wale\" + 0.015*\"youth\"\n", + "2019-01-31 00:20:03,923 : INFO : topic diff=0.024724, rho=0.085436\n", + "2019-01-31 00:20:04,074 : INFO : PROGRESS: pass 0, at document #276000/4922894\n", + "2019-01-31 00:20:05,524 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:20:05,790 : INFO : topic #12 (0.020): 0.008*\"number\" + 0.008*\"frontal\" + 0.007*\"southern\" + 0.006*\"gener\" + 0.006*\"théori\" + 0.006*\"poet\" + 0.006*\"exampl\" + 0.006*\"cytokin\" + 0.006*\"servitud\" + 0.006*\"measur\"\n", + "2019-01-31 00:20:05,791 : INFO : topic #29 (0.020): 0.012*\"govern\" + 0.011*\"start\" + 0.008*\"replac\" + 0.008*\"yawn\" + 0.007*\"countri\" + 0.007*\"million\" + 0.007*\"nation\" + 0.006*\"summerhil\" + 0.006*\"new\" + 0.006*\"placement\"\n", + "2019-01-31 00:20:05,792 : INFO : topic #26 (0.020): 0.031*\"woman\" + 0.031*\"workplac\" + 0.028*\"champion\" + 0.023*\"event\" + 0.023*\"olymp\" + 0.023*\"men\" + 0.023*\"medal\" + 0.019*\"atheist\" + 0.018*\"taxpay\" + 0.018*\"rainfal\"\n", + "2019-01-31 00:20:05,794 : INFO : topic #37 (0.020): 0.008*\"love\" + 0.007*\"gestur\" + 0.005*\"man\" + 0.005*\"night\" + 0.005*\"blue\" + 0.004*\"christma\" + 0.004*\"sene\" + 0.004*\"bewild\" + 0.004*\"litig\" + 0.003*\"introductori\"\n", + "2019-01-31 00:20:05,794 : INFO : topic #41 (0.020): 0.049*\"citi\" + 0.043*\"new\" + 0.027*\"palmer\" + 0.027*\"year\" + 0.017*\"center\" + 0.016*\"strategist\" + 0.011*\"open\" + 0.009*\"hot\" + 0.009*\"lobe\" + 0.009*\"includ\"\n", + "2019-01-31 00:20:05,800 : INFO : topic diff=0.023910, rho=0.085126\n", + "2019-01-31 00:20:05,955 : INFO : PROGRESS: pass 0, at document #278000/4922894\n", + "2019-01-31 00:20:07,413 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:20:07,679 : INFO : topic #17 (0.020): 0.063*\"church\" + 0.021*\"jpg\" + 0.019*\"fifteenth\" + 0.017*\"cathol\" + 0.017*\"bishop\" + 0.017*\"christian\" + 0.016*\"centuri\" + 0.015*\"retroflex\" + 0.012*\"italian\" + 0.012*\"sail\"\n", + "2019-01-31 00:20:07,681 : INFO : topic #10 (0.020): 0.011*\"cdd\" + 0.008*\"media\" + 0.007*\"pathwai\" + 0.007*\"disco\" + 0.007*\"hormon\" + 0.007*\"caus\" + 0.006*\"have\" + 0.006*\"treat\" + 0.006*\"proper\" + 0.006*\"effect\"\n", + "2019-01-31 00:20:07,682 : INFO : topic #43 (0.020): 0.067*\"parti\" + 0.061*\"elect\" + 0.027*\"voluntari\" + 0.025*\"democrat\" + 0.022*\"member\" + 0.017*\"polici\" + 0.016*\"republ\" + 0.015*\"tendenc\" + 0.015*\"report\" + 0.014*\"liber\"\n", + "2019-01-31 00:20:07,683 : INFO : topic #36 (0.020): 0.027*\"companhia\" + 0.010*\"develop\" + 0.009*\"serv\" + 0.009*\"market\" + 0.008*\"prognosi\" + 0.008*\"manag\" + 0.008*\"network\" + 0.008*\"produc\" + 0.008*\"oper\" + 0.008*\"includ\"\n", + "2019-01-31 00:20:07,684 : INFO : topic #7 (0.020): 0.020*\"snatch\" + 0.019*\"di\" + 0.017*\"factor\" + 0.014*\"yawn\" + 0.014*\"margin\" + 0.012*\"life\" + 0.012*\"faster\" + 0.012*\"deal\" + 0.012*\"john\" + 0.012*\"bone\"\n", + "2019-01-31 00:20:07,690 : INFO : topic diff=0.023322, rho=0.084819\n", + "2019-01-31 00:20:10,404 : INFO : -11.715 per-word bound, 3361.4 perplexity estimate based on a held-out corpus of 2000 documents with 523660 words\n", + "2019-01-31 00:20:10,405 : INFO : PROGRESS: pass 0, at document #280000/4922894\n", + "2019-01-31 00:20:11,850 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:20:12,116 : INFO : topic #10 (0.020): 0.011*\"cdd\" + 0.008*\"media\" + 0.007*\"pathwai\" + 0.007*\"disco\" + 0.007*\"hormon\" + 0.007*\"caus\" + 0.006*\"have\" + 0.006*\"effect\" + 0.006*\"treat\" + 0.006*\"proper\"\n", + "2019-01-31 00:20:12,117 : INFO : topic #42 (0.020): 0.038*\"german\" + 0.026*\"germani\" + 0.015*\"jewish\" + 0.013*\"vol\" + 0.012*\"israel\" + 0.012*\"der\" + 0.011*\"berlin\" + 0.011*\"greek\" + 0.009*\"austria\" + 0.008*\"albanian\"\n", + "2019-01-31 00:20:12,118 : INFO : topic #12 (0.020): 0.008*\"gener\" + 0.007*\"number\" + 0.007*\"frontal\" + 0.007*\"southern\" + 0.006*\"poet\" + 0.006*\"théori\" + 0.006*\"exampl\" + 0.006*\"measur\" + 0.006*\"cytokin\" + 0.006*\"servitud\"\n", + "2019-01-31 00:20:12,120 : INFO : topic #18 (0.020): 0.008*\"théori\" + 0.007*\"later\" + 0.006*\"kill\" + 0.006*\"man\" + 0.006*\"sack\" + 0.005*\"retrospect\" + 0.005*\"dai\" + 0.005*\"deal\" + 0.004*\"life\" + 0.004*\"help\"\n", + "2019-01-31 00:20:12,121 : INFO : topic #26 (0.020): 0.031*\"woman\" + 0.031*\"workplac\" + 0.029*\"champion\" + 0.024*\"olymp\" + 0.023*\"event\" + 0.023*\"medal\" + 0.023*\"men\" + 0.018*\"taxpay\" + 0.018*\"atheist\" + 0.017*\"nation\"\n", + "2019-01-31 00:20:12,128 : INFO : topic diff=0.020409, rho=0.084515\n", + "2019-01-31 00:20:12,285 : INFO : PROGRESS: pass 0, at document #282000/4922894\n", + "2019-01-31 00:20:13,753 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:20:14,020 : INFO : topic #10 (0.020): 0.011*\"cdd\" + 0.009*\"media\" + 0.008*\"pathwai\" + 0.007*\"hormon\" + 0.007*\"disco\" + 0.007*\"have\" + 0.007*\"caus\" + 0.006*\"treat\" + 0.006*\"effect\" + 0.006*\"proper\"\n", + "2019-01-31 00:20:14,021 : INFO : topic #26 (0.020): 0.031*\"woman\" + 0.031*\"workplac\" + 0.029*\"champion\" + 0.024*\"olymp\" + 0.023*\"event\" + 0.023*\"medal\" + 0.022*\"men\" + 0.019*\"rainfal\" + 0.018*\"taxpay\" + 0.018*\"atheist\"\n", + "2019-01-31 00:20:14,022 : INFO : topic #0 (0.020): 0.070*\"statewid\" + 0.041*\"arsen\" + 0.040*\"line\" + 0.036*\"raid\" + 0.034*\"museo\" + 0.019*\"pain\" + 0.018*\"traceabl\" + 0.017*\"word\" + 0.017*\"serv\" + 0.015*\"artist\"\n", + "2019-01-31 00:20:14,024 : INFO : topic #27 (0.020): 0.067*\"questionnair\" + 0.017*\"taxpay\" + 0.016*\"candid\" + 0.015*\"tornado\" + 0.012*\"driver\" + 0.011*\"fool\" + 0.011*\"find\" + 0.010*\"théori\" + 0.010*\"landslid\" + 0.010*\"ret\"\n", + "2019-01-31 00:20:14,025 : INFO : topic #49 (0.020): 0.040*\"india\" + 0.031*\"incumb\" + 0.012*\"islam\" + 0.011*\"televis\" + 0.010*\"pakistan\" + 0.010*\"khalsa\" + 0.010*\"singh\" + 0.010*\"alam\" + 0.010*\"start\" + 0.009*\"muskoge\"\n", + "2019-01-31 00:20:14,031 : INFO : topic diff=0.023625, rho=0.084215\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 00:20:14,185 : INFO : PROGRESS: pass 0, at document #284000/4922894\n", + "2019-01-31 00:20:15,655 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:20:15,920 : INFO : topic #7 (0.020): 0.020*\"snatch\" + 0.019*\"di\" + 0.017*\"factor\" + 0.014*\"yawn\" + 0.014*\"margin\" + 0.013*\"life\" + 0.012*\"faster\" + 0.012*\"bone\" + 0.012*\"deal\" + 0.011*\"john\"\n", + "2019-01-31 00:20:15,922 : INFO : topic #42 (0.020): 0.039*\"german\" + 0.026*\"germani\" + 0.015*\"jewish\" + 0.012*\"vol\" + 0.012*\"israel\" + 0.011*\"der\" + 0.011*\"berlin\" + 0.010*\"greek\" + 0.009*\"jeremiah\" + 0.008*\"austria\"\n", + "2019-01-31 00:20:15,923 : INFO : topic #41 (0.020): 0.049*\"citi\" + 0.043*\"new\" + 0.026*\"palmer\" + 0.026*\"year\" + 0.016*\"center\" + 0.016*\"strategist\" + 0.011*\"open\" + 0.010*\"hot\" + 0.009*\"includ\" + 0.009*\"lobe\"\n", + "2019-01-31 00:20:15,924 : INFO : topic #0 (0.020): 0.069*\"statewid\" + 0.040*\"arsen\" + 0.040*\"line\" + 0.037*\"raid\" + 0.034*\"museo\" + 0.019*\"pain\" + 0.018*\"traceabl\" + 0.017*\"word\" + 0.017*\"serv\" + 0.015*\"artist\"\n", + "2019-01-31 00:20:15,925 : INFO : topic #5 (0.020): 0.039*\"abroad\" + 0.029*\"son\" + 0.028*\"rel\" + 0.028*\"reconstruct\" + 0.023*\"band\" + 0.017*\"muscl\" + 0.016*\"simultan\" + 0.014*\"charcoal\" + 0.014*\"toyota\" + 0.010*\"myspac\"\n", + "2019-01-31 00:20:15,931 : INFO : topic diff=0.020654, rho=0.083918\n", + "2019-01-31 00:20:16,141 : INFO : PROGRESS: pass 0, at document #286000/4922894\n", + "2019-01-31 00:20:17,634 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:20:17,900 : INFO : topic #47 (0.020): 0.068*\"muscl\" + 0.037*\"perceptu\" + 0.022*\"damn\" + 0.019*\"theater\" + 0.017*\"place\" + 0.017*\"compos\" + 0.015*\"orchestr\" + 0.013*\"physician\" + 0.013*\"olympo\" + 0.012*\"word\"\n", + "2019-01-31 00:20:17,902 : INFO : topic #27 (0.020): 0.069*\"questionnair\" + 0.016*\"candid\" + 0.016*\"taxpay\" + 0.014*\"tornado\" + 0.012*\"driver\" + 0.012*\"fool\" + 0.011*\"find\" + 0.011*\"landslid\" + 0.010*\"théori\" + 0.009*\"poti\"\n", + "2019-01-31 00:20:17,903 : INFO : topic #49 (0.020): 0.041*\"india\" + 0.030*\"incumb\" + 0.012*\"islam\" + 0.011*\"televis\" + 0.010*\"pakistan\" + 0.010*\"khalsa\" + 0.010*\"alam\" + 0.010*\"singh\" + 0.010*\"start\" + 0.009*\"muskoge\"\n", + "2019-01-31 00:20:17,904 : INFO : topic #10 (0.020): 0.013*\"cdd\" + 0.008*\"media\" + 0.007*\"pathwai\" + 0.007*\"hormon\" + 0.006*\"disco\" + 0.006*\"caus\" + 0.006*\"proper\" + 0.006*\"activ\" + 0.006*\"treat\" + 0.006*\"have\"\n", + "2019-01-31 00:20:17,906 : INFO : topic #34 (0.020): 0.073*\"start\" + 0.038*\"cotton\" + 0.029*\"unionist\" + 0.021*\"american\" + 0.016*\"new\" + 0.016*\"terri\" + 0.014*\"california\" + 0.012*\"warrior\" + 0.012*\"north\" + 0.011*\"violent\"\n", + "2019-01-31 00:20:17,911 : INFO : topic diff=0.021162, rho=0.083624\n", + "2019-01-31 00:20:18,069 : INFO : PROGRESS: pass 0, at document #288000/4922894\n", + "2019-01-31 00:20:19,563 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:20:19,832 : INFO : topic #35 (0.020): 0.051*\"russia\" + 0.035*\"sovereignti\" + 0.028*\"rural\" + 0.024*\"poison\" + 0.024*\"personifi\" + 0.022*\"reprint\" + 0.017*\"moscow\" + 0.016*\"unfortun\" + 0.015*\"tyrant\" + 0.014*\"poland\"\n", + "2019-01-31 00:20:19,833 : INFO : topic #38 (0.020): 0.020*\"walter\" + 0.015*\"king\" + 0.011*\"aza\" + 0.010*\"battalion\" + 0.010*\"teufel\" + 0.009*\"empath\" + 0.008*\"forc\" + 0.007*\"till\" + 0.007*\"centuri\" + 0.007*\"embassi\"\n", + "2019-01-31 00:20:19,834 : INFO : topic #5 (0.020): 0.040*\"abroad\" + 0.028*\"son\" + 0.028*\"reconstruct\" + 0.028*\"rel\" + 0.023*\"band\" + 0.017*\"muscl\" + 0.016*\"simultan\" + 0.015*\"charcoal\" + 0.013*\"toyota\" + 0.010*\"myspac\"\n", + "2019-01-31 00:20:19,835 : INFO : topic #15 (0.020): 0.015*\"develop\" + 0.012*\"requir\" + 0.011*\"small\" + 0.010*\"word\" + 0.010*\"organ\" + 0.010*\"cultur\" + 0.009*\"student\" + 0.009*\"commun\" + 0.008*\"socialist\" + 0.007*\"human\"\n", + "2019-01-31 00:20:19,837 : INFO : topic #43 (0.020): 0.066*\"elect\" + 0.063*\"parti\" + 0.026*\"voluntari\" + 0.023*\"democrat\" + 0.022*\"member\" + 0.017*\"polici\" + 0.016*\"republ\" + 0.015*\"report\" + 0.015*\"bypass\" + 0.014*\"liber\"\n", + "2019-01-31 00:20:19,843 : INFO : topic diff=0.021270, rho=0.083333\n", + "2019-01-31 00:20:19,997 : INFO : PROGRESS: pass 0, at document #290000/4922894\n", + "2019-01-31 00:20:21,444 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:20:21,710 : INFO : topic #20 (0.020): 0.129*\"scholar\" + 0.036*\"struggl\" + 0.032*\"high\" + 0.028*\"educ\" + 0.018*\"yawn\" + 0.017*\"collector\" + 0.013*\"prognosi\" + 0.011*\"class\" + 0.009*\"task\" + 0.009*\"pseudo\"\n", + "2019-01-31 00:20:21,711 : INFO : topic #7 (0.020): 0.020*\"snatch\" + 0.020*\"di\" + 0.017*\"factor\" + 0.014*\"yawn\" + 0.014*\"margin\" + 0.012*\"life\" + 0.012*\"faster\" + 0.012*\"bone\" + 0.011*\"deal\" + 0.011*\"john\"\n", + "2019-01-31 00:20:21,712 : INFO : topic #23 (0.020): 0.131*\"audit\" + 0.068*\"best\" + 0.031*\"jacksonvil\" + 0.029*\"yawn\" + 0.029*\"japanes\" + 0.022*\"noll\" + 0.021*\"festiv\" + 0.019*\"women\" + 0.017*\"intern\" + 0.015*\"prison\"\n", + "2019-01-31 00:20:21,713 : INFO : topic #24 (0.020): 0.038*\"book\" + 0.034*\"publicis\" + 0.020*\"word\" + 0.016*\"new\" + 0.014*\"edit\" + 0.012*\"storag\" + 0.012*\"presid\" + 0.012*\"worldwid\" + 0.011*\"nicola\" + 0.010*\"magazin\"\n", + "2019-01-31 00:20:21,714 : INFO : topic #13 (0.020): 0.028*\"australia\" + 0.025*\"sourc\" + 0.025*\"new\" + 0.023*\"london\" + 0.023*\"australian\" + 0.021*\"england\" + 0.021*\"ireland\" + 0.017*\"youth\" + 0.017*\"british\" + 0.015*\"wale\"\n", + "2019-01-31 00:20:21,720 : INFO : topic diff=0.021206, rho=0.083045\n", + "2019-01-31 00:20:21,872 : INFO : PROGRESS: pass 0, at document #292000/4922894\n", + "2019-01-31 00:20:23,337 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:20:23,604 : INFO : topic #48 (0.020): 0.077*\"octob\" + 0.077*\"march\" + 0.077*\"sens\" + 0.075*\"januari\" + 0.072*\"notion\" + 0.069*\"august\" + 0.068*\"juli\" + 0.067*\"decatur\" + 0.067*\"april\" + 0.067*\"judici\"\n", + "2019-01-31 00:20:23,605 : INFO : topic #9 (0.020): 0.066*\"bone\" + 0.046*\"american\" + 0.026*\"valour\" + 0.019*\"player\" + 0.019*\"english\" + 0.018*\"folei\" + 0.016*\"polit\" + 0.015*\"dutch\" + 0.013*\"simpler\" + 0.013*\"acrimoni\"\n", + "2019-01-31 00:20:23,606 : INFO : topic #43 (0.020): 0.067*\"elect\" + 0.060*\"parti\" + 0.027*\"voluntari\" + 0.023*\"democrat\" + 0.022*\"member\" + 0.017*\"polici\" + 0.016*\"republ\" + 0.015*\"report\" + 0.015*\"bypass\" + 0.014*\"liber\"\n", + "2019-01-31 00:20:23,608 : INFO : topic #5 (0.020): 0.040*\"abroad\" + 0.029*\"son\" + 0.028*\"reconstruct\" + 0.028*\"rel\" + 0.022*\"band\" + 0.018*\"muscl\" + 0.016*\"simultan\" + 0.015*\"charcoal\" + 0.013*\"toyota\" + 0.010*\"myspac\"\n", + "2019-01-31 00:20:23,609 : INFO : topic #13 (0.020): 0.029*\"australia\" + 0.026*\"new\" + 0.025*\"sourc\" + 0.024*\"london\" + 0.022*\"australian\" + 0.022*\"england\" + 0.020*\"ireland\" + 0.017*\"youth\" + 0.017*\"british\" + 0.015*\"wale\"\n", + "2019-01-31 00:20:23,614 : INFO : topic diff=0.021090, rho=0.082761\n", + "2019-01-31 00:20:23,770 : INFO : PROGRESS: pass 0, at document #294000/4922894\n", + "2019-01-31 00:20:25,228 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:20:25,493 : INFO : topic #23 (0.020): 0.130*\"audit\" + 0.066*\"best\" + 0.032*\"jacksonvil\" + 0.031*\"yawn\" + 0.028*\"japanes\" + 0.022*\"noll\" + 0.020*\"festiv\" + 0.019*\"women\" + 0.017*\"intern\" + 0.015*\"prison\"\n", + "2019-01-31 00:20:25,495 : INFO : topic #39 (0.020): 0.031*\"taxpay\" + 0.027*\"canada\" + 0.025*\"scientist\" + 0.022*\"clot\" + 0.022*\"canadian\" + 0.016*\"basketbal\" + 0.015*\"hoar\" + 0.015*\"confer\" + 0.013*\"toronto\" + 0.011*\"ontario\"\n", + "2019-01-31 00:20:25,496 : INFO : topic #8 (0.020): 0.031*\"law\" + 0.026*\"cortic\" + 0.026*\"act\" + 0.019*\"start\" + 0.013*\"ricardo\" + 0.013*\"case\" + 0.011*\"polaris\" + 0.009*\"legal\" + 0.008*\"judaism\" + 0.008*\"justic\"\n", + "2019-01-31 00:20:25,498 : INFO : topic #27 (0.020): 0.072*\"questionnair\" + 0.017*\"candid\" + 0.017*\"taxpay\" + 0.013*\"driver\" + 0.012*\"tornado\" + 0.012*\"fool\" + 0.011*\"find\" + 0.010*\"théori\" + 0.010*\"ret\" + 0.010*\"landslid\"\n", + "2019-01-31 00:20:25,499 : INFO : topic #25 (0.020): 0.029*\"ring\" + 0.017*\"warmth\" + 0.016*\"lagrang\" + 0.016*\"area\" + 0.014*\"mount\" + 0.008*\"foam\" + 0.008*\"land\" + 0.008*\"vacant\" + 0.008*\"north\" + 0.008*\"palmer\"\n", + "2019-01-31 00:20:25,505 : INFO : topic diff=0.020925, rho=0.082479\n", + "2019-01-31 00:20:25,662 : INFO : PROGRESS: pass 0, at document #296000/4922894\n", + "2019-01-31 00:20:27,130 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 00:20:27,399 : INFO : topic #25 (0.020): 0.028*\"ring\" + 0.017*\"warmth\" + 0.016*\"lagrang\" + 0.015*\"area\" + 0.014*\"mount\" + 0.008*\"foam\" + 0.008*\"land\" + 0.008*\"vacant\" + 0.008*\"north\" + 0.007*\"palmer\"\n", + "2019-01-31 00:20:27,400 : INFO : topic #27 (0.020): 0.071*\"questionnair\" + 0.017*\"taxpay\" + 0.017*\"candid\" + 0.013*\"driver\" + 0.012*\"tornado\" + 0.011*\"fool\" + 0.011*\"find\" + 0.010*\"théori\" + 0.010*\"landslid\" + 0.010*\"ret\"\n", + "2019-01-31 00:20:27,402 : INFO : topic #31 (0.020): 0.066*\"fusiform\" + 0.026*\"player\" + 0.021*\"place\" + 0.018*\"scientist\" + 0.016*\"taxpay\" + 0.011*\"leagu\" + 0.011*\"folei\" + 0.009*\"yard\" + 0.009*\"ruler\" + 0.008*\"yawn\"\n", + "2019-01-31 00:20:27,403 : INFO : topic #23 (0.020): 0.132*\"audit\" + 0.065*\"best\" + 0.032*\"jacksonvil\" + 0.030*\"yawn\" + 0.028*\"japanes\" + 0.021*\"noll\" + 0.020*\"festiv\" + 0.019*\"women\" + 0.016*\"intern\" + 0.015*\"prison\"\n", + "2019-01-31 00:20:27,404 : INFO : topic #1 (0.020): 0.058*\"china\" + 0.053*\"chilton\" + 0.026*\"hong\" + 0.024*\"kong\" + 0.022*\"korean\" + 0.022*\"korea\" + 0.017*\"sourc\" + 0.017*\"leah\" + 0.014*\"kim\" + 0.012*\"levinson\"\n", + "2019-01-31 00:20:27,410 : INFO : topic diff=0.019476, rho=0.082199\n", + "2019-01-31 00:20:27,566 : INFO : PROGRESS: pass 0, at document #298000/4922894\n", + "2019-01-31 00:20:29,018 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:20:29,284 : INFO : topic #27 (0.020): 0.072*\"questionnair\" + 0.018*\"candid\" + 0.017*\"taxpay\" + 0.014*\"driver\" + 0.012*\"tornado\" + 0.011*\"fool\" + 0.011*\"théori\" + 0.011*\"find\" + 0.010*\"landslid\" + 0.009*\"ret\"\n", + "2019-01-31 00:20:29,286 : INFO : topic #43 (0.020): 0.067*\"elect\" + 0.061*\"parti\" + 0.026*\"voluntari\" + 0.023*\"democrat\" + 0.022*\"member\" + 0.019*\"polici\" + 0.016*\"republ\" + 0.015*\"bypass\" + 0.015*\"report\" + 0.014*\"seaport\"\n", + "2019-01-31 00:20:29,287 : INFO : topic #19 (0.020): 0.010*\"woodcut\" + 0.009*\"origin\" + 0.009*\"charact\" + 0.008*\"form\" + 0.008*\"languag\" + 0.008*\"god\" + 0.008*\"like\" + 0.008*\"uruguayan\" + 0.007*\"mean\" + 0.006*\"differ\"\n", + "2019-01-31 00:20:29,288 : INFO : topic #29 (0.020): 0.012*\"govern\" + 0.010*\"start\" + 0.008*\"replac\" + 0.007*\"yawn\" + 0.007*\"countri\" + 0.007*\"million\" + 0.007*\"nation\" + 0.006*\"new\" + 0.006*\"théori\" + 0.006*\"summerhil\"\n", + "2019-01-31 00:20:29,289 : INFO : topic #48 (0.020): 0.085*\"march\" + 0.077*\"octob\" + 0.077*\"sens\" + 0.076*\"januari\" + 0.072*\"notion\" + 0.071*\"juli\" + 0.070*\"august\" + 0.069*\"judici\" + 0.069*\"april\" + 0.069*\"decatur\"\n", + "2019-01-31 00:20:29,295 : INFO : topic diff=0.020832, rho=0.081923\n", + "2019-01-31 00:20:32,087 : INFO : -11.414 per-word bound, 2728.1 perplexity estimate based on a held-out corpus of 2000 documents with 555698 words\n", + "2019-01-31 00:20:32,087 : INFO : PROGRESS: pass 0, at document #300000/4922894\n", + "2019-01-31 00:20:33,558 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:20:33,824 : INFO : topic #2 (0.020): 0.051*\"isl\" + 0.040*\"shield\" + 0.017*\"narrat\" + 0.014*\"scot\" + 0.013*\"pope\" + 0.012*\"blur\" + 0.010*\"coalit\" + 0.010*\"nativist\" + 0.010*\"fleet\" + 0.009*\"crew\"\n", + "2019-01-31 00:20:33,826 : INFO : topic #26 (0.020): 0.031*\"workplac\" + 0.030*\"champion\" + 0.029*\"woman\" + 0.026*\"olymp\" + 0.023*\"medal\" + 0.022*\"men\" + 0.021*\"atheist\" + 0.021*\"event\" + 0.018*\"alic\" + 0.018*\"taxpay\"\n", + "2019-01-31 00:20:33,827 : INFO : topic #37 (0.020): 0.009*\"love\" + 0.008*\"gestur\" + 0.005*\"man\" + 0.005*\"night\" + 0.004*\"blue\" + 0.004*\"bewild\" + 0.004*\"litig\" + 0.003*\"vision\" + 0.003*\"christma\" + 0.003*\"dai\"\n", + "2019-01-31 00:20:33,828 : INFO : topic #3 (0.020): 0.040*\"present\" + 0.029*\"offic\" + 0.026*\"minist\" + 0.022*\"seri\" + 0.019*\"gener\" + 0.017*\"member\" + 0.017*\"chickasaw\" + 0.016*\"serv\" + 0.015*\"appeas\" + 0.013*\"govern\"\n", + "2019-01-31 00:20:33,829 : INFO : topic #17 (0.020): 0.062*\"church\" + 0.021*\"jpg\" + 0.020*\"christian\" + 0.020*\"cathol\" + 0.018*\"bishop\" + 0.018*\"fifteenth\" + 0.015*\"centuri\" + 0.014*\"retroflex\" + 0.013*\"sail\" + 0.012*\"italian\"\n", + "2019-01-31 00:20:33,835 : INFO : topic diff=0.020513, rho=0.081650\n", + "2019-01-31 00:20:33,993 : INFO : PROGRESS: pass 0, at document #302000/4922894\n", + "2019-01-31 00:20:35,473 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:20:35,740 : INFO : topic #24 (0.020): 0.038*\"book\" + 0.033*\"publicis\" + 0.020*\"word\" + 0.016*\"new\" + 0.015*\"edit\" + 0.012*\"storag\" + 0.012*\"worldwid\" + 0.012*\"presid\" + 0.011*\"nicola\" + 0.011*\"author\"\n", + "2019-01-31 00:20:35,741 : INFO : topic #37 (0.020): 0.009*\"love\" + 0.008*\"gestur\" + 0.005*\"man\" + 0.005*\"blue\" + 0.005*\"night\" + 0.005*\"bewild\" + 0.004*\"litig\" + 0.003*\"vision\" + 0.003*\"dai\" + 0.003*\"introductori\"\n", + "2019-01-31 00:20:35,742 : INFO : topic #25 (0.020): 0.028*\"ring\" + 0.017*\"warmth\" + 0.016*\"lagrang\" + 0.015*\"area\" + 0.015*\"mount\" + 0.008*\"land\" + 0.008*\"north\" + 0.008*\"vacant\" + 0.008*\"foam\" + 0.008*\"palmer\"\n", + "2019-01-31 00:20:35,743 : INFO : topic #33 (0.020): 0.063*\"french\" + 0.045*\"franc\" + 0.030*\"pari\" + 0.025*\"sail\" + 0.022*\"jean\" + 0.015*\"daphn\" + 0.012*\"loui\" + 0.012*\"lazi\" + 0.012*\"wine\" + 0.011*\"wreath\"\n", + "2019-01-31 00:20:35,744 : INFO : topic #21 (0.020): 0.039*\"samford\" + 0.023*\"spain\" + 0.019*\"del\" + 0.017*\"mexico\" + 0.015*\"soviet\" + 0.014*\"francisco\" + 0.012*\"santa\" + 0.012*\"juan\" + 0.011*\"carlo\" + 0.011*\"josé\"\n", + "2019-01-31 00:20:35,750 : INFO : topic diff=0.018847, rho=0.081379\n", + "2019-01-31 00:20:35,904 : INFO : PROGRESS: pass 0, at document #304000/4922894\n", + "2019-01-31 00:20:37,362 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:20:37,628 : INFO : topic #48 (0.020): 0.087*\"januari\" + 0.084*\"march\" + 0.077*\"sens\" + 0.077*\"octob\" + 0.073*\"notion\" + 0.071*\"judici\" + 0.071*\"juli\" + 0.070*\"august\" + 0.068*\"april\" + 0.068*\"decatur\"\n", + "2019-01-31 00:20:37,630 : INFO : topic #27 (0.020): 0.071*\"questionnair\" + 0.018*\"candid\" + 0.017*\"taxpay\" + 0.014*\"driver\" + 0.012*\"tornado\" + 0.011*\"fool\" + 0.011*\"find\" + 0.011*\"landslid\" + 0.010*\"théori\" + 0.010*\"ret\"\n", + "2019-01-31 00:20:37,631 : INFO : topic #45 (0.020): 0.023*\"black\" + 0.018*\"western\" + 0.016*\"colder\" + 0.013*\"record\" + 0.012*\"fit\" + 0.011*\"blind\" + 0.010*\"light\" + 0.008*\"green\" + 0.008*\"illicit\" + 0.006*\"hand\"\n", + "2019-01-31 00:20:37,633 : INFO : topic #17 (0.020): 0.062*\"church\" + 0.020*\"jpg\" + 0.020*\"christian\" + 0.019*\"cathol\" + 0.017*\"fifteenth\" + 0.017*\"bishop\" + 0.015*\"centuri\" + 0.014*\"retroflex\" + 0.013*\"sail\" + 0.011*\"italian\"\n", + "2019-01-31 00:20:37,634 : INFO : topic #11 (0.020): 0.028*\"john\" + 0.015*\"will\" + 0.014*\"jame\" + 0.012*\"david\" + 0.011*\"rival\" + 0.010*\"georg\" + 0.010*\"slur\" + 0.009*\"mexican–american\" + 0.008*\"rhyme\" + 0.008*\"paul\"\n", + "2019-01-31 00:20:37,639 : INFO : topic diff=0.019128, rho=0.081111\n", + "2019-01-31 00:20:37,790 : INFO : PROGRESS: pass 0, at document #306000/4922894\n", + "2019-01-31 00:20:39,230 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:20:39,496 : INFO : topic #9 (0.020): 0.068*\"bone\" + 0.043*\"american\" + 0.026*\"valour\" + 0.022*\"player\" + 0.018*\"english\" + 0.017*\"folei\" + 0.017*\"dutch\" + 0.017*\"polit\" + 0.012*\"simpler\" + 0.012*\"acrimoni\"\n", + "2019-01-31 00:20:39,497 : INFO : topic #12 (0.020): 0.008*\"number\" + 0.008*\"frontal\" + 0.007*\"gener\" + 0.007*\"servitud\" + 0.006*\"exampl\" + 0.006*\"théori\" + 0.006*\"poet\" + 0.006*\"southern\" + 0.006*\"differ\" + 0.006*\"measur\"\n", + "2019-01-31 00:20:39,499 : INFO : topic #35 (0.020): 0.053*\"russia\" + 0.032*\"sovereignti\" + 0.028*\"poison\" + 0.027*\"rural\" + 0.025*\"reprint\" + 0.023*\"personifi\" + 0.018*\"poland\" + 0.016*\"moscow\" + 0.014*\"shirin\" + 0.014*\"unfortun\"\n", + "2019-01-31 00:20:39,500 : INFO : topic #3 (0.020): 0.040*\"present\" + 0.028*\"offic\" + 0.026*\"minist\" + 0.022*\"seri\" + 0.018*\"gener\" + 0.018*\"member\" + 0.018*\"chickasaw\" + 0.016*\"serv\" + 0.015*\"appeas\" + 0.013*\"govern\"\n", + "2019-01-31 00:20:39,501 : INFO : topic #34 (0.020): 0.074*\"start\" + 0.041*\"cotton\" + 0.029*\"unionist\" + 0.022*\"american\" + 0.018*\"new\" + 0.015*\"terri\" + 0.014*\"california\" + 0.013*\"warrior\" + 0.012*\"north\" + 0.012*\"violent\"\n", + "2019-01-31 00:20:39,507 : INFO : topic diff=0.021513, rho=0.080845\n", + "2019-01-31 00:20:39,665 : INFO : PROGRESS: pass 0, at document #308000/4922894\n", + "2019-01-31 00:20:41,152 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:20:41,418 : INFO : topic #25 (0.020): 0.029*\"ring\" + 0.018*\"warmth\" + 0.016*\"lagrang\" + 0.016*\"area\" + 0.015*\"mount\" + 0.008*\"land\" + 0.008*\"north\" + 0.008*\"vacant\" + 0.008*\"palmer\" + 0.008*\"foam\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 00:20:41,419 : INFO : topic #5 (0.020): 0.041*\"abroad\" + 0.029*\"son\" + 0.029*\"rel\" + 0.026*\"reconstruct\" + 0.022*\"band\" + 0.017*\"muscl\" + 0.016*\"simultan\" + 0.015*\"charcoal\" + 0.014*\"toyota\" + 0.009*\"myspac\"\n", + "2019-01-31 00:20:41,420 : INFO : topic #16 (0.020): 0.029*\"priest\" + 0.019*\"maria\" + 0.019*\"duke\" + 0.018*\"grammat\" + 0.018*\"king\" + 0.017*\"quarterli\" + 0.014*\"rotterdam\" + 0.014*\"portugues\" + 0.014*\"order\" + 0.012*\"princ\"\n", + "2019-01-31 00:20:41,421 : INFO : topic #11 (0.020): 0.027*\"john\" + 0.015*\"will\" + 0.013*\"jame\" + 0.012*\"david\" + 0.011*\"rival\" + 0.010*\"georg\" + 0.010*\"slur\" + 0.009*\"mexican–american\" + 0.009*\"rhyme\" + 0.008*\"paul\"\n", + "2019-01-31 00:20:41,422 : INFO : topic #12 (0.020): 0.008*\"number\" + 0.008*\"frontal\" + 0.007*\"gener\" + 0.007*\"servitud\" + 0.006*\"exampl\" + 0.006*\"théori\" + 0.006*\"poet\" + 0.006*\"southern\" + 0.006*\"differ\" + 0.006*\"measur\"\n", + "2019-01-31 00:20:41,428 : INFO : topic diff=0.020493, rho=0.080582\n", + "2019-01-31 00:20:41,578 : INFO : PROGRESS: pass 0, at document #310000/4922894\n", + "2019-01-31 00:20:43,012 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:20:43,278 : INFO : topic #31 (0.020): 0.066*\"fusiform\" + 0.023*\"player\" + 0.020*\"scientist\" + 0.019*\"place\" + 0.015*\"taxpay\" + 0.012*\"leagu\" + 0.010*\"ruler\" + 0.010*\"folei\" + 0.009*\"yard\" + 0.008*\"barber\"\n", + "2019-01-31 00:20:43,279 : INFO : topic #37 (0.020): 0.009*\"love\" + 0.008*\"gestur\" + 0.006*\"man\" + 0.005*\"bewild\" + 0.005*\"blue\" + 0.004*\"night\" + 0.004*\"litig\" + 0.003*\"dai\" + 0.003*\"introductori\" + 0.003*\"vision\"\n", + "2019-01-31 00:20:43,280 : INFO : topic #3 (0.020): 0.039*\"present\" + 0.028*\"offic\" + 0.026*\"minist\" + 0.023*\"seri\" + 0.019*\"chickasaw\" + 0.018*\"member\" + 0.018*\"gener\" + 0.016*\"serv\" + 0.015*\"appeas\" + 0.014*\"govern\"\n", + "2019-01-31 00:20:43,282 : INFO : topic #10 (0.020): 0.013*\"cdd\" + 0.008*\"media\" + 0.008*\"pathwai\" + 0.007*\"proper\" + 0.007*\"hormon\" + 0.007*\"disco\" + 0.006*\"caus\" + 0.006*\"have\" + 0.006*\"treat\" + 0.006*\"activ\"\n", + "2019-01-31 00:20:43,283 : INFO : topic #30 (0.020): 0.035*\"cleveland\" + 0.033*\"leagu\" + 0.031*\"place\" + 0.029*\"taxpay\" + 0.024*\"scientist\" + 0.023*\"crete\" + 0.021*\"folei\" + 0.016*\"goal\" + 0.016*\"martin\" + 0.012*\"schmitz\"\n", + "2019-01-31 00:20:43,289 : INFO : topic diff=0.020996, rho=0.080322\n", + "2019-01-31 00:20:43,438 : INFO : PROGRESS: pass 0, at document #312000/4922894\n", + "2019-01-31 00:20:44,875 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:20:45,140 : INFO : topic #16 (0.020): 0.028*\"priest\" + 0.020*\"grammat\" + 0.019*\"duke\" + 0.018*\"maria\" + 0.018*\"quarterli\" + 0.017*\"king\" + 0.015*\"rotterdam\" + 0.015*\"order\" + 0.015*\"portugues\" + 0.011*\"portrait\"\n", + "2019-01-31 00:20:45,141 : INFO : topic #20 (0.020): 0.127*\"scholar\" + 0.036*\"struggl\" + 0.029*\"educ\" + 0.029*\"high\" + 0.018*\"yawn\" + 0.017*\"collector\" + 0.012*\"prognosi\" + 0.009*\"class\" + 0.009*\"task\" + 0.008*\"pseudo\"\n", + "2019-01-31 00:20:45,143 : INFO : topic #35 (0.020): 0.052*\"russia\" + 0.031*\"sovereignti\" + 0.028*\"rural\" + 0.026*\"poison\" + 0.024*\"reprint\" + 0.022*\"personifi\" + 0.017*\"poland\" + 0.017*\"moscow\" + 0.015*\"shirin\" + 0.014*\"unfortun\"\n", + "2019-01-31 00:20:45,144 : INFO : topic #31 (0.020): 0.065*\"fusiform\" + 0.023*\"player\" + 0.020*\"place\" + 0.020*\"scientist\" + 0.015*\"taxpay\" + 0.012*\"leagu\" + 0.011*\"yard\" + 0.010*\"ruler\" + 0.009*\"folei\" + 0.008*\"barber\"\n", + "2019-01-31 00:20:45,145 : INFO : topic #13 (0.020): 0.028*\"australia\" + 0.028*\"new\" + 0.025*\"sourc\" + 0.023*\"london\" + 0.021*\"australian\" + 0.021*\"england\" + 0.020*\"ireland\" + 0.018*\"youth\" + 0.017*\"british\" + 0.016*\"sydnei\"\n", + "2019-01-31 00:20:45,151 : INFO : topic diff=0.021081, rho=0.080064\n", + "2019-01-31 00:20:45,303 : INFO : PROGRESS: pass 0, at document #314000/4922894\n", + "2019-01-31 00:20:46,759 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:20:47,025 : INFO : topic #27 (0.020): 0.071*\"questionnair\" + 0.017*\"taxpay\" + 0.017*\"candid\" + 0.016*\"driver\" + 0.013*\"tornado\" + 0.013*\"ret\" + 0.011*\"fool\" + 0.011*\"find\" + 0.010*\"théori\" + 0.010*\"champion\"\n", + "2019-01-31 00:20:47,026 : INFO : topic #5 (0.020): 0.040*\"abroad\" + 0.030*\"son\" + 0.028*\"rel\" + 0.026*\"reconstruct\" + 0.021*\"band\" + 0.017*\"muscl\" + 0.016*\"simultan\" + 0.015*\"charcoal\" + 0.014*\"toyota\" + 0.009*\"myspac\"\n", + "2019-01-31 00:20:47,027 : INFO : topic #30 (0.020): 0.035*\"cleveland\" + 0.034*\"leagu\" + 0.031*\"place\" + 0.029*\"taxpay\" + 0.024*\"scientist\" + 0.023*\"crete\" + 0.021*\"folei\" + 0.016*\"goal\" + 0.016*\"martin\" + 0.012*\"player\"\n", + "2019-01-31 00:20:47,029 : INFO : topic #49 (0.020): 0.040*\"india\" + 0.032*\"incumb\" + 0.012*\"televis\" + 0.012*\"pakistan\" + 0.011*\"islam\" + 0.010*\"khalsa\" + 0.010*\"sri\" + 0.010*\"start\" + 0.009*\"alam\" + 0.009*\"muskoge\"\n", + "2019-01-31 00:20:47,030 : INFO : topic #9 (0.020): 0.081*\"bone\" + 0.046*\"american\" + 0.024*\"valour\" + 0.021*\"player\" + 0.016*\"folei\" + 0.016*\"english\" + 0.015*\"polit\" + 0.015*\"dutch\" + 0.013*\"acrimoni\" + 0.013*\"simpler\"\n", + "2019-01-31 00:20:47,036 : INFO : topic diff=0.019141, rho=0.079809\n", + "2019-01-31 00:20:47,187 : INFO : PROGRESS: pass 0, at document #316000/4922894\n", + "2019-01-31 00:20:48,626 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:20:48,891 : INFO : topic #25 (0.020): 0.029*\"ring\" + 0.018*\"warmth\" + 0.017*\"lagrang\" + 0.016*\"area\" + 0.014*\"mount\" + 0.008*\"vacant\" + 0.008*\"land\" + 0.008*\"north\" + 0.008*\"palmer\" + 0.008*\"lobe\"\n", + "2019-01-31 00:20:48,893 : INFO : topic #31 (0.020): 0.065*\"fusiform\" + 0.023*\"player\" + 0.020*\"place\" + 0.020*\"scientist\" + 0.015*\"taxpay\" + 0.012*\"leagu\" + 0.011*\"yard\" + 0.010*\"ruler\" + 0.010*\"folei\" + 0.008*\"barber\"\n", + "2019-01-31 00:20:48,894 : INFO : topic #8 (0.020): 0.032*\"law\" + 0.026*\"cortic\" + 0.022*\"act\" + 0.019*\"start\" + 0.013*\"ricardo\" + 0.013*\"case\" + 0.010*\"polaris\" + 0.009*\"legal\" + 0.009*\"judaism\" + 0.007*\"justic\"\n", + "2019-01-31 00:20:48,895 : INFO : topic #21 (0.020): 0.039*\"samford\" + 0.024*\"spain\" + 0.020*\"mexico\" + 0.019*\"del\" + 0.014*\"soviet\" + 0.013*\"francisco\" + 0.013*\"santa\" + 0.011*\"carlo\" + 0.011*\"juan\" + 0.011*\"lizard\"\n", + "2019-01-31 00:20:48,897 : INFO : topic #48 (0.020): 0.087*\"march\" + 0.082*\"januari\" + 0.078*\"sens\" + 0.077*\"octob\" + 0.075*\"notion\" + 0.073*\"juli\" + 0.073*\"judici\" + 0.072*\"august\" + 0.072*\"april\" + 0.070*\"decatur\"\n", + "2019-01-31 00:20:48,903 : INFO : topic diff=0.018112, rho=0.079556\n", + "2019-01-31 00:20:49,056 : INFO : PROGRESS: pass 0, at document #318000/4922894\n", + "2019-01-31 00:20:50,489 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:20:50,755 : INFO : topic #33 (0.020): 0.063*\"french\" + 0.044*\"franc\" + 0.029*\"pari\" + 0.024*\"sail\" + 0.021*\"jean\" + 0.017*\"wine\" + 0.016*\"wreath\" + 0.015*\"daphn\" + 0.013*\"loui\" + 0.012*\"lazi\"\n", + "2019-01-31 00:20:50,756 : INFO : topic #21 (0.020): 0.039*\"samford\" + 0.024*\"spain\" + 0.020*\"mexico\" + 0.019*\"del\" + 0.014*\"soviet\" + 0.013*\"francisco\" + 0.012*\"santa\" + 0.011*\"carlo\" + 0.011*\"juan\" + 0.011*\"lizard\"\n", + "2019-01-31 00:20:50,757 : INFO : topic #19 (0.020): 0.010*\"woodcut\" + 0.009*\"origin\" + 0.009*\"charact\" + 0.009*\"form\" + 0.009*\"languag\" + 0.008*\"mean\" + 0.008*\"uruguayan\" + 0.008*\"like\" + 0.007*\"god\" + 0.006*\"differ\"\n", + "2019-01-31 00:20:50,758 : INFO : topic #13 (0.020): 0.028*\"australia\" + 0.027*\"new\" + 0.025*\"sourc\" + 0.024*\"london\" + 0.021*\"australian\" + 0.020*\"england\" + 0.020*\"ireland\" + 0.018*\"youth\" + 0.017*\"british\" + 0.015*\"sydnei\"\n", + "2019-01-31 00:20:50,760 : INFO : topic #26 (0.020): 0.033*\"workplac\" + 0.031*\"champion\" + 0.029*\"woman\" + 0.025*\"olymp\" + 0.024*\"alic\" + 0.022*\"medal\" + 0.021*\"men\" + 0.021*\"event\" + 0.018*\"atheist\" + 0.018*\"taxpay\"\n", + "2019-01-31 00:20:50,765 : INFO : topic diff=0.018600, rho=0.079305\n", + "2019-01-31 00:20:53,587 : INFO : -11.562 per-word bound, 3022.6 perplexity estimate based on a held-out corpus of 2000 documents with 550871 words\n", + "2019-01-31 00:20:53,588 : INFO : PROGRESS: pass 0, at document #320000/4922894\n", + "2019-01-31 00:20:55,043 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:20:55,309 : INFO : topic #40 (0.020): 0.087*\"unit\" + 0.025*\"collector\" + 0.020*\"institut\" + 0.019*\"schuster\" + 0.016*\"student\" + 0.016*\"requir\" + 0.014*\"professor\" + 0.012*\"word\" + 0.012*\"governor\" + 0.011*\"degre\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 00:20:55,310 : INFO : topic #0 (0.020): 0.064*\"statewid\" + 0.044*\"arsen\" + 0.038*\"line\" + 0.037*\"raid\" + 0.035*\"museo\" + 0.018*\"traceabl\" + 0.018*\"pain\" + 0.017*\"serv\" + 0.017*\"word\" + 0.017*\"exhaust\"\n", + "2019-01-31 00:20:55,311 : INFO : topic #8 (0.020): 0.033*\"law\" + 0.027*\"cortic\" + 0.022*\"act\" + 0.018*\"start\" + 0.013*\"ricardo\" + 0.013*\"case\" + 0.010*\"legal\" + 0.009*\"polaris\" + 0.009*\"judaism\" + 0.008*\"justic\"\n", + "2019-01-31 00:20:55,312 : INFO : topic #15 (0.020): 0.014*\"develop\" + 0.013*\"small\" + 0.012*\"requir\" + 0.010*\"organ\" + 0.010*\"word\" + 0.010*\"commun\" + 0.009*\"cultur\" + 0.008*\"student\" + 0.008*\"socialist\" + 0.008*\"human\"\n", + "2019-01-31 00:20:55,313 : INFO : topic #22 (0.020): 0.033*\"spars\" + 0.027*\"factor\" + 0.023*\"adulthood\" + 0.017*\"hostil\" + 0.017*\"feel\" + 0.015*\"male\" + 0.011*\"plaisir\" + 0.011*\"live\" + 0.010*\"genu\" + 0.009*\"popolo\"\n", + "2019-01-31 00:20:55,319 : INFO : topic diff=0.017851, rho=0.079057\n", + "2019-01-31 00:20:55,474 : INFO : PROGRESS: pass 0, at document #322000/4922894\n", + "2019-01-31 00:20:56,926 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:20:57,192 : INFO : topic #7 (0.020): 0.020*\"snatch\" + 0.020*\"di\" + 0.017*\"factor\" + 0.014*\"yawn\" + 0.014*\"margin\" + 0.012*\"life\" + 0.012*\"deal\" + 0.012*\"bone\" + 0.012*\"faster\" + 0.012*\"john\"\n", + "2019-01-31 00:20:57,193 : INFO : topic #33 (0.020): 0.063*\"french\" + 0.043*\"franc\" + 0.028*\"pari\" + 0.024*\"sail\" + 0.021*\"jean\" + 0.016*\"wine\" + 0.015*\"wreath\" + 0.014*\"daphn\" + 0.013*\"loui\" + 0.012*\"lazi\"\n", + "2019-01-31 00:20:57,194 : INFO : topic #41 (0.020): 0.049*\"citi\" + 0.042*\"new\" + 0.027*\"palmer\" + 0.025*\"year\" + 0.015*\"center\" + 0.015*\"strategist\" + 0.010*\"open\" + 0.009*\"hot\" + 0.009*\"lobe\" + 0.009*\"includ\"\n", + "2019-01-31 00:20:57,195 : INFO : topic #29 (0.020): 0.012*\"govern\" + 0.010*\"start\" + 0.008*\"replac\" + 0.008*\"countri\" + 0.008*\"yawn\" + 0.007*\"million\" + 0.007*\"nation\" + 0.006*\"new\" + 0.006*\"théori\" + 0.006*\"summerhil\"\n", + "2019-01-31 00:20:57,197 : INFO : topic #49 (0.020): 0.040*\"india\" + 0.031*\"incumb\" + 0.015*\"televis\" + 0.012*\"pakistan\" + 0.010*\"islam\" + 0.010*\"khalsa\" + 0.010*\"start\" + 0.009*\"sri\" + 0.009*\"tajikistan\" + 0.009*\"alam\"\n", + "2019-01-31 00:20:57,202 : INFO : topic diff=0.019380, rho=0.078811\n", + "2019-01-31 00:20:57,359 : INFO : PROGRESS: pass 0, at document #324000/4922894\n", + "2019-01-31 00:20:58,818 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:20:59,084 : INFO : topic #26 (0.020): 0.034*\"workplac\" + 0.030*\"champion\" + 0.028*\"woman\" + 0.025*\"olymp\" + 0.023*\"alic\" + 0.021*\"medal\" + 0.021*\"event\" + 0.020*\"men\" + 0.018*\"taxpay\" + 0.017*\"atheist\"\n", + "2019-01-31 00:20:59,085 : INFO : topic #45 (0.020): 0.022*\"black\" + 0.018*\"western\" + 0.015*\"colder\" + 0.013*\"record\" + 0.010*\"blind\" + 0.010*\"light\" + 0.009*\"fit\" + 0.008*\"illicit\" + 0.008*\"green\" + 0.007*\"arm\"\n", + "2019-01-31 00:20:59,086 : INFO : topic #48 (0.020): 0.083*\"march\" + 0.080*\"januari\" + 0.076*\"octob\" + 0.076*\"sens\" + 0.073*\"notion\" + 0.072*\"april\" + 0.071*\"juli\" + 0.071*\"judici\" + 0.071*\"august\" + 0.069*\"decatur\"\n", + "2019-01-31 00:20:59,087 : INFO : topic #3 (0.020): 0.037*\"present\" + 0.028*\"offic\" + 0.026*\"minist\" + 0.023*\"seri\" + 0.019*\"gener\" + 0.019*\"chickasaw\" + 0.018*\"member\" + 0.015*\"serv\" + 0.015*\"appeas\" + 0.014*\"govern\"\n", + "2019-01-31 00:20:59,088 : INFO : topic #7 (0.020): 0.020*\"snatch\" + 0.020*\"di\" + 0.017*\"factor\" + 0.014*\"yawn\" + 0.014*\"margin\" + 0.012*\"deal\" + 0.012*\"life\" + 0.012*\"john\" + 0.012*\"bone\" + 0.012*\"faster\"\n", + "2019-01-31 00:20:59,094 : INFO : topic diff=0.020038, rho=0.078567\n", + "2019-01-31 00:20:59,250 : INFO : PROGRESS: pass 0, at document #326000/4922894\n", + "2019-01-31 00:21:00,726 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:21:00,991 : INFO : topic #40 (0.020): 0.090*\"unit\" + 0.026*\"collector\" + 0.020*\"institut\" + 0.019*\"schuster\" + 0.016*\"student\" + 0.015*\"requir\" + 0.014*\"professor\" + 0.012*\"word\" + 0.012*\"governor\" + 0.012*\"degre\"\n", + "2019-01-31 00:21:00,993 : INFO : topic #26 (0.020): 0.035*\"workplac\" + 0.030*\"champion\" + 0.028*\"woman\" + 0.026*\"olymp\" + 0.022*\"alic\" + 0.021*\"medal\" + 0.021*\"event\" + 0.020*\"men\" + 0.018*\"rainfal\" + 0.018*\"taxpay\"\n", + "2019-01-31 00:21:00,994 : INFO : topic #28 (0.020): 0.030*\"build\" + 0.023*\"hous\" + 0.023*\"rivièr\" + 0.016*\"buford\" + 0.012*\"rosenwald\" + 0.011*\"briarwood\" + 0.011*\"histor\" + 0.011*\"constitut\" + 0.010*\"strategist\" + 0.010*\"silicon\"\n", + "2019-01-31 00:21:00,995 : INFO : topic #3 (0.020): 0.039*\"present\" + 0.028*\"offic\" + 0.025*\"minist\" + 0.023*\"seri\" + 0.019*\"gener\" + 0.018*\"chickasaw\" + 0.018*\"member\" + 0.015*\"serv\" + 0.015*\"appeas\" + 0.014*\"govern\"\n", + "2019-01-31 00:21:00,996 : INFO : topic #33 (0.020): 0.062*\"french\" + 0.043*\"franc\" + 0.028*\"pari\" + 0.024*\"sail\" + 0.021*\"jean\" + 0.015*\"wine\" + 0.015*\"loui\" + 0.014*\"daphn\" + 0.013*\"wreath\" + 0.013*\"lazi\"\n", + "2019-01-31 00:21:01,002 : INFO : topic diff=0.018567, rho=0.078326\n", + "2019-01-31 00:21:01,154 : INFO : PROGRESS: pass 0, at document #328000/4922894\n", + "2019-01-31 00:21:02,594 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:21:02,860 : INFO : topic #42 (0.020): 0.038*\"german\" + 0.025*\"germani\" + 0.014*\"vol\" + 0.012*\"jewish\" + 0.012*\"der\" + 0.011*\"israel\" + 0.010*\"berlin\" + 0.009*\"greek\" + 0.008*\"austria\" + 0.008*\"europ\"\n", + "2019-01-31 00:21:02,861 : INFO : topic #41 (0.020): 0.051*\"citi\" + 0.042*\"new\" + 0.027*\"palmer\" + 0.024*\"year\" + 0.015*\"center\" + 0.014*\"strategist\" + 0.010*\"open\" + 0.010*\"lobe\" + 0.009*\"includ\" + 0.009*\"hot\"\n", + "2019-01-31 00:21:02,862 : INFO : topic #21 (0.020): 0.037*\"samford\" + 0.024*\"spain\" + 0.019*\"mexico\" + 0.018*\"del\" + 0.014*\"soviet\" + 0.013*\"santa\" + 0.013*\"francisco\" + 0.011*\"josé\" + 0.011*\"juan\" + 0.011*\"carlo\"\n", + "2019-01-31 00:21:02,863 : INFO : topic #8 (0.020): 0.032*\"law\" + 0.025*\"cortic\" + 0.020*\"act\" + 0.018*\"start\" + 0.013*\"ricardo\" + 0.012*\"case\" + 0.009*\"polaris\" + 0.009*\"legal\" + 0.008*\"judaism\" + 0.008*\"rudolf\"\n", + "2019-01-31 00:21:02,864 : INFO : topic #16 (0.020): 0.028*\"priest\" + 0.019*\"quarterli\" + 0.019*\"grammat\" + 0.018*\"king\" + 0.018*\"duke\" + 0.018*\"portugues\" + 0.017*\"maria\" + 0.015*\"rotterdam\" + 0.013*\"princ\" + 0.012*\"portrait\"\n", + "2019-01-31 00:21:02,870 : INFO : topic diff=0.016826, rho=0.078087\n", + "2019-01-31 00:21:03,027 : INFO : PROGRESS: pass 0, at document #330000/4922894\n", + "2019-01-31 00:21:04,504 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:21:04,770 : INFO : topic #15 (0.020): 0.014*\"small\" + 0.013*\"develop\" + 0.011*\"organ\" + 0.011*\"requir\" + 0.010*\"word\" + 0.010*\"commun\" + 0.009*\"cultur\" + 0.008*\"socialist\" + 0.008*\"student\" + 0.008*\"human\"\n", + "2019-01-31 00:21:04,771 : INFO : topic #17 (0.020): 0.065*\"church\" + 0.019*\"jpg\" + 0.019*\"christian\" + 0.018*\"cathol\" + 0.017*\"bishop\" + 0.014*\"sail\" + 0.014*\"fifteenth\" + 0.014*\"retroflex\" + 0.014*\"centuri\" + 0.010*\"italian\"\n", + "2019-01-31 00:21:04,772 : INFO : topic #33 (0.020): 0.061*\"french\" + 0.043*\"franc\" + 0.029*\"pari\" + 0.026*\"sail\" + 0.022*\"jean\" + 0.015*\"loui\" + 0.014*\"daphn\" + 0.014*\"wine\" + 0.013*\"lazi\" + 0.012*\"piec\"\n", + "2019-01-31 00:21:04,774 : INFO : topic #27 (0.020): 0.072*\"questionnair\" + 0.020*\"taxpay\" + 0.016*\"candid\" + 0.014*\"driver\" + 0.014*\"ret\" + 0.013*\"tornado\" + 0.011*\"find\" + 0.011*\"fool\" + 0.010*\"champion\" + 0.010*\"théori\"\n", + "2019-01-31 00:21:04,775 : INFO : topic #25 (0.020): 0.029*\"ring\" + 0.019*\"warmth\" + 0.017*\"lagrang\" + 0.015*\"area\" + 0.015*\"mount\" + 0.008*\"north\" + 0.008*\"land\" + 0.008*\"vacant\" + 0.008*\"lobe\" + 0.008*\"foam\"\n", + "2019-01-31 00:21:04,781 : INFO : topic diff=0.019237, rho=0.077850\n", + "2019-01-31 00:21:04,933 : INFO : PROGRESS: pass 0, at document #332000/4922894\n", + "2019-01-31 00:21:06,383 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:21:06,655 : INFO : topic #33 (0.020): 0.062*\"french\" + 0.043*\"franc\" + 0.028*\"pari\" + 0.025*\"sail\" + 0.022*\"wine\" + 0.022*\"jean\" + 0.014*\"daphn\" + 0.014*\"loui\" + 0.012*\"lazi\" + 0.011*\"piec\"\n", + "2019-01-31 00:21:06,656 : INFO : topic #49 (0.020): 0.041*\"india\" + 0.030*\"incumb\" + 0.014*\"televis\" + 0.012*\"pakistan\" + 0.010*\"islam\" + 0.010*\"start\" + 0.010*\"khalsa\" + 0.009*\"tajikistan\" + 0.009*\"sri\" + 0.008*\"alam\"\n", + "2019-01-31 00:21:06,658 : INFO : topic #10 (0.020): 0.013*\"cdd\" + 0.009*\"hormon\" + 0.008*\"media\" + 0.008*\"disco\" + 0.007*\"pathwai\" + 0.007*\"che\" + 0.007*\"caus\" + 0.007*\"have\" + 0.006*\"treat\" + 0.006*\"includ\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 00:21:06,659 : INFO : topic #22 (0.020): 0.035*\"spars\" + 0.027*\"factor\" + 0.023*\"adulthood\" + 0.017*\"hostil\" + 0.017*\"feel\" + 0.015*\"live\" + 0.014*\"male\" + 0.011*\"plaisir\" + 0.009*\"genu\" + 0.009*\"popolo\"\n", + "2019-01-31 00:21:06,660 : INFO : topic #8 (0.020): 0.032*\"law\" + 0.026*\"cortic\" + 0.019*\"act\" + 0.018*\"start\" + 0.013*\"ricardo\" + 0.013*\"case\" + 0.009*\"polaris\" + 0.009*\"legal\" + 0.008*\"judaism\" + 0.008*\"justic\"\n", + "2019-01-31 00:21:06,666 : INFO : topic diff=0.018647, rho=0.077615\n", + "2019-01-31 00:21:06,820 : INFO : PROGRESS: pass 0, at document #334000/4922894\n", + "2019-01-31 00:21:08,282 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:21:08,547 : INFO : topic #29 (0.020): 0.012*\"govern\" + 0.010*\"start\" + 0.008*\"replac\" + 0.008*\"countri\" + 0.008*\"yawn\" + 0.007*\"million\" + 0.006*\"nation\" + 0.006*\"théori\" + 0.006*\"new\" + 0.006*\"placement\"\n", + "2019-01-31 00:21:08,549 : INFO : topic #22 (0.020): 0.035*\"spars\" + 0.027*\"factor\" + 0.023*\"adulthood\" + 0.017*\"hostil\" + 0.017*\"feel\" + 0.015*\"live\" + 0.015*\"male\" + 0.011*\"plaisir\" + 0.010*\"popolo\" + 0.009*\"genu\"\n", + "2019-01-31 00:21:08,550 : INFO : topic #33 (0.020): 0.061*\"french\" + 0.042*\"franc\" + 0.029*\"pari\" + 0.023*\"sail\" + 0.022*\"jean\" + 0.021*\"wine\" + 0.014*\"daphn\" + 0.014*\"loui\" + 0.012*\"lazi\" + 0.011*\"piec\"\n", + "2019-01-31 00:21:08,551 : INFO : topic #44 (0.020): 0.030*\"rooftop\" + 0.026*\"final\" + 0.024*\"wife\" + 0.019*\"tourist\" + 0.017*\"champion\" + 0.015*\"taxpay\" + 0.015*\"tiepolo\" + 0.014*\"chamber\" + 0.013*\"martin\" + 0.012*\"poet\"\n", + "2019-01-31 00:21:08,553 : INFO : topic #23 (0.020): 0.124*\"audit\" + 0.065*\"best\" + 0.039*\"jacksonvil\" + 0.030*\"yawn\" + 0.025*\"japanes\" + 0.022*\"noll\" + 0.020*\"festiv\" + 0.019*\"women\" + 0.017*\"intern\" + 0.016*\"tokyo\"\n", + "2019-01-31 00:21:08,558 : INFO : topic diff=0.016786, rho=0.077382\n", + "2019-01-31 00:21:08,714 : INFO : PROGRESS: pass 0, at document #336000/4922894\n", + "2019-01-31 00:21:10,205 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:21:10,471 : INFO : topic #3 (0.020): 0.038*\"present\" + 0.028*\"offic\" + 0.025*\"minist\" + 0.024*\"seri\" + 0.020*\"gener\" + 0.018*\"member\" + 0.018*\"chickasaw\" + 0.015*\"appeas\" + 0.014*\"govern\" + 0.014*\"serv\"\n", + "2019-01-31 00:21:10,472 : INFO : topic #10 (0.020): 0.013*\"cdd\" + 0.008*\"hormon\" + 0.008*\"media\" + 0.008*\"disco\" + 0.007*\"have\" + 0.007*\"che\" + 0.007*\"caus\" + 0.007*\"pathwai\" + 0.006*\"treat\" + 0.006*\"effect\"\n", + "2019-01-31 00:21:10,474 : INFO : topic #43 (0.020): 0.069*\"elect\" + 0.057*\"parti\" + 0.027*\"voluntari\" + 0.023*\"democrat\" + 0.022*\"member\" + 0.019*\"polici\" + 0.015*\"bypass\" + 0.014*\"report\" + 0.014*\"republ\" + 0.013*\"hous\"\n", + "2019-01-31 00:21:10,475 : INFO : topic #0 (0.020): 0.066*\"statewid\" + 0.043*\"arsen\" + 0.037*\"line\" + 0.037*\"raid\" + 0.032*\"museo\" + 0.018*\"traceabl\" + 0.017*\"serv\" + 0.017*\"pain\" + 0.016*\"word\" + 0.015*\"exhaust\"\n", + "2019-01-31 00:21:10,475 : INFO : topic #16 (0.020): 0.026*\"priest\" + 0.019*\"grammat\" + 0.018*\"king\" + 0.018*\"portugues\" + 0.018*\"quarterli\" + 0.017*\"duke\" + 0.017*\"maria\" + 0.016*\"rotterdam\" + 0.013*\"portrait\" + 0.012*\"idiosyncrat\"\n", + "2019-01-31 00:21:10,481 : INFO : topic diff=0.020697, rho=0.077152\n", + "2019-01-31 00:21:10,638 : INFO : PROGRESS: pass 0, at document #338000/4922894\n", + "2019-01-31 00:21:12,117 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:21:12,383 : INFO : topic #26 (0.020): 0.035*\"workplac\" + 0.032*\"champion\" + 0.031*\"woman\" + 0.025*\"event\" + 0.025*\"olymp\" + 0.021*\"alic\" + 0.021*\"men\" + 0.021*\"medal\" + 0.019*\"rainfal\" + 0.019*\"atheist\"\n", + "2019-01-31 00:21:12,384 : INFO : topic #49 (0.020): 0.042*\"india\" + 0.030*\"incumb\" + 0.014*\"televis\" + 0.011*\"pakistan\" + 0.010*\"islam\" + 0.010*\"khalsa\" + 0.009*\"sri\" + 0.009*\"start\" + 0.009*\"alam\" + 0.008*\"tajikistan\"\n", + "2019-01-31 00:21:12,385 : INFO : topic #31 (0.020): 0.063*\"fusiform\" + 0.022*\"player\" + 0.019*\"scientist\" + 0.019*\"place\" + 0.017*\"taxpay\" + 0.011*\"leagu\" + 0.011*\"folei\" + 0.010*\"yard\" + 0.009*\"borrow\" + 0.009*\"ruler\"\n", + "2019-01-31 00:21:12,386 : INFO : topic #16 (0.020): 0.028*\"priest\" + 0.019*\"king\" + 0.019*\"quarterli\" + 0.018*\"grammat\" + 0.018*\"portugues\" + 0.017*\"duke\" + 0.017*\"maria\" + 0.017*\"rotterdam\" + 0.013*\"princ\" + 0.012*\"idiosyncrat\"\n", + "2019-01-31 00:21:12,388 : INFO : topic #32 (0.020): 0.061*\"district\" + 0.046*\"vigour\" + 0.043*\"popolo\" + 0.042*\"tortur\" + 0.030*\"cotton\" + 0.029*\"area\" + 0.027*\"multitud\" + 0.026*\"regim\" + 0.021*\"citi\" + 0.019*\"commun\"\n", + "2019-01-31 00:21:12,394 : INFO : topic diff=0.017033, rho=0.076923\n", + "2019-01-31 00:21:15,197 : INFO : -11.816 per-word bound, 3606.0 perplexity estimate based on a held-out corpus of 2000 documents with 555866 words\n", + "2019-01-31 00:21:15,197 : INFO : PROGRESS: pass 0, at document #340000/4922894\n", + "2019-01-31 00:21:16,678 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:21:16,944 : INFO : topic #19 (0.020): 0.010*\"origin\" + 0.010*\"woodcut\" + 0.009*\"languag\" + 0.009*\"form\" + 0.009*\"charact\" + 0.008*\"mean\" + 0.008*\"uruguayan\" + 0.008*\"like\" + 0.006*\"god\" + 0.006*\"differ\"\n", + "2019-01-31 00:21:16,945 : INFO : topic #40 (0.020): 0.093*\"unit\" + 0.026*\"collector\" + 0.019*\"institut\" + 0.019*\"schuster\" + 0.016*\"student\" + 0.014*\"requir\" + 0.014*\"professor\" + 0.012*\"word\" + 0.012*\"governor\" + 0.011*\"degre\"\n", + "2019-01-31 00:21:16,946 : INFO : topic #0 (0.020): 0.068*\"statewid\" + 0.042*\"arsen\" + 0.038*\"raid\" + 0.038*\"line\" + 0.031*\"museo\" + 0.019*\"traceabl\" + 0.017*\"serv\" + 0.016*\"pain\" + 0.016*\"word\" + 0.015*\"exhaust\"\n", + "2019-01-31 00:21:16,947 : INFO : topic #44 (0.020): 0.031*\"rooftop\" + 0.026*\"final\" + 0.024*\"wife\" + 0.021*\"tourist\" + 0.017*\"champion\" + 0.015*\"tiepolo\" + 0.015*\"taxpay\" + 0.015*\"chamber\" + 0.013*\"martin\" + 0.012*\"winner\"\n", + "2019-01-31 00:21:16,948 : INFO : topic #22 (0.020): 0.035*\"spars\" + 0.027*\"factor\" + 0.023*\"adulthood\" + 0.017*\"hostil\" + 0.017*\"feel\" + 0.015*\"live\" + 0.015*\"male\" + 0.011*\"plaisir\" + 0.010*\"popolo\" + 0.010*\"genu\"\n", + "2019-01-31 00:21:16,954 : INFO : topic diff=0.017131, rho=0.076696\n", + "2019-01-31 00:21:17,112 : INFO : PROGRESS: pass 0, at document #342000/4922894\n", + "2019-01-31 00:21:18,579 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:21:18,846 : INFO : topic #18 (0.020): 0.008*\"théori\" + 0.007*\"later\" + 0.007*\"sack\" + 0.006*\"kill\" + 0.005*\"retrospect\" + 0.005*\"man\" + 0.005*\"dai\" + 0.004*\"help\" + 0.004*\"deal\" + 0.004*\"fraud\"\n", + "2019-01-31 00:21:18,848 : INFO : topic #43 (0.020): 0.069*\"elect\" + 0.058*\"parti\" + 0.027*\"voluntari\" + 0.022*\"democrat\" + 0.021*\"member\" + 0.020*\"polici\" + 0.015*\"bypass\" + 0.014*\"report\" + 0.014*\"republ\" + 0.013*\"seaport\"\n", + "2019-01-31 00:21:18,849 : INFO : topic #28 (0.020): 0.030*\"build\" + 0.024*\"hous\" + 0.022*\"rivièr\" + 0.016*\"buford\" + 0.012*\"rosenwald\" + 0.012*\"briarwood\" + 0.011*\"histor\" + 0.011*\"strategist\" + 0.011*\"constitut\" + 0.009*\"linear\"\n", + "2019-01-31 00:21:18,850 : INFO : topic #41 (0.020): 0.050*\"citi\" + 0.042*\"new\" + 0.025*\"palmer\" + 0.023*\"year\" + 0.015*\"strategist\" + 0.015*\"center\" + 0.011*\"open\" + 0.010*\"lobe\" + 0.009*\"includ\" + 0.008*\"hot\"\n", + "2019-01-31 00:21:18,851 : INFO : topic #23 (0.020): 0.126*\"audit\" + 0.066*\"best\" + 0.038*\"jacksonvil\" + 0.030*\"yawn\" + 0.026*\"japanes\" + 0.021*\"noll\" + 0.019*\"festiv\" + 0.019*\"women\" + 0.017*\"intern\" + 0.015*\"tokyo\"\n", + "2019-01-31 00:21:18,857 : INFO : topic diff=0.019164, rho=0.076472\n", + "2019-01-31 00:21:19,017 : INFO : PROGRESS: pass 0, at document #344000/4922894\n", + "2019-01-31 00:21:20,510 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:21:20,776 : INFO : topic #19 (0.020): 0.010*\"origin\" + 0.009*\"woodcut\" + 0.009*\"languag\" + 0.009*\"form\" + 0.009*\"charact\" + 0.008*\"mean\" + 0.008*\"uruguayan\" + 0.007*\"like\" + 0.006*\"god\" + 0.006*\"name\"\n", + "2019-01-31 00:21:20,777 : INFO : topic #13 (0.020): 0.028*\"new\" + 0.027*\"australia\" + 0.024*\"england\" + 0.024*\"sourc\" + 0.023*\"london\" + 0.022*\"australian\" + 0.019*\"ireland\" + 0.018*\"youth\" + 0.018*\"british\" + 0.015*\"wale\"\n", + "2019-01-31 00:21:20,778 : INFO : topic #43 (0.020): 0.076*\"elect\" + 0.056*\"parti\" + 0.026*\"voluntari\" + 0.022*\"democrat\" + 0.022*\"member\" + 0.019*\"polici\" + 0.016*\"hous\" + 0.015*\"report\" + 0.015*\"tendenc\" + 0.014*\"bypass\"\n", + "2019-01-31 00:21:20,780 : INFO : topic #38 (0.020): 0.023*\"walter\" + 0.016*\"king\" + 0.012*\"battalion\" + 0.010*\"aza\" + 0.008*\"empath\" + 0.008*\"teufel\" + 0.008*\"forc\" + 0.007*\"centuri\" + 0.007*\"armi\" + 0.007*\"till\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 00:21:20,781 : INFO : topic #16 (0.020): 0.033*\"priest\" + 0.021*\"grammat\" + 0.020*\"king\" + 0.020*\"quarterli\" + 0.019*\"duke\" + 0.017*\"maria\" + 0.017*\"rotterdam\" + 0.017*\"portugues\" + 0.016*\"count\" + 0.013*\"princ\"\n", + "2019-01-31 00:21:20,786 : INFO : topic diff=0.022057, rho=0.076249\n", + "2019-01-31 00:21:20,941 : INFO : PROGRESS: pass 0, at document #346000/4922894\n", + "2019-01-31 00:21:22,384 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:21:22,650 : INFO : topic #33 (0.020): 0.067*\"french\" + 0.047*\"franc\" + 0.030*\"pari\" + 0.023*\"sail\" + 0.021*\"jean\" + 0.016*\"wine\" + 0.015*\"daphn\" + 0.013*\"loui\" + 0.013*\"lazi\" + 0.011*\"piec\"\n", + "2019-01-31 00:21:22,651 : INFO : topic #2 (0.020): 0.049*\"isl\" + 0.038*\"shield\" + 0.018*\"narrat\" + 0.014*\"scot\" + 0.014*\"pope\" + 0.012*\"blur\" + 0.011*\"nativist\" + 0.011*\"fleet\" + 0.010*\"coalit\" + 0.008*\"bahá\"\n", + "2019-01-31 00:21:22,652 : INFO : topic #19 (0.020): 0.010*\"languag\" + 0.010*\"origin\" + 0.010*\"woodcut\" + 0.009*\"form\" + 0.009*\"charact\" + 0.008*\"uruguayan\" + 0.008*\"mean\" + 0.008*\"like\" + 0.006*\"god\" + 0.006*\"name\"\n", + "2019-01-31 00:21:22,653 : INFO : topic #0 (0.020): 0.068*\"statewid\" + 0.042*\"arsen\" + 0.039*\"line\" + 0.036*\"raid\" + 0.033*\"museo\" + 0.019*\"traceabl\" + 0.017*\"serv\" + 0.016*\"pain\" + 0.015*\"word\" + 0.015*\"exhaust\"\n", + "2019-01-31 00:21:22,654 : INFO : topic #41 (0.020): 0.050*\"citi\" + 0.042*\"new\" + 0.025*\"palmer\" + 0.024*\"year\" + 0.015*\"strategist\" + 0.014*\"center\" + 0.010*\"open\" + 0.009*\"lobe\" + 0.009*\"includ\" + 0.008*\"hot\"\n", + "2019-01-31 00:21:22,660 : INFO : topic diff=0.018962, rho=0.076029\n", + "2019-01-31 00:21:22,814 : INFO : PROGRESS: pass 0, at document #348000/4922894\n", + "2019-01-31 00:21:24,264 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:21:24,530 : INFO : topic #40 (0.020): 0.093*\"unit\" + 0.025*\"collector\" + 0.019*\"schuster\" + 0.019*\"institut\" + 0.016*\"student\" + 0.015*\"requir\" + 0.015*\"professor\" + 0.012*\"word\" + 0.012*\"governor\" + 0.012*\"degre\"\n", + "2019-01-31 00:21:24,531 : INFO : topic #32 (0.020): 0.060*\"district\" + 0.046*\"vigour\" + 0.043*\"popolo\" + 0.042*\"tortur\" + 0.029*\"area\" + 0.028*\"cotton\" + 0.027*\"multitud\" + 0.025*\"regim\" + 0.020*\"commun\" + 0.020*\"citi\"\n", + "2019-01-31 00:21:24,533 : INFO : topic #18 (0.020): 0.008*\"théori\" + 0.007*\"later\" + 0.006*\"kill\" + 0.006*\"sack\" + 0.005*\"retrospect\" + 0.005*\"man\" + 0.005*\"dai\" + 0.004*\"deal\" + 0.004*\"help\" + 0.004*\"kenworthi\"\n", + "2019-01-31 00:21:24,534 : INFO : topic #30 (0.020): 0.035*\"cleveland\" + 0.034*\"leagu\" + 0.031*\"place\" + 0.028*\"taxpay\" + 0.024*\"scientist\" + 0.022*\"crete\" + 0.022*\"folei\" + 0.016*\"martin\" + 0.016*\"goal\" + 0.012*\"player\"\n", + "2019-01-31 00:21:24,535 : INFO : topic #20 (0.020): 0.128*\"scholar\" + 0.037*\"struggl\" + 0.029*\"high\" + 0.028*\"educ\" + 0.018*\"yawn\" + 0.018*\"collector\" + 0.013*\"prognosi\" + 0.009*\"task\" + 0.009*\"class\" + 0.009*\"gothic\"\n", + "2019-01-31 00:21:24,541 : INFO : topic diff=0.017567, rho=0.075810\n", + "2019-01-31 00:21:24,751 : INFO : PROGRESS: pass 0, at document #350000/4922894\n", + "2019-01-31 00:21:26,183 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:21:26,449 : INFO : topic #42 (0.020): 0.039*\"german\" + 0.025*\"germani\" + 0.014*\"jewish\" + 0.014*\"vol\" + 0.012*\"israel\" + 0.012*\"der\" + 0.011*\"berlin\" + 0.010*\"jeremiah\" + 0.009*\"greek\" + 0.009*\"itali\"\n", + "2019-01-31 00:21:26,450 : INFO : topic #3 (0.020): 0.037*\"present\" + 0.029*\"offic\" + 0.025*\"minist\" + 0.022*\"seri\" + 0.019*\"gener\" + 0.018*\"chickasaw\" + 0.018*\"member\" + 0.017*\"serv\" + 0.015*\"govern\" + 0.015*\"appeas\"\n", + "2019-01-31 00:21:26,451 : INFO : topic #33 (0.020): 0.068*\"french\" + 0.049*\"franc\" + 0.031*\"pari\" + 0.024*\"sail\" + 0.021*\"jean\" + 0.015*\"wine\" + 0.015*\"daphn\" + 0.013*\"loui\" + 0.012*\"lazi\" + 0.011*\"piec\"\n", + "2019-01-31 00:21:26,453 : INFO : topic #25 (0.020): 0.029*\"ring\" + 0.017*\"warmth\" + 0.017*\"lagrang\" + 0.016*\"area\" + 0.014*\"mount\" + 0.008*\"north\" + 0.008*\"palmer\" + 0.008*\"land\" + 0.008*\"foam\" + 0.007*\"sourc\"\n", + "2019-01-31 00:21:26,453 : INFO : topic #13 (0.020): 0.028*\"new\" + 0.028*\"australia\" + 0.024*\"australian\" + 0.024*\"england\" + 0.024*\"sourc\" + 0.023*\"london\" + 0.020*\"ireland\" + 0.018*\"british\" + 0.018*\"youth\" + 0.015*\"wale\"\n", + "2019-01-31 00:21:26,459 : INFO : topic diff=0.018178, rho=0.075593\n", + "2019-01-31 00:21:26,613 : INFO : PROGRESS: pass 0, at document #352000/4922894\n", + "2019-01-31 00:21:28,078 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:21:28,344 : INFO : topic #12 (0.020): 0.009*\"number\" + 0.008*\"frontal\" + 0.007*\"gener\" + 0.006*\"exampl\" + 0.006*\"servitud\" + 0.006*\"poet\" + 0.006*\"théori\" + 0.006*\"southern\" + 0.005*\"measur\" + 0.005*\"utopian\"\n", + "2019-01-31 00:21:28,345 : INFO : topic #34 (0.020): 0.077*\"start\" + 0.034*\"cotton\" + 0.031*\"unionist\" + 0.024*\"american\" + 0.018*\"new\" + 0.015*\"terri\" + 0.014*\"california\" + 0.013*\"violent\" + 0.012*\"north\" + 0.012*\"warrior\"\n", + "2019-01-31 00:21:28,346 : INFO : topic #35 (0.020): 0.057*\"russia\" + 0.031*\"turin\" + 0.031*\"sovereignti\" + 0.028*\"rural\" + 0.026*\"reprint\" + 0.025*\"poison\" + 0.020*\"personifi\" + 0.018*\"moscow\" + 0.016*\"shirin\" + 0.015*\"poland\"\n", + "2019-01-31 00:21:28,348 : INFO : topic #42 (0.020): 0.039*\"german\" + 0.026*\"germani\" + 0.014*\"vol\" + 0.014*\"jewish\" + 0.012*\"der\" + 0.012*\"israel\" + 0.011*\"berlin\" + 0.009*\"jeremiah\" + 0.009*\"greek\" + 0.009*\"european\"\n", + "2019-01-31 00:21:28,349 : INFO : topic #43 (0.020): 0.074*\"elect\" + 0.059*\"parti\" + 0.027*\"democrat\" + 0.024*\"voluntari\" + 0.021*\"member\" + 0.018*\"polici\" + 0.015*\"republ\" + 0.015*\"report\" + 0.014*\"hous\" + 0.014*\"bypass\"\n", + "2019-01-31 00:21:28,355 : INFO : topic diff=0.016612, rho=0.075378\n", + "2019-01-31 00:21:28,518 : INFO : PROGRESS: pass 0, at document #354000/4922894\n", + "2019-01-31 00:21:30,021 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:21:30,287 : INFO : topic #1 (0.020): 0.053*\"china\" + 0.053*\"chilton\" + 0.026*\"hong\" + 0.026*\"kong\" + 0.023*\"korea\" + 0.022*\"korean\" + 0.017*\"sourc\" + 0.017*\"leah\" + 0.013*\"kim\" + 0.011*\"taiwan\"\n", + "2019-01-31 00:21:30,288 : INFO : topic #25 (0.020): 0.029*\"ring\" + 0.017*\"warmth\" + 0.016*\"lagrang\" + 0.016*\"area\" + 0.015*\"mount\" + 0.008*\"palmer\" + 0.008*\"north\" + 0.008*\"foam\" + 0.008*\"land\" + 0.007*\"vacant\"\n", + "2019-01-31 00:21:30,290 : INFO : topic #21 (0.020): 0.038*\"samford\" + 0.024*\"spain\" + 0.018*\"del\" + 0.017*\"mexico\" + 0.014*\"soviet\" + 0.012*\"santa\" + 0.012*\"francisco\" + 0.011*\"juan\" + 0.011*\"argentina\" + 0.010*\"carlo\"\n", + "2019-01-31 00:21:30,291 : INFO : topic #42 (0.020): 0.041*\"german\" + 0.026*\"germani\" + 0.016*\"jewish\" + 0.014*\"vol\" + 0.013*\"israel\" + 0.012*\"der\" + 0.012*\"berlin\" + 0.010*\"jeremiah\" + 0.008*\"greek\" + 0.008*\"european\"\n", + "2019-01-31 00:21:30,292 : INFO : topic #29 (0.020): 0.012*\"govern\" + 0.011*\"start\" + 0.008*\"replac\" + 0.008*\"countri\" + 0.008*\"yawn\" + 0.007*\"million\" + 0.007*\"nation\" + 0.006*\"théori\" + 0.006*\"new\" + 0.006*\"summerhil\"\n", + "2019-01-31 00:21:30,297 : INFO : topic diff=0.021235, rho=0.075165\n", + "2019-01-31 00:21:30,457 : INFO : PROGRESS: pass 0, at document #356000/4922894\n", + "2019-01-31 00:21:31,940 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:21:32,206 : INFO : topic #46 (0.020): 0.019*\"stop\" + 0.017*\"sweden\" + 0.017*\"damag\" + 0.017*\"swedish\" + 0.016*\"norwai\" + 0.014*\"norwegian\" + 0.014*\"wind\" + 0.011*\"ton\" + 0.011*\"turkish\" + 0.010*\"turkei\"\n", + "2019-01-31 00:21:32,207 : INFO : topic #17 (0.020): 0.068*\"church\" + 0.018*\"bishop\" + 0.018*\"christian\" + 0.017*\"cathol\" + 0.017*\"jpg\" + 0.015*\"fifteenth\" + 0.015*\"centuri\" + 0.014*\"retroflex\" + 0.014*\"sail\" + 0.011*\"italian\"\n", + "2019-01-31 00:21:32,208 : INFO : topic #30 (0.020): 0.035*\"leagu\" + 0.034*\"cleveland\" + 0.030*\"place\" + 0.028*\"taxpay\" + 0.024*\"crete\" + 0.023*\"scientist\" + 0.022*\"folei\" + 0.017*\"goal\" + 0.016*\"martin\" + 0.012*\"schmitz\"\n", + "2019-01-31 00:21:32,210 : INFO : topic #47 (0.020): 0.068*\"muscl\" + 0.034*\"perceptu\" + 0.019*\"damn\" + 0.018*\"compos\" + 0.018*\"theater\" + 0.018*\"place\" + 0.015*\"orchestr\" + 0.013*\"physician\" + 0.013*\"olympo\" + 0.012*\"jack\"\n", + "2019-01-31 00:21:32,211 : INFO : topic #37 (0.020): 0.009*\"love\" + 0.007*\"gestur\" + 0.006*\"man\" + 0.005*\"blue\" + 0.005*\"litig\" + 0.005*\"night\" + 0.004*\"bewild\" + 0.004*\"vision\" + 0.003*\"introductori\" + 0.003*\"christma\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 00:21:32,217 : INFO : topic diff=0.019679, rho=0.074953\n", + "2019-01-31 00:21:32,371 : INFO : PROGRESS: pass 0, at document #358000/4922894\n", + "2019-01-31 00:21:33,801 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:21:34,067 : INFO : topic #11 (0.020): 0.028*\"john\" + 0.016*\"will\" + 0.013*\"jame\" + 0.012*\"david\" + 0.012*\"rival\" + 0.011*\"georg\" + 0.009*\"rhyme\" + 0.008*\"slur\" + 0.008*\"mexican–american\" + 0.008*\"paul\"\n", + "2019-01-31 00:21:34,068 : INFO : topic #1 (0.020): 0.054*\"china\" + 0.050*\"chilton\" + 0.025*\"hong\" + 0.024*\"kong\" + 0.023*\"korea\" + 0.021*\"korean\" + 0.018*\"leah\" + 0.017*\"sourc\" + 0.015*\"kim\" + 0.011*\"taiwan\"\n", + "2019-01-31 00:21:34,070 : INFO : topic #2 (0.020): 0.051*\"isl\" + 0.038*\"shield\" + 0.018*\"narrat\" + 0.014*\"scot\" + 0.013*\"pope\" + 0.012*\"nativist\" + 0.012*\"blur\" + 0.011*\"fleet\" + 0.010*\"coalit\" + 0.009*\"bahá\"\n", + "2019-01-31 00:21:34,071 : INFO : topic #48 (0.020): 0.083*\"march\" + 0.080*\"januari\" + 0.078*\"sens\" + 0.077*\"octob\" + 0.075*\"juli\" + 0.075*\"judici\" + 0.074*\"april\" + 0.073*\"notion\" + 0.073*\"august\" + 0.066*\"decatur\"\n", + "2019-01-31 00:21:34,072 : INFO : topic #6 (0.020): 0.072*\"fewer\" + 0.024*\"septemb\" + 0.021*\"epiru\" + 0.018*\"teacher\" + 0.017*\"stake\" + 0.013*\"proclaim\" + 0.012*\"rodríguez\" + 0.012*\"direct\" + 0.011*\"movi\" + 0.010*\"acrimoni\"\n", + "2019-01-31 00:21:34,079 : INFO : topic diff=0.017307, rho=0.074744\n", + "2019-01-31 00:21:36,800 : INFO : -12.078 per-word bound, 4322.4 perplexity estimate based on a held-out corpus of 2000 documents with 543113 words\n", + "2019-01-31 00:21:36,800 : INFO : PROGRESS: pass 0, at document #360000/4922894\n", + "2019-01-31 00:21:38,236 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:21:38,503 : INFO : topic #47 (0.020): 0.069*\"muscl\" + 0.034*\"perceptu\" + 0.018*\"theater\" + 0.018*\"compos\" + 0.018*\"damn\" + 0.017*\"place\" + 0.015*\"orchestr\" + 0.013*\"physician\" + 0.013*\"olympo\" + 0.012*\"jack\"\n", + "2019-01-31 00:21:38,504 : INFO : topic #10 (0.020): 0.013*\"cdd\" + 0.008*\"disco\" + 0.008*\"hormon\" + 0.007*\"media\" + 0.007*\"pathwai\" + 0.007*\"have\" + 0.006*\"caus\" + 0.006*\"cancer\" + 0.006*\"che\" + 0.006*\"treat\"\n", + "2019-01-31 00:21:38,506 : INFO : topic #5 (0.020): 0.039*\"abroad\" + 0.029*\"son\" + 0.028*\"rel\" + 0.027*\"reconstruct\" + 0.021*\"band\" + 0.017*\"muscl\" + 0.016*\"simultan\" + 0.015*\"charcoal\" + 0.013*\"toyota\" + 0.011*\"vocabulari\"\n", + "2019-01-31 00:21:38,507 : INFO : topic #0 (0.020): 0.065*\"statewid\" + 0.042*\"arsen\" + 0.041*\"line\" + 0.034*\"raid\" + 0.030*\"museo\" + 0.019*\"traceabl\" + 0.017*\"serv\" + 0.016*\"pain\" + 0.016*\"artist\" + 0.015*\"word\"\n", + "2019-01-31 00:21:38,508 : INFO : topic #43 (0.020): 0.073*\"elect\" + 0.057*\"parti\" + 0.027*\"democrat\" + 0.025*\"voluntari\" + 0.021*\"member\" + 0.018*\"polici\" + 0.018*\"republ\" + 0.015*\"report\" + 0.014*\"bypass\" + 0.014*\"hous\"\n", + "2019-01-31 00:21:38,514 : INFO : topic diff=0.017960, rho=0.074536\n", + "2019-01-31 00:21:38,670 : INFO : PROGRESS: pass 0, at document #362000/4922894\n", + "2019-01-31 00:21:40,126 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:21:40,392 : INFO : topic #42 (0.020): 0.040*\"german\" + 0.026*\"germani\" + 0.015*\"jewish\" + 0.014*\"israel\" + 0.013*\"vol\" + 0.012*\"der\" + 0.012*\"berlin\" + 0.011*\"jeremiah\" + 0.009*\"nazi\" + 0.008*\"itali\"\n", + "2019-01-31 00:21:40,393 : INFO : topic #45 (0.020): 0.020*\"black\" + 0.018*\"colder\" + 0.017*\"western\" + 0.013*\"record\" + 0.010*\"blind\" + 0.009*\"light\" + 0.009*\"illicit\" + 0.008*\"green\" + 0.006*\"hand\" + 0.006*\"fit\"\n", + "2019-01-31 00:21:40,394 : INFO : topic #3 (0.020): 0.038*\"present\" + 0.029*\"offic\" + 0.025*\"minist\" + 0.023*\"seri\" + 0.020*\"gener\" + 0.018*\"member\" + 0.017*\"chickasaw\" + 0.016*\"serv\" + 0.016*\"appeas\" + 0.015*\"govern\"\n", + "2019-01-31 00:21:40,395 : INFO : topic #33 (0.020): 0.062*\"french\" + 0.046*\"franc\" + 0.031*\"pari\" + 0.022*\"sail\" + 0.021*\"jean\" + 0.015*\"daphn\" + 0.014*\"wine\" + 0.013*\"lazi\" + 0.013*\"loui\" + 0.010*\"piec\"\n", + "2019-01-31 00:21:40,396 : INFO : topic #30 (0.020): 0.034*\"leagu\" + 0.033*\"cleveland\" + 0.029*\"place\" + 0.028*\"taxpay\" + 0.025*\"crete\" + 0.023*\"folei\" + 0.023*\"scientist\" + 0.017*\"goal\" + 0.016*\"martin\" + 0.012*\"schmitz\"\n", + "2019-01-31 00:21:40,402 : INFO : topic diff=0.015836, rho=0.074329\n", + "2019-01-31 00:21:40,557 : INFO : PROGRESS: pass 0, at document #364000/4922894\n", + "2019-01-31 00:21:42,004 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:21:42,270 : INFO : topic #20 (0.020): 0.129*\"scholar\" + 0.037*\"struggl\" + 0.030*\"high\" + 0.028*\"educ\" + 0.019*\"collector\" + 0.018*\"yawn\" + 0.013*\"prognosi\" + 0.009*\"task\" + 0.009*\"class\" + 0.008*\"gothic\"\n", + "2019-01-31 00:21:42,272 : INFO : topic #6 (0.020): 0.070*\"fewer\" + 0.024*\"septemb\" + 0.021*\"epiru\" + 0.018*\"teacher\" + 0.018*\"stake\" + 0.013*\"proclaim\" + 0.012*\"rodríguez\" + 0.012*\"direct\" + 0.011*\"movi\" + 0.010*\"acrimoni\"\n", + "2019-01-31 00:21:42,273 : INFO : topic #37 (0.020): 0.009*\"love\" + 0.007*\"gestur\" + 0.006*\"man\" + 0.005*\"litig\" + 0.005*\"blue\" + 0.005*\"night\" + 0.004*\"bewild\" + 0.004*\"vision\" + 0.003*\"introductori\" + 0.003*\"york\"\n", + "2019-01-31 00:21:42,274 : INFO : topic #30 (0.020): 0.034*\"leagu\" + 0.033*\"cleveland\" + 0.029*\"place\" + 0.028*\"taxpay\" + 0.025*\"crete\" + 0.023*\"folei\" + 0.022*\"scientist\" + 0.016*\"goal\" + 0.016*\"martin\" + 0.012*\"player\"\n", + "2019-01-31 00:21:42,276 : INFO : topic #39 (0.020): 0.028*\"canada\" + 0.025*\"scientist\" + 0.024*\"taxpay\" + 0.024*\"canadian\" + 0.018*\"clot\" + 0.016*\"basketbal\" + 0.015*\"hoar\" + 0.014*\"toronto\" + 0.013*\"confer\" + 0.012*\"ontario\"\n", + "2019-01-31 00:21:42,281 : INFO : topic diff=0.015960, rho=0.074125\n", + "2019-01-31 00:21:42,436 : INFO : PROGRESS: pass 0, at document #366000/4922894\n", + "2019-01-31 00:21:43,895 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:21:44,161 : INFO : topic #35 (0.020): 0.053*\"russia\" + 0.037*\"sovereignti\" + 0.030*\"rural\" + 0.024*\"reprint\" + 0.023*\"poison\" + 0.023*\"turin\" + 0.020*\"personifi\" + 0.018*\"moscow\" + 0.015*\"poland\" + 0.015*\"unfortun\"\n", + "2019-01-31 00:21:44,162 : INFO : topic #39 (0.020): 0.028*\"canada\" + 0.025*\"canadian\" + 0.024*\"scientist\" + 0.024*\"taxpay\" + 0.019*\"clot\" + 0.016*\"basketbal\" + 0.015*\"hoar\" + 0.014*\"toronto\" + 0.013*\"confer\" + 0.012*\"ontario\"\n", + "2019-01-31 00:21:44,163 : INFO : topic #36 (0.020): 0.024*\"companhia\" + 0.009*\"serv\" + 0.009*\"develop\" + 0.008*\"network\" + 0.008*\"prognosi\" + 0.008*\"base\" + 0.008*\"manag\" + 0.008*\"includ\" + 0.007*\"oper\" + 0.007*\"user\"\n", + "2019-01-31 00:21:44,164 : INFO : topic #28 (0.020): 0.030*\"build\" + 0.024*\"hous\" + 0.021*\"rivièr\" + 0.016*\"buford\" + 0.012*\"briarwood\" + 0.012*\"rosenwald\" + 0.011*\"histor\" + 0.011*\"constitut\" + 0.010*\"strategist\" + 0.009*\"lobe\"\n", + "2019-01-31 00:21:44,166 : INFO : topic #49 (0.020): 0.044*\"india\" + 0.031*\"incumb\" + 0.015*\"islam\" + 0.014*\"televis\" + 0.011*\"pakistan\" + 0.010*\"start\" + 0.010*\"sri\" + 0.010*\"khalsa\" + 0.010*\"muskoge\" + 0.008*\"alam\"\n", + "2019-01-31 00:21:44,171 : INFO : topic diff=0.016409, rho=0.073922\n", + "2019-01-31 00:21:44,327 : INFO : PROGRESS: pass 0, at document #368000/4922894\n", + "2019-01-31 00:21:45,791 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:21:46,057 : INFO : topic #27 (0.020): 0.067*\"questionnair\" + 0.020*\"taxpay\" + 0.018*\"candid\" + 0.016*\"tornado\" + 0.014*\"driver\" + 0.013*\"find\" + 0.013*\"ret\" + 0.010*\"fool\" + 0.010*\"scientist\" + 0.010*\"champion\"\n", + "2019-01-31 00:21:46,058 : INFO : topic #41 (0.020): 0.050*\"citi\" + 0.041*\"new\" + 0.025*\"palmer\" + 0.025*\"year\" + 0.014*\"strategist\" + 0.014*\"center\" + 0.011*\"open\" + 0.010*\"includ\" + 0.009*\"lobe\" + 0.008*\"hot\"\n", + "2019-01-31 00:21:46,060 : INFO : topic #18 (0.020): 0.008*\"théori\" + 0.007*\"later\" + 0.007*\"kill\" + 0.006*\"sack\" + 0.005*\"man\" + 0.005*\"retrospect\" + 0.005*\"dai\" + 0.005*\"deal\" + 0.004*\"help\" + 0.004*\"wander\"\n", + "2019-01-31 00:21:46,061 : INFO : topic #4 (0.020): 0.026*\"enfranchis\" + 0.016*\"depress\" + 0.015*\"pour\" + 0.009*\"mode\" + 0.009*\"produc\" + 0.009*\"elabor\" + 0.009*\"veget\" + 0.009*\"candid\" + 0.008*\"encyclopedia\" + 0.007*\"stanc\"\n", + "2019-01-31 00:21:46,062 : INFO : topic #37 (0.020): 0.009*\"love\" + 0.007*\"gestur\" + 0.006*\"man\" + 0.005*\"litig\" + 0.005*\"blue\" + 0.005*\"night\" + 0.004*\"bewild\" + 0.003*\"vision\" + 0.003*\"york\" + 0.003*\"epiru\"\n", + "2019-01-31 00:21:46,068 : INFO : topic diff=0.017176, rho=0.073721\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 00:21:46,219 : INFO : PROGRESS: pass 0, at document #370000/4922894\n", + "2019-01-31 00:21:47,643 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:21:47,909 : INFO : topic #18 (0.020): 0.008*\"théori\" + 0.007*\"later\" + 0.007*\"kill\" + 0.006*\"sack\" + 0.005*\"man\" + 0.005*\"retrospect\" + 0.005*\"dai\" + 0.005*\"deal\" + 0.004*\"help\" + 0.004*\"kenworthi\"\n", + "2019-01-31 00:21:47,911 : INFO : topic #36 (0.020): 0.025*\"companhia\" + 0.009*\"network\" + 0.009*\"serv\" + 0.009*\"develop\" + 0.008*\"prognosi\" + 0.008*\"base\" + 0.008*\"manag\" + 0.008*\"oper\" + 0.008*\"includ\" + 0.007*\"market\"\n", + "2019-01-31 00:21:47,912 : INFO : topic #12 (0.020): 0.010*\"number\" + 0.008*\"frontal\" + 0.007*\"gener\" + 0.007*\"servitud\" + 0.006*\"exampl\" + 0.006*\"southern\" + 0.006*\"poet\" + 0.005*\"théori\" + 0.005*\"method\" + 0.005*\"utopian\"\n", + "2019-01-31 00:21:47,913 : INFO : topic #37 (0.020): 0.009*\"love\" + 0.007*\"gestur\" + 0.006*\"man\" + 0.005*\"litig\" + 0.005*\"blue\" + 0.005*\"night\" + 0.004*\"bewild\" + 0.003*\"vision\" + 0.003*\"jolli\" + 0.003*\"york\"\n", + "2019-01-31 00:21:47,914 : INFO : topic #2 (0.020): 0.047*\"isl\" + 0.037*\"shield\" + 0.019*\"narrat\" + 0.014*\"scot\" + 0.014*\"pope\" + 0.011*\"nativist\" + 0.011*\"fleet\" + 0.011*\"coalit\" + 0.010*\"blur\" + 0.009*\"bahá\"\n", + "2019-01-31 00:21:47,920 : INFO : topic diff=0.015674, rho=0.073521\n", + "2019-01-31 00:21:48,076 : INFO : PROGRESS: pass 0, at document #372000/4922894\n", + "2019-01-31 00:21:49,525 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:21:49,791 : INFO : topic #18 (0.020): 0.008*\"théori\" + 0.007*\"later\" + 0.007*\"kill\" + 0.007*\"sack\" + 0.005*\"man\" + 0.005*\"retrospect\" + 0.005*\"dai\" + 0.005*\"deal\" + 0.004*\"help\" + 0.004*\"kenworthi\"\n", + "2019-01-31 00:21:49,792 : INFO : topic #44 (0.020): 0.031*\"rooftop\" + 0.028*\"final\" + 0.021*\"wife\" + 0.019*\"tourist\" + 0.017*\"martin\" + 0.015*\"champion\" + 0.014*\"tiepolo\" + 0.014*\"chamber\" + 0.013*\"taxpay\" + 0.012*\"winner\"\n", + "2019-01-31 00:21:49,794 : INFO : topic #35 (0.020): 0.052*\"russia\" + 0.037*\"sovereignti\" + 0.031*\"rural\" + 0.023*\"reprint\" + 0.022*\"poison\" + 0.020*\"turin\" + 0.020*\"moscow\" + 0.020*\"personifi\" + 0.015*\"unfortun\" + 0.015*\"malaysia\"\n", + "2019-01-31 00:21:49,795 : INFO : topic #25 (0.020): 0.030*\"ring\" + 0.017*\"warmth\" + 0.017*\"lagrang\" + 0.015*\"area\" + 0.014*\"mount\" + 0.008*\"palmer\" + 0.008*\"foam\" + 0.008*\"north\" + 0.008*\"land\" + 0.008*\"vacant\"\n", + "2019-01-31 00:21:49,796 : INFO : topic #32 (0.020): 0.056*\"district\" + 0.056*\"vigour\" + 0.043*\"popolo\" + 0.041*\"tortur\" + 0.030*\"area\" + 0.027*\"regim\" + 0.026*\"cotton\" + 0.025*\"multitud\" + 0.021*\"commun\" + 0.020*\"citi\"\n", + "2019-01-31 00:21:49,802 : INFO : topic diff=0.018160, rho=0.073324\n", + "2019-01-31 00:21:49,958 : INFO : PROGRESS: pass 0, at document #374000/4922894\n", + "2019-01-31 00:21:51,396 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:21:51,662 : INFO : topic #34 (0.020): 0.076*\"start\" + 0.032*\"unionist\" + 0.031*\"cotton\" + 0.024*\"american\" + 0.018*\"new\" + 0.014*\"terri\" + 0.014*\"california\" + 0.013*\"warrior\" + 0.013*\"north\" + 0.012*\"violent\"\n", + "2019-01-31 00:21:51,664 : INFO : topic #36 (0.020): 0.025*\"companhia\" + 0.009*\"network\" + 0.009*\"serv\" + 0.009*\"develop\" + 0.008*\"prognosi\" + 0.008*\"base\" + 0.008*\"manag\" + 0.008*\"oper\" + 0.008*\"includ\" + 0.007*\"market\"\n", + "2019-01-31 00:21:51,665 : INFO : topic #9 (0.020): 0.066*\"bone\" + 0.047*\"american\" + 0.026*\"valour\" + 0.019*\"player\" + 0.019*\"dutch\" + 0.017*\"polit\" + 0.017*\"folei\" + 0.015*\"english\" + 0.012*\"simpler\" + 0.011*\"acrimoni\"\n", + "2019-01-31 00:21:51,666 : INFO : topic #29 (0.020): 0.012*\"govern\" + 0.011*\"start\" + 0.008*\"countri\" + 0.008*\"replac\" + 0.008*\"yawn\" + 0.007*\"million\" + 0.007*\"nation\" + 0.006*\"théori\" + 0.006*\"new\" + 0.006*\"summerhil\"\n", + "2019-01-31 00:21:51,667 : INFO : topic #3 (0.020): 0.038*\"present\" + 0.028*\"offic\" + 0.024*\"minist\" + 0.022*\"seri\" + 0.022*\"serv\" + 0.019*\"gener\" + 0.018*\"member\" + 0.016*\"chickasaw\" + 0.015*\"appeas\" + 0.014*\"govern\"\n", + "2019-01-31 00:21:51,673 : INFO : topic diff=0.016402, rho=0.073127\n", + "2019-01-31 00:21:51,828 : INFO : PROGRESS: pass 0, at document #376000/4922894\n", + "2019-01-31 00:21:53,285 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:21:53,551 : INFO : topic #19 (0.020): 0.011*\"languag\" + 0.010*\"origin\" + 0.009*\"woodcut\" + 0.009*\"form\" + 0.008*\"mean\" + 0.008*\"charact\" + 0.008*\"uruguayan\" + 0.008*\"god\" + 0.007*\"like\" + 0.006*\"differ\"\n", + "2019-01-31 00:21:53,553 : INFO : topic #1 (0.020): 0.051*\"china\" + 0.043*\"chilton\" + 0.025*\"hong\" + 0.024*\"kong\" + 0.020*\"korea\" + 0.020*\"korean\" + 0.019*\"leah\" + 0.018*\"kim\" + 0.015*\"sourc\" + 0.011*\"wang\"\n", + "2019-01-31 00:21:53,554 : INFO : topic #34 (0.020): 0.076*\"start\" + 0.032*\"unionist\" + 0.031*\"cotton\" + 0.024*\"american\" + 0.018*\"new\" + 0.014*\"terri\" + 0.014*\"california\" + 0.013*\"violent\" + 0.013*\"warrior\" + 0.013*\"north\"\n", + "2019-01-31 00:21:53,555 : INFO : topic #38 (0.020): 0.022*\"walter\" + 0.014*\"king\" + 0.012*\"aza\" + 0.011*\"teufel\" + 0.010*\"battalion\" + 0.010*\"empath\" + 0.010*\"till\" + 0.008*\"forc\" + 0.008*\"centuri\" + 0.007*\"armi\"\n", + "2019-01-31 00:21:53,557 : INFO : topic #44 (0.020): 0.030*\"rooftop\" + 0.027*\"final\" + 0.021*\"wife\" + 0.019*\"tourist\" + 0.016*\"martin\" + 0.015*\"champion\" + 0.014*\"tiepolo\" + 0.014*\"taxpay\" + 0.013*\"chamber\" + 0.012*\"winner\"\n", + "2019-01-31 00:21:53,562 : INFO : topic diff=0.014290, rho=0.072932\n", + "2019-01-31 00:21:53,716 : INFO : PROGRESS: pass 0, at document #378000/4922894\n", + "2019-01-31 00:21:55,148 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:21:55,414 : INFO : topic #38 (0.020): 0.021*\"walter\" + 0.013*\"king\" + 0.012*\"aza\" + 0.011*\"teufel\" + 0.010*\"battalion\" + 0.010*\"empath\" + 0.009*\"till\" + 0.008*\"forc\" + 0.008*\"centuri\" + 0.007*\"armi\"\n", + "2019-01-31 00:21:55,415 : INFO : topic #12 (0.020): 0.010*\"number\" + 0.008*\"frontal\" + 0.007*\"gener\" + 0.006*\"servitud\" + 0.006*\"exampl\" + 0.006*\"southern\" + 0.006*\"poet\" + 0.006*\"théori\" + 0.005*\"method\" + 0.005*\"differ\"\n", + "2019-01-31 00:21:55,416 : INFO : topic #10 (0.020): 0.012*\"cdd\" + 0.008*\"disco\" + 0.008*\"hormon\" + 0.008*\"media\" + 0.007*\"pathwai\" + 0.007*\"have\" + 0.007*\"caus\" + 0.006*\"acid\" + 0.006*\"effect\" + 0.006*\"treat\"\n", + "2019-01-31 00:21:55,417 : INFO : topic #17 (0.020): 0.067*\"church\" + 0.018*\"bishop\" + 0.017*\"christian\" + 0.017*\"cathol\" + 0.017*\"jpg\" + 0.016*\"sail\" + 0.014*\"retroflex\" + 0.014*\"fifteenth\" + 0.014*\"centuri\" + 0.011*\"italian\"\n", + "2019-01-31 00:21:55,418 : INFO : topic #36 (0.020): 0.025*\"companhia\" + 0.009*\"network\" + 0.009*\"serv\" + 0.009*\"develop\" + 0.008*\"prognosi\" + 0.008*\"base\" + 0.008*\"oper\" + 0.008*\"manag\" + 0.008*\"includ\" + 0.007*\"busi\"\n", + "2019-01-31 00:21:55,424 : INFO : topic diff=0.014800, rho=0.072739\n", + "2019-01-31 00:21:58,215 : INFO : -11.609 per-word bound, 3122.8 perplexity estimate based on a held-out corpus of 2000 documents with 582384 words\n", + "2019-01-31 00:21:58,215 : INFO : PROGRESS: pass 0, at document #380000/4922894\n", + "2019-01-31 00:21:59,678 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:21:59,944 : INFO : topic #4 (0.020): 0.026*\"enfranchis\" + 0.016*\"depress\" + 0.015*\"pour\" + 0.010*\"mode\" + 0.010*\"elabor\" + 0.009*\"produc\" + 0.009*\"candid\" + 0.009*\"veget\" + 0.008*\"encyclopedia\" + 0.007*\"uruguayan\"\n", + "2019-01-31 00:21:59,945 : INFO : topic #28 (0.020): 0.030*\"build\" + 0.023*\"hous\" + 0.022*\"rivièr\" + 0.018*\"buford\" + 0.011*\"briarwood\" + 0.011*\"histor\" + 0.011*\"constitut\" + 0.011*\"rosenwald\" + 0.010*\"strategist\" + 0.009*\"lobe\"\n", + "2019-01-31 00:21:59,947 : INFO : topic #21 (0.020): 0.035*\"samford\" + 0.024*\"spain\" + 0.018*\"del\" + 0.016*\"mexico\" + 0.014*\"soviet\" + 0.012*\"francisco\" + 0.011*\"carlo\" + 0.011*\"juan\" + 0.010*\"josé\" + 0.010*\"santa\"\n", + "2019-01-31 00:21:59,948 : INFO : topic #14 (0.020): 0.025*\"forc\" + 0.021*\"aggress\" + 0.021*\"walter\" + 0.020*\"armi\" + 0.017*\"com\" + 0.014*\"oper\" + 0.013*\"militari\" + 0.013*\"unionist\" + 0.011*\"airbu\" + 0.010*\"airmen\"\n", + "2019-01-31 00:21:59,948 : INFO : topic #40 (0.020): 0.099*\"unit\" + 0.025*\"collector\" + 0.020*\"institut\" + 0.019*\"schuster\" + 0.016*\"student\" + 0.015*\"professor\" + 0.015*\"requir\" + 0.012*\"word\" + 0.012*\"governor\" + 0.011*\"degre\"\n", + "2019-01-31 00:21:59,954 : INFO : topic diff=0.016913, rho=0.072548\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 00:22:00,162 : INFO : PROGRESS: pass 0, at document #382000/4922894\n", + "2019-01-31 00:22:01,601 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:22:01,866 : INFO : topic #35 (0.020): 0.050*\"russia\" + 0.033*\"sovereignti\" + 0.028*\"rural\" + 0.025*\"poison\" + 0.022*\"reprint\" + 0.021*\"personifi\" + 0.018*\"moscow\" + 0.017*\"turin\" + 0.017*\"poland\" + 0.015*\"shirin\"\n", + "2019-01-31 00:22:01,868 : INFO : topic #33 (0.020): 0.064*\"french\" + 0.044*\"franc\" + 0.029*\"pari\" + 0.021*\"jean\" + 0.021*\"sail\" + 0.015*\"daphn\" + 0.013*\"loui\" + 0.012*\"lazi\" + 0.012*\"wine\" + 0.011*\"piec\"\n", + "2019-01-31 00:22:01,869 : INFO : topic #27 (0.020): 0.067*\"questionnair\" + 0.020*\"taxpay\" + 0.017*\"ret\" + 0.017*\"candid\" + 0.014*\"driver\" + 0.014*\"tornado\" + 0.012*\"find\" + 0.010*\"horac\" + 0.010*\"scientist\" + 0.010*\"fool\"\n", + "2019-01-31 00:22:01,870 : INFO : topic #29 (0.020): 0.011*\"govern\" + 0.011*\"start\" + 0.008*\"countri\" + 0.008*\"yawn\" + 0.008*\"replac\" + 0.008*\"million\" + 0.007*\"nation\" + 0.006*\"théori\" + 0.006*\"new\" + 0.006*\"function\"\n", + "2019-01-31 00:22:01,872 : INFO : topic #43 (0.020): 0.070*\"elect\" + 0.058*\"parti\" + 0.025*\"democrat\" + 0.025*\"voluntari\" + 0.021*\"member\" + 0.019*\"polici\" + 0.015*\"republ\" + 0.015*\"selma\" + 0.015*\"bypass\" + 0.015*\"seaport\"\n", + "2019-01-31 00:22:01,877 : INFO : topic diff=0.015176, rho=0.072357\n", + "2019-01-31 00:22:02,029 : INFO : PROGRESS: pass 0, at document #384000/4922894\n", + "2019-01-31 00:22:03,465 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:22:03,731 : INFO : topic #22 (0.020): 0.035*\"spars\" + 0.028*\"factor\" + 0.024*\"adulthood\" + 0.016*\"hostil\" + 0.016*\"feel\" + 0.014*\"male\" + 0.012*\"live\" + 0.011*\"plaisir\" + 0.010*\"yawn\" + 0.009*\"genu\"\n", + "2019-01-31 00:22:03,733 : INFO : topic #39 (0.020): 0.028*\"canada\" + 0.024*\"canadian\" + 0.023*\"scientist\" + 0.023*\"taxpay\" + 0.017*\"clot\" + 0.017*\"basketbal\" + 0.015*\"hoar\" + 0.014*\"toronto\" + 0.012*\"ontario\" + 0.012*\"confer\"\n", + "2019-01-31 00:22:03,734 : INFO : topic #2 (0.020): 0.046*\"isl\" + 0.039*\"shield\" + 0.019*\"narrat\" + 0.014*\"pope\" + 0.013*\"scot\" + 0.012*\"nativist\" + 0.012*\"blur\" + 0.010*\"fleet\" + 0.010*\"coalit\" + 0.009*\"class\"\n", + "2019-01-31 00:22:03,735 : INFO : topic #45 (0.020): 0.020*\"black\" + 0.017*\"colder\" + 0.017*\"western\" + 0.014*\"record\" + 0.010*\"blind\" + 0.009*\"light\" + 0.009*\"illicit\" + 0.008*\"green\" + 0.006*\"fit\" + 0.006*\"arm\"\n", + "2019-01-31 00:22:03,736 : INFO : topic #12 (0.020): 0.010*\"number\" + 0.007*\"frontal\" + 0.007*\"gener\" + 0.007*\"southern\" + 0.006*\"exampl\" + 0.006*\"servitud\" + 0.006*\"théori\" + 0.005*\"method\" + 0.005*\"differ\" + 0.005*\"poet\"\n", + "2019-01-31 00:22:03,742 : INFO : topic diff=0.015016, rho=0.072169\n", + "2019-01-31 00:22:03,896 : INFO : PROGRESS: pass 0, at document #386000/4922894\n", + "2019-01-31 00:22:05,338 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:22:05,605 : INFO : topic #11 (0.020): 0.028*\"john\" + 0.015*\"will\" + 0.013*\"jame\" + 0.012*\"david\" + 0.011*\"rival\" + 0.011*\"georg\" + 0.008*\"slur\" + 0.008*\"rhyme\" + 0.008*\"paul\" + 0.008*\"mexican–american\"\n", + "2019-01-31 00:22:05,606 : INFO : topic #39 (0.020): 0.029*\"canada\" + 0.025*\"canadian\" + 0.023*\"scientist\" + 0.022*\"taxpay\" + 0.017*\"clot\" + 0.016*\"basketbal\" + 0.015*\"hoar\" + 0.014*\"toronto\" + 0.013*\"ontario\" + 0.012*\"confer\"\n", + "2019-01-31 00:22:05,607 : INFO : topic #16 (0.020): 0.032*\"priest\" + 0.021*\"king\" + 0.019*\"quarterli\" + 0.018*\"grammat\" + 0.017*\"maria\" + 0.016*\"duke\" + 0.015*\"idiosyncrat\" + 0.015*\"rotterdam\" + 0.014*\"count\" + 0.014*\"princ\"\n", + "2019-01-31 00:22:05,608 : INFO : topic #30 (0.020): 0.036*\"leagu\" + 0.035*\"cleveland\" + 0.030*\"place\" + 0.027*\"taxpay\" + 0.025*\"crete\" + 0.023*\"scientist\" + 0.023*\"folei\" + 0.016*\"goal\" + 0.015*\"martin\" + 0.012*\"player\"\n", + "2019-01-31 00:22:05,609 : INFO : topic #12 (0.020): 0.009*\"number\" + 0.007*\"frontal\" + 0.007*\"gener\" + 0.006*\"exampl\" + 0.006*\"southern\" + 0.006*\"servitud\" + 0.006*\"théori\" + 0.006*\"poet\" + 0.005*\"differ\" + 0.005*\"method\"\n", + "2019-01-31 00:22:05,615 : INFO : topic diff=0.014705, rho=0.071982\n", + "2019-01-31 00:22:05,769 : INFO : PROGRESS: pass 0, at document #388000/4922894\n", + "2019-01-31 00:22:07,209 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:22:07,475 : INFO : topic #31 (0.020): 0.065*\"fusiform\" + 0.023*\"player\" + 0.021*\"scientist\" + 0.020*\"place\" + 0.017*\"taxpay\" + 0.012*\"folei\" + 0.012*\"leagu\" + 0.010*\"ruler\" + 0.010*\"yard\" + 0.009*\"barber\"\n", + "2019-01-31 00:22:07,476 : INFO : topic #37 (0.020): 0.009*\"love\" + 0.008*\"gestur\" + 0.006*\"man\" + 0.005*\"litig\" + 0.005*\"blue\" + 0.005*\"night\" + 0.004*\"bewild\" + 0.003*\"vision\" + 0.003*\"epiru\" + 0.003*\"york\"\n", + "2019-01-31 00:22:07,477 : INFO : topic #47 (0.020): 0.072*\"muscl\" + 0.033*\"perceptu\" + 0.018*\"theater\" + 0.018*\"compos\" + 0.018*\"place\" + 0.016*\"damn\" + 0.015*\"orchestr\" + 0.014*\"olympo\" + 0.012*\"jack\" + 0.012*\"physician\"\n", + "2019-01-31 00:22:07,478 : INFO : topic #17 (0.020): 0.065*\"church\" + 0.019*\"sail\" + 0.017*\"cathol\" + 0.017*\"bishop\" + 0.016*\"christian\" + 0.016*\"jpg\" + 0.014*\"fifteenth\" + 0.014*\"retroflex\" + 0.013*\"centuri\" + 0.011*\"italian\"\n", + "2019-01-31 00:22:07,479 : INFO : topic #40 (0.020): 0.097*\"unit\" + 0.025*\"collector\" + 0.020*\"institut\" + 0.020*\"schuster\" + 0.016*\"student\" + 0.015*\"requir\" + 0.015*\"professor\" + 0.012*\"word\" + 0.011*\"governor\" + 0.011*\"degre\"\n", + "2019-01-31 00:22:07,485 : INFO : topic diff=0.016741, rho=0.071796\n", + "2019-01-31 00:22:07,641 : INFO : PROGRESS: pass 0, at document #390000/4922894\n", + "2019-01-31 00:22:09,088 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:22:09,354 : INFO : topic #32 (0.020): 0.058*\"district\" + 0.053*\"vigour\" + 0.042*\"popolo\" + 0.042*\"tortur\" + 0.029*\"cotton\" + 0.029*\"regim\" + 0.029*\"area\" + 0.024*\"multitud\" + 0.021*\"citi\" + 0.020*\"commun\"\n", + "2019-01-31 00:22:09,355 : INFO : topic #3 (0.020): 0.039*\"present\" + 0.027*\"offic\" + 0.025*\"minist\" + 0.021*\"seri\" + 0.021*\"serv\" + 0.019*\"member\" + 0.019*\"gener\" + 0.016*\"chickasaw\" + 0.015*\"govern\" + 0.014*\"appeas\"\n", + "2019-01-31 00:22:09,356 : INFO : topic #2 (0.020): 0.043*\"shield\" + 0.043*\"isl\" + 0.018*\"narrat\" + 0.013*\"scot\" + 0.012*\"pope\" + 0.012*\"renaiss\" + 0.011*\"blur\" + 0.011*\"nativist\" + 0.011*\"walter\" + 0.010*\"buford\"\n", + "2019-01-31 00:22:09,358 : INFO : topic #45 (0.020): 0.021*\"black\" + 0.017*\"colder\" + 0.017*\"western\" + 0.014*\"record\" + 0.010*\"blind\" + 0.009*\"light\" + 0.008*\"illicit\" + 0.008*\"green\" + 0.007*\"fit\" + 0.006*\"color\"\n", + "2019-01-31 00:22:09,359 : INFO : topic #10 (0.020): 0.011*\"cdd\" + 0.008*\"have\" + 0.008*\"disco\" + 0.008*\"hormon\" + 0.007*\"media\" + 0.007*\"pathwai\" + 0.007*\"caus\" + 0.007*\"proper\" + 0.006*\"treat\" + 0.006*\"effect\"\n", + "2019-01-31 00:22:09,365 : INFO : topic diff=0.017004, rho=0.071611\n", + "2019-01-31 00:22:09,526 : INFO : PROGRESS: pass 0, at document #392000/4922894\n", + "2019-01-31 00:22:10,993 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:22:11,259 : INFO : topic #35 (0.020): 0.050*\"russia\" + 0.034*\"sovereignti\" + 0.030*\"rural\" + 0.025*\"poison\" + 0.022*\"reprint\" + 0.021*\"personifi\" + 0.018*\"poland\" + 0.017*\"moscow\" + 0.016*\"unfortun\" + 0.015*\"turin\"\n", + "2019-01-31 00:22:11,260 : INFO : topic #40 (0.020): 0.097*\"unit\" + 0.025*\"collector\" + 0.021*\"institut\" + 0.020*\"schuster\" + 0.016*\"student\" + 0.016*\"requir\" + 0.015*\"professor\" + 0.012*\"word\" + 0.011*\"governor\" + 0.011*\"degre\"\n", + "2019-01-31 00:22:11,261 : INFO : topic #28 (0.020): 0.029*\"build\" + 0.023*\"hous\" + 0.023*\"rivièr\" + 0.017*\"buford\" + 0.012*\"histor\" + 0.011*\"rosenwald\" + 0.011*\"briarwood\" + 0.011*\"constitut\" + 0.010*\"strategist\" + 0.009*\"linear\"\n", + "2019-01-31 00:22:11,262 : INFO : topic #45 (0.020): 0.020*\"black\" + 0.017*\"western\" + 0.017*\"colder\" + 0.014*\"record\" + 0.010*\"blind\" + 0.009*\"light\" + 0.008*\"illicit\" + 0.008*\"green\" + 0.007*\"fit\" + 0.006*\"color\"\n", + "2019-01-31 00:22:11,263 : INFO : topic #36 (0.020): 0.025*\"companhia\" + 0.009*\"network\" + 0.009*\"serv\" + 0.009*\"develop\" + 0.008*\"manag\" + 0.008*\"prognosi\" + 0.008*\"base\" + 0.008*\"oper\" + 0.008*\"includ\" + 0.008*\"market\"\n", + "2019-01-31 00:22:11,269 : INFO : topic diff=0.018016, rho=0.071429\n", + "2019-01-31 00:22:11,425 : INFO : PROGRESS: pass 0, at document #394000/4922894\n", + "2019-01-31 00:22:12,856 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 00:22:13,122 : INFO : topic #28 (0.020): 0.029*\"build\" + 0.024*\"hous\" + 0.023*\"rivièr\" + 0.017*\"buford\" + 0.012*\"histor\" + 0.011*\"rosenwald\" + 0.011*\"briarwood\" + 0.011*\"constitut\" + 0.010*\"strategist\" + 0.009*\"linear\"\n", + "2019-01-31 00:22:13,124 : INFO : topic #45 (0.020): 0.021*\"black\" + 0.017*\"western\" + 0.016*\"colder\" + 0.014*\"record\" + 0.010*\"blind\" + 0.009*\"light\" + 0.008*\"illicit\" + 0.008*\"green\" + 0.007*\"fit\" + 0.006*\"color\"\n", + "2019-01-31 00:22:13,125 : INFO : topic #42 (0.020): 0.040*\"german\" + 0.026*\"germani\" + 0.015*\"vol\" + 0.014*\"jewish\" + 0.014*\"israel\" + 0.012*\"berlin\" + 0.011*\"der\" + 0.009*\"jeremiah\" + 0.009*\"europ\" + 0.008*\"european\"\n", + "2019-01-31 00:22:13,126 : INFO : topic #10 (0.020): 0.011*\"cdd\" + 0.008*\"disco\" + 0.008*\"have\" + 0.008*\"hormon\" + 0.007*\"media\" + 0.007*\"caus\" + 0.007*\"pathwai\" + 0.007*\"proper\" + 0.007*\"treat\" + 0.006*\"effect\"\n", + "2019-01-31 00:22:13,127 : INFO : topic #18 (0.020): 0.008*\"théori\" + 0.007*\"later\" + 0.007*\"kill\" + 0.006*\"sack\" + 0.005*\"man\" + 0.005*\"dai\" + 0.005*\"retrospect\" + 0.005*\"deal\" + 0.004*\"help\" + 0.004*\"fraud\"\n", + "2019-01-31 00:22:13,133 : INFO : topic diff=0.014678, rho=0.071247\n", + "2019-01-31 00:22:13,293 : INFO : PROGRESS: pass 0, at document #396000/4922894\n", + "2019-01-31 00:22:14,766 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:22:15,032 : INFO : topic #8 (0.020): 0.032*\"law\" + 0.024*\"cortic\" + 0.018*\"start\" + 0.017*\"act\" + 0.014*\"ricardo\" + 0.012*\"case\" + 0.011*\"polaris\" + 0.010*\"legal\" + 0.007*\"justic\" + 0.007*\"judaism\"\n", + "2019-01-31 00:22:15,033 : INFO : topic #17 (0.020): 0.064*\"church\" + 0.018*\"sail\" + 0.018*\"cathol\" + 0.017*\"christian\" + 0.017*\"bishop\" + 0.015*\"jpg\" + 0.014*\"centuri\" + 0.013*\"retroflex\" + 0.013*\"fifteenth\" + 0.010*\"italian\"\n", + "2019-01-31 00:22:15,034 : INFO : topic #46 (0.020): 0.020*\"wind\" + 0.018*\"stop\" + 0.017*\"norwai\" + 0.016*\"swedish\" + 0.016*\"norwegian\" + 0.016*\"sweden\" + 0.015*\"damag\" + 0.012*\"treeless\" + 0.012*\"turkish\" + 0.011*\"iceland\"\n", + "2019-01-31 00:22:15,035 : INFO : topic #29 (0.020): 0.011*\"govern\" + 0.011*\"start\" + 0.008*\"countri\" + 0.008*\"yawn\" + 0.008*\"million\" + 0.007*\"replac\" + 0.007*\"nation\" + 0.006*\"function\" + 0.006*\"théori\" + 0.006*\"new\"\n", + "2019-01-31 00:22:15,037 : INFO : topic #26 (0.020): 0.033*\"woman\" + 0.032*\"workplac\" + 0.030*\"champion\" + 0.026*\"men\" + 0.024*\"olymp\" + 0.022*\"event\" + 0.020*\"medal\" + 0.019*\"atheist\" + 0.018*\"rainfal\" + 0.018*\"alic\"\n", + "2019-01-31 00:22:15,042 : INFO : topic diff=0.016258, rho=0.071067\n", + "2019-01-31 00:22:15,197 : INFO : PROGRESS: pass 0, at document #398000/4922894\n", + "2019-01-31 00:22:16,641 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:22:16,907 : INFO : topic #6 (0.020): 0.069*\"fewer\" + 0.024*\"septemb\" + 0.022*\"epiru\" + 0.018*\"teacher\" + 0.016*\"stake\" + 0.013*\"rodríguez\" + 0.012*\"proclaim\" + 0.011*\"direct\" + 0.011*\"movi\" + 0.010*\"acrimoni\"\n", + "2019-01-31 00:22:16,908 : INFO : topic #49 (0.020): 0.045*\"india\" + 0.029*\"incumb\" + 0.013*\"televis\" + 0.013*\"pakistan\" + 0.011*\"islam\" + 0.011*\"muskoge\" + 0.010*\"start\" + 0.009*\"alam\" + 0.009*\"sri\" + 0.009*\"tajikistan\"\n", + "2019-01-31 00:22:16,910 : INFO : topic #14 (0.020): 0.024*\"forc\" + 0.022*\"walter\" + 0.021*\"aggress\" + 0.020*\"armi\" + 0.016*\"com\" + 0.015*\"oper\" + 0.014*\"militari\" + 0.013*\"unionist\" + 0.012*\"airbu\" + 0.011*\"airmen\"\n", + "2019-01-31 00:22:16,911 : INFO : topic #7 (0.020): 0.020*\"snatch\" + 0.020*\"di\" + 0.018*\"factor\" + 0.015*\"yawn\" + 0.014*\"margin\" + 0.012*\"bone\" + 0.012*\"john\" + 0.012*\"life\" + 0.012*\"faster\" + 0.011*\"deal\"\n", + "2019-01-31 00:22:16,912 : INFO : topic #20 (0.020): 0.132*\"scholar\" + 0.039*\"struggl\" + 0.031*\"high\" + 0.029*\"educ\" + 0.019*\"collector\" + 0.018*\"yawn\" + 0.013*\"prognosi\" + 0.009*\"task\" + 0.009*\"gothic\" + 0.009*\"class\"\n", + "2019-01-31 00:22:16,918 : INFO : topic diff=0.017548, rho=0.070888\n", + "2019-01-31 00:22:19,603 : INFO : -11.685 per-word bound, 3292.1 perplexity estimate based on a held-out corpus of 2000 documents with 516897 words\n", + "2019-01-31 00:22:19,604 : INFO : PROGRESS: pass 0, at document #400000/4922894\n", + "2019-01-31 00:22:21,026 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:22:21,292 : INFO : topic #23 (0.020): 0.137*\"audit\" + 0.068*\"best\" + 0.030*\"jacksonvil\" + 0.030*\"yawn\" + 0.025*\"japanes\" + 0.023*\"noll\" + 0.020*\"festiv\" + 0.018*\"women\" + 0.017*\"intern\" + 0.012*\"prison\"\n", + "2019-01-31 00:22:21,293 : INFO : topic #4 (0.020): 0.025*\"enfranchis\" + 0.017*\"elabor\" + 0.015*\"depress\" + 0.014*\"pour\" + 0.010*\"produc\" + 0.010*\"mode\" + 0.009*\"candid\" + 0.008*\"veget\" + 0.008*\"encyclopedia\" + 0.007*\"spectacl\"\n", + "2019-01-31 00:22:21,295 : INFO : topic #15 (0.020): 0.014*\"small\" + 0.013*\"develop\" + 0.010*\"organ\" + 0.010*\"requir\" + 0.010*\"word\" + 0.010*\"commun\" + 0.009*\"cultur\" + 0.008*\"student\" + 0.008*\"human\" + 0.008*\"socialist\"\n", + "2019-01-31 00:22:21,296 : INFO : topic #2 (0.020): 0.043*\"shield\" + 0.041*\"isl\" + 0.017*\"narrat\" + 0.014*\"scot\" + 0.012*\"pope\" + 0.011*\"fleet\" + 0.010*\"blur\" + 0.010*\"nativist\" + 0.010*\"walter\" + 0.010*\"coalit\"\n", + "2019-01-31 00:22:21,297 : INFO : topic #0 (0.020): 0.075*\"statewid\" + 0.046*\"arsen\" + 0.038*\"line\" + 0.031*\"museo\" + 0.030*\"raid\" + 0.018*\"traceabl\" + 0.018*\"pain\" + 0.017*\"serv\" + 0.016*\"word\" + 0.015*\"artist\"\n", + "2019-01-31 00:22:21,302 : INFO : topic diff=0.016718, rho=0.070711\n", + "2019-01-31 00:22:21,458 : INFO : PROGRESS: pass 0, at document #402000/4922894\n", + "2019-01-31 00:22:22,910 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:22:23,177 : INFO : topic #49 (0.020): 0.045*\"india\" + 0.030*\"incumb\" + 0.014*\"pakistan\" + 0.013*\"televis\" + 0.011*\"islam\" + 0.010*\"alam\" + 0.010*\"start\" + 0.010*\"sri\" + 0.010*\"muskoge\" + 0.009*\"tajikistan\"\n", + "2019-01-31 00:22:23,178 : INFO : topic #23 (0.020): 0.137*\"audit\" + 0.069*\"best\" + 0.031*\"jacksonvil\" + 0.030*\"yawn\" + 0.025*\"japanes\" + 0.023*\"noll\" + 0.020*\"festiv\" + 0.018*\"women\" + 0.017*\"intern\" + 0.012*\"prison\"\n", + "2019-01-31 00:22:23,179 : INFO : topic #24 (0.020): 0.039*\"book\" + 0.034*\"publicis\" + 0.021*\"word\" + 0.017*\"new\" + 0.014*\"presid\" + 0.014*\"edit\" + 0.012*\"nicola\" + 0.012*\"storag\" + 0.011*\"worldwid\" + 0.011*\"author\"\n", + "2019-01-31 00:22:23,181 : INFO : topic #20 (0.020): 0.131*\"scholar\" + 0.039*\"struggl\" + 0.031*\"high\" + 0.029*\"educ\" + 0.020*\"collector\" + 0.018*\"yawn\" + 0.013*\"prognosi\" + 0.009*\"task\" + 0.009*\"class\" + 0.009*\"gothic\"\n", + "2019-01-31 00:22:23,182 : INFO : topic #21 (0.020): 0.037*\"samford\" + 0.022*\"spain\" + 0.021*\"del\" + 0.015*\"mexico\" + 0.014*\"soviet\" + 0.013*\"francisco\" + 0.012*\"juan\" + 0.011*\"santa\" + 0.011*\"josé\" + 0.011*\"carlo\"\n", + "2019-01-31 00:22:23,188 : INFO : topic diff=0.013449, rho=0.070535\n", + "2019-01-31 00:22:23,342 : INFO : PROGRESS: pass 0, at document #404000/4922894\n", + "2019-01-31 00:22:24,794 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:22:25,060 : INFO : topic #30 (0.020): 0.034*\"leagu\" + 0.033*\"cleveland\" + 0.030*\"place\" + 0.029*\"taxpay\" + 0.025*\"crete\" + 0.024*\"scientist\" + 0.022*\"folei\" + 0.016*\"goal\" + 0.015*\"martin\" + 0.012*\"schmitz\"\n", + "2019-01-31 00:22:25,061 : INFO : topic #34 (0.020): 0.072*\"start\" + 0.033*\"unionist\" + 0.033*\"cotton\" + 0.024*\"american\" + 0.019*\"new\" + 0.014*\"california\" + 0.014*\"terri\" + 0.014*\"north\" + 0.012*\"violent\" + 0.012*\"warrior\"\n", + "2019-01-31 00:22:25,062 : INFO : topic #27 (0.020): 0.068*\"questionnair\" + 0.020*\"taxpay\" + 0.019*\"candid\" + 0.014*\"ret\" + 0.013*\"driver\" + 0.012*\"find\" + 0.011*\"tornado\" + 0.011*\"landslid\" + 0.010*\"champion\" + 0.010*\"théori\"\n", + "2019-01-31 00:22:25,064 : INFO : topic #36 (0.020): 0.025*\"companhia\" + 0.009*\"network\" + 0.009*\"serv\" + 0.009*\"manag\" + 0.009*\"develop\" + 0.008*\"includ\" + 0.008*\"prognosi\" + 0.008*\"oper\" + 0.008*\"base\" + 0.007*\"busi\"\n", + "2019-01-31 00:22:25,065 : INFO : topic #22 (0.020): 0.033*\"spars\" + 0.027*\"factor\" + 0.025*\"adulthood\" + 0.017*\"hostil\" + 0.016*\"feel\" + 0.014*\"male\" + 0.012*\"live\" + 0.010*\"genu\" + 0.010*\"plaisir\" + 0.010*\"yawn\"\n", + "2019-01-31 00:22:25,071 : INFO : topic diff=0.014262, rho=0.070360\n", + "2019-01-31 00:22:25,238 : INFO : PROGRESS: pass 0, at document #406000/4922894\n", + "2019-01-31 00:22:26,713 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:22:26,979 : INFO : topic #11 (0.020): 0.028*\"john\" + 0.015*\"will\" + 0.013*\"jame\" + 0.012*\"david\" + 0.012*\"rival\" + 0.011*\"georg\" + 0.009*\"paul\" + 0.009*\"slur\" + 0.008*\"mexican–american\" + 0.008*\"rhyme\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 00:22:26,980 : INFO : topic #39 (0.020): 0.032*\"canada\" + 0.027*\"canadian\" + 0.025*\"taxpay\" + 0.021*\"scientist\" + 0.017*\"clot\" + 0.016*\"basketbal\" + 0.015*\"hoar\" + 0.014*\"ontario\" + 0.014*\"toronto\" + 0.011*\"confer\"\n", + "2019-01-31 00:22:26,982 : INFO : topic #34 (0.020): 0.072*\"start\" + 0.033*\"unionist\" + 0.032*\"cotton\" + 0.024*\"american\" + 0.019*\"new\" + 0.014*\"terri\" + 0.014*\"california\" + 0.014*\"north\" + 0.012*\"violent\" + 0.012*\"warrior\"\n", + "2019-01-31 00:22:26,983 : INFO : topic #46 (0.020): 0.020*\"stop\" + 0.019*\"damag\" + 0.017*\"wind\" + 0.017*\"sweden\" + 0.016*\"norwai\" + 0.015*\"swedish\" + 0.014*\"norwegian\" + 0.013*\"treeless\" + 0.012*\"turkish\" + 0.011*\"farid\"\n", + "2019-01-31 00:22:26,984 : INFO : topic #42 (0.020): 0.042*\"german\" + 0.029*\"germani\" + 0.014*\"jewish\" + 0.014*\"vol\" + 0.014*\"israel\" + 0.011*\"der\" + 0.011*\"berlin\" + 0.009*\"jeremiah\" + 0.008*\"europ\" + 0.008*\"itali\"\n", + "2019-01-31 00:22:26,990 : INFO : topic diff=0.017943, rho=0.070186\n", + "2019-01-31 00:22:27,146 : INFO : PROGRESS: pass 0, at document #408000/4922894\n", + "2019-01-31 00:22:28,597 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:22:28,863 : INFO : topic #15 (0.020): 0.014*\"develop\" + 0.013*\"small\" + 0.010*\"organ\" + 0.010*\"commun\" + 0.010*\"requir\" + 0.010*\"word\" + 0.009*\"cultur\" + 0.008*\"student\" + 0.008*\"human\" + 0.007*\"socialist\"\n", + "2019-01-31 00:22:28,865 : INFO : topic #11 (0.020): 0.029*\"john\" + 0.014*\"will\" + 0.013*\"jame\" + 0.012*\"david\" + 0.011*\"rival\" + 0.011*\"georg\" + 0.009*\"slur\" + 0.008*\"paul\" + 0.008*\"rhyme\" + 0.008*\"mexican–american\"\n", + "2019-01-31 00:22:28,866 : INFO : topic #16 (0.020): 0.032*\"priest\" + 0.023*\"king\" + 0.020*\"quarterli\" + 0.019*\"duke\" + 0.018*\"idiosyncrat\" + 0.017*\"portugues\" + 0.017*\"grammat\" + 0.016*\"maria\" + 0.015*\"brazil\" + 0.014*\"rotterdam\"\n", + "2019-01-31 00:22:28,867 : INFO : topic #30 (0.020): 0.034*\"leagu\" + 0.033*\"cleveland\" + 0.029*\"place\" + 0.028*\"taxpay\" + 0.024*\"crete\" + 0.024*\"scientist\" + 0.022*\"folei\" + 0.016*\"goal\" + 0.015*\"martin\" + 0.012*\"player\"\n", + "2019-01-31 00:22:28,868 : INFO : topic #3 (0.020): 0.045*\"present\" + 0.032*\"minist\" + 0.029*\"offic\" + 0.020*\"seri\" + 0.019*\"member\" + 0.019*\"gener\" + 0.018*\"serv\" + 0.016*\"prime\" + 0.016*\"chickasaw\" + 0.015*\"govern\"\n", + "2019-01-31 00:22:28,874 : INFO : topic diff=0.015836, rho=0.070014\n", + "2019-01-31 00:22:29,027 : INFO : PROGRESS: pass 0, at document #410000/4922894\n", + "2019-01-31 00:22:30,468 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:22:30,734 : INFO : topic #12 (0.020): 0.009*\"number\" + 0.008*\"frontal\" + 0.007*\"servitud\" + 0.007*\"gener\" + 0.006*\"exampl\" + 0.006*\"southern\" + 0.006*\"théori\" + 0.006*\"poet\" + 0.005*\"method\" + 0.005*\"differ\"\n", + "2019-01-31 00:22:30,736 : INFO : topic #18 (0.020): 0.008*\"théori\" + 0.007*\"later\" + 0.007*\"kill\" + 0.006*\"sack\" + 0.005*\"man\" + 0.005*\"dai\" + 0.005*\"retrospect\" + 0.005*\"deal\" + 0.004*\"help\" + 0.004*\"end\"\n", + "2019-01-31 00:22:30,737 : INFO : topic #31 (0.020): 0.060*\"fusiform\" + 0.022*\"player\" + 0.021*\"scientist\" + 0.021*\"place\" + 0.019*\"taxpay\" + 0.012*\"yard\" + 0.011*\"folei\" + 0.011*\"leagu\" + 0.010*\"ruler\" + 0.008*\"barber\"\n", + "2019-01-31 00:22:30,738 : INFO : topic #7 (0.020): 0.020*\"di\" + 0.020*\"snatch\" + 0.017*\"factor\" + 0.015*\"yawn\" + 0.014*\"margin\" + 0.013*\"john\" + 0.012*\"bone\" + 0.012*\"life\" + 0.011*\"faster\" + 0.011*\"deal\"\n", + "2019-01-31 00:22:30,740 : INFO : topic #38 (0.020): 0.022*\"walter\" + 0.014*\"king\" + 0.011*\"aza\" + 0.010*\"teufel\" + 0.010*\"battalion\" + 0.009*\"empath\" + 0.008*\"forc\" + 0.008*\"till\" + 0.008*\"centuri\" + 0.008*\"armi\"\n", + "2019-01-31 00:22:30,745 : INFO : topic diff=0.015655, rho=0.069843\n", + "2019-01-31 00:22:30,902 : INFO : PROGRESS: pass 0, at document #412000/4922894\n", + "2019-01-31 00:22:32,348 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:22:32,614 : INFO : topic #13 (0.020): 0.029*\"australia\" + 0.028*\"new\" + 0.025*\"sourc\" + 0.024*\"australian\" + 0.023*\"england\" + 0.023*\"london\" + 0.020*\"british\" + 0.019*\"ireland\" + 0.017*\"youth\" + 0.014*\"wale\"\n", + "2019-01-31 00:22:32,615 : INFO : topic #8 (0.020): 0.031*\"law\" + 0.023*\"cortic\" + 0.022*\"act\" + 0.018*\"start\" + 0.014*\"ricardo\" + 0.013*\"case\" + 0.011*\"polaris\" + 0.010*\"legal\" + 0.007*\"rudolf\" + 0.007*\"judaism\"\n", + "2019-01-31 00:22:32,616 : INFO : topic #24 (0.020): 0.039*\"book\" + 0.033*\"publicis\" + 0.021*\"word\" + 0.017*\"new\" + 0.014*\"presid\" + 0.014*\"edit\" + 0.012*\"nicola\" + 0.012*\"storag\" + 0.011*\"worldwid\" + 0.011*\"author\"\n", + "2019-01-31 00:22:32,618 : INFO : topic #30 (0.020): 0.034*\"leagu\" + 0.033*\"cleveland\" + 0.030*\"place\" + 0.028*\"taxpay\" + 0.024*\"crete\" + 0.024*\"scientist\" + 0.022*\"folei\" + 0.017*\"goal\" + 0.015*\"martin\" + 0.012*\"player\"\n", + "2019-01-31 00:22:32,619 : INFO : topic #27 (0.020): 0.068*\"questionnair\" + 0.020*\"taxpay\" + 0.017*\"candid\" + 0.013*\"driver\" + 0.013*\"ret\" + 0.012*\"find\" + 0.011*\"tornado\" + 0.010*\"landslid\" + 0.010*\"champion\" + 0.010*\"fool\"\n", + "2019-01-31 00:22:32,625 : INFO : topic diff=0.014874, rho=0.069673\n", + "2019-01-31 00:22:32,793 : INFO : PROGRESS: pass 0, at document #414000/4922894\n", + "2019-01-31 00:22:34,248 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:22:34,514 : INFO : topic #11 (0.020): 0.029*\"john\" + 0.014*\"will\" + 0.013*\"jame\" + 0.012*\"david\" + 0.011*\"rival\" + 0.011*\"georg\" + 0.009*\"slur\" + 0.008*\"rhyme\" + 0.008*\"mexican–american\" + 0.008*\"paul\"\n", + "2019-01-31 00:22:34,516 : INFO : topic #7 (0.020): 0.020*\"snatch\" + 0.020*\"di\" + 0.017*\"factor\" + 0.015*\"yawn\" + 0.014*\"margin\" + 0.013*\"john\" + 0.012*\"bone\" + 0.012*\"life\" + 0.012*\"faster\" + 0.011*\"deal\"\n", + "2019-01-31 00:22:34,517 : INFO : topic #44 (0.020): 0.031*\"rooftop\" + 0.026*\"final\" + 0.024*\"wife\" + 0.023*\"tourist\" + 0.017*\"martin\" + 0.016*\"champion\" + 0.015*\"winner\" + 0.015*\"taxpay\" + 0.014*\"tiepolo\" + 0.013*\"chamber\"\n", + "2019-01-31 00:22:34,518 : INFO : topic #6 (0.020): 0.070*\"fewer\" + 0.023*\"septemb\" + 0.022*\"epiru\" + 0.019*\"teacher\" + 0.015*\"stake\" + 0.013*\"proclaim\" + 0.013*\"rodríguez\" + 0.011*\"movi\" + 0.011*\"direct\" + 0.010*\"acrimoni\"\n", + "2019-01-31 00:22:34,520 : INFO : topic #19 (0.020): 0.011*\"languag\" + 0.010*\"woodcut\" + 0.009*\"form\" + 0.009*\"origin\" + 0.007*\"uruguayan\" + 0.007*\"charact\" + 0.007*\"mean\" + 0.007*\"like\" + 0.007*\"anim\" + 0.006*\"god\"\n", + "2019-01-31 00:22:34,525 : INFO : topic diff=0.015824, rho=0.069505\n", + "2019-01-31 00:22:34,738 : INFO : PROGRESS: pass 0, at document #416000/4922894\n", + "2019-01-31 00:22:36,201 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:22:36,467 : INFO : topic #30 (0.020): 0.034*\"leagu\" + 0.034*\"cleveland\" + 0.030*\"place\" + 0.029*\"taxpay\" + 0.024*\"scientist\" + 0.024*\"crete\" + 0.022*\"folei\" + 0.016*\"goal\" + 0.015*\"martin\" + 0.012*\"player\"\n", + "2019-01-31 00:22:36,468 : INFO : topic #4 (0.020): 0.023*\"enfranchis\" + 0.015*\"depress\" + 0.015*\"pour\" + 0.015*\"elabor\" + 0.010*\"mode\" + 0.010*\"produc\" + 0.009*\"veget\" + 0.009*\"candid\" + 0.008*\"offset\" + 0.007*\"encyclopedia\"\n", + "2019-01-31 00:22:36,470 : INFO : topic #45 (0.020): 0.019*\"black\" + 0.016*\"western\" + 0.016*\"colder\" + 0.013*\"record\" + 0.010*\"blind\" + 0.009*\"light\" + 0.008*\"illicit\" + 0.007*\"green\" + 0.007*\"hand\" + 0.006*\"depress\"\n", + "2019-01-31 00:22:36,471 : INFO : topic #40 (0.020): 0.097*\"unit\" + 0.027*\"collector\" + 0.020*\"institut\" + 0.020*\"schuster\" + 0.016*\"student\" + 0.016*\"professor\" + 0.015*\"requir\" + 0.012*\"word\" + 0.012*\"governor\" + 0.011*\"degre\"\n", + "2019-01-31 00:22:36,472 : INFO : topic #43 (0.020): 0.066*\"elect\" + 0.057*\"parti\" + 0.024*\"voluntari\" + 0.023*\"democrat\" + 0.022*\"member\" + 0.018*\"polici\" + 0.015*\"bypass\" + 0.015*\"republ\" + 0.014*\"report\" + 0.014*\"liber\"\n", + "2019-01-31 00:22:36,478 : INFO : topic diff=0.015791, rho=0.069338\n", + "2019-01-31 00:22:36,635 : INFO : PROGRESS: pass 0, at document #418000/4922894\n", + "2019-01-31 00:22:38,107 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:22:38,373 : INFO : topic #15 (0.020): 0.013*\"develop\" + 0.013*\"small\" + 0.010*\"organ\" + 0.010*\"commun\" + 0.010*\"word\" + 0.009*\"requir\" + 0.009*\"cultur\" + 0.008*\"student\" + 0.008*\"human\" + 0.007*\"group\"\n", + "2019-01-31 00:22:38,374 : INFO : topic #8 (0.020): 0.029*\"law\" + 0.025*\"act\" + 0.023*\"cortic\" + 0.018*\"start\" + 0.014*\"ricardo\" + 0.013*\"case\" + 0.010*\"polaris\" + 0.010*\"legal\" + 0.007*\"rudolf\" + 0.007*\"unionist\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 00:22:38,375 : INFO : topic #4 (0.020): 0.024*\"enfranchis\" + 0.015*\"pour\" + 0.015*\"depress\" + 0.014*\"elabor\" + 0.010*\"mode\" + 0.009*\"produc\" + 0.009*\"veget\" + 0.009*\"candid\" + 0.008*\"encyclopedia\" + 0.007*\"offset\"\n", + "2019-01-31 00:22:38,376 : INFO : topic #0 (0.020): 0.071*\"statewid\" + 0.044*\"arsen\" + 0.039*\"line\" + 0.033*\"raid\" + 0.028*\"museo\" + 0.018*\"traceabl\" + 0.018*\"pain\" + 0.017*\"serv\" + 0.015*\"exhaust\" + 0.014*\"word\"\n", + "2019-01-31 00:22:38,378 : INFO : topic #30 (0.020): 0.035*\"cleveland\" + 0.034*\"leagu\" + 0.030*\"place\" + 0.029*\"taxpay\" + 0.024*\"scientist\" + 0.024*\"crete\" + 0.022*\"folei\" + 0.016*\"goal\" + 0.015*\"martin\" + 0.013*\"player\"\n", + "2019-01-31 00:22:38,383 : INFO : topic diff=0.014223, rho=0.069171\n", + "2019-01-31 00:22:41,174 : INFO : -11.780 per-word bound, 3516.9 perplexity estimate based on a held-out corpus of 2000 documents with 580823 words\n", + "2019-01-31 00:22:41,175 : INFO : PROGRESS: pass 0, at document #420000/4922894\n", + "2019-01-31 00:22:42,637 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:22:42,902 : INFO : topic #16 (0.020): 0.030*\"priest\" + 0.023*\"king\" + 0.020*\"quarterli\" + 0.019*\"duke\" + 0.017*\"portugues\" + 0.016*\"maria\" + 0.016*\"idiosyncrat\" + 0.016*\"grammat\" + 0.015*\"brazil\" + 0.013*\"rotterdam\"\n", + "2019-01-31 00:22:42,903 : INFO : topic #1 (0.020): 0.049*\"china\" + 0.044*\"chilton\" + 0.023*\"hong\" + 0.023*\"kong\" + 0.022*\"korea\" + 0.019*\"korean\" + 0.017*\"leah\" + 0.015*\"sourc\" + 0.013*\"kim\" + 0.011*\"summer\"\n", + "2019-01-31 00:22:42,904 : INFO : topic #4 (0.020): 0.023*\"enfranchis\" + 0.015*\"depress\" + 0.015*\"pour\" + 0.014*\"elabor\" + 0.010*\"mode\" + 0.010*\"produc\" + 0.009*\"veget\" + 0.009*\"candid\" + 0.007*\"encyclopedia\" + 0.007*\"offset\"\n", + "2019-01-31 00:22:42,906 : INFO : topic #30 (0.020): 0.035*\"cleveland\" + 0.034*\"leagu\" + 0.030*\"place\" + 0.029*\"taxpay\" + 0.024*\"scientist\" + 0.023*\"crete\" + 0.022*\"folei\" + 0.016*\"goal\" + 0.015*\"martin\" + 0.012*\"player\"\n", + "2019-01-31 00:22:42,907 : INFO : topic #46 (0.020): 0.028*\"damag\" + 0.019*\"stop\" + 0.016*\"wind\" + 0.015*\"sweden\" + 0.015*\"swedish\" + 0.015*\"treeless\" + 0.014*\"norwai\" + 0.013*\"ton\" + 0.013*\"replac\" + 0.013*\"norwegian\"\n", + "2019-01-31 00:22:42,913 : INFO : topic diff=0.014296, rho=0.069007\n", + "2019-01-31 00:22:43,068 : INFO : PROGRESS: pass 0, at document #422000/4922894\n", + "2019-01-31 00:22:44,534 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:22:44,804 : INFO : topic #10 (0.020): 0.012*\"cdd\" + 0.009*\"disco\" + 0.007*\"media\" + 0.007*\"pathwai\" + 0.007*\"caus\" + 0.007*\"have\" + 0.007*\"proper\" + 0.006*\"hormon\" + 0.006*\"acid\" + 0.006*\"effect\"\n", + "2019-01-31 00:22:44,806 : INFO : topic #40 (0.020): 0.096*\"unit\" + 0.026*\"collector\" + 0.021*\"schuster\" + 0.021*\"institut\" + 0.016*\"student\" + 0.016*\"requir\" + 0.015*\"professor\" + 0.012*\"word\" + 0.012*\"governor\" + 0.011*\"degre\"\n", + "2019-01-31 00:22:44,807 : INFO : topic #33 (0.020): 0.061*\"french\" + 0.053*\"franc\" + 0.030*\"pari\" + 0.026*\"sail\" + 0.023*\"jean\" + 0.016*\"daphn\" + 0.014*\"lazi\" + 0.011*\"loui\" + 0.010*\"piec\" + 0.009*\"focal\"\n", + "2019-01-31 00:22:44,809 : INFO : topic #37 (0.020): 0.009*\"love\" + 0.009*\"gestur\" + 0.006*\"man\" + 0.006*\"blue\" + 0.005*\"litig\" + 0.004*\"night\" + 0.004*\"bewild\" + 0.004*\"ladi\" + 0.003*\"healthcar\" + 0.003*\"york\"\n", + "2019-01-31 00:22:44,810 : INFO : topic #20 (0.020): 0.132*\"scholar\" + 0.037*\"struggl\" + 0.031*\"high\" + 0.028*\"educ\" + 0.020*\"collector\" + 0.018*\"yawn\" + 0.013*\"prognosi\" + 0.010*\"task\" + 0.009*\"gothic\" + 0.009*\"class\"\n", + "2019-01-31 00:22:44,816 : INFO : topic diff=0.015195, rho=0.068843\n", + "2019-01-31 00:22:44,969 : INFO : PROGRESS: pass 0, at document #424000/4922894\n", + "2019-01-31 00:22:46,406 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:22:46,672 : INFO : topic #7 (0.020): 0.020*\"snatch\" + 0.019*\"di\" + 0.017*\"factor\" + 0.015*\"yawn\" + 0.014*\"margin\" + 0.012*\"bone\" + 0.012*\"john\" + 0.012*\"life\" + 0.012*\"faster\" + 0.011*\"deal\"\n", + "2019-01-31 00:22:46,673 : INFO : topic #25 (0.020): 0.029*\"ring\" + 0.017*\"warmth\" + 0.017*\"lagrang\" + 0.015*\"area\" + 0.014*\"mount\" + 0.008*\"foam\" + 0.008*\"north\" + 0.008*\"land\" + 0.008*\"sourc\" + 0.008*\"lobe\"\n", + "2019-01-31 00:22:46,675 : INFO : topic #48 (0.020): 0.078*\"march\" + 0.078*\"sens\" + 0.078*\"octob\" + 0.075*\"april\" + 0.074*\"notion\" + 0.073*\"august\" + 0.072*\"januari\" + 0.072*\"juli\" + 0.069*\"judici\" + 0.068*\"decatur\"\n", + "2019-01-31 00:22:46,676 : INFO : topic #34 (0.020): 0.076*\"start\" + 0.033*\"unionist\" + 0.031*\"cotton\" + 0.023*\"american\" + 0.022*\"new\" + 0.014*\"terri\" + 0.013*\"california\" + 0.013*\"warrior\" + 0.013*\"north\" + 0.012*\"violent\"\n", + "2019-01-31 00:22:46,677 : INFO : topic #31 (0.020): 0.059*\"fusiform\" + 0.023*\"player\" + 0.021*\"scientist\" + 0.020*\"place\" + 0.019*\"taxpay\" + 0.013*\"folei\" + 0.012*\"leagu\" + 0.010*\"ruler\" + 0.009*\"yard\" + 0.008*\"clot\"\n", + "2019-01-31 00:22:46,683 : INFO : topic diff=0.014879, rho=0.068680\n", + "2019-01-31 00:22:46,842 : INFO : PROGRESS: pass 0, at document #426000/4922894\n", + "2019-01-31 00:22:48,315 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:22:48,581 : INFO : topic #35 (0.020): 0.049*\"russia\" + 0.031*\"rural\" + 0.031*\"sovereignti\" + 0.026*\"shirin\" + 0.025*\"poison\" + 0.023*\"personifi\" + 0.022*\"reprint\" + 0.019*\"turin\" + 0.018*\"moscow\" + 0.016*\"poland\"\n", + "2019-01-31 00:22:48,583 : INFO : topic #17 (0.020): 0.066*\"church\" + 0.019*\"cathol\" + 0.018*\"bishop\" + 0.018*\"christian\" + 0.015*\"sail\" + 0.014*\"jpg\" + 0.014*\"centuri\" + 0.013*\"retroflex\" + 0.012*\"fifteenth\" + 0.010*\"italian\"\n", + "2019-01-31 00:22:48,584 : INFO : topic #24 (0.020): 0.039*\"book\" + 0.033*\"publicis\" + 0.021*\"word\" + 0.018*\"new\" + 0.014*\"presid\" + 0.014*\"edit\" + 0.013*\"storag\" + 0.012*\"nicola\" + 0.011*\"author\" + 0.011*\"worldwid\"\n", + "2019-01-31 00:22:48,585 : INFO : topic #45 (0.020): 0.019*\"black\" + 0.017*\"western\" + 0.016*\"colder\" + 0.013*\"record\" + 0.010*\"blind\" + 0.009*\"illicit\" + 0.009*\"light\" + 0.008*\"hand\" + 0.008*\"green\" + 0.006*\"depress\"\n", + "2019-01-31 00:22:48,586 : INFO : topic #44 (0.020): 0.030*\"rooftop\" + 0.028*\"final\" + 0.024*\"wife\" + 0.021*\"tourist\" + 0.016*\"martin\" + 0.016*\"champion\" + 0.014*\"taxpay\" + 0.014*\"tiepolo\" + 0.014*\"winner\" + 0.013*\"chamber\"\n", + "2019-01-31 00:22:48,592 : INFO : topic diff=0.014034, rho=0.068519\n", + "2019-01-31 00:22:48,747 : INFO : PROGRESS: pass 0, at document #428000/4922894\n", + "2019-01-31 00:22:50,204 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:22:50,469 : INFO : topic #19 (0.020): 0.011*\"languag\" + 0.010*\"woodcut\" + 0.009*\"form\" + 0.009*\"origin\" + 0.008*\"dynam\" + 0.007*\"uruguayan\" + 0.007*\"charact\" + 0.007*\"mean\" + 0.007*\"like\" + 0.006*\"god\"\n", + "2019-01-31 00:22:50,471 : INFO : topic #31 (0.020): 0.060*\"fusiform\" + 0.022*\"player\" + 0.021*\"scientist\" + 0.020*\"place\" + 0.020*\"taxpay\" + 0.013*\"folei\" + 0.012*\"leagu\" + 0.010*\"ruler\" + 0.009*\"yard\" + 0.009*\"clot\"\n", + "2019-01-31 00:22:50,472 : INFO : topic #23 (0.020): 0.138*\"audit\" + 0.071*\"best\" + 0.036*\"yawn\" + 0.030*\"jacksonvil\" + 0.023*\"japanes\" + 0.023*\"noll\" + 0.018*\"festiv\" + 0.017*\"women\" + 0.016*\"intern\" + 0.014*\"winner\"\n", + "2019-01-31 00:22:50,473 : INFO : topic #0 (0.020): 0.070*\"statewid\" + 0.044*\"arsen\" + 0.039*\"line\" + 0.033*\"raid\" + 0.028*\"museo\" + 0.019*\"traceabl\" + 0.018*\"pain\" + 0.017*\"serv\" + 0.015*\"exhaust\" + 0.014*\"word\"\n", + "2019-01-31 00:22:50,474 : INFO : topic #38 (0.020): 0.022*\"walter\" + 0.014*\"king\" + 0.012*\"aza\" + 0.011*\"teufel\" + 0.009*\"battalion\" + 0.009*\"empath\" + 0.009*\"till\" + 0.008*\"centuri\" + 0.008*\"forc\" + 0.008*\"armi\"\n", + "2019-01-31 00:22:50,480 : INFO : topic diff=0.013507, rho=0.068359\n", + "2019-01-31 00:22:50,637 : INFO : PROGRESS: pass 0, at document #430000/4922894\n", + "2019-01-31 00:22:52,093 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:22:52,363 : INFO : topic #18 (0.020): 0.008*\"théori\" + 0.007*\"kill\" + 0.007*\"later\" + 0.006*\"sack\" + 0.005*\"dai\" + 0.005*\"man\" + 0.005*\"retrospect\" + 0.005*\"deal\" + 0.004*\"help\" + 0.004*\"end\"\n", + "2019-01-31 00:22:52,365 : INFO : topic #49 (0.020): 0.042*\"india\" + 0.031*\"incumb\" + 0.014*\"televis\" + 0.013*\"pakistan\" + 0.012*\"islam\" + 0.010*\"tajikistan\" + 0.010*\"sri\" + 0.010*\"start\" + 0.009*\"pradesh\" + 0.009*\"khalsa\"\n", + "2019-01-31 00:22:52,366 : INFO : topic #35 (0.020): 0.048*\"russia\" + 0.031*\"rural\" + 0.031*\"sovereignti\" + 0.028*\"poison\" + 0.025*\"reprint\" + 0.024*\"personifi\" + 0.023*\"shirin\" + 0.018*\"poland\" + 0.017*\"turin\" + 0.017*\"moscow\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 00:22:52,368 : INFO : topic #8 (0.020): 0.030*\"law\" + 0.024*\"cortic\" + 0.023*\"act\" + 0.017*\"start\" + 0.014*\"ricardo\" + 0.013*\"case\" + 0.011*\"polaris\" + 0.010*\"legal\" + 0.008*\"justic\" + 0.007*\"judaism\"\n", + "2019-01-31 00:22:52,369 : INFO : topic #23 (0.020): 0.138*\"audit\" + 0.071*\"best\" + 0.036*\"yawn\" + 0.030*\"jacksonvil\" + 0.023*\"japanes\" + 0.023*\"noll\" + 0.018*\"festiv\" + 0.017*\"women\" + 0.016*\"intern\" + 0.014*\"winner\"\n", + "2019-01-31 00:22:52,375 : INFO : topic diff=0.015549, rho=0.068199\n", + "2019-01-31 00:22:52,540 : INFO : PROGRESS: pass 0, at document #432000/4922894\n", + "2019-01-31 00:22:54,045 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:22:54,311 : INFO : topic #29 (0.020): 0.011*\"govern\" + 0.011*\"start\" + 0.008*\"countri\" + 0.008*\"yawn\" + 0.008*\"million\" + 0.007*\"replac\" + 0.006*\"nation\" + 0.006*\"théori\" + 0.006*\"function\" + 0.006*\"new\"\n", + "2019-01-31 00:22:54,312 : INFO : topic #33 (0.020): 0.059*\"french\" + 0.049*\"franc\" + 0.029*\"pari\" + 0.024*\"sail\" + 0.023*\"jean\" + 0.017*\"daphn\" + 0.015*\"lazi\" + 0.012*\"piec\" + 0.012*\"loui\" + 0.009*\"focal\"\n", + "2019-01-31 00:22:54,313 : INFO : topic #46 (0.020): 0.024*\"damag\" + 0.017*\"stop\" + 0.016*\"norwai\" + 0.016*\"sweden\" + 0.016*\"swedish\" + 0.014*\"norwegian\" + 0.013*\"wind\" + 0.012*\"replac\" + 0.012*\"turkish\" + 0.011*\"treeless\"\n", + "2019-01-31 00:22:54,315 : INFO : topic #8 (0.020): 0.030*\"law\" + 0.024*\"cortic\" + 0.022*\"act\" + 0.018*\"start\" + 0.014*\"ricardo\" + 0.013*\"case\" + 0.012*\"polaris\" + 0.009*\"legal\" + 0.008*\"justic\" + 0.007*\"judaism\"\n", + "2019-01-31 00:22:54,316 : INFO : topic #21 (0.020): 0.038*\"samford\" + 0.023*\"spain\" + 0.019*\"del\" + 0.018*\"mexico\" + 0.014*\"soviet\" + 0.013*\"juan\" + 0.012*\"francisco\" + 0.011*\"carlo\" + 0.011*\"josé\" + 0.010*\"santa\"\n", + "2019-01-31 00:22:54,322 : INFO : topic diff=0.017257, rho=0.068041\n", + "2019-01-31 00:22:54,477 : INFO : PROGRESS: pass 0, at document #434000/4922894\n", + "2019-01-31 00:22:55,889 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:22:56,155 : INFO : topic #35 (0.020): 0.047*\"russia\" + 0.031*\"sovereignti\" + 0.030*\"rural\" + 0.027*\"poison\" + 0.025*\"reprint\" + 0.023*\"personifi\" + 0.022*\"shirin\" + 0.018*\"poland\" + 0.017*\"turin\" + 0.016*\"moscow\"\n", + "2019-01-31 00:22:56,157 : INFO : topic #31 (0.020): 0.061*\"fusiform\" + 0.023*\"player\" + 0.021*\"scientist\" + 0.020*\"place\" + 0.020*\"taxpay\" + 0.013*\"folei\" + 0.011*\"leagu\" + 0.010*\"ruler\" + 0.009*\"clot\" + 0.008*\"yard\"\n", + "2019-01-31 00:22:56,158 : INFO : topic #7 (0.020): 0.020*\"snatch\" + 0.020*\"di\" + 0.017*\"factor\" + 0.015*\"yawn\" + 0.015*\"margin\" + 0.013*\"bone\" + 0.012*\"john\" + 0.012*\"life\" + 0.012*\"faster\" + 0.011*\"deal\"\n", + "2019-01-31 00:22:56,159 : INFO : topic #47 (0.020): 0.068*\"muscl\" + 0.032*\"perceptu\" + 0.020*\"theater\" + 0.019*\"compos\" + 0.018*\"place\" + 0.017*\"damn\" + 0.015*\"physician\" + 0.014*\"orchestr\" + 0.012*\"word\" + 0.012*\"olympo\"\n", + "2019-01-31 00:22:56,161 : INFO : topic #37 (0.020): 0.010*\"love\" + 0.009*\"gestur\" + 0.006*\"man\" + 0.006*\"blue\" + 0.004*\"night\" + 0.004*\"litig\" + 0.004*\"bewild\" + 0.004*\"ladi\" + 0.003*\"amphora\" + 0.003*\"introductori\"\n", + "2019-01-31 00:22:56,166 : INFO : topic diff=0.013546, rho=0.067884\n", + "2019-01-31 00:22:56,319 : INFO : PROGRESS: pass 0, at document #436000/4922894\n", + "2019-01-31 00:22:57,734 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:22:58,000 : INFO : topic #25 (0.020): 0.029*\"ring\" + 0.017*\"lagrang\" + 0.017*\"warmth\" + 0.016*\"area\" + 0.015*\"mount\" + 0.008*\"foam\" + 0.008*\"land\" + 0.008*\"north\" + 0.008*\"vacant\" + 0.008*\"lobe\"\n", + "2019-01-31 00:22:58,001 : INFO : topic #31 (0.020): 0.060*\"fusiform\" + 0.023*\"player\" + 0.022*\"scientist\" + 0.020*\"taxpay\" + 0.020*\"place\" + 0.013*\"folei\" + 0.011*\"leagu\" + 0.010*\"ruler\" + 0.009*\"clot\" + 0.008*\"yard\"\n", + "2019-01-31 00:22:58,003 : INFO : topic #43 (0.020): 0.067*\"elect\" + 0.057*\"parti\" + 0.024*\"democrat\" + 0.024*\"voluntari\" + 0.022*\"member\" + 0.019*\"polici\" + 0.015*\"liber\" + 0.015*\"republ\" + 0.015*\"bypass\" + 0.014*\"report\"\n", + "2019-01-31 00:22:58,004 : INFO : topic #21 (0.020): 0.037*\"samford\" + 0.024*\"spain\" + 0.019*\"del\" + 0.018*\"mexico\" + 0.014*\"soviet\" + 0.012*\"juan\" + 0.012*\"francisco\" + 0.011*\"josé\" + 0.010*\"carlo\" + 0.010*\"santa\"\n", + "2019-01-31 00:22:58,005 : INFO : topic #7 (0.020): 0.020*\"snatch\" + 0.019*\"di\" + 0.017*\"factor\" + 0.015*\"yawn\" + 0.014*\"margin\" + 0.013*\"bone\" + 0.012*\"john\" + 0.012*\"life\" + 0.012*\"faster\" + 0.011*\"deal\"\n", + "2019-01-31 00:22:58,011 : INFO : topic diff=0.013789, rho=0.067729\n", + "2019-01-31 00:22:58,165 : INFO : PROGRESS: pass 0, at document #438000/4922894\n", + "2019-01-31 00:22:59,604 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:22:59,870 : INFO : topic #42 (0.020): 0.046*\"german\" + 0.031*\"germani\" + 0.014*\"vol\" + 0.013*\"jewish\" + 0.012*\"israel\" + 0.011*\"berlin\" + 0.011*\"der\" + 0.009*\"itali\" + 0.008*\"european\" + 0.008*\"europ\"\n", + "2019-01-31 00:22:59,872 : INFO : topic #45 (0.020): 0.019*\"black\" + 0.016*\"western\" + 0.015*\"colder\" + 0.012*\"record\" + 0.009*\"blind\" + 0.009*\"illicit\" + 0.008*\"hand\" + 0.008*\"light\" + 0.007*\"green\" + 0.006*\"depress\"\n", + "2019-01-31 00:22:59,873 : INFO : topic #2 (0.020): 0.046*\"isl\" + 0.040*\"shield\" + 0.018*\"narrat\" + 0.014*\"scot\" + 0.013*\"blur\" + 0.011*\"pope\" + 0.010*\"coalit\" + 0.010*\"nativist\" + 0.010*\"fleet\" + 0.009*\"class\"\n", + "2019-01-31 00:22:59,874 : INFO : topic #27 (0.020): 0.070*\"questionnair\" + 0.019*\"taxpay\" + 0.016*\"candid\" + 0.013*\"tornado\" + 0.013*\"driver\" + 0.012*\"find\" + 0.011*\"squatter\" + 0.011*\"théori\" + 0.010*\"fool\" + 0.009*\"ret\"\n", + "2019-01-31 00:22:59,875 : INFO : topic #13 (0.020): 0.029*\"new\" + 0.028*\"australia\" + 0.026*\"sourc\" + 0.024*\"london\" + 0.024*\"australian\" + 0.023*\"england\" + 0.020*\"british\" + 0.019*\"ireland\" + 0.017*\"youth\" + 0.014*\"wale\"\n", + "2019-01-31 00:22:59,881 : INFO : topic diff=0.013922, rho=0.067574\n", + "2019-01-31 00:23:02,599 : INFO : -11.704 per-word bound, 3336.5 perplexity estimate based on a held-out corpus of 2000 documents with 559222 words\n", + "2019-01-31 00:23:02,600 : INFO : PROGRESS: pass 0, at document #440000/4922894\n", + "2019-01-31 00:23:04,487 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:23:04,753 : INFO : topic #24 (0.020): 0.040*\"book\" + 0.033*\"publicis\" + 0.021*\"word\" + 0.017*\"new\" + 0.014*\"edit\" + 0.014*\"presid\" + 0.013*\"storag\" + 0.012*\"worldwid\" + 0.011*\"nicola\" + 0.011*\"author\"\n", + "2019-01-31 00:23:04,755 : INFO : topic #34 (0.020): 0.076*\"start\" + 0.033*\"unionist\" + 0.030*\"cotton\" + 0.023*\"american\" + 0.022*\"new\" + 0.014*\"terri\" + 0.014*\"california\" + 0.013*\"warrior\" + 0.012*\"north\" + 0.012*\"violent\"\n", + "2019-01-31 00:23:04,756 : INFO : topic #21 (0.020): 0.038*\"samford\" + 0.023*\"spain\" + 0.019*\"del\" + 0.018*\"mexico\" + 0.014*\"soviet\" + 0.013*\"francisco\" + 0.012*\"juan\" + 0.010*\"josé\" + 0.010*\"carlo\" + 0.010*\"santa\"\n", + "2019-01-31 00:23:04,757 : INFO : topic #2 (0.020): 0.045*\"isl\" + 0.040*\"shield\" + 0.018*\"narrat\" + 0.014*\"scot\" + 0.013*\"blur\" + 0.011*\"pope\" + 0.011*\"nativist\" + 0.010*\"coalit\" + 0.010*\"fleet\" + 0.009*\"class\"\n", + "2019-01-31 00:23:04,758 : INFO : topic #44 (0.020): 0.031*\"rooftop\" + 0.027*\"final\" + 0.024*\"wife\" + 0.021*\"tourist\" + 0.017*\"champion\" + 0.015*\"martin\" + 0.015*\"taxpay\" + 0.014*\"tiepolo\" + 0.014*\"chamber\" + 0.013*\"winner\"\n", + "2019-01-31 00:23:04,764 : INFO : topic diff=0.013040, rho=0.067420\n", + "2019-01-31 00:23:04,921 : INFO : PROGRESS: pass 0, at document #442000/4922894\n", + "2019-01-31 00:23:06,870 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:23:07,136 : INFO : topic #17 (0.020): 0.064*\"church\" + 0.020*\"christian\" + 0.019*\"cathol\" + 0.018*\"bishop\" + 0.015*\"sail\" + 0.013*\"centuri\" + 0.013*\"retroflex\" + 0.012*\"jpg\" + 0.011*\"fifteenth\" + 0.010*\"relationship\"\n", + "2019-01-31 00:23:07,137 : INFO : topic #7 (0.020): 0.020*\"snatch\" + 0.020*\"di\" + 0.017*\"factor\" + 0.015*\"yawn\" + 0.014*\"margin\" + 0.013*\"bone\" + 0.012*\"john\" + 0.012*\"life\" + 0.012*\"faster\" + 0.012*\"deal\"\n", + "2019-01-31 00:23:07,139 : INFO : topic #44 (0.020): 0.031*\"rooftop\" + 0.027*\"final\" + 0.024*\"wife\" + 0.021*\"tourist\" + 0.017*\"champion\" + 0.015*\"martin\" + 0.015*\"taxpay\" + 0.014*\"tiepolo\" + 0.014*\"chamber\" + 0.013*\"winner\"\n", + "2019-01-31 00:23:07,140 : INFO : topic #40 (0.020): 0.095*\"unit\" + 0.028*\"collector\" + 0.021*\"schuster\" + 0.019*\"institut\" + 0.016*\"student\" + 0.016*\"requir\" + 0.015*\"professor\" + 0.012*\"word\" + 0.012*\"governor\" + 0.011*\"degre\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 00:23:07,141 : INFO : topic #30 (0.020): 0.035*\"cleveland\" + 0.034*\"leagu\" + 0.029*\"place\" + 0.028*\"taxpay\" + 0.024*\"scientist\" + 0.023*\"crete\" + 0.022*\"folei\" + 0.017*\"goal\" + 0.015*\"martin\" + 0.012*\"schmitz\"\n", + "2019-01-31 00:23:07,147 : INFO : topic diff=0.014265, rho=0.067267\n", + "2019-01-31 00:23:07,306 : INFO : PROGRESS: pass 0, at document #444000/4922894\n", + "2019-01-31 00:23:08,738 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:23:09,004 : INFO : topic #39 (0.020): 0.034*\"canada\" + 0.031*\"canadian\" + 0.025*\"taxpay\" + 0.019*\"scientist\" + 0.016*\"basketbal\" + 0.015*\"toronto\" + 0.015*\"clot\" + 0.014*\"hoar\" + 0.013*\"ontario\" + 0.011*\"confer\"\n", + "2019-01-31 00:23:09,005 : INFO : topic #0 (0.020): 0.067*\"statewid\" + 0.043*\"arsen\" + 0.036*\"line\" + 0.033*\"raid\" + 0.031*\"museo\" + 0.020*\"traceabl\" + 0.018*\"serv\" + 0.017*\"pain\" + 0.014*\"word\" + 0.014*\"exhaust\"\n", + "2019-01-31 00:23:09,006 : INFO : topic #18 (0.020): 0.009*\"théori\" + 0.007*\"later\" + 0.007*\"sack\" + 0.006*\"kill\" + 0.005*\"dai\" + 0.005*\"retrospect\" + 0.005*\"man\" + 0.005*\"deal\" + 0.004*\"end\" + 0.004*\"help\"\n", + "2019-01-31 00:23:09,008 : INFO : topic #15 (0.020): 0.013*\"develop\" + 0.013*\"small\" + 0.010*\"commun\" + 0.010*\"organ\" + 0.010*\"word\" + 0.009*\"cultur\" + 0.009*\"requir\" + 0.008*\"student\" + 0.008*\"group\" + 0.008*\"human\"\n", + "2019-01-31 00:23:09,009 : INFO : topic #20 (0.020): 0.133*\"scholar\" + 0.037*\"struggl\" + 0.032*\"high\" + 0.029*\"educ\" + 0.021*\"collector\" + 0.017*\"yawn\" + 0.014*\"prognosi\" + 0.009*\"task\" + 0.009*\"class\" + 0.008*\"gothic\"\n", + "2019-01-31 00:23:09,015 : INFO : topic diff=0.014884, rho=0.067116\n", + "2019-01-31 00:23:09,228 : INFO : PROGRESS: pass 0, at document #446000/4922894\n", + "2019-01-31 00:23:10,670 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:23:10,936 : INFO : topic #41 (0.020): 0.048*\"citi\" + 0.039*\"new\" + 0.022*\"palmer\" + 0.021*\"year\" + 0.015*\"strategist\" + 0.015*\"center\" + 0.012*\"open\" + 0.010*\"includ\" + 0.009*\"lobe\" + 0.008*\"hot\"\n", + "2019-01-31 00:23:10,937 : INFO : topic #42 (0.020): 0.045*\"german\" + 0.030*\"germani\" + 0.014*\"israel\" + 0.014*\"jewish\" + 0.013*\"vol\" + 0.011*\"berlin\" + 0.011*\"der\" + 0.009*\"itali\" + 0.008*\"jeremiah\" + 0.008*\"european\"\n", + "2019-01-31 00:23:10,938 : INFO : topic #15 (0.020): 0.013*\"develop\" + 0.013*\"small\" + 0.010*\"commun\" + 0.010*\"organ\" + 0.010*\"word\" + 0.009*\"cultur\" + 0.009*\"requir\" + 0.008*\"student\" + 0.008*\"group\" + 0.008*\"human\"\n", + "2019-01-31 00:23:10,939 : INFO : topic #28 (0.020): 0.030*\"build\" + 0.024*\"hous\" + 0.021*\"rivièr\" + 0.016*\"buford\" + 0.012*\"rosenwald\" + 0.011*\"histor\" + 0.011*\"constitut\" + 0.010*\"strategist\" + 0.010*\"briarwood\" + 0.010*\"linear\"\n", + "2019-01-31 00:23:10,941 : INFO : topic #22 (0.020): 0.034*\"spars\" + 0.026*\"factor\" + 0.022*\"adulthood\" + 0.016*\"hostil\" + 0.015*\"feel\" + 0.014*\"male\" + 0.012*\"plaisir\" + 0.012*\"live\" + 0.011*\"genu\" + 0.010*\"yawn\"\n", + "2019-01-31 00:23:10,947 : INFO : topic diff=0.013917, rho=0.066965\n", + "2019-01-31 00:23:11,105 : INFO : PROGRESS: pass 0, at document #448000/4922894\n", + "2019-01-31 00:23:12,570 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:23:12,836 : INFO : topic #12 (0.020): 0.010*\"number\" + 0.008*\"frontal\" + 0.007*\"servitud\" + 0.006*\"gener\" + 0.006*\"southern\" + 0.006*\"exampl\" + 0.006*\"théori\" + 0.006*\"poet\" + 0.006*\"utopian\" + 0.005*\"differ\"\n", + "2019-01-31 00:23:12,837 : INFO : topic #47 (0.020): 0.068*\"muscl\" + 0.032*\"perceptu\" + 0.020*\"theater\" + 0.019*\"compos\" + 0.018*\"place\" + 0.017*\"damn\" + 0.014*\"orchestr\" + 0.013*\"physician\" + 0.012*\"olympo\" + 0.012*\"word\"\n", + "2019-01-31 00:23:12,838 : INFO : topic #11 (0.020): 0.028*\"john\" + 0.014*\"will\" + 0.013*\"jame\" + 0.012*\"david\" + 0.011*\"rival\" + 0.010*\"georg\" + 0.009*\"slur\" + 0.008*\"paul\" + 0.008*\"mexican–american\" + 0.008*\"rhyme\"\n", + "2019-01-31 00:23:12,839 : INFO : topic #41 (0.020): 0.049*\"citi\" + 0.039*\"new\" + 0.023*\"palmer\" + 0.021*\"year\" + 0.015*\"strategist\" + 0.015*\"center\" + 0.012*\"open\" + 0.010*\"includ\" + 0.009*\"lobe\" + 0.008*\"hot\"\n", + "2019-01-31 00:23:12,840 : INFO : topic #48 (0.020): 0.082*\"sens\" + 0.080*\"octob\" + 0.078*\"march\" + 0.077*\"august\" + 0.072*\"notion\" + 0.072*\"april\" + 0.071*\"juli\" + 0.070*\"januari\" + 0.066*\"judici\" + 0.065*\"decatur\"\n", + "2019-01-31 00:23:12,847 : INFO : topic diff=0.014961, rho=0.066815\n", + "2019-01-31 00:23:13,000 : INFO : PROGRESS: pass 0, at document #450000/4922894\n", + "2019-01-31 00:23:14,414 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:23:14,680 : INFO : topic #27 (0.020): 0.070*\"questionnair\" + 0.019*\"taxpay\" + 0.016*\"candid\" + 0.013*\"tornado\" + 0.013*\"driver\" + 0.011*\"find\" + 0.011*\"squatter\" + 0.010*\"fool\" + 0.010*\"landslid\" + 0.010*\"théori\"\n", + "2019-01-31 00:23:14,681 : INFO : topic #24 (0.020): 0.040*\"book\" + 0.033*\"publicis\" + 0.021*\"word\" + 0.017*\"new\" + 0.015*\"edit\" + 0.014*\"presid\" + 0.013*\"storag\" + 0.012*\"nicola\" + 0.012*\"worldwid\" + 0.011*\"author\"\n", + "2019-01-31 00:23:14,682 : INFO : topic #0 (0.020): 0.065*\"statewid\" + 0.043*\"arsen\" + 0.037*\"line\" + 0.036*\"raid\" + 0.031*\"museo\" + 0.019*\"traceabl\" + 0.019*\"serv\" + 0.017*\"pain\" + 0.015*\"word\" + 0.015*\"exhaust\"\n", + "2019-01-31 00:23:14,683 : INFO : topic #12 (0.020): 0.010*\"number\" + 0.008*\"frontal\" + 0.007*\"servitud\" + 0.006*\"exampl\" + 0.006*\"gener\" + 0.006*\"southern\" + 0.006*\"poet\" + 0.006*\"théori\" + 0.005*\"utopian\" + 0.005*\"order\"\n", + "2019-01-31 00:23:14,684 : INFO : topic #8 (0.020): 0.031*\"law\" + 0.024*\"cortic\" + 0.020*\"act\" + 0.018*\"start\" + 0.014*\"ricardo\" + 0.013*\"case\" + 0.012*\"polaris\" + 0.009*\"legal\" + 0.008*\"rudolf\" + 0.007*\"justic\"\n", + "2019-01-31 00:23:14,690 : INFO : topic diff=0.013215, rho=0.066667\n", + "2019-01-31 00:23:14,845 : INFO : PROGRESS: pass 0, at document #452000/4922894\n", + "2019-01-31 00:23:16,283 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:23:16,549 : INFO : topic #47 (0.020): 0.068*\"muscl\" + 0.032*\"perceptu\" + 0.020*\"theater\" + 0.019*\"compos\" + 0.018*\"place\" + 0.017*\"damn\" + 0.014*\"physician\" + 0.013*\"orchestr\" + 0.012*\"olympo\" + 0.012*\"word\"\n", + "2019-01-31 00:23:16,551 : INFO : topic #36 (0.020): 0.026*\"companhia\" + 0.010*\"network\" + 0.009*\"prognosi\" + 0.009*\"serv\" + 0.008*\"develop\" + 0.008*\"oper\" + 0.008*\"manag\" + 0.008*\"includ\" + 0.007*\"base\" + 0.007*\"busi\"\n", + "2019-01-31 00:23:16,552 : INFO : topic #7 (0.020): 0.019*\"di\" + 0.019*\"snatch\" + 0.017*\"factor\" + 0.015*\"yawn\" + 0.014*\"margin\" + 0.013*\"bone\" + 0.012*\"life\" + 0.012*\"john\" + 0.012*\"faster\" + 0.012*\"deal\"\n", + "2019-01-31 00:23:16,553 : INFO : topic #42 (0.020): 0.046*\"german\" + 0.030*\"germani\" + 0.015*\"jewish\" + 0.014*\"israel\" + 0.013*\"vol\" + 0.012*\"berlin\" + 0.011*\"der\" + 0.008*\"itali\" + 0.008*\"european\" + 0.008*\"europ\"\n", + "2019-01-31 00:23:16,554 : INFO : topic #0 (0.020): 0.064*\"statewid\" + 0.042*\"arsen\" + 0.036*\"line\" + 0.036*\"raid\" + 0.031*\"museo\" + 0.019*\"traceabl\" + 0.019*\"serv\" + 0.017*\"pain\" + 0.015*\"word\" + 0.015*\"exhaust\"\n", + "2019-01-31 00:23:16,560 : INFO : topic diff=0.014925, rho=0.066519\n", + "2019-01-31 00:23:16,712 : INFO : PROGRESS: pass 0, at document #454000/4922894\n", + "2019-01-31 00:23:18,114 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:23:18,380 : INFO : topic #24 (0.020): 0.040*\"book\" + 0.033*\"publicis\" + 0.021*\"word\" + 0.017*\"new\" + 0.015*\"edit\" + 0.014*\"presid\" + 0.012*\"storag\" + 0.012*\"worldwid\" + 0.012*\"nicola\" + 0.011*\"author\"\n", + "2019-01-31 00:23:18,381 : INFO : topic #4 (0.020): 0.024*\"enfranchis\" + 0.016*\"depress\" + 0.015*\"pour\" + 0.011*\"elabor\" + 0.010*\"produc\" + 0.010*\"mode\" + 0.009*\"veget\" + 0.008*\"candid\" + 0.008*\"encyclopedia\" + 0.007*\"offset\"\n", + "2019-01-31 00:23:18,383 : INFO : topic #22 (0.020): 0.034*\"spars\" + 0.026*\"factor\" + 0.021*\"adulthood\" + 0.015*\"feel\" + 0.015*\"hostil\" + 0.013*\"male\" + 0.012*\"plaisir\" + 0.012*\"live\" + 0.010*\"genu\" + 0.009*\"yawn\"\n", + "2019-01-31 00:23:18,384 : INFO : topic #40 (0.020): 0.097*\"unit\" + 0.028*\"collector\" + 0.020*\"institut\" + 0.020*\"schuster\" + 0.015*\"student\" + 0.015*\"requir\" + 0.014*\"professor\" + 0.012*\"word\" + 0.012*\"governor\" + 0.012*\"degre\"\n", + "2019-01-31 00:23:18,385 : INFO : topic #37 (0.020): 0.010*\"love\" + 0.009*\"gestur\" + 0.006*\"man\" + 0.006*\"blue\" + 0.005*\"litig\" + 0.004*\"bewild\" + 0.004*\"night\" + 0.004*\"ladi\" + 0.004*\"amphora\" + 0.003*\"introductori\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 00:23:18,391 : INFO : topic diff=0.011715, rho=0.066372\n", + "2019-01-31 00:23:18,544 : INFO : PROGRESS: pass 0, at document #456000/4922894\n", + "2019-01-31 00:23:19,949 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:23:20,216 : INFO : topic #31 (0.020): 0.062*\"fusiform\" + 0.025*\"player\" + 0.022*\"scientist\" + 0.021*\"taxpay\" + 0.021*\"place\" + 0.013*\"folei\" + 0.012*\"leagu\" + 0.009*\"ruler\" + 0.009*\"clot\" + 0.008*\"reconstruct\"\n", + "2019-01-31 00:23:20,217 : INFO : topic #45 (0.020): 0.019*\"black\" + 0.016*\"western\" + 0.014*\"colder\" + 0.012*\"record\" + 0.009*\"blind\" + 0.009*\"illicit\" + 0.008*\"hand\" + 0.008*\"green\" + 0.007*\"light\" + 0.006*\"arm\"\n", + "2019-01-31 00:23:20,218 : INFO : topic #23 (0.020): 0.137*\"audit\" + 0.067*\"best\" + 0.037*\"yawn\" + 0.034*\"jacksonvil\" + 0.023*\"japanes\" + 0.022*\"noll\" + 0.019*\"women\" + 0.019*\"festiv\" + 0.018*\"intern\" + 0.014*\"tokyo\"\n", + "2019-01-31 00:23:20,219 : INFO : topic #4 (0.020): 0.024*\"enfranchis\" + 0.017*\"depress\" + 0.015*\"pour\" + 0.011*\"elabor\" + 0.010*\"produc\" + 0.009*\"mode\" + 0.009*\"veget\" + 0.008*\"candid\" + 0.008*\"encyclopedia\" + 0.007*\"offset\"\n", + "2019-01-31 00:23:20,220 : INFO : topic #43 (0.020): 0.067*\"elect\" + 0.059*\"parti\" + 0.025*\"voluntari\" + 0.024*\"democrat\" + 0.022*\"member\" + 0.020*\"polici\" + 0.015*\"republ\" + 0.014*\"bypass\" + 0.014*\"report\" + 0.014*\"liber\"\n", + "2019-01-31 00:23:20,226 : INFO : topic diff=0.013479, rho=0.066227\n", + "2019-01-31 00:23:20,382 : INFO : PROGRESS: pass 0, at document #458000/4922894\n", + "2019-01-31 00:23:21,829 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:23:22,095 : INFO : topic #15 (0.020): 0.013*\"small\" + 0.013*\"develop\" + 0.010*\"organ\" + 0.010*\"commun\" + 0.010*\"word\" + 0.009*\"cultur\" + 0.009*\"requir\" + 0.008*\"student\" + 0.008*\"human\" + 0.008*\"group\"\n", + "2019-01-31 00:23:22,096 : INFO : topic #46 (0.020): 0.021*\"damag\" + 0.017*\"norwai\" + 0.016*\"stop\" + 0.016*\"sweden\" + 0.015*\"swedish\" + 0.014*\"replac\" + 0.014*\"norwegian\" + 0.013*\"wind\" + 0.012*\"earthquak\" + 0.011*\"treeless\"\n", + "2019-01-31 00:23:22,097 : INFO : topic #12 (0.020): 0.010*\"number\" + 0.009*\"frontal\" + 0.007*\"exampl\" + 0.006*\"servitud\" + 0.006*\"gener\" + 0.006*\"southern\" + 0.006*\"théori\" + 0.006*\"poet\" + 0.006*\"measur\" + 0.006*\"utopian\"\n", + "2019-01-31 00:23:22,099 : INFO : topic #37 (0.020): 0.010*\"love\" + 0.009*\"gestur\" + 0.006*\"man\" + 0.006*\"blue\" + 0.005*\"litig\" + 0.004*\"bewild\" + 0.004*\"night\" + 0.004*\"ladi\" + 0.004*\"amphora\" + 0.003*\"dai\"\n", + "2019-01-31 00:23:22,100 : INFO : topic #10 (0.020): 0.012*\"cdd\" + 0.008*\"hormon\" + 0.008*\"media\" + 0.008*\"disco\" + 0.007*\"caus\" + 0.006*\"pathwai\" + 0.006*\"have\" + 0.006*\"proper\" + 0.006*\"activ\" + 0.006*\"effect\"\n", + "2019-01-31 00:23:22,106 : INFO : topic diff=0.016294, rho=0.066082\n", + "2019-01-31 00:23:24,843 : INFO : -11.496 per-word bound, 2887.3 perplexity estimate based on a held-out corpus of 2000 documents with 545887 words\n", + "2019-01-31 00:23:24,843 : INFO : PROGRESS: pass 0, at document #460000/4922894\n", + "2019-01-31 00:23:26,273 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:23:26,539 : INFO : topic #30 (0.020): 0.036*\"leagu\" + 0.035*\"cleveland\" + 0.029*\"place\" + 0.028*\"taxpay\" + 0.024*\"scientist\" + 0.022*\"crete\" + 0.022*\"folei\" + 0.017*\"goal\" + 0.015*\"martin\" + 0.012*\"schmitz\"\n", + "2019-01-31 00:23:26,540 : INFO : topic #0 (0.020): 0.063*\"statewid\" + 0.043*\"arsen\" + 0.038*\"line\" + 0.035*\"raid\" + 0.031*\"museo\" + 0.020*\"traceabl\" + 0.019*\"serv\" + 0.016*\"pain\" + 0.016*\"word\" + 0.015*\"exhaust\"\n", + "2019-01-31 00:23:26,542 : INFO : topic #9 (0.020): 0.066*\"bone\" + 0.046*\"american\" + 0.028*\"valour\" + 0.020*\"dutch\" + 0.018*\"player\" + 0.015*\"folei\" + 0.015*\"polit\" + 0.014*\"english\" + 0.013*\"acrimoni\" + 0.012*\"simpler\"\n", + "2019-01-31 00:23:26,543 : INFO : topic #6 (0.020): 0.070*\"fewer\" + 0.024*\"septemb\" + 0.023*\"epiru\" + 0.019*\"teacher\" + 0.017*\"stake\" + 0.013*\"rodríguez\" + 0.013*\"proclaim\" + 0.011*\"movi\" + 0.011*\"acrimoni\" + 0.011*\"direct\"\n", + "2019-01-31 00:23:26,544 : INFO : topic #4 (0.020): 0.024*\"enfranchis\" + 0.016*\"depress\" + 0.015*\"pour\" + 0.011*\"elabor\" + 0.010*\"mode\" + 0.009*\"produc\" + 0.009*\"candid\" + 0.009*\"veget\" + 0.007*\"encyclopedia\" + 0.007*\"uruguayan\"\n", + "2019-01-31 00:23:26,550 : INFO : topic diff=0.012832, rho=0.065938\n", + "2019-01-31 00:23:26,705 : INFO : PROGRESS: pass 0, at document #462000/4922894\n", + "2019-01-31 00:23:28,111 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:23:28,378 : INFO : topic #31 (0.020): 0.063*\"fusiform\" + 0.024*\"player\" + 0.022*\"scientist\" + 0.021*\"place\" + 0.020*\"taxpay\" + 0.013*\"folei\" + 0.012*\"leagu\" + 0.010*\"ruler\" + 0.009*\"reconstruct\" + 0.009*\"clot\"\n", + "2019-01-31 00:23:28,378 : INFO : topic #28 (0.020): 0.030*\"build\" + 0.024*\"hous\" + 0.020*\"rivièr\" + 0.016*\"buford\" + 0.012*\"rosenwald\" + 0.011*\"histor\" + 0.011*\"constitut\" + 0.010*\"strategist\" + 0.010*\"linear\" + 0.010*\"depress\"\n", + "2019-01-31 00:23:28,380 : INFO : topic #10 (0.020): 0.012*\"cdd\" + 0.008*\"hormon\" + 0.007*\"media\" + 0.007*\"disco\" + 0.007*\"caus\" + 0.007*\"have\" + 0.006*\"pathwai\" + 0.006*\"proper\" + 0.006*\"effect\" + 0.006*\"activ\"\n", + "2019-01-31 00:23:28,381 : INFO : topic #5 (0.020): 0.039*\"abroad\" + 0.029*\"son\" + 0.028*\"rel\" + 0.026*\"reconstruct\" + 0.022*\"band\" + 0.017*\"muscl\" + 0.016*\"simultan\" + 0.015*\"toyota\" + 0.014*\"charcoal\" + 0.011*\"vocabulari\"\n", + "2019-01-31 00:23:28,382 : INFO : topic #16 (0.020): 0.028*\"king\" + 0.028*\"priest\" + 0.021*\"quarterli\" + 0.019*\"grammat\" + 0.018*\"duke\" + 0.017*\"maria\" + 0.016*\"idiosyncrat\" + 0.016*\"order\" + 0.015*\"rotterdam\" + 0.014*\"portugues\"\n", + "2019-01-31 00:23:28,388 : INFO : topic diff=0.013818, rho=0.065795\n", + "2019-01-31 00:23:28,542 : INFO : PROGRESS: pass 0, at document #464000/4922894\n", + "2019-01-31 00:23:30,019 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:23:30,285 : INFO : topic #10 (0.020): 0.012*\"cdd\" + 0.008*\"hormon\" + 0.008*\"disco\" + 0.007*\"media\" + 0.007*\"have\" + 0.007*\"caus\" + 0.006*\"pathwai\" + 0.006*\"proper\" + 0.006*\"effect\" + 0.006*\"activ\"\n", + "2019-01-31 00:23:30,286 : INFO : topic #37 (0.020): 0.010*\"love\" + 0.009*\"gestur\" + 0.006*\"man\" + 0.006*\"blue\" + 0.005*\"bewild\" + 0.005*\"litig\" + 0.004*\"night\" + 0.004*\"amphora\" + 0.004*\"ladi\" + 0.004*\"healthcar\"\n", + "2019-01-31 00:23:30,288 : INFO : topic #24 (0.020): 0.040*\"book\" + 0.033*\"publicis\" + 0.021*\"word\" + 0.017*\"new\" + 0.014*\"edit\" + 0.013*\"presid\" + 0.013*\"storag\" + 0.013*\"nicola\" + 0.012*\"worldwid\" + 0.011*\"author\"\n", + "2019-01-31 00:23:30,289 : INFO : topic #35 (0.020): 0.053*\"russia\" + 0.034*\"sovereignti\" + 0.034*\"rural\" + 0.025*\"poison\" + 0.022*\"reprint\" + 0.021*\"personifi\" + 0.019*\"moscow\" + 0.016*\"poland\" + 0.016*\"shirin\" + 0.015*\"tyrant\"\n", + "2019-01-31 00:23:30,290 : INFO : topic #18 (0.020): 0.009*\"théori\" + 0.007*\"later\" + 0.006*\"sack\" + 0.006*\"kill\" + 0.005*\"dai\" + 0.005*\"retrospect\" + 0.005*\"man\" + 0.004*\"help\" + 0.004*\"deal\" + 0.004*\"end\"\n", + "2019-01-31 00:23:30,296 : INFO : topic diff=0.012890, rho=0.065653\n", + "2019-01-31 00:23:30,454 : INFO : PROGRESS: pass 0, at document #466000/4922894\n", + "2019-01-31 00:23:31,876 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:23:32,142 : INFO : topic #34 (0.020): 0.075*\"start\" + 0.032*\"unionist\" + 0.030*\"cotton\" + 0.024*\"american\" + 0.023*\"new\" + 0.014*\"terri\" + 0.013*\"california\" + 0.013*\"north\" + 0.012*\"warrior\" + 0.012*\"violent\"\n", + "2019-01-31 00:23:32,143 : INFO : topic #11 (0.020): 0.028*\"john\" + 0.014*\"will\" + 0.013*\"jame\" + 0.012*\"david\" + 0.011*\"rival\" + 0.010*\"georg\" + 0.009*\"slur\" + 0.008*\"mexican–american\" + 0.008*\"paul\" + 0.008*\"rhyme\"\n", + "2019-01-31 00:23:32,145 : INFO : topic #12 (0.020): 0.011*\"number\" + 0.008*\"frontal\" + 0.006*\"exampl\" + 0.006*\"gener\" + 0.006*\"théori\" + 0.006*\"servitud\" + 0.006*\"poet\" + 0.006*\"southern\" + 0.006*\"measur\" + 0.005*\"utopian\"\n", + "2019-01-31 00:23:32,146 : INFO : topic #16 (0.020): 0.030*\"king\" + 0.028*\"priest\" + 0.021*\"quarterli\" + 0.018*\"grammat\" + 0.018*\"duke\" + 0.017*\"idiosyncrat\" + 0.017*\"rotterdam\" + 0.016*\"maria\" + 0.015*\"order\" + 0.014*\"portugues\"\n", + "2019-01-31 00:23:32,146 : INFO : topic #13 (0.020): 0.028*\"new\" + 0.027*\"australia\" + 0.026*\"sourc\" + 0.024*\"england\" + 0.024*\"london\" + 0.021*\"australian\" + 0.020*\"british\" + 0.018*\"ireland\" + 0.016*\"youth\" + 0.013*\"wale\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 00:23:32,152 : INFO : topic diff=0.013784, rho=0.065512\n", + "2019-01-31 00:23:32,310 : INFO : PROGRESS: pass 0, at document #468000/4922894\n", + "2019-01-31 00:23:33,768 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:23:34,033 : INFO : topic #42 (0.020): 0.047*\"german\" + 0.029*\"germani\" + 0.014*\"vol\" + 0.013*\"israel\" + 0.012*\"jewish\" + 0.012*\"berlin\" + 0.011*\"der\" + 0.009*\"itali\" + 0.008*\"europ\" + 0.008*\"european\"\n", + "2019-01-31 00:23:34,035 : INFO : topic #32 (0.020): 0.060*\"district\" + 0.049*\"vigour\" + 0.043*\"tortur\" + 0.041*\"popolo\" + 0.032*\"cotton\" + 0.026*\"area\" + 0.025*\"regim\" + 0.023*\"multitud\" + 0.021*\"citi\" + 0.019*\"earthworm\"\n", + "2019-01-31 00:23:34,036 : INFO : topic #38 (0.020): 0.021*\"walter\" + 0.013*\"king\" + 0.013*\"battalion\" + 0.012*\"aza\" + 0.010*\"teufel\" + 0.009*\"empath\" + 0.008*\"centuri\" + 0.008*\"forc\" + 0.008*\"armi\" + 0.008*\"till\"\n", + "2019-01-31 00:23:34,037 : INFO : topic #14 (0.020): 0.024*\"forc\" + 0.024*\"aggress\" + 0.023*\"walter\" + 0.019*\"armi\" + 0.017*\"com\" + 0.014*\"oper\" + 0.014*\"airmen\" + 0.013*\"militari\" + 0.013*\"unionist\" + 0.012*\"airbu\"\n", + "2019-01-31 00:23:34,038 : INFO : topic #31 (0.020): 0.062*\"fusiform\" + 0.023*\"player\" + 0.022*\"scientist\" + 0.020*\"place\" + 0.020*\"taxpay\" + 0.013*\"folei\" + 0.012*\"leagu\" + 0.009*\"ruler\" + 0.009*\"barber\" + 0.009*\"clot\"\n", + "2019-01-31 00:23:34,044 : INFO : topic diff=0.014505, rho=0.065372\n", + "2019-01-31 00:23:34,198 : INFO : PROGRESS: pass 0, at document #470000/4922894\n", + "2019-01-31 00:23:35,644 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:23:35,910 : INFO : topic #7 (0.020): 0.021*\"snatch\" + 0.019*\"di\" + 0.017*\"factor\" + 0.015*\"margin\" + 0.015*\"yawn\" + 0.013*\"bone\" + 0.012*\"life\" + 0.012*\"faster\" + 0.012*\"john\" + 0.011*\"deal\"\n", + "2019-01-31 00:23:35,911 : INFO : topic #23 (0.020): 0.140*\"audit\" + 0.066*\"best\" + 0.038*\"yawn\" + 0.033*\"jacksonvil\" + 0.023*\"japanes\" + 0.021*\"noll\" + 0.019*\"women\" + 0.018*\"festiv\" + 0.018*\"intern\" + 0.014*\"prison\"\n", + "2019-01-31 00:23:35,912 : INFO : topic #30 (0.020): 0.036*\"leagu\" + 0.036*\"cleveland\" + 0.030*\"place\" + 0.028*\"taxpay\" + 0.024*\"scientist\" + 0.023*\"crete\" + 0.022*\"folei\" + 0.016*\"goal\" + 0.016*\"martin\" + 0.012*\"schmitz\"\n", + "2019-01-31 00:23:35,913 : INFO : topic #18 (0.020): 0.009*\"théori\" + 0.007*\"later\" + 0.007*\"sack\" + 0.006*\"kill\" + 0.005*\"man\" + 0.005*\"dai\" + 0.005*\"retrospect\" + 0.005*\"deal\" + 0.004*\"help\" + 0.004*\"end\"\n", + "2019-01-31 00:23:35,915 : INFO : topic #37 (0.020): 0.010*\"love\" + 0.009*\"gestur\" + 0.006*\"man\" + 0.006*\"blue\" + 0.005*\"litig\" + 0.005*\"bewild\" + 0.004*\"night\" + 0.004*\"ladi\" + 0.004*\"amphora\" + 0.004*\"babi\"\n", + "2019-01-31 00:23:35,920 : INFO : topic diff=0.014500, rho=0.065233\n", + "2019-01-31 00:23:36,073 : INFO : PROGRESS: pass 0, at document #472000/4922894\n", + "2019-01-31 00:23:37,505 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:23:37,771 : INFO : topic #1 (0.020): 0.052*\"chilton\" + 0.051*\"china\" + 0.026*\"hong\" + 0.025*\"kong\" + 0.022*\"korea\" + 0.016*\"leah\" + 0.015*\"korean\" + 0.015*\"sourc\" + 0.014*\"kim\" + 0.010*\"taiwan\"\n", + "2019-01-31 00:23:37,773 : INFO : topic #19 (0.020): 0.012*\"languag\" + 0.010*\"form\" + 0.009*\"origin\" + 0.009*\"woodcut\" + 0.008*\"mean\" + 0.008*\"charact\" + 0.008*\"uruguayan\" + 0.007*\"like\" + 0.007*\"god\" + 0.006*\"dynam\"\n", + "2019-01-31 00:23:37,774 : INFO : topic #34 (0.020): 0.075*\"start\" + 0.032*\"unionist\" + 0.030*\"cotton\" + 0.024*\"american\" + 0.023*\"new\" + 0.014*\"terri\" + 0.013*\"california\" + 0.013*\"north\" + 0.012*\"warrior\" + 0.012*\"violent\"\n", + "2019-01-31 00:23:37,775 : INFO : topic #27 (0.020): 0.073*\"questionnair\" + 0.019*\"taxpay\" + 0.015*\"candid\" + 0.014*\"tornado\" + 0.012*\"find\" + 0.012*\"driver\" + 0.011*\"landslid\" + 0.010*\"horac\" + 0.010*\"fool\" + 0.010*\"théori\"\n", + "2019-01-31 00:23:37,776 : INFO : topic #47 (0.020): 0.066*\"muscl\" + 0.033*\"perceptu\" + 0.021*\"theater\" + 0.018*\"compos\" + 0.016*\"place\" + 0.016*\"damn\" + 0.015*\"physician\" + 0.015*\"orchestr\" + 0.013*\"olympo\" + 0.012*\"jack\"\n", + "2019-01-31 00:23:37,782 : INFO : topic diff=0.013358, rho=0.065094\n", + "2019-01-31 00:23:37,939 : INFO : PROGRESS: pass 0, at document #474000/4922894\n", + "2019-01-31 00:23:39,390 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:23:39,656 : INFO : topic #42 (0.020): 0.047*\"german\" + 0.028*\"germani\" + 0.014*\"israel\" + 0.014*\"vol\" + 0.013*\"jewish\" + 0.013*\"berlin\" + 0.011*\"der\" + 0.008*\"itali\" + 0.008*\"europ\" + 0.008*\"european\"\n", + "2019-01-31 00:23:39,658 : INFO : topic #18 (0.020): 0.009*\"théori\" + 0.007*\"later\" + 0.007*\"sack\" + 0.006*\"kill\" + 0.005*\"man\" + 0.005*\"dai\" + 0.005*\"deal\" + 0.005*\"retrospect\" + 0.004*\"help\" + 0.004*\"end\"\n", + "2019-01-31 00:23:39,659 : INFO : topic #4 (0.020): 0.023*\"enfranchis\" + 0.017*\"depress\" + 0.016*\"pour\" + 0.011*\"elabor\" + 0.010*\"mode\" + 0.009*\"veget\" + 0.009*\"produc\" + 0.009*\"candid\" + 0.009*\"encyclopedia\" + 0.007*\"uruguayan\"\n", + "2019-01-31 00:23:39,660 : INFO : topic #39 (0.020): 0.034*\"canada\" + 0.028*\"canadian\" + 0.024*\"taxpay\" + 0.020*\"scientist\" + 0.016*\"toronto\" + 0.015*\"basketbal\" + 0.014*\"hoar\" + 0.014*\"clot\" + 0.012*\"ontario\" + 0.011*\"confer\"\n", + "2019-01-31 00:23:39,661 : INFO : topic #11 (0.020): 0.028*\"john\" + 0.015*\"will\" + 0.013*\"jame\" + 0.012*\"david\" + 0.012*\"rival\" + 0.010*\"georg\" + 0.008*\"slur\" + 0.008*\"mexican–american\" + 0.008*\"rhyme\" + 0.008*\"paul\"\n", + "2019-01-31 00:23:39,667 : INFO : topic diff=0.012886, rho=0.064957\n", + "2019-01-31 00:23:39,824 : INFO : PROGRESS: pass 0, at document #476000/4922894\n", + "2019-01-31 00:23:41,262 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:23:41,528 : INFO : topic #21 (0.020): 0.037*\"samford\" + 0.023*\"spain\" + 0.019*\"del\" + 0.017*\"mexico\" + 0.014*\"soviet\" + 0.012*\"juan\" + 0.011*\"francisco\" + 0.011*\"josé\" + 0.010*\"carlo\" + 0.010*\"antiqu\"\n", + "2019-01-31 00:23:41,529 : INFO : topic #1 (0.020): 0.051*\"chilton\" + 0.049*\"china\" + 0.026*\"hong\" + 0.026*\"kong\" + 0.022*\"korea\" + 0.018*\"korean\" + 0.017*\"leah\" + 0.016*\"kim\" + 0.015*\"sourc\" + 0.010*\"taiwan\"\n", + "2019-01-31 00:23:41,530 : INFO : topic #26 (0.020): 0.029*\"woman\" + 0.029*\"workplac\" + 0.029*\"olymp\" + 0.027*\"champion\" + 0.024*\"men\" + 0.023*\"medal\" + 0.021*\"event\" + 0.019*\"alic\" + 0.018*\"théori\" + 0.018*\"atheist\"\n", + "2019-01-31 00:23:41,532 : INFO : topic #45 (0.020): 0.018*\"black\" + 0.016*\"western\" + 0.013*\"colder\" + 0.012*\"record\" + 0.009*\"illicit\" + 0.009*\"blind\" + 0.008*\"green\" + 0.007*\"light\" + 0.007*\"hand\" + 0.006*\"arm\"\n", + "2019-01-31 00:23:41,533 : INFO : topic #47 (0.020): 0.066*\"muscl\" + 0.033*\"perceptu\" + 0.021*\"theater\" + 0.018*\"compos\" + 0.016*\"physician\" + 0.016*\"place\" + 0.016*\"orchestr\" + 0.015*\"damn\" + 0.013*\"olympo\" + 0.012*\"jack\"\n", + "2019-01-31 00:23:41,539 : INFO : topic diff=0.012847, rho=0.064820\n", + "2019-01-31 00:23:41,750 : INFO : PROGRESS: pass 0, at document #478000/4922894\n", + "2019-01-31 00:23:43,193 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:23:43,458 : INFO : topic #8 (0.020): 0.032*\"law\" + 0.025*\"cortic\" + 0.019*\"act\" + 0.018*\"start\" + 0.015*\"ricardo\" + 0.012*\"case\" + 0.010*\"polaris\" + 0.010*\"legal\" + 0.007*\"consolid\" + 0.007*\"judaism\"\n", + "2019-01-31 00:23:43,459 : INFO : topic #0 (0.020): 0.064*\"statewid\" + 0.044*\"arsen\" + 0.038*\"line\" + 0.035*\"raid\" + 0.030*\"museo\" + 0.020*\"traceabl\" + 0.018*\"serv\" + 0.018*\"word\" + 0.017*\"pain\" + 0.015*\"exhaust\"\n", + "2019-01-31 00:23:43,461 : INFO : topic #17 (0.020): 0.064*\"church\" + 0.021*\"cathol\" + 0.019*\"christian\" + 0.017*\"bishop\" + 0.014*\"retroflex\" + 0.014*\"sail\" + 0.012*\"centuri\" + 0.010*\"jpg\" + 0.009*\"fifteenth\" + 0.009*\"italian\"\n", + "2019-01-31 00:23:43,462 : INFO : topic #19 (0.020): 0.012*\"languag\" + 0.009*\"form\" + 0.009*\"origin\" + 0.009*\"woodcut\" + 0.008*\"mean\" + 0.008*\"charact\" + 0.008*\"uruguayan\" + 0.007*\"like\" + 0.007*\"god\" + 0.007*\"dynam\"\n", + "2019-01-31 00:23:43,463 : INFO : topic #35 (0.020): 0.052*\"russia\" + 0.036*\"sovereignti\" + 0.033*\"rural\" + 0.022*\"poison\" + 0.022*\"personifi\" + 0.022*\"reprint\" + 0.019*\"moscow\" + 0.015*\"shirin\" + 0.015*\"poland\" + 0.015*\"unfortun\"\n", + "2019-01-31 00:23:43,469 : INFO : topic diff=0.012082, rho=0.064685\n", + "2019-01-31 00:23:46,297 : INFO : -11.721 per-word bound, 3376.6 perplexity estimate based on a held-out corpus of 2000 documents with 580708 words\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 00:23:46,298 : INFO : PROGRESS: pass 0, at document #480000/4922894\n", + "2019-01-31 00:23:47,758 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:23:48,024 : INFO : topic #17 (0.020): 0.065*\"church\" + 0.021*\"cathol\" + 0.019*\"christian\" + 0.017*\"bishop\" + 0.014*\"retroflex\" + 0.014*\"sail\" + 0.012*\"centuri\" + 0.010*\"jpg\" + 0.009*\"fifteenth\" + 0.009*\"italian\"\n", + "2019-01-31 00:23:48,025 : INFO : topic #12 (0.020): 0.011*\"number\" + 0.008*\"frontal\" + 0.007*\"poet\" + 0.006*\"gener\" + 0.006*\"southern\" + 0.006*\"exampl\" + 0.006*\"servitud\" + 0.006*\"théori\" + 0.005*\"differ\" + 0.005*\"utopian\"\n", + "2019-01-31 00:23:48,027 : INFO : topic #18 (0.020): 0.009*\"théori\" + 0.007*\"later\" + 0.007*\"sack\" + 0.006*\"kill\" + 0.005*\"man\" + 0.005*\"dai\" + 0.005*\"deal\" + 0.005*\"retrospect\" + 0.004*\"help\" + 0.004*\"end\"\n", + "2019-01-31 00:23:48,028 : INFO : topic #3 (0.020): 0.041*\"present\" + 0.028*\"offic\" + 0.028*\"minist\" + 0.021*\"member\" + 0.020*\"seri\" + 0.020*\"gener\" + 0.016*\"govern\" + 0.016*\"appeas\" + 0.016*\"serv\" + 0.016*\"chickasaw\"\n", + "2019-01-31 00:23:48,029 : INFO : topic #7 (0.020): 0.020*\"snatch\" + 0.019*\"di\" + 0.018*\"factor\" + 0.015*\"yawn\" + 0.015*\"margin\" + 0.013*\"bone\" + 0.012*\"life\" + 0.012*\"john\" + 0.012*\"faster\" + 0.011*\"deal\"\n", + "2019-01-31 00:23:48,035 : INFO : topic diff=0.012352, rho=0.064550\n", + "2019-01-31 00:23:48,194 : INFO : PROGRESS: pass 0, at document #482000/4922894\n", + "2019-01-31 00:23:49,626 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:23:49,891 : INFO : topic #3 (0.020): 0.041*\"present\" + 0.028*\"offic\" + 0.028*\"minist\" + 0.021*\"member\" + 0.020*\"seri\" + 0.019*\"gener\" + 0.016*\"govern\" + 0.016*\"appeas\" + 0.016*\"serv\" + 0.015*\"chickasaw\"\n", + "2019-01-31 00:23:49,893 : INFO : topic #26 (0.020): 0.028*\"woman\" + 0.028*\"workplac\" + 0.027*\"olymp\" + 0.027*\"champion\" + 0.025*\"alic\" + 0.023*\"men\" + 0.023*\"medal\" + 0.021*\"event\" + 0.018*\"atheist\" + 0.018*\"théori\"\n", + "2019-01-31 00:23:49,894 : INFO : topic #41 (0.020): 0.048*\"citi\" + 0.038*\"new\" + 0.023*\"palmer\" + 0.020*\"year\" + 0.014*\"center\" + 0.014*\"strategist\" + 0.012*\"open\" + 0.011*\"includ\" + 0.009*\"lobe\" + 0.008*\"hot\"\n", + "2019-01-31 00:23:49,895 : INFO : topic #44 (0.020): 0.034*\"rooftop\" + 0.027*\"final\" + 0.022*\"wife\" + 0.021*\"tourist\" + 0.019*\"martin\" + 0.018*\"champion\" + 0.016*\"taxpay\" + 0.016*\"chamber\" + 0.015*\"tiepolo\" + 0.013*\"open\"\n", + "2019-01-31 00:23:49,896 : INFO : topic #0 (0.020): 0.066*\"statewid\" + 0.043*\"arsen\" + 0.039*\"line\" + 0.035*\"raid\" + 0.030*\"museo\" + 0.020*\"traceabl\" + 0.018*\"serv\" + 0.017*\"word\" + 0.016*\"pain\" + 0.015*\"exhaust\"\n", + "2019-01-31 00:23:49,902 : INFO : topic diff=0.012371, rho=0.064416\n", + "2019-01-31 00:23:50,059 : INFO : PROGRESS: pass 0, at document #484000/4922894\n", + "2019-01-31 00:23:51,502 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:23:51,768 : INFO : topic #28 (0.020): 0.030*\"build\" + 0.025*\"hous\" + 0.020*\"rivièr\" + 0.016*\"buford\" + 0.012*\"constitut\" + 0.011*\"histor\" + 0.011*\"rosenwald\" + 0.010*\"strategist\" + 0.010*\"briarwood\" + 0.010*\"linear\"\n", + "2019-01-31 00:23:51,770 : INFO : topic #18 (0.020): 0.009*\"théori\" + 0.007*\"later\" + 0.006*\"sack\" + 0.006*\"kill\" + 0.005*\"dai\" + 0.005*\"man\" + 0.005*\"deal\" + 0.005*\"retrospect\" + 0.004*\"help\" + 0.004*\"kenworthi\"\n", + "2019-01-31 00:23:51,771 : INFO : topic #41 (0.020): 0.048*\"citi\" + 0.037*\"new\" + 0.023*\"palmer\" + 0.019*\"year\" + 0.014*\"center\" + 0.014*\"strategist\" + 0.012*\"open\" + 0.011*\"includ\" + 0.009*\"lobe\" + 0.008*\"hot\"\n", + "2019-01-31 00:23:51,772 : INFO : topic #30 (0.020): 0.036*\"cleveland\" + 0.035*\"leagu\" + 0.029*\"place\" + 0.027*\"taxpay\" + 0.024*\"scientist\" + 0.022*\"crete\" + 0.021*\"folei\" + 0.017*\"goal\" + 0.015*\"martin\" + 0.013*\"schmitz\"\n", + "2019-01-31 00:23:51,774 : INFO : topic #49 (0.020): 0.041*\"india\" + 0.030*\"incumb\" + 0.015*\"islam\" + 0.012*\"pakistan\" + 0.012*\"televis\" + 0.011*\"muskoge\" + 0.010*\"sri\" + 0.009*\"khalsa\" + 0.009*\"tajikistan\" + 0.009*\"start\"\n", + "2019-01-31 00:23:51,779 : INFO : topic diff=0.011678, rho=0.064282\n", + "2019-01-31 00:23:51,937 : INFO : PROGRESS: pass 0, at document #486000/4922894\n", + "2019-01-31 00:23:53,371 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:23:53,636 : INFO : topic #27 (0.020): 0.071*\"questionnair\" + 0.019*\"taxpay\" + 0.015*\"tornado\" + 0.015*\"candid\" + 0.013*\"find\" + 0.012*\"driver\" + 0.012*\"landslid\" + 0.012*\"squatter\" + 0.010*\"théori\" + 0.010*\"fool\"\n", + "2019-01-31 00:23:53,637 : INFO : topic #35 (0.020): 0.052*\"russia\" + 0.036*\"sovereignti\" + 0.032*\"rural\" + 0.022*\"moscow\" + 0.021*\"reprint\" + 0.021*\"poison\" + 0.021*\"personifi\" + 0.016*\"unfortun\" + 0.014*\"shirin\" + 0.014*\"poland\"\n", + "2019-01-31 00:23:53,639 : INFO : topic #49 (0.020): 0.041*\"india\" + 0.030*\"incumb\" + 0.015*\"islam\" + 0.012*\"pakistan\" + 0.012*\"televis\" + 0.011*\"muskoge\" + 0.010*\"sri\" + 0.009*\"khalsa\" + 0.009*\"tajikistan\" + 0.009*\"start\"\n", + "2019-01-31 00:23:53,640 : INFO : topic #10 (0.020): 0.012*\"cdd\" + 0.008*\"disco\" + 0.008*\"hormon\" + 0.007*\"media\" + 0.007*\"caus\" + 0.007*\"have\" + 0.007*\"pathwai\" + 0.006*\"proper\" + 0.006*\"effect\" + 0.006*\"acid\"\n", + "2019-01-31 00:23:53,642 : INFO : topic #30 (0.020): 0.035*\"cleveland\" + 0.035*\"leagu\" + 0.029*\"place\" + 0.027*\"taxpay\" + 0.024*\"scientist\" + 0.022*\"crete\" + 0.021*\"folei\" + 0.017*\"goal\" + 0.015*\"martin\" + 0.013*\"schmitz\"\n", + "2019-01-31 00:23:53,648 : INFO : topic diff=0.014063, rho=0.064150\n", + "2019-01-31 00:23:53,806 : INFO : PROGRESS: pass 0, at document #488000/4922894\n", + "2019-01-31 00:23:55,250 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:23:55,516 : INFO : topic #23 (0.020): 0.135*\"audit\" + 0.066*\"best\" + 0.039*\"yawn\" + 0.036*\"jacksonvil\" + 0.027*\"japanes\" + 0.021*\"noll\" + 0.019*\"women\" + 0.018*\"festiv\" + 0.018*\"prison\" + 0.017*\"intern\"\n", + "2019-01-31 00:23:55,517 : INFO : topic #13 (0.020): 0.027*\"new\" + 0.026*\"australia\" + 0.026*\"sourc\" + 0.023*\"england\" + 0.023*\"london\" + 0.023*\"australian\" + 0.021*\"british\" + 0.021*\"ireland\" + 0.015*\"youth\" + 0.013*\"wale\"\n", + "2019-01-31 00:23:55,518 : INFO : topic #0 (0.020): 0.067*\"statewid\" + 0.042*\"arsen\" + 0.038*\"line\" + 0.035*\"raid\" + 0.030*\"museo\" + 0.020*\"traceabl\" + 0.017*\"word\" + 0.017*\"serv\" + 0.016*\"pain\" + 0.015*\"exhaust\"\n", + "2019-01-31 00:23:55,519 : INFO : topic #45 (0.020): 0.018*\"black\" + 0.016*\"western\" + 0.013*\"colder\" + 0.013*\"record\" + 0.009*\"illicit\" + 0.009*\"blind\" + 0.009*\"green\" + 0.007*\"light\" + 0.007*\"hand\" + 0.006*\"arm\"\n", + "2019-01-31 00:23:55,521 : INFO : topic #24 (0.020): 0.042*\"book\" + 0.033*\"publicis\" + 0.022*\"word\" + 0.016*\"new\" + 0.014*\"edit\" + 0.013*\"presid\" + 0.013*\"nicola\" + 0.012*\"storag\" + 0.012*\"worldwid\" + 0.011*\"author\"\n", + "2019-01-31 00:23:55,527 : INFO : topic diff=0.013476, rho=0.064018\n", + "2019-01-31 00:23:55,683 : INFO : PROGRESS: pass 0, at document #490000/4922894\n", + "2019-01-31 00:23:57,113 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:23:57,379 : INFO : topic #18 (0.020): 0.009*\"théori\" + 0.007*\"later\" + 0.006*\"sack\" + 0.006*\"kill\" + 0.005*\"dai\" + 0.005*\"man\" + 0.005*\"retrospect\" + 0.005*\"deal\" + 0.004*\"help\" + 0.004*\"end\"\n", + "2019-01-31 00:23:57,381 : INFO : topic #31 (0.020): 0.068*\"fusiform\" + 0.024*\"player\" + 0.021*\"scientist\" + 0.020*\"place\" + 0.019*\"taxpay\" + 0.013*\"leagu\" + 0.012*\"folei\" + 0.009*\"barber\" + 0.009*\"ruler\" + 0.009*\"yard\"\n", + "2019-01-31 00:23:57,382 : INFO : topic #15 (0.020): 0.012*\"develop\" + 0.012*\"small\" + 0.010*\"organ\" + 0.009*\"commun\" + 0.009*\"word\" + 0.009*\"cultur\" + 0.009*\"requir\" + 0.008*\"human\" + 0.008*\"student\" + 0.008*\"group\"\n", + "2019-01-31 00:23:57,383 : INFO : topic #42 (0.020): 0.043*\"german\" + 0.026*\"germani\" + 0.013*\"vol\" + 0.013*\"der\" + 0.012*\"israel\" + 0.012*\"jewish\" + 0.012*\"berlin\" + 0.008*\"thong\" + 0.008*\"europ\" + 0.008*\"european\"\n", + "2019-01-31 00:23:57,384 : INFO : topic #25 (0.020): 0.028*\"ring\" + 0.019*\"warmth\" + 0.017*\"lagrang\" + 0.016*\"area\" + 0.015*\"mount\" + 0.009*\"foam\" + 0.008*\"land\" + 0.008*\"lobe\" + 0.008*\"north\" + 0.007*\"vacant\"\n", + "2019-01-31 00:23:57,390 : INFO : topic diff=0.011865, rho=0.063888\n", + "2019-01-31 00:23:57,552 : INFO : PROGRESS: pass 0, at document #492000/4922894\n", + "2019-01-31 00:23:59,048 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:23:59,314 : INFO : topic #7 (0.020): 0.020*\"snatch\" + 0.019*\"di\" + 0.017*\"factor\" + 0.015*\"margin\" + 0.015*\"yawn\" + 0.013*\"bone\" + 0.012*\"life\" + 0.012*\"john\" + 0.012*\"faster\" + 0.011*\"deal\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 00:23:59,316 : INFO : topic #25 (0.020): 0.028*\"ring\" + 0.019*\"warmth\" + 0.017*\"lagrang\" + 0.016*\"area\" + 0.015*\"mount\" + 0.009*\"foam\" + 0.008*\"land\" + 0.008*\"lobe\" + 0.008*\"north\" + 0.007*\"vacant\"\n", + "2019-01-31 00:23:59,317 : INFO : topic #38 (0.020): 0.021*\"walter\" + 0.012*\"king\" + 0.011*\"battalion\" + 0.010*\"aza\" + 0.009*\"centuri\" + 0.008*\"forc\" + 0.008*\"teufel\" + 0.008*\"empath\" + 0.008*\"armi\" + 0.007*\"till\"\n", + "2019-01-31 00:23:59,318 : INFO : topic #3 (0.020): 0.040*\"present\" + 0.029*\"offic\" + 0.027*\"minist\" + 0.021*\"member\" + 0.020*\"seri\" + 0.019*\"gener\" + 0.017*\"chickasaw\" + 0.017*\"govern\" + 0.016*\"appeas\" + 0.015*\"serv\"\n", + "2019-01-31 00:23:59,319 : INFO : topic #2 (0.020): 0.047*\"isl\" + 0.038*\"shield\" + 0.018*\"narrat\" + 0.015*\"scot\" + 0.012*\"blur\" + 0.012*\"pope\" + 0.011*\"nativist\" + 0.010*\"coalit\" + 0.010*\"fleet\" + 0.009*\"sai\"\n", + "2019-01-31 00:23:59,325 : INFO : topic diff=0.012339, rho=0.063758\n", + "2019-01-31 00:23:59,480 : INFO : PROGRESS: pass 0, at document #494000/4922894\n", + "2019-01-31 00:24:00,898 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:24:01,163 : INFO : topic #7 (0.020): 0.020*\"snatch\" + 0.019*\"di\" + 0.017*\"factor\" + 0.015*\"margin\" + 0.015*\"yawn\" + 0.013*\"bone\" + 0.012*\"life\" + 0.012*\"john\" + 0.012*\"faster\" + 0.011*\"deal\"\n", + "2019-01-31 00:24:01,165 : INFO : topic #33 (0.020): 0.054*\"french\" + 0.041*\"franc\" + 0.029*\"pari\" + 0.022*\"sail\" + 0.021*\"jean\" + 0.017*\"daphn\" + 0.013*\"lazi\" + 0.012*\"loui\" + 0.011*\"piec\" + 0.008*\"focal\"\n", + "2019-01-31 00:24:01,166 : INFO : topic #16 (0.020): 0.028*\"priest\" + 0.026*\"king\" + 0.023*\"quarterli\" + 0.021*\"duke\" + 0.018*\"grammat\" + 0.016*\"maria\" + 0.016*\"portugues\" + 0.015*\"count\" + 0.015*\"idiosyncrat\" + 0.014*\"rotterdam\"\n", + "2019-01-31 00:24:01,167 : INFO : topic #47 (0.020): 0.066*\"muscl\" + 0.034*\"perceptu\" + 0.020*\"theater\" + 0.019*\"compos\" + 0.016*\"place\" + 0.015*\"physician\" + 0.015*\"olympo\" + 0.015*\"orchestr\" + 0.014*\"damn\" + 0.012*\"word\"\n", + "2019-01-31 00:24:01,168 : INFO : topic #42 (0.020): 0.043*\"german\" + 0.026*\"germani\" + 0.013*\"vol\" + 0.012*\"der\" + 0.012*\"berlin\" + 0.012*\"israel\" + 0.012*\"jewish\" + 0.008*\"europ\" + 0.008*\"itali\" + 0.008*\"european\"\n", + "2019-01-31 00:24:01,174 : INFO : topic diff=0.012981, rho=0.063628\n", + "2019-01-31 00:24:01,324 : INFO : PROGRESS: pass 0, at document #496000/4922894\n", + "2019-01-31 00:24:02,730 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:24:02,996 : INFO : topic #34 (0.020): 0.073*\"start\" + 0.031*\"unionist\" + 0.030*\"cotton\" + 0.025*\"american\" + 0.023*\"new\" + 0.014*\"california\" + 0.013*\"terri\" + 0.013*\"north\" + 0.012*\"warrior\" + 0.011*\"year\"\n", + "2019-01-31 00:24:02,997 : INFO : topic #25 (0.020): 0.027*\"ring\" + 0.019*\"warmth\" + 0.017*\"lagrang\" + 0.016*\"area\" + 0.016*\"mount\" + 0.010*\"foam\" + 0.008*\"land\" + 0.008*\"lobe\" + 0.008*\"north\" + 0.008*\"palmer\"\n", + "2019-01-31 00:24:02,999 : INFO : topic #21 (0.020): 0.039*\"samford\" + 0.024*\"spain\" + 0.018*\"del\" + 0.017*\"mexico\" + 0.015*\"soviet\" + 0.014*\"francisco\" + 0.012*\"juan\" + 0.011*\"santa\" + 0.011*\"carlo\" + 0.011*\"mexican\"\n", + "2019-01-31 00:24:03,000 : INFO : topic #32 (0.020): 0.058*\"district\" + 0.047*\"vigour\" + 0.043*\"popolo\" + 0.042*\"tortur\" + 0.029*\"cotton\" + 0.027*\"area\" + 0.026*\"regim\" + 0.025*\"multitud\" + 0.021*\"citi\" + 0.019*\"commun\"\n", + "2019-01-31 00:24:03,001 : INFO : topic #14 (0.020): 0.026*\"forc\" + 0.022*\"aggress\" + 0.021*\"walter\" + 0.018*\"armi\" + 0.017*\"com\" + 0.014*\"oper\" + 0.013*\"unionist\" + 0.012*\"militari\" + 0.012*\"airbu\" + 0.010*\"airmen\"\n", + "2019-01-31 00:24:03,007 : INFO : topic diff=0.013785, rho=0.063500\n", + "2019-01-31 00:24:03,167 : INFO : PROGRESS: pass 0, at document #498000/4922894\n", + "2019-01-31 00:24:04,725 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:24:04,991 : INFO : topic #28 (0.020): 0.031*\"build\" + 0.026*\"hous\" + 0.020*\"rivièr\" + 0.017*\"buford\" + 0.012*\"histor\" + 0.011*\"constitut\" + 0.011*\"strategist\" + 0.010*\"rosenwald\" + 0.010*\"briarwood\" + 0.010*\"linear\"\n", + "2019-01-31 00:24:04,992 : INFO : topic #37 (0.020): 0.010*\"love\" + 0.008*\"gestur\" + 0.006*\"man\" + 0.006*\"blue\" + 0.005*\"night\" + 0.004*\"litig\" + 0.004*\"bewild\" + 0.003*\"healthcar\" + 0.003*\"ladi\" + 0.003*\"york\"\n", + "2019-01-31 00:24:04,994 : INFO : topic #44 (0.020): 0.033*\"rooftop\" + 0.026*\"final\" + 0.022*\"wife\" + 0.019*\"tourist\" + 0.018*\"champion\" + 0.017*\"martin\" + 0.015*\"taxpay\" + 0.015*\"chamber\" + 0.015*\"tiepolo\" + 0.013*\"withhold\"\n", + "2019-01-31 00:24:04,995 : INFO : topic #4 (0.020): 0.023*\"enfranchis\" + 0.016*\"depress\" + 0.016*\"pour\" + 0.011*\"elabor\" + 0.009*\"mode\" + 0.009*\"produc\" + 0.009*\"encyclopedia\" + 0.009*\"candid\" + 0.008*\"veget\" + 0.007*\"uruguayan\"\n", + "2019-01-31 00:24:04,996 : INFO : topic #19 (0.020): 0.012*\"languag\" + 0.009*\"origin\" + 0.009*\"form\" + 0.009*\"woodcut\" + 0.008*\"mean\" + 0.007*\"charact\" + 0.007*\"uruguayan\" + 0.007*\"god\" + 0.007*\"like\" + 0.006*\"dynam\"\n", + "2019-01-31 00:24:05,003 : INFO : topic diff=0.013094, rho=0.063372\n", + "2019-01-31 00:24:07,722 : INFO : -11.598 per-word bound, 3100.7 perplexity estimate based on a held-out corpus of 2000 documents with 553729 words\n", + "2019-01-31 00:24:07,722 : INFO : PROGRESS: pass 0, at document #500000/4922894\n", + "2019-01-31 00:24:09,152 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:24:09,418 : INFO : topic #2 (0.020): 0.049*\"isl\" + 0.038*\"shield\" + 0.017*\"narrat\" + 0.015*\"scot\" + 0.012*\"pope\" + 0.011*\"blur\" + 0.010*\"coalit\" + 0.010*\"nativist\" + 0.010*\"fleet\" + 0.009*\"sai\"\n", + "2019-01-31 00:24:09,419 : INFO : topic #10 (0.020): 0.012*\"cdd\" + 0.009*\"disco\" + 0.008*\"media\" + 0.008*\"hormon\" + 0.007*\"caus\" + 0.007*\"pathwai\" + 0.006*\"have\" + 0.006*\"proper\" + 0.006*\"treat\" + 0.006*\"acid\"\n", + "2019-01-31 00:24:09,420 : INFO : topic #37 (0.020): 0.010*\"love\" + 0.008*\"gestur\" + 0.006*\"man\" + 0.006*\"blue\" + 0.005*\"night\" + 0.005*\"litig\" + 0.005*\"bewild\" + 0.004*\"dramatist\" + 0.003*\"ladi\" + 0.003*\"healthcar\"\n", + "2019-01-31 00:24:09,422 : INFO : topic #8 (0.020): 0.032*\"law\" + 0.023*\"cortic\" + 0.019*\"act\" + 0.018*\"start\" + 0.014*\"ricardo\" + 0.012*\"case\" + 0.010*\"polaris\" + 0.010*\"legal\" + 0.008*\"judaism\" + 0.007*\"rudolf\"\n", + "2019-01-31 00:24:09,423 : INFO : topic #3 (0.020): 0.039*\"present\" + 0.029*\"offic\" + 0.026*\"minist\" + 0.021*\"member\" + 0.021*\"seri\" + 0.019*\"gener\" + 0.017*\"chickasaw\" + 0.016*\"govern\" + 0.016*\"appeas\" + 0.015*\"serv\"\n", + "2019-01-31 00:24:09,428 : INFO : topic diff=0.012178, rho=0.063246\n", + "2019-01-31 00:24:09,586 : INFO : PROGRESS: pass 0, at document #502000/4922894\n", + "2019-01-31 00:24:11,044 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:24:11,310 : INFO : topic #29 (0.020): 0.011*\"govern\" + 0.010*\"start\" + 0.008*\"million\" + 0.008*\"yawn\" + 0.008*\"countri\" + 0.006*\"bank\" + 0.006*\"replac\" + 0.006*\"function\" + 0.006*\"nation\" + 0.006*\"théori\"\n", + "2019-01-31 00:24:11,312 : INFO : topic #18 (0.020): 0.009*\"théori\" + 0.007*\"later\" + 0.006*\"kill\" + 0.006*\"sack\" + 0.005*\"dai\" + 0.005*\"man\" + 0.005*\"retrospect\" + 0.005*\"deal\" + 0.004*\"help\" + 0.004*\"end\"\n", + "2019-01-31 00:24:11,313 : INFO : topic #25 (0.020): 0.027*\"ring\" + 0.019*\"warmth\" + 0.016*\"area\" + 0.016*\"lagrang\" + 0.015*\"mount\" + 0.009*\"foam\" + 0.008*\"land\" + 0.008*\"lobe\" + 0.008*\"north\" + 0.008*\"palmer\"\n", + "2019-01-31 00:24:11,314 : INFO : topic #8 (0.020): 0.032*\"law\" + 0.023*\"cortic\" + 0.019*\"act\" + 0.018*\"start\" + 0.014*\"ricardo\" + 0.012*\"case\" + 0.010*\"polaris\" + 0.010*\"legal\" + 0.008*\"judaism\" + 0.007*\"rudolf\"\n", + "2019-01-31 00:24:11,315 : INFO : topic #2 (0.020): 0.048*\"isl\" + 0.038*\"shield\" + 0.018*\"narrat\" + 0.015*\"scot\" + 0.012*\"blur\" + 0.012*\"pope\" + 0.011*\"coalit\" + 0.010*\"nativist\" + 0.010*\"fleet\" + 0.009*\"sai\"\n", + "2019-01-31 00:24:11,321 : INFO : topic diff=0.011153, rho=0.063119\n", + "2019-01-31 00:24:11,482 : INFO : PROGRESS: pass 0, at document #504000/4922894\n", + "2019-01-31 00:24:12,961 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:24:13,228 : INFO : topic #11 (0.020): 0.028*\"john\" + 0.015*\"will\" + 0.014*\"jame\" + 0.013*\"david\" + 0.012*\"rival\" + 0.010*\"georg\" + 0.008*\"mexican–american\" + 0.008*\"slur\" + 0.008*\"rhyme\" + 0.008*\"paul\"\n", + "2019-01-31 00:24:13,229 : INFO : topic #20 (0.020): 0.130*\"scholar\" + 0.036*\"struggl\" + 0.029*\"high\" + 0.029*\"educ\" + 0.020*\"collector\" + 0.018*\"yawn\" + 0.014*\"prognosi\" + 0.010*\"pseudo\" + 0.009*\"task\" + 0.008*\"gothic\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 00:24:13,230 : INFO : topic #14 (0.020): 0.026*\"forc\" + 0.022*\"aggress\" + 0.021*\"walter\" + 0.019*\"armi\" + 0.017*\"com\" + 0.014*\"oper\" + 0.013*\"unionist\" + 0.012*\"militari\" + 0.012*\"airbu\" + 0.010*\"airmen\"\n", + "2019-01-31 00:24:13,231 : INFO : topic #31 (0.020): 0.067*\"fusiform\" + 0.024*\"player\" + 0.021*\"scientist\" + 0.021*\"place\" + 0.019*\"taxpay\" + 0.013*\"leagu\" + 0.012*\"folei\" + 0.010*\"ruler\" + 0.009*\"barber\" + 0.009*\"yard\"\n", + "2019-01-31 00:24:13,232 : INFO : topic #44 (0.020): 0.033*\"rooftop\" + 0.027*\"final\" + 0.022*\"wife\" + 0.019*\"tourist\" + 0.018*\"martin\" + 0.018*\"champion\" + 0.015*\"taxpay\" + 0.015*\"chamber\" + 0.015*\"tiepolo\" + 0.013*\"withhold\"\n", + "2019-01-31 00:24:13,238 : INFO : topic diff=0.013192, rho=0.062994\n", + "2019-01-31 00:24:13,394 : INFO : PROGRESS: pass 0, at document #506000/4922894\n", + "2019-01-31 00:24:14,842 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:24:15,108 : INFO : topic #20 (0.020): 0.131*\"scholar\" + 0.036*\"struggl\" + 0.029*\"high\" + 0.028*\"educ\" + 0.019*\"collector\" + 0.018*\"yawn\" + 0.014*\"prognosi\" + 0.010*\"pseudo\" + 0.010*\"task\" + 0.008*\"gothic\"\n", + "2019-01-31 00:24:15,109 : INFO : topic #16 (0.020): 0.031*\"priest\" + 0.026*\"king\" + 0.022*\"quarterli\" + 0.020*\"duke\" + 0.018*\"grammat\" + 0.017*\"maria\" + 0.015*\"portugues\" + 0.015*\"rotterdam\" + 0.014*\"count\" + 0.014*\"idiosyncrat\"\n", + "2019-01-31 00:24:15,111 : INFO : topic #9 (0.020): 0.070*\"bone\" + 0.041*\"american\" + 0.026*\"valour\" + 0.019*\"dutch\" + 0.016*\"player\" + 0.016*\"polit\" + 0.015*\"folei\" + 0.013*\"english\" + 0.012*\"acrimoni\" + 0.011*\"simpler\"\n", + "2019-01-31 00:24:15,112 : INFO : topic #36 (0.020): 0.023*\"companhia\" + 0.010*\"network\" + 0.009*\"prognosi\" + 0.009*\"serv\" + 0.009*\"develop\" + 0.008*\"manag\" + 0.008*\"oper\" + 0.008*\"busi\" + 0.007*\"produc\" + 0.007*\"includ\"\n", + "2019-01-31 00:24:15,113 : INFO : topic #21 (0.020): 0.039*\"samford\" + 0.024*\"spain\" + 0.018*\"del\" + 0.018*\"mexico\" + 0.016*\"soviet\" + 0.014*\"francisco\" + 0.011*\"juan\" + 0.011*\"santa\" + 0.010*\"lizard\" + 0.010*\"mexican\"\n", + "2019-01-31 00:24:15,119 : INFO : topic diff=0.011201, rho=0.062869\n", + "2019-01-31 00:24:15,272 : INFO : PROGRESS: pass 0, at document #508000/4922894\n", + "2019-01-31 00:24:16,686 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:24:16,952 : INFO : topic #43 (0.020): 0.067*\"elect\" + 0.057*\"parti\" + 0.025*\"voluntari\" + 0.022*\"democrat\" + 0.020*\"member\" + 0.018*\"polici\" + 0.015*\"bypass\" + 0.014*\"republ\" + 0.014*\"selma\" + 0.014*\"hous\"\n", + "2019-01-31 00:24:16,953 : INFO : topic #29 (0.020): 0.011*\"govern\" + 0.010*\"start\" + 0.008*\"million\" + 0.008*\"yawn\" + 0.007*\"countri\" + 0.006*\"bank\" + 0.006*\"replac\" + 0.006*\"function\" + 0.006*\"nation\" + 0.006*\"théori\"\n", + "2019-01-31 00:24:16,954 : INFO : topic #5 (0.020): 0.040*\"abroad\" + 0.030*\"son\" + 0.028*\"rel\" + 0.027*\"reconstruct\" + 0.021*\"band\" + 0.017*\"simultan\" + 0.016*\"muscl\" + 0.015*\"charcoal\" + 0.014*\"toyota\" + 0.010*\"vocabulari\"\n", + "2019-01-31 00:24:16,956 : INFO : topic #45 (0.020): 0.019*\"black\" + 0.016*\"western\" + 0.013*\"colder\" + 0.012*\"record\" + 0.010*\"illicit\" + 0.009*\"blind\" + 0.008*\"green\" + 0.008*\"light\" + 0.006*\"hand\" + 0.006*\"arm\"\n", + "2019-01-31 00:24:16,957 : INFO : topic #10 (0.020): 0.011*\"cdd\" + 0.009*\"disco\" + 0.008*\"media\" + 0.007*\"hormon\" + 0.007*\"caus\" + 0.007*\"pathwai\" + 0.007*\"have\" + 0.006*\"proper\" + 0.006*\"effect\" + 0.006*\"treat\"\n", + "2019-01-31 00:24:16,963 : INFO : topic diff=0.011546, rho=0.062746\n", + "2019-01-31 00:24:17,172 : INFO : PROGRESS: pass 0, at document #510000/4922894\n", + "2019-01-31 00:24:18,618 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:24:18,884 : INFO : topic #14 (0.020): 0.026*\"forc\" + 0.022*\"walter\" + 0.021*\"aggress\" + 0.018*\"com\" + 0.018*\"armi\" + 0.014*\"oper\" + 0.013*\"unionist\" + 0.012*\"militari\" + 0.011*\"airbu\" + 0.010*\"airmen\"\n", + "2019-01-31 00:24:18,886 : INFO : topic #21 (0.020): 0.039*\"samford\" + 0.023*\"spain\" + 0.018*\"del\" + 0.018*\"mexico\" + 0.016*\"soviet\" + 0.013*\"francisco\" + 0.011*\"juan\" + 0.011*\"santa\" + 0.011*\"lizard\" + 0.010*\"plung\"\n", + "2019-01-31 00:24:18,887 : INFO : topic #39 (0.020): 0.032*\"canada\" + 0.028*\"canadian\" + 0.022*\"taxpay\" + 0.019*\"scientist\" + 0.016*\"basketbal\" + 0.016*\"toronto\" + 0.014*\"hoar\" + 0.013*\"clot\" + 0.012*\"ontario\" + 0.011*\"confer\"\n", + "2019-01-31 00:24:18,888 : INFO : topic #25 (0.020): 0.032*\"ring\" + 0.018*\"warmth\" + 0.016*\"area\" + 0.015*\"lagrang\" + 0.015*\"mount\" + 0.009*\"foam\" + 0.008*\"land\" + 0.008*\"north\" + 0.008*\"lobe\" + 0.008*\"palmer\"\n", + "2019-01-31 00:24:18,889 : INFO : topic #43 (0.020): 0.067*\"elect\" + 0.055*\"parti\" + 0.026*\"democrat\" + 0.025*\"voluntari\" + 0.020*\"member\" + 0.018*\"polici\" + 0.015*\"republ\" + 0.015*\"liber\" + 0.014*\"bypass\" + 0.014*\"selma\"\n", + "2019-01-31 00:24:18,895 : INFO : topic diff=0.011627, rho=0.062622\n", + "2019-01-31 00:24:19,056 : INFO : PROGRESS: pass 0, at document #512000/4922894\n", + "2019-01-31 00:24:20,526 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:24:20,792 : INFO : topic #43 (0.020): 0.067*\"elect\" + 0.055*\"parti\" + 0.026*\"democrat\" + 0.025*\"voluntari\" + 0.020*\"member\" + 0.018*\"polici\" + 0.015*\"republ\" + 0.014*\"bypass\" + 0.014*\"liber\" + 0.014*\"seaport\"\n", + "2019-01-31 00:24:20,794 : INFO : topic #6 (0.020): 0.069*\"fewer\" + 0.026*\"septemb\" + 0.024*\"epiru\" + 0.019*\"teacher\" + 0.017*\"stake\" + 0.013*\"rodríguez\" + 0.012*\"proclaim\" + 0.011*\"direct\" + 0.011*\"movi\" + 0.010*\"acrimoni\"\n", + "2019-01-31 00:24:20,795 : INFO : topic #24 (0.020): 0.042*\"book\" + 0.034*\"publicis\" + 0.022*\"word\" + 0.016*\"new\" + 0.014*\"edit\" + 0.013*\"nicola\" + 0.013*\"presid\" + 0.012*\"storag\" + 0.012*\"worldwid\" + 0.011*\"author\"\n", + "2019-01-31 00:24:20,796 : INFO : topic #21 (0.020): 0.038*\"samford\" + 0.024*\"spain\" + 0.019*\"mexico\" + 0.018*\"del\" + 0.016*\"soviet\" + 0.013*\"francisco\" + 0.012*\"mexican\" + 0.012*\"juan\" + 0.011*\"santa\" + 0.011*\"lizard\"\n", + "2019-01-31 00:24:20,797 : INFO : topic #45 (0.020): 0.018*\"black\" + 0.016*\"western\" + 0.013*\"colder\" + 0.012*\"record\" + 0.010*\"illicit\" + 0.009*\"blind\" + 0.008*\"green\" + 0.007*\"light\" + 0.006*\"hand\" + 0.006*\"depress\"\n", + "2019-01-31 00:24:20,803 : INFO : topic diff=0.013517, rho=0.062500\n", + "2019-01-31 00:24:20,958 : INFO : PROGRESS: pass 0, at document #514000/4922894\n", + "2019-01-31 00:24:22,385 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:24:22,651 : INFO : topic #40 (0.020): 0.090*\"unit\" + 0.029*\"collector\" + 0.021*\"institut\" + 0.020*\"schuster\" + 0.018*\"professor\" + 0.017*\"student\" + 0.016*\"requir\" + 0.012*\"word\" + 0.012*\"governor\" + 0.011*\"degre\"\n", + "2019-01-31 00:24:22,653 : INFO : topic #39 (0.020): 0.032*\"canada\" + 0.029*\"canadian\" + 0.022*\"taxpay\" + 0.019*\"scientist\" + 0.016*\"basketbal\" + 0.015*\"toronto\" + 0.015*\"hoar\" + 0.013*\"ontario\" + 0.012*\"clot\" + 0.010*\"confer\"\n", + "2019-01-31 00:24:22,654 : INFO : topic #49 (0.020): 0.042*\"india\" + 0.030*\"incumb\" + 0.012*\"televis\" + 0.012*\"islam\" + 0.012*\"pakistan\" + 0.011*\"muskoge\" + 0.010*\"khalsa\" + 0.010*\"start\" + 0.009*\"singh\" + 0.009*\"sri\"\n", + "2019-01-31 00:24:22,655 : INFO : topic #37 (0.020): 0.010*\"love\" + 0.008*\"gestur\" + 0.007*\"man\" + 0.006*\"blue\" + 0.005*\"belinda\" + 0.005*\"night\" + 0.005*\"litig\" + 0.004*\"bewild\" + 0.003*\"dramatist\" + 0.003*\"ladi\"\n", + "2019-01-31 00:24:22,656 : INFO : topic #13 (0.020): 0.027*\"new\" + 0.026*\"australia\" + 0.026*\"sourc\" + 0.023*\"london\" + 0.022*\"british\" + 0.022*\"england\" + 0.022*\"australian\" + 0.019*\"ireland\" + 0.016*\"youth\" + 0.013*\"north\"\n", + "2019-01-31 00:24:22,662 : INFO : topic diff=0.011288, rho=0.062378\n", + "2019-01-31 00:24:22,817 : INFO : PROGRESS: pass 0, at document #516000/4922894\n", + "2019-01-31 00:24:24,251 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:24:24,517 : INFO : topic #26 (0.020): 0.030*\"woman\" + 0.028*\"workplac\" + 0.028*\"champion\" + 0.026*\"olymp\" + 0.026*\"men\" + 0.023*\"medal\" + 0.021*\"event\" + 0.021*\"rainfal\" + 0.020*\"alic\" + 0.020*\"atheist\"\n", + "2019-01-31 00:24:24,518 : INFO : topic #25 (0.020): 0.031*\"ring\" + 0.018*\"warmth\" + 0.016*\"area\" + 0.016*\"lagrang\" + 0.015*\"mount\" + 0.009*\"foam\" + 0.008*\"north\" + 0.008*\"sourc\" + 0.008*\"land\" + 0.008*\"lobe\"\n", + "2019-01-31 00:24:24,519 : INFO : topic #21 (0.020): 0.038*\"samford\" + 0.024*\"spain\" + 0.020*\"mexico\" + 0.017*\"del\" + 0.015*\"soviet\" + 0.013*\"francisco\" + 0.012*\"mexican\" + 0.011*\"juan\" + 0.011*\"santa\" + 0.010*\"lizard\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 00:24:24,521 : INFO : topic #1 (0.020): 0.054*\"china\" + 0.047*\"chilton\" + 0.024*\"hong\" + 0.024*\"kong\" + 0.021*\"korea\" + 0.018*\"korean\" + 0.015*\"leah\" + 0.014*\"sourc\" + 0.013*\"kim\" + 0.010*\"taiwan\"\n", + "2019-01-31 00:24:24,522 : INFO : topic #16 (0.020): 0.032*\"priest\" + 0.027*\"king\" + 0.021*\"quarterli\" + 0.020*\"duke\" + 0.018*\"grammat\" + 0.016*\"rotterdam\" + 0.016*\"maria\" + 0.015*\"idiosyncrat\" + 0.015*\"portugues\" + 0.014*\"count\"\n", + "2019-01-31 00:24:24,527 : INFO : topic diff=0.012022, rho=0.062257\n", + "2019-01-31 00:24:24,680 : INFO : PROGRESS: pass 0, at document #518000/4922894\n", + "2019-01-31 00:24:26,097 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:24:26,363 : INFO : topic #36 (0.020): 0.022*\"companhia\" + 0.010*\"network\" + 0.009*\"develop\" + 0.009*\"serv\" + 0.009*\"prognosi\" + 0.008*\"manag\" + 0.008*\"oper\" + 0.008*\"produc\" + 0.008*\"base\" + 0.007*\"includ\"\n", + "2019-01-31 00:24:26,365 : INFO : topic #24 (0.020): 0.042*\"book\" + 0.034*\"publicis\" + 0.022*\"word\" + 0.016*\"new\" + 0.014*\"edit\" + 0.013*\"nicola\" + 0.013*\"presid\" + 0.013*\"storag\" + 0.012*\"worldwid\" + 0.011*\"author\"\n", + "2019-01-31 00:24:26,366 : INFO : topic #47 (0.020): 0.063*\"muscl\" + 0.034*\"perceptu\" + 0.022*\"theater\" + 0.018*\"compos\" + 0.016*\"physician\" + 0.015*\"place\" + 0.015*\"orchestr\" + 0.014*\"damn\" + 0.014*\"olympo\" + 0.013*\"wahl\"\n", + "2019-01-31 00:24:26,367 : INFO : topic #6 (0.020): 0.068*\"fewer\" + 0.026*\"septemb\" + 0.023*\"epiru\" + 0.019*\"teacher\" + 0.017*\"stake\" + 0.013*\"rodríguez\" + 0.012*\"proclaim\" + 0.012*\"direct\" + 0.011*\"movi\" + 0.010*\"acrimoni\"\n", + "2019-01-31 00:24:26,368 : INFO : topic #26 (0.020): 0.030*\"woman\" + 0.028*\"workplac\" + 0.028*\"champion\" + 0.026*\"olymp\" + 0.025*\"men\" + 0.025*\"alic\" + 0.022*\"medal\" + 0.021*\"event\" + 0.020*\"rainfal\" + 0.020*\"atheist\"\n", + "2019-01-31 00:24:26,374 : INFO : topic diff=0.012125, rho=0.062137\n", + "2019-01-31 00:24:29,058 : INFO : -11.537 per-word bound, 2972.0 perplexity estimate based on a held-out corpus of 2000 documents with 548527 words\n", + "2019-01-31 00:24:29,058 : INFO : PROGRESS: pass 0, at document #520000/4922894\n", + "2019-01-31 00:24:30,461 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:24:30,727 : INFO : topic #30 (0.020): 0.036*\"leagu\" + 0.035*\"cleveland\" + 0.029*\"place\" + 0.027*\"taxpay\" + 0.025*\"scientist\" + 0.025*\"crete\" + 0.021*\"folei\" + 0.017*\"goal\" + 0.015*\"martin\" + 0.013*\"schmitz\"\n", + "2019-01-31 00:24:30,728 : INFO : topic #15 (0.020): 0.012*\"small\" + 0.012*\"develop\" + 0.011*\"organ\" + 0.009*\"word\" + 0.009*\"commun\" + 0.009*\"cultur\" + 0.008*\"group\" + 0.008*\"requir\" + 0.008*\"human\" + 0.008*\"student\"\n", + "2019-01-31 00:24:30,729 : INFO : topic #27 (0.020): 0.067*\"questionnair\" + 0.020*\"taxpay\" + 0.017*\"candid\" + 0.013*\"driver\" + 0.013*\"tornado\" + 0.013*\"ret\" + 0.012*\"find\" + 0.010*\"horac\" + 0.010*\"landslid\" + 0.010*\"théori\"\n", + "2019-01-31 00:24:30,731 : INFO : topic #41 (0.020): 0.048*\"citi\" + 0.037*\"new\" + 0.023*\"palmer\" + 0.019*\"year\" + 0.016*\"strategist\" + 0.015*\"center\" + 0.011*\"open\" + 0.010*\"includ\" + 0.009*\"lobe\" + 0.008*\"highli\"\n", + "2019-01-31 00:24:30,732 : INFO : topic #45 (0.020): 0.018*\"black\" + 0.016*\"western\" + 0.013*\"colder\" + 0.011*\"record\" + 0.011*\"illicit\" + 0.009*\"blind\" + 0.008*\"green\" + 0.007*\"light\" + 0.006*\"depress\" + 0.006*\"hand\"\n", + "2019-01-31 00:24:30,738 : INFO : topic diff=0.009969, rho=0.062017\n", + "2019-01-31 00:24:30,891 : INFO : PROGRESS: pass 0, at document #522000/4922894\n", + "2019-01-31 00:24:32,308 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:24:32,574 : INFO : topic #14 (0.020): 0.025*\"forc\" + 0.021*\"aggress\" + 0.021*\"walter\" + 0.018*\"com\" + 0.018*\"armi\" + 0.014*\"oper\" + 0.013*\"unionist\" + 0.012*\"militari\" + 0.012*\"airbu\" + 0.010*\"airmen\"\n", + "2019-01-31 00:24:32,575 : INFO : topic #48 (0.020): 0.084*\"octob\" + 0.083*\"march\" + 0.079*\"sens\" + 0.075*\"juli\" + 0.074*\"januari\" + 0.073*\"august\" + 0.073*\"notion\" + 0.071*\"april\" + 0.071*\"decatur\" + 0.070*\"judici\"\n", + "2019-01-31 00:24:32,576 : INFO : topic #28 (0.020): 0.031*\"build\" + 0.025*\"hous\" + 0.020*\"rivièr\" + 0.016*\"buford\" + 0.012*\"histor\" + 0.011*\"strategist\" + 0.011*\"rosenwald\" + 0.011*\"constitut\" + 0.010*\"briarwood\" + 0.010*\"highland\"\n", + "2019-01-31 00:24:32,577 : INFO : topic #2 (0.020): 0.048*\"isl\" + 0.039*\"shield\" + 0.017*\"narrat\" + 0.014*\"scot\" + 0.014*\"pope\" + 0.011*\"coalit\" + 0.011*\"blur\" + 0.010*\"nativist\" + 0.010*\"bahá\" + 0.009*\"fleet\"\n", + "2019-01-31 00:24:32,578 : INFO : topic #35 (0.020): 0.050*\"russia\" + 0.037*\"sovereignti\" + 0.033*\"poison\" + 0.029*\"rural\" + 0.021*\"poland\" + 0.019*\"reprint\" + 0.019*\"personifi\" + 0.018*\"moscow\" + 0.017*\"unfortun\" + 0.011*\"turin\"\n", + "2019-01-31 00:24:32,584 : INFO : topic diff=0.014437, rho=0.061898\n", + "2019-01-31 00:24:32,738 : INFO : PROGRESS: pass 0, at document #524000/4922894\n", + "2019-01-31 00:24:34,154 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:24:34,420 : INFO : topic #4 (0.020): 0.022*\"enfranchis\" + 0.017*\"depress\" + 0.016*\"pour\" + 0.010*\"elabor\" + 0.009*\"produc\" + 0.009*\"mode\" + 0.008*\"encyclopedia\" + 0.008*\"veget\" + 0.008*\"candid\" + 0.007*\"develop\"\n", + "2019-01-31 00:24:34,421 : INFO : topic #13 (0.020): 0.026*\"australia\" + 0.026*\"sourc\" + 0.026*\"new\" + 0.023*\"london\" + 0.023*\"british\" + 0.022*\"australian\" + 0.022*\"england\" + 0.019*\"ireland\" + 0.016*\"youth\" + 0.014*\"wale\"\n", + "2019-01-31 00:24:34,422 : INFO : topic #37 (0.020): 0.010*\"love\" + 0.008*\"gestur\" + 0.007*\"man\" + 0.006*\"blue\" + 0.005*\"night\" + 0.005*\"bewild\" + 0.005*\"litig\" + 0.004*\"belinda\" + 0.003*\"wither\" + 0.003*\"healthcar\"\n", + "2019-01-31 00:24:34,423 : INFO : topic #25 (0.020): 0.032*\"ring\" + 0.017*\"warmth\" + 0.017*\"area\" + 0.016*\"lagrang\" + 0.014*\"mount\" + 0.008*\"foam\" + 0.008*\"sourc\" + 0.008*\"north\" + 0.008*\"land\" + 0.008*\"lobe\"\n", + "2019-01-31 00:24:34,424 : INFO : topic #39 (0.020): 0.032*\"canada\" + 0.028*\"canadian\" + 0.022*\"taxpay\" + 0.019*\"scientist\" + 0.016*\"hoar\" + 0.016*\"toronto\" + 0.016*\"basketbal\" + 0.012*\"ontario\" + 0.012*\"clot\" + 0.010*\"confer\"\n", + "2019-01-31 00:24:34,430 : INFO : topic diff=0.011209, rho=0.061780\n", + "2019-01-31 00:24:34,589 : INFO : PROGRESS: pass 0, at document #526000/4922894\n", + "2019-01-31 00:24:36,044 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:24:36,310 : INFO : topic #37 (0.020): 0.010*\"love\" + 0.008*\"gestur\" + 0.007*\"man\" + 0.006*\"blue\" + 0.005*\"night\" + 0.005*\"bewild\" + 0.004*\"litig\" + 0.004*\"belinda\" + 0.003*\"wither\" + 0.003*\"healthcar\"\n", + "2019-01-31 00:24:36,311 : INFO : topic #19 (0.020): 0.013*\"languag\" + 0.010*\"woodcut\" + 0.010*\"form\" + 0.010*\"origin\" + 0.008*\"mean\" + 0.007*\"uruguayan\" + 0.007*\"like\" + 0.007*\"dynam\" + 0.007*\"charact\" + 0.006*\"god\"\n", + "2019-01-31 00:24:36,312 : INFO : topic #7 (0.020): 0.020*\"snatch\" + 0.019*\"di\" + 0.017*\"factor\" + 0.015*\"margin\" + 0.015*\"yawn\" + 0.013*\"bone\" + 0.012*\"faster\" + 0.012*\"life\" + 0.012*\"john\" + 0.011*\"deal\"\n", + "2019-01-31 00:24:36,313 : INFO : topic #42 (0.020): 0.044*\"german\" + 0.025*\"germani\" + 0.015*\"der\" + 0.015*\"vol\" + 0.014*\"jewish\" + 0.012*\"berlin\" + 0.011*\"israel\" + 0.010*\"jeremiah\" + 0.009*\"die\" + 0.008*\"und\"\n", + "2019-01-31 00:24:36,315 : INFO : topic #6 (0.020): 0.068*\"fewer\" + 0.026*\"septemb\" + 0.024*\"epiru\" + 0.019*\"teacher\" + 0.017*\"stake\" + 0.013*\"rodríguez\" + 0.012*\"proclaim\" + 0.011*\"direct\" + 0.011*\"movi\" + 0.010*\"acrimoni\"\n", + "2019-01-31 00:24:36,320 : INFO : topic diff=0.012560, rho=0.061663\n", + "2019-01-31 00:24:36,479 : INFO : PROGRESS: pass 0, at document #528000/4922894\n", + "2019-01-31 00:24:37,929 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:24:38,196 : INFO : topic #27 (0.020): 0.067*\"questionnair\" + 0.021*\"taxpay\" + 0.016*\"candid\" + 0.014*\"tornado\" + 0.013*\"driver\" + 0.012*\"find\" + 0.011*\"ret\" + 0.011*\"horac\" + 0.011*\"squatter\" + 0.010*\"théori\"\n", + "2019-01-31 00:24:38,197 : INFO : topic #44 (0.020): 0.033*\"rooftop\" + 0.026*\"final\" + 0.022*\"wife\" + 0.020*\"tourist\" + 0.019*\"champion\" + 0.017*\"martin\" + 0.016*\"taxpay\" + 0.015*\"chamber\" + 0.014*\"tiepolo\" + 0.013*\"workplac\"\n", + "2019-01-31 00:24:38,198 : INFO : topic #34 (0.020): 0.075*\"start\" + 0.032*\"unionist\" + 0.029*\"cotton\" + 0.027*\"american\" + 0.023*\"new\" + 0.014*\"california\" + 0.013*\"terri\" + 0.013*\"north\" + 0.012*\"warrior\" + 0.012*\"violent\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 00:24:38,199 : INFO : topic #33 (0.020): 0.055*\"french\" + 0.043*\"franc\" + 0.029*\"pari\" + 0.023*\"jean\" + 0.022*\"sail\" + 0.017*\"daphn\" + 0.015*\"lazi\" + 0.012*\"loui\" + 0.012*\"piec\" + 0.010*\"wine\"\n", + "2019-01-31 00:24:38,201 : INFO : topic #42 (0.020): 0.043*\"german\" + 0.025*\"germani\" + 0.015*\"der\" + 0.015*\"vol\" + 0.013*\"jewish\" + 0.012*\"berlin\" + 0.011*\"israel\" + 0.011*\"jeremiah\" + 0.009*\"die\" + 0.009*\"und\"\n", + "2019-01-31 00:24:38,206 : INFO : topic diff=0.010578, rho=0.061546\n", + "2019-01-31 00:24:38,366 : INFO : PROGRESS: pass 0, at document #530000/4922894\n", + "2019-01-31 00:24:39,811 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:24:40,077 : INFO : topic #5 (0.020): 0.039*\"abroad\" + 0.029*\"son\" + 0.028*\"rel\" + 0.027*\"reconstruct\" + 0.021*\"band\" + 0.017*\"simultan\" + 0.017*\"muscl\" + 0.014*\"charcoal\" + 0.014*\"toyota\" + 0.010*\"vocabulari\"\n", + "2019-01-31 00:24:40,078 : INFO : topic #47 (0.020): 0.060*\"muscl\" + 0.031*\"perceptu\" + 0.027*\"physician\" + 0.019*\"theater\" + 0.017*\"orchestr\" + 0.017*\"compos\" + 0.015*\"olympo\" + 0.014*\"son\" + 0.013*\"place\" + 0.013*\"damn\"\n", + "2019-01-31 00:24:40,079 : INFO : topic #41 (0.020): 0.049*\"citi\" + 0.038*\"new\" + 0.022*\"palmer\" + 0.019*\"year\" + 0.016*\"center\" + 0.015*\"strategist\" + 0.011*\"open\" + 0.010*\"includ\" + 0.009*\"lobe\" + 0.008*\"highli\"\n", + "2019-01-31 00:24:40,080 : INFO : topic #40 (0.020): 0.090*\"unit\" + 0.028*\"collector\" + 0.022*\"institut\" + 0.021*\"schuster\" + 0.017*\"student\" + 0.016*\"requir\" + 0.016*\"professor\" + 0.013*\"word\" + 0.012*\"governor\" + 0.012*\"degre\"\n", + "2019-01-31 00:24:40,081 : INFO : topic #10 (0.020): 0.010*\"cdd\" + 0.008*\"disco\" + 0.007*\"media\" + 0.007*\"caus\" + 0.007*\"hormon\" + 0.007*\"acid\" + 0.007*\"have\" + 0.007*\"proper\" + 0.006*\"effect\" + 0.006*\"pathwai\"\n", + "2019-01-31 00:24:40,087 : INFO : topic diff=0.013411, rho=0.061430\n", + "2019-01-31 00:24:40,238 : INFO : PROGRESS: pass 0, at document #532000/4922894\n", + "2019-01-31 00:24:41,624 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:24:41,890 : INFO : topic #10 (0.020): 0.010*\"cdd\" + 0.008*\"disco\" + 0.008*\"media\" + 0.007*\"caus\" + 0.007*\"hormon\" + 0.007*\"have\" + 0.007*\"acid\" + 0.006*\"proper\" + 0.006*\"effect\" + 0.006*\"pathwai\"\n", + "2019-01-31 00:24:41,891 : INFO : topic #26 (0.020): 0.031*\"woman\" + 0.028*\"champion\" + 0.028*\"workplac\" + 0.026*\"men\" + 0.026*\"olymp\" + 0.024*\"alic\" + 0.021*\"medal\" + 0.021*\"event\" + 0.021*\"rainfal\" + 0.020*\"atheist\"\n", + "2019-01-31 00:24:41,893 : INFO : topic #29 (0.020): 0.011*\"govern\" + 0.010*\"start\" + 0.008*\"million\" + 0.008*\"yawn\" + 0.007*\"countri\" + 0.007*\"bank\" + 0.006*\"replac\" + 0.006*\"function\" + 0.006*\"placement\" + 0.006*\"nation\"\n", + "2019-01-31 00:24:41,894 : INFO : topic #49 (0.020): 0.042*\"india\" + 0.029*\"incumb\" + 0.013*\"televis\" + 0.013*\"islam\" + 0.012*\"muskoge\" + 0.011*\"pakistan\" + 0.010*\"start\" + 0.010*\"singh\" + 0.009*\"khalsa\" + 0.009*\"sri\"\n", + "2019-01-31 00:24:41,895 : INFO : topic #2 (0.020): 0.049*\"isl\" + 0.039*\"shield\" + 0.019*\"narrat\" + 0.014*\"scot\" + 0.013*\"pope\" + 0.012*\"blur\" + 0.011*\"coalit\" + 0.010*\"nativist\" + 0.009*\"fleet\" + 0.009*\"bahá\"\n", + "2019-01-31 00:24:41,901 : INFO : topic diff=0.012359, rho=0.061314\n", + "2019-01-31 00:24:42,059 : INFO : PROGRESS: pass 0, at document #534000/4922894\n", + "2019-01-31 00:24:43,504 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:24:43,771 : INFO : topic #46 (0.020): 0.020*\"stop\" + 0.018*\"damag\" + 0.017*\"wind\" + 0.016*\"swedish\" + 0.015*\"norwai\" + 0.015*\"norwegian\" + 0.014*\"sweden\" + 0.011*\"replac\" + 0.011*\"treeless\" + 0.011*\"huntsvil\"\n", + "2019-01-31 00:24:43,772 : INFO : topic #15 (0.020): 0.012*\"develop\" + 0.012*\"small\" + 0.011*\"organ\" + 0.009*\"word\" + 0.009*\"commun\" + 0.009*\"cultur\" + 0.008*\"human\" + 0.008*\"requir\" + 0.008*\"group\" + 0.008*\"student\"\n", + "2019-01-31 00:24:43,773 : INFO : topic #0 (0.020): 0.067*\"statewid\" + 0.041*\"arsen\" + 0.039*\"line\" + 0.033*\"raid\" + 0.031*\"museo\" + 0.018*\"traceabl\" + 0.018*\"serv\" + 0.015*\"word\" + 0.015*\"pain\" + 0.015*\"exhaust\"\n", + "2019-01-31 00:24:43,774 : INFO : topic #7 (0.020): 0.020*\"snatch\" + 0.019*\"di\" + 0.018*\"factor\" + 0.015*\"margin\" + 0.015*\"yawn\" + 0.013*\"bone\" + 0.012*\"faster\" + 0.012*\"life\" + 0.012*\"deal\" + 0.012*\"john\"\n", + "2019-01-31 00:24:43,775 : INFO : topic #5 (0.020): 0.039*\"abroad\" + 0.029*\"son\" + 0.028*\"rel\" + 0.027*\"reconstruct\" + 0.021*\"band\" + 0.017*\"simultan\" + 0.017*\"muscl\" + 0.015*\"charcoal\" + 0.014*\"toyota\" + 0.010*\"vocabulari\"\n", + "2019-01-31 00:24:43,781 : INFO : topic diff=0.011819, rho=0.061199\n", + "2019-01-31 00:24:43,935 : INFO : PROGRESS: pass 0, at document #536000/4922894\n", + "2019-01-31 00:24:45,356 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:24:45,623 : INFO : topic #17 (0.020): 0.068*\"church\" + 0.020*\"cathol\" + 0.020*\"christian\" + 0.017*\"bishop\" + 0.014*\"retroflex\" + 0.014*\"sail\" + 0.012*\"centuri\" + 0.010*\"italian\" + 0.009*\"historiographi\" + 0.008*\"relationship\"\n", + "2019-01-31 00:24:45,624 : INFO : topic #4 (0.020): 0.023*\"enfranchis\" + 0.018*\"depress\" + 0.016*\"pour\" + 0.009*\"elabor\" + 0.009*\"mode\" + 0.009*\"produc\" + 0.008*\"encyclopedia\" + 0.008*\"veget\" + 0.008*\"candid\" + 0.007*\"uruguayan\"\n", + "2019-01-31 00:24:45,625 : INFO : topic #38 (0.020): 0.021*\"walter\" + 0.011*\"king\" + 0.010*\"battalion\" + 0.009*\"aza\" + 0.009*\"centuri\" + 0.008*\"empath\" + 0.008*\"forc\" + 0.008*\"teufel\" + 0.007*\"armi\" + 0.007*\"till\"\n", + "2019-01-31 00:24:45,627 : INFO : topic #1 (0.020): 0.054*\"china\" + 0.048*\"chilton\" + 0.024*\"hong\" + 0.023*\"kong\" + 0.021*\"korea\" + 0.018*\"korean\" + 0.015*\"sourc\" + 0.014*\"leah\" + 0.013*\"han\" + 0.013*\"kim\"\n", + "2019-01-31 00:24:45,628 : INFO : topic #2 (0.020): 0.050*\"isl\" + 0.038*\"shield\" + 0.018*\"narrat\" + 0.014*\"scot\" + 0.013*\"pope\" + 0.012*\"blur\" + 0.011*\"coalit\" + 0.011*\"nativist\" + 0.009*\"bahá\" + 0.009*\"fleet\"\n", + "2019-01-31 00:24:45,634 : INFO : topic diff=0.010792, rho=0.061085\n", + "2019-01-31 00:24:45,787 : INFO : PROGRESS: pass 0, at document #538000/4922894\n", + "2019-01-31 00:24:47,195 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:24:47,462 : INFO : topic #18 (0.020): 0.009*\"théori\" + 0.007*\"later\" + 0.007*\"sack\" + 0.006*\"kill\" + 0.005*\"retrospect\" + 0.005*\"dai\" + 0.005*\"man\" + 0.005*\"deal\" + 0.004*\"help\" + 0.004*\"call\"\n", + "2019-01-31 00:24:47,463 : INFO : topic #21 (0.020): 0.038*\"samford\" + 0.022*\"spain\" + 0.020*\"del\" + 0.019*\"mexico\" + 0.014*\"soviet\" + 0.012*\"francisco\" + 0.011*\"juan\" + 0.011*\"carlo\" + 0.011*\"mexican\" + 0.011*\"lizard\"\n", + "2019-01-31 00:24:47,464 : INFO : topic #47 (0.020): 0.061*\"muscl\" + 0.033*\"perceptu\" + 0.025*\"physician\" + 0.020*\"theater\" + 0.018*\"compos\" + 0.017*\"orchestr\" + 0.014*\"olympo\" + 0.013*\"place\" + 0.013*\"son\" + 0.012*\"damn\"\n", + "2019-01-31 00:24:47,465 : INFO : topic #23 (0.020): 0.138*\"audit\" + 0.067*\"best\" + 0.038*\"yawn\" + 0.031*\"jacksonvil\" + 0.024*\"japanes\" + 0.022*\"noll\" + 0.020*\"women\" + 0.018*\"festiv\" + 0.017*\"prison\" + 0.016*\"intern\"\n", + "2019-01-31 00:24:47,467 : INFO : topic #45 (0.020): 0.017*\"black\" + 0.015*\"western\" + 0.013*\"colder\" + 0.011*\"record\" + 0.010*\"illicit\" + 0.009*\"blind\" + 0.008*\"green\" + 0.008*\"light\" + 0.007*\"fifteenth\" + 0.006*\"jpg\"\n", + "2019-01-31 00:24:47,473 : INFO : topic diff=0.010960, rho=0.060971\n", + "2019-01-31 00:24:50,207 : INFO : -11.877 per-word bound, 3761.5 perplexity estimate based on a held-out corpus of 2000 documents with 546535 words\n", + "2019-01-31 00:24:50,207 : INFO : PROGRESS: pass 0, at document #540000/4922894\n", + "2019-01-31 00:24:51,645 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:24:51,911 : INFO : topic #40 (0.020): 0.090*\"unit\" + 0.027*\"collector\" + 0.021*\"schuster\" + 0.021*\"institut\" + 0.017*\"requir\" + 0.017*\"student\" + 0.016*\"professor\" + 0.012*\"word\" + 0.012*\"governor\" + 0.011*\"degre\"\n", + "2019-01-31 00:24:51,913 : INFO : topic #27 (0.020): 0.066*\"questionnair\" + 0.021*\"taxpay\" + 0.018*\"candid\" + 0.014*\"tornado\" + 0.013*\"driver\" + 0.013*\"ret\" + 0.012*\"find\" + 0.011*\"champion\" + 0.011*\"squatter\" + 0.010*\"théori\"\n", + "2019-01-31 00:24:51,914 : INFO : topic #49 (0.020): 0.043*\"india\" + 0.030*\"incumb\" + 0.013*\"televis\" + 0.012*\"islam\" + 0.012*\"pakistan\" + 0.011*\"muskoge\" + 0.010*\"singh\" + 0.010*\"start\" + 0.009*\"khalsa\" + 0.009*\"sri\"\n", + "2019-01-31 00:24:51,915 : INFO : topic #25 (0.020): 0.031*\"ring\" + 0.018*\"warmth\" + 0.016*\"mount\" + 0.016*\"lagrang\" + 0.016*\"area\" + 0.008*\"north\" + 0.008*\"foam\" + 0.008*\"sourc\" + 0.008*\"palmer\" + 0.008*\"lobe\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 00:24:51,916 : INFO : topic #8 (0.020): 0.029*\"law\" + 0.024*\"cortic\" + 0.023*\"act\" + 0.019*\"start\" + 0.016*\"ricardo\" + 0.012*\"case\" + 0.010*\"polaris\" + 0.009*\"legal\" + 0.007*\"judaism\" + 0.007*\"rudolf\"\n", + "2019-01-31 00:24:51,922 : INFO : topic diff=0.012260, rho=0.060858\n", + "2019-01-31 00:24:52,078 : INFO : PROGRESS: pass 0, at document #542000/4922894\n", + "2019-01-31 00:24:53,505 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:24:53,772 : INFO : topic #24 (0.020): 0.042*\"book\" + 0.035*\"publicis\" + 0.022*\"word\" + 0.016*\"new\" + 0.014*\"edit\" + 0.013*\"presid\" + 0.012*\"nicola\" + 0.012*\"storag\" + 0.012*\"worldwid\" + 0.011*\"author\"\n", + "2019-01-31 00:24:53,773 : INFO : topic #22 (0.020): 0.034*\"spars\" + 0.028*\"factor\" + 0.023*\"adulthood\" + 0.016*\"hostil\" + 0.016*\"feel\" + 0.014*\"male\" + 0.011*\"live\" + 0.011*\"genu\" + 0.011*\"plaisir\" + 0.010*\"yawn\"\n", + "2019-01-31 00:24:53,774 : INFO : topic #6 (0.020): 0.069*\"fewer\" + 0.025*\"septemb\" + 0.023*\"epiru\" + 0.018*\"teacher\" + 0.017*\"stake\" + 0.013*\"rodríguez\" + 0.012*\"proclaim\" + 0.011*\"direct\" + 0.011*\"movi\" + 0.010*\"acrimoni\"\n", + "2019-01-31 00:24:53,775 : INFO : topic #5 (0.020): 0.039*\"abroad\" + 0.029*\"son\" + 0.028*\"rel\" + 0.027*\"reconstruct\" + 0.021*\"band\" + 0.017*\"simultan\" + 0.017*\"muscl\" + 0.015*\"charcoal\" + 0.014*\"toyota\" + 0.010*\"vocabulari\"\n", + "2019-01-31 00:24:53,777 : INFO : topic #4 (0.020): 0.023*\"enfranchis\" + 0.018*\"depress\" + 0.017*\"pour\" + 0.009*\"elabor\" + 0.009*\"mode\" + 0.009*\"produc\" + 0.008*\"veget\" + 0.008*\"candid\" + 0.008*\"encyclopedia\" + 0.007*\"develop\"\n", + "2019-01-31 00:24:53,782 : INFO : topic diff=0.011440, rho=0.060746\n", + "2019-01-31 00:24:53,997 : INFO : PROGRESS: pass 0, at document #544000/4922894\n", + "2019-01-31 00:24:55,421 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:24:55,688 : INFO : topic #11 (0.020): 0.028*\"john\" + 0.014*\"will\" + 0.013*\"jame\" + 0.012*\"david\" + 0.011*\"rival\" + 0.010*\"georg\" + 0.009*\"slur\" + 0.008*\"mexican–american\" + 0.008*\"rhyme\" + 0.008*\"paul\"\n", + "2019-01-31 00:24:55,689 : INFO : topic #44 (0.020): 0.032*\"rooftop\" + 0.025*\"final\" + 0.023*\"tourist\" + 0.021*\"wife\" + 0.018*\"champion\" + 0.017*\"martin\" + 0.017*\"taxpay\" + 0.016*\"chamber\" + 0.014*\"tiepolo\" + 0.013*\"open\"\n", + "2019-01-31 00:24:55,690 : INFO : topic #31 (0.020): 0.064*\"fusiform\" + 0.025*\"player\" + 0.021*\"scientist\" + 0.021*\"place\" + 0.020*\"taxpay\" + 0.013*\"leagu\" + 0.012*\"folei\" + 0.011*\"yard\" + 0.010*\"barber\" + 0.009*\"ruler\"\n", + "2019-01-31 00:24:55,691 : INFO : topic #32 (0.020): 0.056*\"district\" + 0.048*\"vigour\" + 0.045*\"popolo\" + 0.041*\"tortur\" + 0.028*\"cotton\" + 0.028*\"regim\" + 0.028*\"area\" + 0.025*\"multitud\" + 0.023*\"citi\" + 0.020*\"commun\"\n", + "2019-01-31 00:24:55,692 : INFO : topic #35 (0.020): 0.053*\"russia\" + 0.036*\"sovereignti\" + 0.032*\"rural\" + 0.030*\"poison\" + 0.022*\"personifi\" + 0.020*\"reprint\" + 0.020*\"moscow\" + 0.018*\"poland\" + 0.018*\"unfortun\" + 0.012*\"czech\"\n", + "2019-01-31 00:24:55,698 : INFO : topic diff=0.011468, rho=0.060634\n", + "2019-01-31 00:24:55,854 : INFO : PROGRESS: pass 0, at document #546000/4922894\n", + "2019-01-31 00:24:57,299 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:24:57,565 : INFO : topic #12 (0.020): 0.010*\"number\" + 0.007*\"frontal\" + 0.007*\"théori\" + 0.007*\"exampl\" + 0.007*\"southern\" + 0.006*\"servitud\" + 0.006*\"gener\" + 0.006*\"measur\" + 0.006*\"poet\" + 0.005*\"utopian\"\n", + "2019-01-31 00:24:57,566 : INFO : topic #1 (0.020): 0.052*\"china\" + 0.049*\"chilton\" + 0.023*\"hong\" + 0.023*\"kong\" + 0.023*\"korea\" + 0.018*\"korean\" + 0.015*\"sourc\" + 0.012*\"leah\" + 0.012*\"han\" + 0.012*\"kim\"\n", + "2019-01-31 00:24:57,568 : INFO : topic #25 (0.020): 0.030*\"ring\" + 0.017*\"warmth\" + 0.016*\"lagrang\" + 0.016*\"area\" + 0.015*\"mount\" + 0.008*\"sourc\" + 0.008*\"north\" + 0.008*\"foam\" + 0.008*\"palmer\" + 0.008*\"lobe\"\n", + "2019-01-31 00:24:57,569 : INFO : topic #4 (0.020): 0.023*\"enfranchis\" + 0.017*\"depress\" + 0.017*\"pour\" + 0.009*\"elabor\" + 0.009*\"produc\" + 0.009*\"mode\" + 0.008*\"veget\" + 0.008*\"candid\" + 0.007*\"encyclopedia\" + 0.007*\"develop\"\n", + "2019-01-31 00:24:57,570 : INFO : topic #47 (0.020): 0.061*\"muscl\" + 0.031*\"perceptu\" + 0.027*\"physician\" + 0.018*\"theater\" + 0.018*\"wahl\" + 0.018*\"orchestr\" + 0.018*\"compos\" + 0.013*\"place\" + 0.013*\"olympo\" + 0.012*\"son\"\n", + "2019-01-31 00:24:57,576 : INFO : topic diff=0.012075, rho=0.060523\n", + "2019-01-31 00:24:57,738 : INFO : PROGRESS: pass 0, at document #548000/4922894\n", + "2019-01-31 00:24:59,203 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:24:59,469 : INFO : topic #47 (0.020): 0.061*\"muscl\" + 0.031*\"perceptu\" + 0.026*\"physician\" + 0.018*\"theater\" + 0.018*\"compos\" + 0.018*\"orchestr\" + 0.017*\"wahl\" + 0.013*\"place\" + 0.013*\"olympo\" + 0.012*\"damn\"\n", + "2019-01-31 00:24:59,470 : INFO : topic #45 (0.020): 0.017*\"black\" + 0.016*\"western\" + 0.013*\"colder\" + 0.011*\"record\" + 0.010*\"blind\" + 0.010*\"illicit\" + 0.008*\"light\" + 0.008*\"green\" + 0.007*\"fifteenth\" + 0.006*\"jpg\"\n", + "2019-01-31 00:24:59,471 : INFO : topic #43 (0.020): 0.066*\"elect\" + 0.055*\"parti\" + 0.027*\"voluntari\" + 0.026*\"democrat\" + 0.020*\"member\" + 0.018*\"polici\" + 0.016*\"republ\" + 0.015*\"liber\" + 0.015*\"bypass\" + 0.014*\"selma\"\n", + "2019-01-31 00:24:59,473 : INFO : topic #20 (0.020): 0.131*\"scholar\" + 0.035*\"struggl\" + 0.032*\"high\" + 0.029*\"educ\" + 0.019*\"yawn\" + 0.018*\"collector\" + 0.014*\"prognosi\" + 0.010*\"gothic\" + 0.009*\"pseudo\" + 0.008*\"task\"\n", + "2019-01-31 00:24:59,474 : INFO : topic #31 (0.020): 0.063*\"fusiform\" + 0.025*\"player\" + 0.022*\"scientist\" + 0.021*\"place\" + 0.020*\"taxpay\" + 0.014*\"leagu\" + 0.011*\"folei\" + 0.011*\"yard\" + 0.010*\"barber\" + 0.009*\"clot\"\n", + "2019-01-31 00:24:59,480 : INFO : topic diff=0.015389, rho=0.060412\n", + "2019-01-31 00:24:59,637 : INFO : PROGRESS: pass 0, at document #550000/4922894\n", + "2019-01-31 00:25:01,065 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:25:01,330 : INFO : topic #22 (0.020): 0.033*\"spars\" + 0.027*\"factor\" + 0.024*\"adulthood\" + 0.017*\"feel\" + 0.016*\"hostil\" + 0.014*\"male\" + 0.011*\"live\" + 0.011*\"plaisir\" + 0.011*\"genu\" + 0.010*\"yawn\"\n", + "2019-01-31 00:25:01,332 : INFO : topic #1 (0.020): 0.051*\"china\" + 0.048*\"chilton\" + 0.023*\"hong\" + 0.023*\"korea\" + 0.022*\"kong\" + 0.018*\"korean\" + 0.015*\"sourc\" + 0.015*\"kim\" + 0.014*\"leah\" + 0.012*\"ashvil\"\n", + "2019-01-31 00:25:01,333 : INFO : topic #38 (0.020): 0.021*\"walter\" + 0.011*\"king\" + 0.010*\"aza\" + 0.010*\"battalion\" + 0.009*\"empath\" + 0.009*\"teufel\" + 0.008*\"centuri\" + 0.008*\"forc\" + 0.007*\"armi\" + 0.007*\"till\"\n", + "2019-01-31 00:25:01,334 : INFO : topic #31 (0.020): 0.065*\"fusiform\" + 0.025*\"player\" + 0.022*\"scientist\" + 0.021*\"place\" + 0.021*\"taxpay\" + 0.014*\"leagu\" + 0.012*\"folei\" + 0.011*\"yard\" + 0.010*\"barber\" + 0.009*\"clot\"\n", + "2019-01-31 00:25:01,336 : INFO : topic #17 (0.020): 0.068*\"church\" + 0.020*\"christian\" + 0.019*\"cathol\" + 0.017*\"bishop\" + 0.015*\"retroflex\" + 0.014*\"sail\" + 0.012*\"centuri\" + 0.010*\"italian\" + 0.009*\"relationship\" + 0.008*\"historiographi\"\n", + "2019-01-31 00:25:01,341 : INFO : topic diff=0.009282, rho=0.060302\n", + "2019-01-31 00:25:01,501 : INFO : PROGRESS: pass 0, at document #552000/4922894\n", + "2019-01-31 00:25:02,965 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:25:03,232 : INFO : topic #40 (0.020): 0.089*\"unit\" + 0.027*\"collector\" + 0.022*\"schuster\" + 0.021*\"institut\" + 0.018*\"requir\" + 0.017*\"student\" + 0.015*\"professor\" + 0.012*\"word\" + 0.012*\"governor\" + 0.011*\"degre\"\n", + "2019-01-31 00:25:03,233 : INFO : topic #48 (0.020): 0.081*\"march\" + 0.080*\"octob\" + 0.077*\"sens\" + 0.075*\"januari\" + 0.072*\"juli\" + 0.072*\"notion\" + 0.070*\"april\" + 0.069*\"august\" + 0.069*\"judici\" + 0.068*\"decatur\"\n", + "2019-01-31 00:25:03,235 : INFO : topic #12 (0.020): 0.009*\"number\" + 0.007*\"frontal\" + 0.007*\"théori\" + 0.007*\"exampl\" + 0.006*\"southern\" + 0.006*\"gener\" + 0.006*\"measur\" + 0.006*\"servitud\" + 0.006*\"poet\" + 0.005*\"differ\"\n", + "2019-01-31 00:25:03,236 : INFO : topic #22 (0.020): 0.033*\"spars\" + 0.027*\"factor\" + 0.023*\"adulthood\" + 0.016*\"feel\" + 0.016*\"hostil\" + 0.014*\"male\" + 0.011*\"live\" + 0.011*\"plaisir\" + 0.011*\"genu\" + 0.010*\"yawn\"\n", + "2019-01-31 00:25:03,237 : INFO : topic #1 (0.020): 0.051*\"china\" + 0.048*\"chilton\" + 0.023*\"hong\" + 0.022*\"kong\" + 0.022*\"korea\" + 0.017*\"korean\" + 0.015*\"sourc\" + 0.014*\"kim\" + 0.014*\"leah\" + 0.012*\"ashvil\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 00:25:03,243 : INFO : topic diff=0.014395, rho=0.060193\n", + "2019-01-31 00:25:03,401 : INFO : PROGRESS: pass 0, at document #554000/4922894\n", + "2019-01-31 00:25:04,845 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:25:05,111 : INFO : topic #39 (0.020): 0.035*\"canada\" + 0.028*\"canadian\" + 0.021*\"taxpay\" + 0.019*\"scientist\" + 0.017*\"hoar\" + 0.016*\"basketbal\" + 0.016*\"toronto\" + 0.015*\"ontario\" + 0.012*\"confer\" + 0.012*\"clot\"\n", + "2019-01-31 00:25:05,112 : INFO : topic #33 (0.020): 0.058*\"french\" + 0.045*\"franc\" + 0.028*\"pari\" + 0.022*\"sail\" + 0.021*\"jean\" + 0.016*\"daphn\" + 0.013*\"lazi\" + 0.011*\"loui\" + 0.011*\"piec\" + 0.010*\"focal\"\n", + "2019-01-31 00:25:05,114 : INFO : topic #29 (0.020): 0.010*\"govern\" + 0.010*\"start\" + 0.009*\"million\" + 0.008*\"yawn\" + 0.007*\"countri\" + 0.007*\"function\" + 0.007*\"bank\" + 0.006*\"replac\" + 0.006*\"théori\" + 0.006*\"nation\"\n", + "2019-01-31 00:25:05,115 : INFO : topic #4 (0.020): 0.022*\"enfranchis\" + 0.017*\"depress\" + 0.016*\"pour\" + 0.009*\"elabor\" + 0.009*\"produc\" + 0.008*\"mode\" + 0.008*\"veget\" + 0.008*\"encyclopedia\" + 0.007*\"candid\" + 0.007*\"develop\"\n", + "2019-01-31 00:25:05,116 : INFO : topic #6 (0.020): 0.070*\"fewer\" + 0.025*\"septemb\" + 0.023*\"epiru\" + 0.018*\"teacher\" + 0.018*\"stake\" + 0.013*\"rodríguez\" + 0.012*\"proclaim\" + 0.011*\"direct\" + 0.011*\"movi\" + 0.010*\"acrimoni\"\n", + "2019-01-31 00:25:05,122 : INFO : topic diff=0.011124, rho=0.060084\n", + "2019-01-31 00:25:05,278 : INFO : PROGRESS: pass 0, at document #556000/4922894\n", + "2019-01-31 00:25:06,697 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:25:06,964 : INFO : topic #40 (0.020): 0.089*\"unit\" + 0.028*\"collector\" + 0.022*\"schuster\" + 0.022*\"institut\" + 0.018*\"requir\" + 0.016*\"student\" + 0.015*\"professor\" + 0.012*\"word\" + 0.012*\"governor\" + 0.011*\"degre\"\n", + "2019-01-31 00:25:06,965 : INFO : topic #49 (0.020): 0.041*\"india\" + 0.028*\"incumb\" + 0.014*\"islam\" + 0.014*\"televis\" + 0.011*\"pakistan\" + 0.011*\"khalsa\" + 0.011*\"muskoge\" + 0.010*\"start\" + 0.010*\"anglo\" + 0.010*\"iran\"\n", + "2019-01-31 00:25:06,966 : INFO : topic #41 (0.020): 0.047*\"citi\" + 0.037*\"new\" + 0.025*\"palmer\" + 0.020*\"year\" + 0.015*\"center\" + 0.015*\"strategist\" + 0.011*\"open\" + 0.010*\"includ\" + 0.010*\"lobe\" + 0.008*\"highli\"\n", + "2019-01-31 00:25:06,967 : INFO : topic #23 (0.020): 0.141*\"audit\" + 0.067*\"best\" + 0.037*\"yawn\" + 0.029*\"jacksonvil\" + 0.023*\"japanes\" + 0.022*\"noll\" + 0.021*\"women\" + 0.020*\"festiv\" + 0.018*\"intern\" + 0.016*\"prison\"\n", + "2019-01-31 00:25:06,968 : INFO : topic #48 (0.020): 0.081*\"march\" + 0.080*\"octob\" + 0.077*\"sens\" + 0.076*\"januari\" + 0.073*\"juli\" + 0.071*\"notion\" + 0.071*\"april\" + 0.069*\"judici\" + 0.069*\"august\" + 0.068*\"decatur\"\n", + "2019-01-31 00:25:06,974 : INFO : topic diff=0.010680, rho=0.059976\n", + "2019-01-31 00:25:07,132 : INFO : PROGRESS: pass 0, at document #558000/4922894\n", + "2019-01-31 00:25:08,569 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:25:08,835 : INFO : topic #35 (0.020): 0.051*\"russia\" + 0.035*\"sovereignti\" + 0.033*\"rural\" + 0.026*\"poison\" + 0.022*\"personifi\" + 0.021*\"reprint\" + 0.018*\"moscow\" + 0.017*\"poland\" + 0.017*\"unfortun\" + 0.016*\"tyrant\"\n", + "2019-01-31 00:25:08,836 : INFO : topic #47 (0.020): 0.063*\"muscl\" + 0.033*\"perceptu\" + 0.023*\"physician\" + 0.018*\"theater\" + 0.018*\"compos\" + 0.017*\"orchestr\" + 0.014*\"wahl\" + 0.014*\"olympo\" + 0.014*\"place\" + 0.013*\"damn\"\n", + "2019-01-31 00:25:08,838 : INFO : topic #19 (0.020): 0.013*\"languag\" + 0.010*\"woodcut\" + 0.010*\"form\" + 0.009*\"origin\" + 0.008*\"mean\" + 0.007*\"uruguayan\" + 0.007*\"like\" + 0.006*\"dynam\" + 0.006*\"centuri\" + 0.006*\"god\"\n", + "2019-01-31 00:25:08,838 : INFO : topic #13 (0.020): 0.028*\"australia\" + 0.027*\"sourc\" + 0.026*\"new\" + 0.024*\"london\" + 0.022*\"australian\" + 0.022*\"england\" + 0.021*\"british\" + 0.018*\"ireland\" + 0.016*\"youth\" + 0.014*\"wale\"\n", + "2019-01-31 00:25:08,839 : INFO : topic #28 (0.020): 0.030*\"build\" + 0.023*\"hous\" + 0.021*\"rivièr\" + 0.017*\"buford\" + 0.013*\"histor\" + 0.011*\"strategist\" + 0.011*\"constitut\" + 0.011*\"briarwood\" + 0.011*\"rosenwald\" + 0.009*\"depress\"\n", + "2019-01-31 00:25:08,845 : INFO : topic diff=0.011311, rho=0.059868\n", + "2019-01-31 00:25:11,662 : INFO : -11.495 per-word bound, 2885.7 perplexity estimate based on a held-out corpus of 2000 documents with 607011 words\n", + "2019-01-31 00:25:11,663 : INFO : PROGRESS: pass 0, at document #560000/4922894\n", + "2019-01-31 00:25:13,122 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:25:13,388 : INFO : topic #24 (0.020): 0.041*\"book\" + 0.035*\"publicis\" + 0.022*\"word\" + 0.016*\"new\" + 0.015*\"edit\" + 0.013*\"presid\" + 0.012*\"storag\" + 0.012*\"nicola\" + 0.012*\"author\" + 0.012*\"worldwid\"\n", + "2019-01-31 00:25:13,389 : INFO : topic #17 (0.020): 0.067*\"church\" + 0.023*\"cathol\" + 0.020*\"dioces\" + 0.019*\"christian\" + 0.016*\"bishop\" + 0.014*\"retroflex\" + 0.014*\"sail\" + 0.012*\"centuri\" + 0.009*\"italian\" + 0.009*\"historiographi\"\n", + "2019-01-31 00:25:13,390 : INFO : topic #35 (0.020): 0.051*\"russia\" + 0.036*\"sovereignti\" + 0.034*\"rural\" + 0.026*\"poison\" + 0.022*\"personifi\" + 0.021*\"reprint\" + 0.018*\"moscow\" + 0.017*\"unfortun\" + 0.017*\"poland\" + 0.016*\"tyrant\"\n", + "2019-01-31 00:25:13,392 : INFO : topic #18 (0.020): 0.009*\"théori\" + 0.007*\"later\" + 0.007*\"kill\" + 0.007*\"sack\" + 0.005*\"retrospect\" + 0.005*\"dai\" + 0.005*\"deal\" + 0.004*\"man\" + 0.004*\"end\" + 0.004*\"help\"\n", + "2019-01-31 00:25:13,393 : INFO : topic #7 (0.020): 0.020*\"snatch\" + 0.019*\"di\" + 0.017*\"factor\" + 0.015*\"yawn\" + 0.015*\"margin\" + 0.013*\"bone\" + 0.013*\"faster\" + 0.012*\"life\" + 0.012*\"john\" + 0.011*\"deal\"\n", + "2019-01-31 00:25:13,399 : INFO : topic diff=0.012397, rho=0.059761\n", + "2019-01-31 00:25:13,555 : INFO : PROGRESS: pass 0, at document #562000/4922894\n", + "2019-01-31 00:25:14,985 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:25:15,250 : INFO : topic #36 (0.020): 0.022*\"companhia\" + 0.010*\"network\" + 0.009*\"develop\" + 0.009*\"prognosi\" + 0.008*\"serv\" + 0.008*\"manag\" + 0.008*\"base\" + 0.008*\"oper\" + 0.008*\"includ\" + 0.007*\"produc\"\n", + "2019-01-31 00:25:15,252 : INFO : topic #40 (0.020): 0.094*\"unit\" + 0.028*\"collector\" + 0.023*\"institut\" + 0.023*\"schuster\" + 0.017*\"requir\" + 0.016*\"student\" + 0.014*\"professor\" + 0.012*\"word\" + 0.011*\"governor\" + 0.011*\"degre\"\n", + "2019-01-31 00:25:15,252 : INFO : topic #44 (0.020): 0.031*\"rooftop\" + 0.025*\"final\" + 0.022*\"tourist\" + 0.020*\"wife\" + 0.018*\"taxpay\" + 0.018*\"champion\" + 0.018*\"martin\" + 0.016*\"chamber\" + 0.014*\"tiepolo\" + 0.013*\"workplac\"\n", + "2019-01-31 00:25:15,254 : INFO : topic #45 (0.020): 0.016*\"western\" + 0.016*\"black\" + 0.014*\"colder\" + 0.011*\"record\" + 0.010*\"blind\" + 0.010*\"illicit\" + 0.007*\"light\" + 0.007*\"green\" + 0.007*\"fifteenth\" + 0.007*\"jpg\"\n", + "2019-01-31 00:25:15,254 : INFO : topic #41 (0.020): 0.047*\"citi\" + 0.037*\"new\" + 0.024*\"palmer\" + 0.020*\"year\" + 0.015*\"center\" + 0.015*\"strategist\" + 0.011*\"open\" + 0.010*\"includ\" + 0.009*\"lobe\" + 0.008*\"highli\"\n", + "2019-01-31 00:25:15,260 : INFO : topic diff=0.010572, rho=0.059655\n", + "2019-01-31 00:25:15,416 : INFO : PROGRESS: pass 0, at document #564000/4922894\n", + "2019-01-31 00:25:16,849 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:25:17,115 : INFO : topic #12 (0.020): 0.009*\"number\" + 0.008*\"southern\" + 0.007*\"frontal\" + 0.006*\"théori\" + 0.006*\"exampl\" + 0.006*\"gener\" + 0.006*\"poet\" + 0.006*\"servitud\" + 0.006*\"measur\" + 0.005*\"differ\"\n", + "2019-01-31 00:25:17,116 : INFO : topic #48 (0.020): 0.080*\"march\" + 0.079*\"octob\" + 0.077*\"sens\" + 0.077*\"januari\" + 0.071*\"juli\" + 0.070*\"notion\" + 0.070*\"april\" + 0.069*\"judici\" + 0.069*\"august\" + 0.068*\"decatur\"\n", + "2019-01-31 00:25:17,117 : INFO : topic #44 (0.020): 0.031*\"rooftop\" + 0.025*\"final\" + 0.022*\"tourist\" + 0.020*\"wife\" + 0.018*\"taxpay\" + 0.018*\"champion\" + 0.017*\"martin\" + 0.016*\"chamber\" + 0.014*\"tiepolo\" + 0.013*\"workplac\"\n", + "2019-01-31 00:25:17,118 : INFO : topic #19 (0.020): 0.013*\"languag\" + 0.010*\"woodcut\" + 0.010*\"form\" + 0.009*\"origin\" + 0.008*\"mean\" + 0.007*\"uruguayan\" + 0.007*\"like\" + 0.006*\"dynam\" + 0.006*\"centuri\" + 0.006*\"god\"\n", + "2019-01-31 00:25:17,120 : INFO : topic #42 (0.020): 0.043*\"german\" + 0.026*\"germani\" + 0.014*\"vol\" + 0.014*\"jewish\" + 0.013*\"der\" + 0.013*\"israel\" + 0.013*\"berlin\" + 0.010*\"jeremiah\" + 0.008*\"greek\" + 0.008*\"und\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 00:25:17,125 : INFO : topic diff=0.011876, rho=0.059549\n", + "2019-01-31 00:25:17,281 : INFO : PROGRESS: pass 0, at document #566000/4922894\n", + "2019-01-31 00:25:18,697 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:25:18,963 : INFO : topic #38 (0.020): 0.021*\"walter\" + 0.011*\"aza\" + 0.010*\"king\" + 0.010*\"battalion\" + 0.009*\"empath\" + 0.009*\"teufel\" + 0.009*\"centuri\" + 0.008*\"forc\" + 0.007*\"armi\" + 0.007*\"till\"\n", + "2019-01-31 00:25:18,964 : INFO : topic #29 (0.020): 0.011*\"start\" + 0.010*\"govern\" + 0.009*\"million\" + 0.008*\"yawn\" + 0.007*\"countri\" + 0.007*\"bank\" + 0.007*\"function\" + 0.006*\"replac\" + 0.006*\"théori\" + 0.006*\"new\"\n", + "2019-01-31 00:25:18,965 : INFO : topic #33 (0.020): 0.058*\"french\" + 0.046*\"franc\" + 0.028*\"pari\" + 0.022*\"jean\" + 0.021*\"sail\" + 0.016*\"daphn\" + 0.014*\"lazi\" + 0.011*\"loui\" + 0.010*\"piec\" + 0.010*\"focal\"\n", + "2019-01-31 00:25:18,967 : INFO : topic #48 (0.020): 0.080*\"march\" + 0.079*\"octob\" + 0.076*\"sens\" + 0.076*\"januari\" + 0.070*\"notion\" + 0.070*\"juli\" + 0.068*\"april\" + 0.067*\"judici\" + 0.067*\"august\" + 0.067*\"decatur\"\n", + "2019-01-31 00:25:18,968 : INFO : topic #35 (0.020): 0.050*\"russia\" + 0.036*\"sovereignti\" + 0.033*\"rural\" + 0.025*\"poison\" + 0.022*\"personifi\" + 0.021*\"reprint\" + 0.018*\"unfortun\" + 0.017*\"poland\" + 0.017*\"moscow\" + 0.015*\"tyrant\"\n", + "2019-01-31 00:25:18,973 : INFO : topic diff=0.011214, rho=0.059444\n", + "2019-01-31 00:25:19,125 : INFO : PROGRESS: pass 0, at document #568000/4922894\n", + "2019-01-31 00:25:20,525 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:25:20,791 : INFO : topic #23 (0.020): 0.143*\"audit\" + 0.068*\"best\" + 0.037*\"yawn\" + 0.028*\"jacksonvil\" + 0.022*\"japanes\" + 0.022*\"noll\" + 0.021*\"women\" + 0.019*\"festiv\" + 0.017*\"intern\" + 0.016*\"prison\"\n", + "2019-01-31 00:25:20,792 : INFO : topic #15 (0.020): 0.013*\"small\" + 0.012*\"develop\" + 0.010*\"commun\" + 0.010*\"organ\" + 0.009*\"word\" + 0.009*\"cultur\" + 0.009*\"group\" + 0.008*\"requir\" + 0.008*\"socialist\" + 0.008*\"human\"\n", + "2019-01-31 00:25:20,794 : INFO : topic #36 (0.020): 0.022*\"companhia\" + 0.010*\"network\" + 0.009*\"prognosi\" + 0.009*\"develop\" + 0.008*\"serv\" + 0.008*\"manag\" + 0.008*\"includ\" + 0.008*\"oper\" + 0.008*\"base\" + 0.007*\"user\"\n", + "2019-01-31 00:25:20,795 : INFO : topic #47 (0.020): 0.063*\"muscl\" + 0.033*\"perceptu\" + 0.021*\"physician\" + 0.019*\"compos\" + 0.019*\"theater\" + 0.016*\"orchestr\" + 0.014*\"olympo\" + 0.014*\"place\" + 0.013*\"damn\" + 0.012*\"wahl\"\n", + "2019-01-31 00:25:20,796 : INFO : topic #39 (0.020): 0.034*\"canada\" + 0.028*\"canadian\" + 0.020*\"taxpay\" + 0.019*\"scientist\" + 0.017*\"hoar\" + 0.016*\"basketbal\" + 0.015*\"toronto\" + 0.015*\"ontario\" + 0.011*\"confer\" + 0.011*\"clot\"\n", + "2019-01-31 00:25:20,802 : INFO : topic diff=0.012117, rho=0.059339\n", + "2019-01-31 00:25:20,957 : INFO : PROGRESS: pass 0, at document #570000/4922894\n", + "2019-01-31 00:25:22,362 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:25:22,628 : INFO : topic #29 (0.020): 0.011*\"start\" + 0.010*\"govern\" + 0.009*\"million\" + 0.008*\"yawn\" + 0.007*\"countri\" + 0.007*\"bank\" + 0.007*\"function\" + 0.006*\"replac\" + 0.006*\"théori\" + 0.006*\"placement\"\n", + "2019-01-31 00:25:22,629 : INFO : topic #22 (0.020): 0.033*\"spars\" + 0.027*\"factor\" + 0.023*\"adulthood\" + 0.017*\"feel\" + 0.016*\"hostil\" + 0.015*\"male\" + 0.011*\"live\" + 0.010*\"plaisir\" + 0.010*\"yawn\" + 0.010*\"genu\"\n", + "2019-01-31 00:25:22,630 : INFO : topic #32 (0.020): 0.055*\"district\" + 0.045*\"vigour\" + 0.043*\"popolo\" + 0.042*\"tortur\" + 0.028*\"area\" + 0.028*\"regim\" + 0.027*\"cotton\" + 0.024*\"multitud\" + 0.022*\"citi\" + 0.021*\"prosper\"\n", + "2019-01-31 00:25:22,631 : INFO : topic #39 (0.020): 0.035*\"canada\" + 0.028*\"canadian\" + 0.020*\"taxpay\" + 0.018*\"scientist\" + 0.017*\"hoar\" + 0.016*\"basketbal\" + 0.015*\"toronto\" + 0.014*\"ontario\" + 0.012*\"confer\" + 0.011*\"clot\"\n", + "2019-01-31 00:25:22,632 : INFO : topic #19 (0.020): 0.013*\"languag\" + 0.010*\"woodcut\" + 0.010*\"form\" + 0.009*\"origin\" + 0.008*\"mean\" + 0.007*\"uruguayan\" + 0.007*\"like\" + 0.007*\"god\" + 0.006*\"centuri\" + 0.006*\"dynam\"\n", + "2019-01-31 00:25:22,638 : INFO : topic diff=0.011523, rho=0.059235\n", + "2019-01-31 00:25:22,791 : INFO : PROGRESS: pass 0, at document #572000/4922894\n", + "2019-01-31 00:25:24,212 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:25:24,478 : INFO : topic #30 (0.020): 0.035*\"leagu\" + 0.035*\"cleveland\" + 0.030*\"place\" + 0.026*\"taxpay\" + 0.025*\"scientist\" + 0.024*\"crete\" + 0.021*\"folei\" + 0.017*\"goal\" + 0.015*\"martin\" + 0.012*\"schmitz\"\n", + "2019-01-31 00:25:24,479 : INFO : topic #45 (0.020): 0.016*\"black\" + 0.015*\"western\" + 0.014*\"colder\" + 0.012*\"record\" + 0.010*\"blind\" + 0.010*\"illicit\" + 0.008*\"fifteenth\" + 0.007*\"light\" + 0.007*\"green\" + 0.007*\"jpg\"\n", + "2019-01-31 00:25:24,480 : INFO : topic #8 (0.020): 0.032*\"act\" + 0.028*\"law\" + 0.024*\"cortic\" + 0.018*\"start\" + 0.016*\"ricardo\" + 0.012*\"case\" + 0.010*\"allei\" + 0.009*\"polaris\" + 0.009*\"legal\" + 0.007*\"rudolf\"\n", + "2019-01-31 00:25:24,482 : INFO : topic #39 (0.020): 0.035*\"canada\" + 0.028*\"canadian\" + 0.020*\"taxpay\" + 0.018*\"scientist\" + 0.017*\"hoar\" + 0.016*\"basketbal\" + 0.014*\"toronto\" + 0.014*\"ontario\" + 0.012*\"confer\" + 0.010*\"clot\"\n", + "2019-01-31 00:25:24,483 : INFO : topic #28 (0.020): 0.030*\"build\" + 0.024*\"hous\" + 0.021*\"rivièr\" + 0.017*\"buford\" + 0.013*\"histor\" + 0.011*\"briarwood\" + 0.011*\"constitut\" + 0.010*\"strategist\" + 0.010*\"rosenwald\" + 0.010*\"highland\"\n", + "2019-01-31 00:25:24,488 : INFO : topic diff=0.011371, rho=0.059131\n", + "2019-01-31 00:25:24,706 : INFO : PROGRESS: pass 0, at document #574000/4922894\n", + "2019-01-31 00:25:26,191 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:25:26,457 : INFO : topic #37 (0.020): 0.010*\"love\" + 0.008*\"gestur\" + 0.008*\"man\" + 0.006*\"blue\" + 0.005*\"bewild\" + 0.005*\"litig\" + 0.004*\"night\" + 0.003*\"healthcar\" + 0.003*\"amphora\" + 0.003*\"ladi\"\n", + "2019-01-31 00:25:26,458 : INFO : topic #29 (0.020): 0.011*\"start\" + 0.010*\"govern\" + 0.009*\"million\" + 0.008*\"yawn\" + 0.007*\"bank\" + 0.007*\"countri\" + 0.007*\"function\" + 0.006*\"replac\" + 0.006*\"placement\" + 0.006*\"théori\"\n", + "2019-01-31 00:25:26,459 : INFO : topic #28 (0.020): 0.030*\"build\" + 0.024*\"hous\" + 0.021*\"rivièr\" + 0.017*\"buford\" + 0.013*\"histor\" + 0.012*\"briarwood\" + 0.011*\"constitut\" + 0.011*\"strategist\" + 0.010*\"rosenwald\" + 0.010*\"depress\"\n", + "2019-01-31 00:25:26,460 : INFO : topic #38 (0.020): 0.021*\"walter\" + 0.011*\"aza\" + 0.010*\"king\" + 0.010*\"battalion\" + 0.009*\"empath\" + 0.009*\"teufel\" + 0.008*\"centuri\" + 0.008*\"forc\" + 0.007*\"armi\" + 0.007*\"till\"\n", + "2019-01-31 00:25:26,461 : INFO : topic #11 (0.020): 0.028*\"john\" + 0.015*\"will\" + 0.013*\"jame\" + 0.012*\"david\" + 0.011*\"rival\" + 0.010*\"georg\" + 0.009*\"slur\" + 0.008*\"mexican–american\" + 0.008*\"rhyme\" + 0.008*\"paul\"\n", + "2019-01-31 00:25:26,467 : INFO : topic diff=0.011891, rho=0.059028\n", + "2019-01-31 00:25:26,623 : INFO : PROGRESS: pass 0, at document #576000/4922894\n", + "2019-01-31 00:25:28,045 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:25:28,312 : INFO : topic #21 (0.020): 0.036*\"samford\" + 0.022*\"spain\" + 0.019*\"del\" + 0.018*\"mexico\" + 0.013*\"soviet\" + 0.012*\"santa\" + 0.012*\"francisco\" + 0.011*\"juan\" + 0.011*\"carlo\" + 0.010*\"josé\"\n", + "2019-01-31 00:25:28,313 : INFO : topic #45 (0.020): 0.016*\"black\" + 0.015*\"western\" + 0.014*\"colder\" + 0.012*\"record\" + 0.010*\"blind\" + 0.010*\"illicit\" + 0.009*\"fifteenth\" + 0.008*\"light\" + 0.007*\"green\" + 0.007*\"jpg\"\n", + "2019-01-31 00:25:28,314 : INFO : topic #2 (0.020): 0.046*\"isl\" + 0.039*\"shield\" + 0.020*\"narrat\" + 0.015*\"scot\" + 0.013*\"blur\" + 0.012*\"pope\" + 0.011*\"nativist\" + 0.010*\"fleet\" + 0.010*\"coalit\" + 0.009*\"class\"\n", + "2019-01-31 00:25:28,315 : INFO : topic #6 (0.020): 0.066*\"fewer\" + 0.024*\"septemb\" + 0.022*\"epiru\" + 0.018*\"teacher\" + 0.017*\"stake\" + 0.013*\"rodríguez\" + 0.012*\"proclaim\" + 0.011*\"direct\" + 0.011*\"movi\" + 0.010*\"acrimoni\"\n", + "2019-01-31 00:25:28,316 : INFO : topic #36 (0.020): 0.022*\"companhia\" + 0.011*\"network\" + 0.009*\"prognosi\" + 0.009*\"develop\" + 0.009*\"serv\" + 0.008*\"manag\" + 0.008*\"oper\" + 0.008*\"includ\" + 0.008*\"base\" + 0.007*\"produc\"\n", + "2019-01-31 00:25:28,322 : INFO : topic diff=0.010918, rho=0.058926\n", + "2019-01-31 00:25:28,478 : INFO : PROGRESS: pass 0, at document #578000/4922894\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 00:25:29,906 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:25:30,172 : INFO : topic #5 (0.020): 0.040*\"abroad\" + 0.029*\"son\" + 0.028*\"rel\" + 0.026*\"reconstruct\" + 0.022*\"band\" + 0.018*\"muscl\" + 0.017*\"simultan\" + 0.015*\"charcoal\" + 0.013*\"toyota\" + 0.010*\"vocabulari\"\n", + "2019-01-31 00:25:30,173 : INFO : topic #10 (0.020): 0.012*\"cdd\" + 0.008*\"disco\" + 0.007*\"caus\" + 0.007*\"have\" + 0.007*\"media\" + 0.007*\"hormon\" + 0.006*\"cancer\" + 0.006*\"pathwai\" + 0.006*\"proper\" + 0.006*\"effect\"\n", + "2019-01-31 00:25:30,174 : INFO : topic #34 (0.020): 0.073*\"start\" + 0.033*\"cotton\" + 0.030*\"unionist\" + 0.028*\"american\" + 0.022*\"new\" + 0.013*\"california\" + 0.013*\"terri\" + 0.013*\"warrior\" + 0.012*\"north\" + 0.011*\"violent\"\n", + "2019-01-31 00:25:30,175 : INFO : topic #20 (0.020): 0.130*\"scholar\" + 0.037*\"struggl\" + 0.030*\"high\" + 0.029*\"educ\" + 0.019*\"yawn\" + 0.017*\"collector\" + 0.014*\"prognosi\" + 0.010*\"gothic\" + 0.009*\"district\" + 0.009*\"second\"\n", + "2019-01-31 00:25:30,176 : INFO : topic #2 (0.020): 0.047*\"isl\" + 0.039*\"shield\" + 0.020*\"narrat\" + 0.015*\"scot\" + 0.013*\"blur\" + 0.012*\"pope\" + 0.011*\"nativist\" + 0.010*\"fleet\" + 0.010*\"coalit\" + 0.009*\"sai\"\n", + "2019-01-31 00:25:30,182 : INFO : topic diff=0.012336, rho=0.058824\n", + "2019-01-31 00:25:32,955 : INFO : -11.900 per-word bound, 3822.2 perplexity estimate based on a held-out corpus of 2000 documents with 556773 words\n", + "2019-01-31 00:25:32,955 : INFO : PROGRESS: pass 0, at document #580000/4922894\n", + "2019-01-31 00:25:34,414 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:25:34,680 : INFO : topic #28 (0.020): 0.029*\"build\" + 0.024*\"hous\" + 0.021*\"rivièr\" + 0.017*\"buford\" + 0.012*\"histor\" + 0.011*\"briarwood\" + 0.011*\"constitut\" + 0.011*\"strategist\" + 0.010*\"rosenwald\" + 0.009*\"depress\"\n", + "2019-01-31 00:25:34,681 : INFO : topic #23 (0.020): 0.142*\"audit\" + 0.070*\"best\" + 0.037*\"yawn\" + 0.028*\"jacksonvil\" + 0.024*\"noll\" + 0.022*\"japanes\" + 0.021*\"women\" + 0.019*\"festiv\" + 0.016*\"intern\" + 0.016*\"prison\"\n", + "2019-01-31 00:25:34,682 : INFO : topic #39 (0.020): 0.032*\"canada\" + 0.026*\"canadian\" + 0.020*\"taxpay\" + 0.019*\"scientist\" + 0.016*\"hoar\" + 0.015*\"basketbal\" + 0.015*\"toronto\" + 0.014*\"ontario\" + 0.012*\"confer\" + 0.010*\"new\"\n", + "2019-01-31 00:25:34,683 : INFO : topic #40 (0.020): 0.092*\"unit\" + 0.027*\"collector\" + 0.022*\"institut\" + 0.022*\"schuster\" + 0.017*\"requir\" + 0.017*\"student\" + 0.014*\"professor\" + 0.013*\"degre\" + 0.012*\"governor\" + 0.012*\"word\"\n", + "2019-01-31 00:25:34,684 : INFO : topic #9 (0.020): 0.078*\"bone\" + 0.039*\"american\" + 0.026*\"valour\" + 0.019*\"dutch\" + 0.017*\"player\" + 0.016*\"folei\" + 0.016*\"polit\" + 0.015*\"english\" + 0.011*\"simpler\" + 0.010*\"acrimoni\"\n", + "2019-01-31 00:25:34,690 : INFO : topic diff=0.009998, rho=0.058722\n", + "2019-01-31 00:25:34,843 : INFO : PROGRESS: pass 0, at document #582000/4922894\n", + "2019-01-31 00:25:36,252 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:25:36,519 : INFO : topic #14 (0.020): 0.024*\"forc\" + 0.021*\"walter\" + 0.020*\"armi\" + 0.020*\"aggress\" + 0.017*\"oper\" + 0.016*\"com\" + 0.013*\"unionist\" + 0.012*\"militari\" + 0.012*\"airbu\" + 0.011*\"diversifi\"\n", + "2019-01-31 00:25:36,520 : INFO : topic #44 (0.020): 0.032*\"rooftop\" + 0.027*\"final\" + 0.022*\"tourist\" + 0.020*\"wife\" + 0.019*\"champion\" + 0.018*\"taxpay\" + 0.017*\"martin\" + 0.015*\"chamber\" + 0.014*\"tiepolo\" + 0.013*\"winner\"\n", + "2019-01-31 00:25:36,521 : INFO : topic #6 (0.020): 0.066*\"fewer\" + 0.025*\"septemb\" + 0.022*\"epiru\" + 0.019*\"teacher\" + 0.016*\"stake\" + 0.012*\"rodríguez\" + 0.012*\"proclaim\" + 0.012*\"direct\" + 0.010*\"movi\" + 0.010*\"acrimoni\"\n", + "2019-01-31 00:25:36,522 : INFO : topic #27 (0.020): 0.067*\"questionnair\" + 0.019*\"taxpay\" + 0.016*\"candid\" + 0.016*\"squatter\" + 0.015*\"tornado\" + 0.013*\"driver\" + 0.012*\"ret\" + 0.011*\"théori\" + 0.011*\"find\" + 0.011*\"rick\"\n", + "2019-01-31 00:25:36,523 : INFO : topic #8 (0.020): 0.030*\"act\" + 0.028*\"law\" + 0.024*\"cortic\" + 0.018*\"start\" + 0.016*\"ricardo\" + 0.013*\"case\" + 0.009*\"legal\" + 0.009*\"polaris\" + 0.009*\"allei\" + 0.007*\"rudolf\"\n", + "2019-01-31 00:25:36,529 : INFO : topic diff=0.011187, rho=0.058621\n", + "2019-01-31 00:25:36,685 : INFO : PROGRESS: pass 0, at document #584000/4922894\n", + "2019-01-31 00:25:38,121 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:25:38,387 : INFO : topic #39 (0.020): 0.032*\"canada\" + 0.026*\"canadian\" + 0.020*\"taxpay\" + 0.018*\"scientist\" + 0.016*\"hoar\" + 0.016*\"basketbal\" + 0.015*\"toronto\" + 0.014*\"ontario\" + 0.014*\"confer\" + 0.011*\"new\"\n", + "2019-01-31 00:25:38,388 : INFO : topic #13 (0.020): 0.031*\"australia\" + 0.027*\"sourc\" + 0.027*\"new\" + 0.023*\"australian\" + 0.023*\"london\" + 0.022*\"england\" + 0.021*\"ireland\" + 0.020*\"british\" + 0.016*\"youth\" + 0.014*\"wale\"\n", + "2019-01-31 00:25:38,389 : INFO : topic #11 (0.020): 0.027*\"john\" + 0.015*\"will\" + 0.013*\"jame\" + 0.013*\"david\" + 0.011*\"rival\" + 0.010*\"georg\" + 0.009*\"slur\" + 0.009*\"paul\" + 0.008*\"mexican–american\" + 0.008*\"rhyme\"\n", + "2019-01-31 00:25:38,391 : INFO : topic #33 (0.020): 0.056*\"french\" + 0.043*\"franc\" + 0.029*\"pari\" + 0.024*\"sail\" + 0.022*\"jean\" + 0.018*\"daphn\" + 0.013*\"lazi\" + 0.012*\"loui\" + 0.010*\"piec\" + 0.010*\"wine\"\n", + "2019-01-31 00:25:38,392 : INFO : topic #20 (0.020): 0.130*\"scholar\" + 0.037*\"struggl\" + 0.030*\"high\" + 0.029*\"educ\" + 0.019*\"yawn\" + 0.018*\"collector\" + 0.014*\"prognosi\" + 0.009*\"gothic\" + 0.009*\"district\" + 0.008*\"second\"\n", + "2019-01-31 00:25:38,398 : INFO : topic diff=0.012064, rho=0.058521\n", + "2019-01-31 00:25:38,554 : INFO : PROGRESS: pass 0, at document #586000/4922894\n", + "2019-01-31 00:25:39,991 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:25:40,261 : INFO : topic #30 (0.020): 0.037*\"cleveland\" + 0.036*\"leagu\" + 0.029*\"place\" + 0.026*\"taxpay\" + 0.025*\"scientist\" + 0.024*\"crete\" + 0.021*\"folei\" + 0.016*\"goal\" + 0.015*\"martin\" + 0.012*\"schmitz\"\n", + "2019-01-31 00:25:40,262 : INFO : topic #40 (0.020): 0.094*\"unit\" + 0.028*\"collector\" + 0.023*\"institut\" + 0.022*\"schuster\" + 0.017*\"requir\" + 0.017*\"student\" + 0.014*\"professor\" + 0.013*\"degre\" + 0.012*\"word\" + 0.012*\"governor\"\n", + "2019-01-31 00:25:40,263 : INFO : topic #4 (0.020): 0.023*\"enfranchis\" + 0.016*\"depress\" + 0.015*\"pour\" + 0.009*\"produc\" + 0.009*\"elabor\" + 0.008*\"spectacl\" + 0.008*\"veget\" + 0.008*\"mode\" + 0.008*\"candid\" + 0.007*\"develop\"\n", + "2019-01-31 00:25:40,264 : INFO : topic #48 (0.020): 0.080*\"march\" + 0.080*\"octob\" + 0.075*\"sens\" + 0.073*\"januari\" + 0.071*\"notion\" + 0.068*\"juli\" + 0.067*\"april\" + 0.066*\"august\" + 0.065*\"decatur\" + 0.064*\"judici\"\n", + "2019-01-31 00:25:40,265 : INFO : topic #18 (0.020): 0.009*\"théori\" + 0.007*\"later\" + 0.007*\"kill\" + 0.007*\"sack\" + 0.005*\"dai\" + 0.005*\"retrospect\" + 0.004*\"man\" + 0.004*\"deal\" + 0.004*\"like\" + 0.004*\"kenworthi\"\n", + "2019-01-31 00:25:40,271 : INFO : topic diff=0.010885, rho=0.058421\n", + "2019-01-31 00:25:40,426 : INFO : PROGRESS: pass 0, at document #588000/4922894\n", + "2019-01-31 00:25:41,844 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:25:42,110 : INFO : topic #37 (0.020): 0.010*\"love\" + 0.008*\"gestur\" + 0.008*\"man\" + 0.006*\"bewild\" + 0.006*\"blue\" + 0.005*\"litig\" + 0.005*\"night\" + 0.003*\"ladi\" + 0.003*\"amphora\" + 0.003*\"healthcar\"\n", + "2019-01-31 00:25:42,112 : INFO : topic #18 (0.020): 0.009*\"théori\" + 0.007*\"later\" + 0.007*\"kill\" + 0.007*\"sack\" + 0.005*\"dai\" + 0.005*\"retrospect\" + 0.005*\"man\" + 0.004*\"deal\" + 0.004*\"like\" + 0.004*\"kenworthi\"\n", + "2019-01-31 00:25:42,113 : INFO : topic #40 (0.020): 0.094*\"unit\" + 0.028*\"collector\" + 0.023*\"institut\" + 0.022*\"schuster\" + 0.018*\"requir\" + 0.017*\"student\" + 0.014*\"professor\" + 0.012*\"degre\" + 0.012*\"governor\" + 0.012*\"word\"\n", + "2019-01-31 00:25:42,114 : INFO : topic #26 (0.020): 0.030*\"woman\" + 0.028*\"workplac\" + 0.027*\"men\" + 0.027*\"champion\" + 0.026*\"olymp\" + 0.023*\"medal\" + 0.021*\"event\" + 0.020*\"alic\" + 0.020*\"atheist\" + 0.020*\"rainfal\"\n", + "2019-01-31 00:25:42,115 : INFO : topic #19 (0.020): 0.014*\"languag\" + 0.010*\"woodcut\" + 0.010*\"origin\" + 0.010*\"form\" + 0.008*\"mean\" + 0.007*\"uruguayan\" + 0.007*\"like\" + 0.007*\"centuri\" + 0.007*\"english\" + 0.006*\"god\"\n", + "2019-01-31 00:25:42,121 : INFO : topic diff=0.012561, rho=0.058321\n", + "2019-01-31 00:25:42,277 : INFO : PROGRESS: pass 0, at document #590000/4922894\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 00:25:43,717 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:25:43,983 : INFO : topic #17 (0.020): 0.071*\"church\" + 0.021*\"cathol\" + 0.019*\"christian\" + 0.018*\"bishop\" + 0.015*\"sail\" + 0.014*\"retroflex\" + 0.012*\"centuri\" + 0.012*\"dioces\" + 0.011*\"italian\" + 0.009*\"historiographi\"\n", + "2019-01-31 00:25:43,984 : INFO : topic #37 (0.020): 0.010*\"love\" + 0.008*\"gestur\" + 0.008*\"man\" + 0.006*\"blue\" + 0.006*\"bewild\" + 0.005*\"litig\" + 0.004*\"night\" + 0.003*\"christma\" + 0.003*\"ladi\" + 0.003*\"amphora\"\n", + "2019-01-31 00:25:43,986 : INFO : topic #26 (0.020): 0.030*\"woman\" + 0.027*\"men\" + 0.027*\"workplac\" + 0.027*\"champion\" + 0.025*\"olymp\" + 0.023*\"medal\" + 0.022*\"alic\" + 0.022*\"event\" + 0.021*\"rainfal\" + 0.021*\"atheist\"\n", + "2019-01-31 00:25:43,987 : INFO : topic #5 (0.020): 0.040*\"abroad\" + 0.028*\"son\" + 0.028*\"rel\" + 0.026*\"reconstruct\" + 0.022*\"band\" + 0.018*\"muscl\" + 0.016*\"simultan\" + 0.014*\"charcoal\" + 0.013*\"toyota\" + 0.010*\"vocabulari\"\n", + "2019-01-31 00:25:43,988 : INFO : topic #14 (0.020): 0.025*\"forc\" + 0.020*\"aggress\" + 0.019*\"walter\" + 0.019*\"armi\" + 0.016*\"com\" + 0.016*\"oper\" + 0.012*\"unionist\" + 0.012*\"militari\" + 0.012*\"airbu\" + 0.010*\"refut\"\n", + "2019-01-31 00:25:43,994 : INFO : topic diff=0.012532, rho=0.058222\n", + "2019-01-31 00:25:44,150 : INFO : PROGRESS: pass 0, at document #592000/4922894\n", + "2019-01-31 00:25:45,566 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:25:45,832 : INFO : topic #33 (0.020): 0.058*\"french\" + 0.044*\"franc\" + 0.029*\"pari\" + 0.024*\"sail\" + 0.023*\"jean\" + 0.019*\"daphn\" + 0.014*\"lazi\" + 0.012*\"loui\" + 0.011*\"piec\" + 0.010*\"wine\"\n", + "2019-01-31 00:25:45,833 : INFO : topic #37 (0.020): 0.010*\"love\" + 0.008*\"gestur\" + 0.007*\"man\" + 0.006*\"blue\" + 0.005*\"bewild\" + 0.005*\"litig\" + 0.005*\"night\" + 0.003*\"christma\" + 0.003*\"ladi\" + 0.003*\"amphora\"\n", + "2019-01-31 00:25:45,835 : INFO : topic #8 (0.020): 0.029*\"law\" + 0.027*\"act\" + 0.024*\"cortic\" + 0.017*\"start\" + 0.016*\"ricardo\" + 0.013*\"case\" + 0.009*\"polaris\" + 0.009*\"legal\" + 0.008*\"judaism\" + 0.007*\"allei\"\n", + "2019-01-31 00:25:45,836 : INFO : topic #24 (0.020): 0.040*\"book\" + 0.035*\"publicis\" + 0.022*\"word\" + 0.017*\"new\" + 0.014*\"edit\" + 0.013*\"presid\" + 0.013*\"nicola\" + 0.012*\"storag\" + 0.011*\"author\" + 0.011*\"worldwid\"\n", + "2019-01-31 00:25:45,837 : INFO : topic #35 (0.020): 0.061*\"russia\" + 0.039*\"sovereignti\" + 0.031*\"rural\" + 0.025*\"turin\" + 0.024*\"poison\" + 0.022*\"reprint\" + 0.021*\"personifi\" + 0.018*\"moscow\" + 0.017*\"unfortun\" + 0.016*\"poland\"\n", + "2019-01-31 00:25:45,843 : INFO : topic diff=0.010819, rho=0.058124\n", + "2019-01-31 00:25:45,997 : INFO : PROGRESS: pass 0, at document #594000/4922894\n", + "2019-01-31 00:25:47,416 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:25:47,682 : INFO : topic #25 (0.020): 0.029*\"ring\" + 0.019*\"warmth\" + 0.017*\"lagrang\" + 0.016*\"area\" + 0.015*\"mount\" + 0.009*\"palmer\" + 0.008*\"foam\" + 0.008*\"north\" + 0.008*\"lobe\" + 0.008*\"sourc\"\n", + "2019-01-31 00:25:47,684 : INFO : topic #2 (0.020): 0.047*\"isl\" + 0.038*\"shield\" + 0.018*\"narrat\" + 0.015*\"scot\" + 0.013*\"pope\" + 0.012*\"blur\" + 0.010*\"nativist\" + 0.010*\"class\" + 0.010*\"fleet\" + 0.010*\"ellison\"\n", + "2019-01-31 00:25:47,685 : INFO : topic #47 (0.020): 0.065*\"muscl\" + 0.035*\"perceptu\" + 0.023*\"theater\" + 0.019*\"compos\" + 0.017*\"physician\" + 0.015*\"place\" + 0.014*\"orchestr\" + 0.014*\"damn\" + 0.014*\"olympo\" + 0.012*\"son\"\n", + "2019-01-31 00:25:47,686 : INFO : topic #10 (0.020): 0.011*\"cdd\" + 0.009*\"disco\" + 0.008*\"caus\" + 0.007*\"media\" + 0.007*\"pathwai\" + 0.007*\"have\" + 0.006*\"effect\" + 0.006*\"hormon\" + 0.006*\"proper\" + 0.006*\"treat\"\n", + "2019-01-31 00:25:47,687 : INFO : topic #44 (0.020): 0.033*\"rooftop\" + 0.028*\"final\" + 0.022*\"tourist\" + 0.020*\"wife\" + 0.018*\"champion\" + 0.018*\"taxpay\" + 0.016*\"martin\" + 0.015*\"chamber\" + 0.014*\"tiepolo\" + 0.013*\"winner\"\n", + "2019-01-31 00:25:47,693 : INFO : topic diff=0.011287, rho=0.058026\n", + "2019-01-31 00:25:47,853 : INFO : PROGRESS: pass 0, at document #596000/4922894\n", + "2019-01-31 00:25:49,275 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:25:49,541 : INFO : topic #2 (0.020): 0.046*\"isl\" + 0.038*\"shield\" + 0.018*\"narrat\" + 0.015*\"scot\" + 0.013*\"pope\" + 0.012*\"blur\" + 0.010*\"nativist\" + 0.010*\"fleet\" + 0.010*\"class\" + 0.010*\"ellison\"\n", + "2019-01-31 00:25:49,543 : INFO : topic #16 (0.020): 0.032*\"king\" + 0.031*\"priest\" + 0.019*\"quarterli\" + 0.018*\"duke\" + 0.018*\"grammat\" + 0.016*\"idiosyncrat\" + 0.015*\"maria\" + 0.015*\"rotterdam\" + 0.014*\"brazil\" + 0.013*\"portugues\"\n", + "2019-01-31 00:25:49,544 : INFO : topic #36 (0.020): 0.022*\"companhia\" + 0.010*\"network\" + 0.009*\"prognosi\" + 0.009*\"develop\" + 0.008*\"serv\" + 0.008*\"base\" + 0.008*\"includ\" + 0.008*\"oper\" + 0.007*\"pop\" + 0.007*\"manag\"\n", + "2019-01-31 00:25:49,545 : INFO : topic #26 (0.020): 0.029*\"woman\" + 0.027*\"champion\" + 0.027*\"workplac\" + 0.027*\"men\" + 0.026*\"olymp\" + 0.022*\"medal\" + 0.022*\"alic\" + 0.022*\"event\" + 0.021*\"rainfal\" + 0.020*\"atheist\"\n", + "2019-01-31 00:25:49,546 : INFO : topic #20 (0.020): 0.130*\"scholar\" + 0.038*\"struggl\" + 0.030*\"high\" + 0.029*\"educ\" + 0.019*\"yawn\" + 0.018*\"collector\" + 0.013*\"prognosi\" + 0.010*\"task\" + 0.009*\"gothic\" + 0.009*\"second\"\n", + "2019-01-31 00:25:49,552 : INFO : topic diff=0.011764, rho=0.057928\n", + "2019-01-31 00:25:49,716 : INFO : PROGRESS: pass 0, at document #598000/4922894\n", + "2019-01-31 00:25:51,175 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:25:51,441 : INFO : topic #24 (0.020): 0.040*\"book\" + 0.035*\"publicis\" + 0.023*\"word\" + 0.016*\"new\" + 0.014*\"edit\" + 0.013*\"presid\" + 0.013*\"storag\" + 0.012*\"nicola\" + 0.011*\"author\" + 0.011*\"worldwid\"\n", + "2019-01-31 00:25:51,442 : INFO : topic #6 (0.020): 0.067*\"fewer\" + 0.025*\"septemb\" + 0.021*\"epiru\" + 0.019*\"teacher\" + 0.016*\"stake\" + 0.012*\"rodríguez\" + 0.012*\"proclaim\" + 0.011*\"direct\" + 0.010*\"movi\" + 0.010*\"acrimoni\"\n", + "2019-01-31 00:25:51,443 : INFO : topic #26 (0.020): 0.028*\"woman\" + 0.027*\"champion\" + 0.027*\"workplac\" + 0.027*\"olymp\" + 0.027*\"men\" + 0.022*\"medal\" + 0.022*\"alic\" + 0.021*\"event\" + 0.021*\"rainfal\" + 0.020*\"atheist\"\n", + "2019-01-31 00:25:51,444 : INFO : topic #48 (0.020): 0.079*\"march\" + 0.078*\"octob\" + 0.075*\"sens\" + 0.072*\"januari\" + 0.070*\"notion\" + 0.066*\"juli\" + 0.065*\"april\" + 0.064*\"august\" + 0.064*\"decatur\" + 0.061*\"judici\"\n", + "2019-01-31 00:25:51,445 : INFO : topic #1 (0.020): 0.050*\"china\" + 0.046*\"chilton\" + 0.030*\"korea\" + 0.026*\"hong\" + 0.025*\"kong\" + 0.020*\"korean\" + 0.019*\"sourc\" + 0.013*\"leah\" + 0.012*\"kim\" + 0.012*\"ashvil\"\n", + "2019-01-31 00:25:51,451 : INFO : topic diff=0.011433, rho=0.057831\n", + "2019-01-31 00:25:54,186 : INFO : -11.643 per-word bound, 3198.9 perplexity estimate based on a held-out corpus of 2000 documents with 567072 words\n", + "2019-01-31 00:25:54,186 : INFO : PROGRESS: pass 0, at document #600000/4922894\n", + "2019-01-31 00:25:55,613 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:25:55,879 : INFO : topic #29 (0.020): 0.010*\"start\" + 0.010*\"govern\" + 0.009*\"million\" + 0.008*\"yawn\" + 0.008*\"countri\" + 0.007*\"bank\" + 0.007*\"function\" + 0.006*\"placement\" + 0.006*\"replac\" + 0.006*\"new\"\n", + "2019-01-31 00:25:55,880 : INFO : topic #32 (0.020): 0.054*\"district\" + 0.046*\"vigour\" + 0.045*\"tortur\" + 0.042*\"popolo\" + 0.029*\"regim\" + 0.029*\"cotton\" + 0.029*\"area\" + 0.025*\"citi\" + 0.023*\"multitud\" + 0.020*\"commun\"\n", + "2019-01-31 00:25:55,881 : INFO : topic #4 (0.020): 0.023*\"enfranchis\" + 0.016*\"depress\" + 0.015*\"pour\" + 0.009*\"elabor\" + 0.009*\"produc\" + 0.009*\"mode\" + 0.008*\"veget\" + 0.007*\"spectacl\" + 0.007*\"candid\" + 0.007*\"encyclopedia\"\n", + "2019-01-31 00:25:55,882 : INFO : topic #35 (0.020): 0.057*\"russia\" + 0.036*\"sovereignti\" + 0.030*\"rural\" + 0.026*\"reprint\" + 0.024*\"turin\" + 0.023*\"poison\" + 0.023*\"personifi\" + 0.019*\"moscow\" + 0.016*\"unfortun\" + 0.015*\"poland\"\n", + "2019-01-31 00:25:55,884 : INFO : topic #44 (0.020): 0.033*\"rooftop\" + 0.029*\"final\" + 0.022*\"tourist\" + 0.020*\"wife\" + 0.018*\"champion\" + 0.018*\"taxpay\" + 0.015*\"martin\" + 0.015*\"chamber\" + 0.014*\"tiepolo\" + 0.013*\"workplac\"\n", + "2019-01-31 00:25:55,889 : INFO : topic diff=0.010249, rho=0.057735\n", + "2019-01-31 00:25:56,048 : INFO : PROGRESS: pass 0, at document #602000/4922894\n", + "2019-01-31 00:25:57,491 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 00:25:57,757 : INFO : topic #5 (0.020): 0.040*\"abroad\" + 0.028*\"son\" + 0.028*\"rel\" + 0.026*\"reconstruct\" + 0.022*\"band\" + 0.018*\"muscl\" + 0.016*\"simultan\" + 0.014*\"charcoal\" + 0.013*\"toyota\" + 0.010*\"vocabulari\"\n", + "2019-01-31 00:25:57,758 : INFO : topic #12 (0.020): 0.009*\"number\" + 0.008*\"exampl\" + 0.007*\"théori\" + 0.007*\"frontal\" + 0.006*\"southern\" + 0.006*\"gener\" + 0.006*\"servitud\" + 0.006*\"mode\" + 0.006*\"poet\" + 0.006*\"measur\"\n", + "2019-01-31 00:25:57,759 : INFO : topic #18 (0.020): 0.009*\"théori\" + 0.007*\"later\" + 0.007*\"sack\" + 0.006*\"kill\" + 0.005*\"dai\" + 0.005*\"retrospect\" + 0.005*\"man\" + 0.004*\"deal\" + 0.004*\"like\" + 0.004*\"kenworthi\"\n", + "2019-01-31 00:25:57,761 : INFO : topic #15 (0.020): 0.012*\"small\" + 0.012*\"develop\" + 0.010*\"organ\" + 0.010*\"word\" + 0.010*\"commun\" + 0.009*\"cultur\" + 0.008*\"group\" + 0.008*\"human\" + 0.007*\"requir\" + 0.007*\"student\"\n", + "2019-01-31 00:25:57,762 : INFO : topic #27 (0.020): 0.068*\"questionnair\" + 0.019*\"taxpay\" + 0.016*\"squatter\" + 0.015*\"candid\" + 0.015*\"tornado\" + 0.013*\"horac\" + 0.013*\"fool\" + 0.012*\"driver\" + 0.012*\"ret\" + 0.011*\"find\"\n", + "2019-01-31 00:25:57,767 : INFO : topic diff=0.010893, rho=0.057639\n", + "2019-01-31 00:25:57,922 : INFO : PROGRESS: pass 0, at document #604000/4922894\n", + "2019-01-31 00:25:59,338 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:25:59,604 : INFO : topic #46 (0.020): 0.020*\"stop\" + 0.016*\"norwai\" + 0.016*\"sweden\" + 0.015*\"wind\" + 0.014*\"damag\" + 0.014*\"norwegian\" + 0.014*\"swedish\" + 0.012*\"huntsvil\" + 0.011*\"denmark\" + 0.011*\"turkish\"\n", + "2019-01-31 00:25:59,605 : INFO : topic #5 (0.020): 0.040*\"abroad\" + 0.028*\"son\" + 0.028*\"rel\" + 0.026*\"reconstruct\" + 0.022*\"band\" + 0.018*\"muscl\" + 0.016*\"simultan\" + 0.014*\"charcoal\" + 0.013*\"toyota\" + 0.010*\"vocabulari\"\n", + "2019-01-31 00:25:59,606 : INFO : topic #2 (0.020): 0.046*\"isl\" + 0.037*\"shield\" + 0.019*\"narrat\" + 0.015*\"scot\" + 0.013*\"blur\" + 0.013*\"pope\" + 0.010*\"nativist\" + 0.010*\"fleet\" + 0.010*\"class\" + 0.009*\"coalit\"\n", + "2019-01-31 00:25:59,608 : INFO : topic #30 (0.020): 0.038*\"leagu\" + 0.036*\"cleveland\" + 0.029*\"place\" + 0.026*\"taxpay\" + 0.024*\"scientist\" + 0.023*\"crete\" + 0.022*\"folei\" + 0.016*\"goal\" + 0.015*\"martin\" + 0.012*\"schmitz\"\n", + "2019-01-31 00:25:59,609 : INFO : topic #21 (0.020): 0.037*\"samford\" + 0.021*\"spain\" + 0.019*\"del\" + 0.019*\"mexico\" + 0.014*\"soviet\" + 0.012*\"francisco\" + 0.011*\"santa\" + 0.011*\"juan\" + 0.011*\"lizard\" + 0.010*\"carlo\"\n", + "2019-01-31 00:25:59,614 : INFO : topic diff=0.010261, rho=0.057544\n", + "2019-01-31 00:25:59,767 : INFO : PROGRESS: pass 0, at document #606000/4922894\n", + "2019-01-31 00:26:01,180 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:26:01,449 : INFO : topic #25 (0.020): 0.028*\"ring\" + 0.021*\"warmth\" + 0.017*\"lagrang\" + 0.016*\"area\" + 0.015*\"mount\" + 0.009*\"palmer\" + 0.009*\"foam\" + 0.008*\"north\" + 0.008*\"lobe\" + 0.008*\"sourc\"\n", + "2019-01-31 00:26:01,450 : INFO : topic #21 (0.020): 0.037*\"samford\" + 0.022*\"spain\" + 0.019*\"del\" + 0.019*\"mexico\" + 0.014*\"soviet\" + 0.012*\"francisco\" + 0.011*\"santa\" + 0.011*\"juan\" + 0.010*\"lizard\" + 0.010*\"mexican\"\n", + "2019-01-31 00:26:01,451 : INFO : topic #9 (0.020): 0.072*\"bone\" + 0.040*\"american\" + 0.029*\"valour\" + 0.021*\"dutch\" + 0.018*\"polit\" + 0.017*\"folei\" + 0.017*\"player\" + 0.016*\"english\" + 0.011*\"wedg\" + 0.010*\"surnam\"\n", + "2019-01-31 00:26:01,452 : INFO : topic #18 (0.020): 0.009*\"théori\" + 0.007*\"later\" + 0.007*\"sack\" + 0.006*\"kill\" + 0.005*\"dai\" + 0.005*\"retrospect\" + 0.005*\"man\" + 0.004*\"deal\" + 0.004*\"like\" + 0.004*\"help\"\n", + "2019-01-31 00:26:01,454 : INFO : topic #14 (0.020): 0.024*\"forc\" + 0.020*\"walter\" + 0.020*\"armi\" + 0.018*\"aggress\" + 0.017*\"oper\" + 0.016*\"com\" + 0.012*\"unionist\" + 0.012*\"militari\" + 0.012*\"diversifi\" + 0.012*\"airbu\"\n", + "2019-01-31 00:26:01,459 : INFO : topic diff=0.010976, rho=0.057448\n", + "2019-01-31 00:26:01,669 : INFO : PROGRESS: pass 0, at document #608000/4922894\n", + "2019-01-31 00:26:03,076 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:26:03,343 : INFO : topic #12 (0.020): 0.009*\"number\" + 0.008*\"exampl\" + 0.007*\"southern\" + 0.007*\"théori\" + 0.007*\"frontal\" + 0.006*\"gener\" + 0.006*\"servitud\" + 0.006*\"mode\" + 0.006*\"measur\" + 0.006*\"poet\"\n", + "2019-01-31 00:26:03,344 : INFO : topic #47 (0.020): 0.065*\"muscl\" + 0.034*\"perceptu\" + 0.021*\"theater\" + 0.018*\"compos\" + 0.016*\"physician\" + 0.015*\"place\" + 0.015*\"damn\" + 0.015*\"orchestr\" + 0.014*\"olympo\" + 0.012*\"son\"\n", + "2019-01-31 00:26:03,345 : INFO : topic #15 (0.020): 0.012*\"small\" + 0.012*\"develop\" + 0.010*\"organ\" + 0.010*\"word\" + 0.010*\"commun\" + 0.009*\"cultur\" + 0.008*\"group\" + 0.008*\"human\" + 0.007*\"requir\" + 0.007*\"student\"\n", + "2019-01-31 00:26:03,347 : INFO : topic #21 (0.020): 0.036*\"samford\" + 0.022*\"spain\" + 0.019*\"del\" + 0.019*\"mexico\" + 0.014*\"soviet\" + 0.012*\"francisco\" + 0.012*\"santa\" + 0.011*\"juan\" + 0.010*\"lizard\" + 0.010*\"mexican\"\n", + "2019-01-31 00:26:03,348 : INFO : topic #42 (0.020): 0.047*\"german\" + 0.028*\"germani\" + 0.014*\"berlin\" + 0.014*\"jewish\" + 0.014*\"vol\" + 0.013*\"der\" + 0.012*\"israel\" + 0.008*\"austria\" + 0.008*\"itali\" + 0.008*\"jeremiah\"\n", + "2019-01-31 00:26:03,354 : INFO : topic diff=0.010731, rho=0.057354\n", + "2019-01-31 00:26:03,508 : INFO : PROGRESS: pass 0, at document #610000/4922894\n", + "2019-01-31 00:26:04,932 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:26:05,198 : INFO : topic #12 (0.020): 0.009*\"number\" + 0.007*\"exampl\" + 0.007*\"southern\" + 0.007*\"théori\" + 0.007*\"frontal\" + 0.006*\"gener\" + 0.006*\"servitud\" + 0.006*\"mode\" + 0.006*\"poet\" + 0.006*\"measur\"\n", + "2019-01-31 00:26:05,199 : INFO : topic #40 (0.020): 0.091*\"unit\" + 0.027*\"collector\" + 0.023*\"schuster\" + 0.022*\"institut\" + 0.018*\"requir\" + 0.017*\"student\" + 0.015*\"professor\" + 0.012*\"governor\" + 0.012*\"word\" + 0.012*\"degre\"\n", + "2019-01-31 00:26:05,201 : INFO : topic #42 (0.020): 0.047*\"german\" + 0.029*\"germani\" + 0.015*\"berlin\" + 0.014*\"vol\" + 0.013*\"jewish\" + 0.013*\"der\" + 0.012*\"israel\" + 0.009*\"austria\" + 0.008*\"itali\" + 0.007*\"jeremiah\"\n", + "2019-01-31 00:26:05,202 : INFO : topic #43 (0.020): 0.064*\"elect\" + 0.057*\"parti\" + 0.027*\"democrat\" + 0.023*\"voluntari\" + 0.021*\"member\" + 0.018*\"polici\" + 0.017*\"republ\" + 0.014*\"liber\" + 0.014*\"bypass\" + 0.014*\"report\"\n", + "2019-01-31 00:26:05,203 : INFO : topic #7 (0.020): 0.020*\"snatch\" + 0.019*\"di\" + 0.018*\"factor\" + 0.015*\"yawn\" + 0.015*\"margin\" + 0.014*\"bone\" + 0.012*\"life\" + 0.012*\"faster\" + 0.011*\"daughter\" + 0.011*\"john\"\n", + "2019-01-31 00:26:05,209 : INFO : topic diff=0.010795, rho=0.057260\n", + "2019-01-31 00:26:05,367 : INFO : PROGRESS: pass 0, at document #612000/4922894\n", + "2019-01-31 00:26:06,829 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:26:07,095 : INFO : topic #13 (0.020): 0.028*\"australia\" + 0.027*\"sourc\" + 0.025*\"new\" + 0.023*\"australian\" + 0.023*\"london\" + 0.023*\"england\" + 0.021*\"ireland\" + 0.020*\"british\" + 0.015*\"youth\" + 0.013*\"weekli\"\n", + "2019-01-31 00:26:07,096 : INFO : topic #14 (0.020): 0.024*\"forc\" + 0.021*\"armi\" + 0.020*\"walter\" + 0.018*\"aggress\" + 0.016*\"com\" + 0.016*\"oper\" + 0.012*\"unionist\" + 0.012*\"militari\" + 0.012*\"diversifi\" + 0.011*\"airbu\"\n", + "2019-01-31 00:26:07,098 : INFO : topic #39 (0.020): 0.032*\"canada\" + 0.028*\"canadian\" + 0.019*\"taxpay\" + 0.018*\"scientist\" + 0.015*\"hoar\" + 0.015*\"basketbal\" + 0.014*\"toronto\" + 0.014*\"confer\" + 0.013*\"ontario\" + 0.011*\"new\"\n", + "2019-01-31 00:26:07,099 : INFO : topic #30 (0.020): 0.038*\"leagu\" + 0.036*\"cleveland\" + 0.029*\"place\" + 0.026*\"taxpay\" + 0.025*\"scientist\" + 0.023*\"crete\" + 0.022*\"folei\" + 0.016*\"goal\" + 0.015*\"martin\" + 0.011*\"schmitz\"\n", + "2019-01-31 00:26:07,100 : INFO : topic #6 (0.020): 0.067*\"fewer\" + 0.026*\"septemb\" + 0.022*\"epiru\" + 0.019*\"teacher\" + 0.016*\"stake\" + 0.012*\"rodríguez\" + 0.012*\"proclaim\" + 0.011*\"direct\" + 0.010*\"movi\" + 0.010*\"acrimoni\"\n", + "2019-01-31 00:26:07,106 : INFO : topic diff=0.011850, rho=0.057166\n", + "2019-01-31 00:26:07,264 : INFO : PROGRESS: pass 0, at document #614000/4922894\n", + "2019-01-31 00:26:08,709 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:26:08,975 : INFO : topic #33 (0.020): 0.060*\"french\" + 0.044*\"franc\" + 0.031*\"pari\" + 0.022*\"sail\" + 0.021*\"jean\" + 0.017*\"daphn\" + 0.013*\"lazi\" + 0.013*\"loui\" + 0.010*\"piec\" + 0.009*\"focal\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 00:26:08,977 : INFO : topic #32 (0.020): 0.057*\"district\" + 0.045*\"vigour\" + 0.044*\"tortur\" + 0.042*\"popolo\" + 0.030*\"cotton\" + 0.028*\"regim\" + 0.028*\"area\" + 0.024*\"multitud\" + 0.024*\"citi\" + 0.019*\"commun\"\n", + "2019-01-31 00:26:08,978 : INFO : topic #10 (0.020): 0.012*\"cdd\" + 0.009*\"disco\" + 0.007*\"proper\" + 0.007*\"caus\" + 0.007*\"media\" + 0.007*\"pathwai\" + 0.007*\"have\" + 0.006*\"treat\" + 0.006*\"hormon\" + 0.006*\"effect\"\n", + "2019-01-31 00:26:08,979 : INFO : topic #2 (0.020): 0.046*\"isl\" + 0.036*\"shield\" + 0.019*\"narrat\" + 0.014*\"scot\" + 0.012*\"blur\" + 0.012*\"pope\" + 0.010*\"nativist\" + 0.010*\"fleet\" + 0.010*\"coalit\" + 0.010*\"class\"\n", + "2019-01-31 00:26:08,981 : INFO : topic #18 (0.020): 0.009*\"théori\" + 0.007*\"later\" + 0.007*\"sack\" + 0.006*\"kill\" + 0.005*\"dai\" + 0.005*\"retrospect\" + 0.005*\"deal\" + 0.004*\"man\" + 0.004*\"like\" + 0.004*\"end\"\n", + "2019-01-31 00:26:08,987 : INFO : topic diff=0.009898, rho=0.057073\n", + "2019-01-31 00:26:09,139 : INFO : PROGRESS: pass 0, at document #616000/4922894\n", + "2019-01-31 00:26:10,557 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:26:10,823 : INFO : topic #19 (0.020): 0.013*\"languag\" + 0.010*\"origin\" + 0.010*\"woodcut\" + 0.009*\"form\" + 0.008*\"mean\" + 0.008*\"uruguayan\" + 0.007*\"like\" + 0.007*\"centuri\" + 0.006*\"dynam\" + 0.006*\"english\"\n", + "2019-01-31 00:26:10,824 : INFO : topic #34 (0.020): 0.073*\"start\" + 0.030*\"unionist\" + 0.030*\"cotton\" + 0.028*\"american\" + 0.023*\"new\" + 0.014*\"terri\" + 0.013*\"california\" + 0.012*\"warrior\" + 0.012*\"north\" + 0.011*\"year\"\n", + "2019-01-31 00:26:10,826 : INFO : topic #32 (0.020): 0.056*\"district\" + 0.045*\"vigour\" + 0.043*\"tortur\" + 0.042*\"popolo\" + 0.029*\"cotton\" + 0.028*\"area\" + 0.028*\"regim\" + 0.024*\"multitud\" + 0.024*\"citi\" + 0.019*\"commun\"\n", + "2019-01-31 00:26:10,827 : INFO : topic #10 (0.020): 0.013*\"cdd\" + 0.009*\"disco\" + 0.007*\"proper\" + 0.007*\"caus\" + 0.007*\"media\" + 0.007*\"pathwai\" + 0.007*\"have\" + 0.006*\"hormon\" + 0.006*\"effect\" + 0.006*\"treat\"\n", + "2019-01-31 00:26:10,829 : INFO : topic #18 (0.020): 0.009*\"théori\" + 0.007*\"later\" + 0.007*\"sack\" + 0.006*\"kill\" + 0.005*\"dai\" + 0.005*\"retrospect\" + 0.004*\"deal\" + 0.004*\"man\" + 0.004*\"like\" + 0.004*\"end\"\n", + "2019-01-31 00:26:10,834 : INFO : topic diff=0.011246, rho=0.056980\n", + "2019-01-31 00:26:10,992 : INFO : PROGRESS: pass 0, at document #618000/4922894\n", + "2019-01-31 00:26:12,421 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:26:12,687 : INFO : topic #35 (0.020): 0.056*\"russia\" + 0.030*\"sovereignti\" + 0.030*\"rural\" + 0.025*\"personifi\" + 0.024*\"poison\" + 0.024*\"reprint\" + 0.020*\"turin\" + 0.020*\"moscow\" + 0.016*\"poland\" + 0.015*\"tyrant\"\n", + "2019-01-31 00:26:12,688 : INFO : topic #46 (0.020): 0.023*\"stop\" + 0.015*\"sweden\" + 0.015*\"norwai\" + 0.015*\"wind\" + 0.014*\"treeless\" + 0.014*\"swedish\" + 0.014*\"norwegian\" + 0.013*\"damag\" + 0.011*\"huntsvil\" + 0.010*\"denmark\"\n", + "2019-01-31 00:26:12,689 : INFO : topic #13 (0.020): 0.028*\"australia\" + 0.027*\"sourc\" + 0.026*\"new\" + 0.023*\"australian\" + 0.023*\"england\" + 0.023*\"london\" + 0.020*\"ireland\" + 0.020*\"british\" + 0.015*\"youth\" + 0.014*\"weekli\"\n", + "2019-01-31 00:26:12,691 : INFO : topic #5 (0.020): 0.040*\"abroad\" + 0.028*\"son\" + 0.027*\"rel\" + 0.025*\"reconstruct\" + 0.022*\"band\" + 0.018*\"muscl\" + 0.016*\"simultan\" + 0.014*\"charcoal\" + 0.014*\"toyota\" + 0.010*\"vocabulari\"\n", + "2019-01-31 00:26:12,692 : INFO : topic #38 (0.020): 0.020*\"walter\" + 0.010*\"king\" + 0.010*\"aza\" + 0.009*\"empath\" + 0.009*\"battalion\" + 0.009*\"teufel\" + 0.008*\"centuri\" + 0.008*\"forc\" + 0.008*\"till\" + 0.007*\"armi\"\n", + "2019-01-31 00:26:12,698 : INFO : topic diff=0.009396, rho=0.056888\n", + "2019-01-31 00:26:15,397 : INFO : -11.501 per-word bound, 2897.9 perplexity estimate based on a held-out corpus of 2000 documents with 528109 words\n", + "2019-01-31 00:26:15,398 : INFO : PROGRESS: pass 0, at document #620000/4922894\n", + "2019-01-31 00:26:16,813 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:26:17,080 : INFO : topic #49 (0.020): 0.041*\"india\" + 0.029*\"incumb\" + 0.015*\"islam\" + 0.012*\"pakistan\" + 0.011*\"televis\" + 0.011*\"muskoge\" + 0.011*\"khalsa\" + 0.011*\"alam\" + 0.009*\"singh\" + 0.009*\"start\"\n", + "2019-01-31 00:26:17,081 : INFO : topic #5 (0.020): 0.040*\"abroad\" + 0.028*\"son\" + 0.027*\"rel\" + 0.025*\"reconstruct\" + 0.022*\"band\" + 0.018*\"muscl\" + 0.016*\"simultan\" + 0.014*\"charcoal\" + 0.014*\"toyota\" + 0.010*\"vocabulari\"\n", + "2019-01-31 00:26:17,082 : INFO : topic #10 (0.020): 0.013*\"cdd\" + 0.008*\"disco\" + 0.007*\"proper\" + 0.007*\"media\" + 0.007*\"caus\" + 0.007*\"pathwai\" + 0.006*\"have\" + 0.006*\"hormon\" + 0.006*\"effect\" + 0.006*\"treat\"\n", + "2019-01-31 00:26:17,083 : INFO : topic #3 (0.020): 0.039*\"present\" + 0.029*\"offic\" + 0.027*\"minist\" + 0.021*\"member\" + 0.020*\"gener\" + 0.019*\"seri\" + 0.017*\"govern\" + 0.016*\"chickasaw\" + 0.016*\"serv\" + 0.015*\"nation\"\n", + "2019-01-31 00:26:17,085 : INFO : topic #38 (0.020): 0.020*\"walter\" + 0.010*\"king\" + 0.010*\"aza\" + 0.009*\"empath\" + 0.009*\"battalion\" + 0.009*\"teufel\" + 0.008*\"centuri\" + 0.008*\"forc\" + 0.007*\"till\" + 0.007*\"armi\"\n", + "2019-01-31 00:26:17,091 : INFO : topic diff=0.009777, rho=0.056796\n", + "2019-01-31 00:26:17,245 : INFO : PROGRESS: pass 0, at document #622000/4922894\n", + "2019-01-31 00:26:18,664 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:26:18,930 : INFO : topic #40 (0.020): 0.089*\"unit\" + 0.027*\"collector\" + 0.023*\"schuster\" + 0.021*\"institut\" + 0.018*\"requir\" + 0.018*\"student\" + 0.015*\"professor\" + 0.012*\"degre\" + 0.012*\"governor\" + 0.012*\"word\"\n", + "2019-01-31 00:26:18,931 : INFO : topic #19 (0.020): 0.013*\"languag\" + 0.010*\"origin\" + 0.010*\"woodcut\" + 0.009*\"form\" + 0.008*\"mean\" + 0.008*\"uruguayan\" + 0.007*\"like\" + 0.007*\"centuri\" + 0.007*\"god\" + 0.006*\"charact\"\n", + "2019-01-31 00:26:18,932 : INFO : topic #28 (0.020): 0.030*\"build\" + 0.025*\"hous\" + 0.020*\"rivièr\" + 0.017*\"buford\" + 0.013*\"histor\" + 0.011*\"constitut\" + 0.011*\"strategist\" + 0.010*\"rosenwald\" + 0.010*\"depress\" + 0.009*\"briarwood\"\n", + "2019-01-31 00:26:18,934 : INFO : topic #27 (0.020): 0.068*\"questionnair\" + 0.019*\"taxpay\" + 0.016*\"ret\" + 0.015*\"candid\" + 0.014*\"tornado\" + 0.013*\"squatter\" + 0.012*\"driver\" + 0.012*\"horac\" + 0.011*\"fool\" + 0.011*\"find\"\n", + "2019-01-31 00:26:18,935 : INFO : topic #11 (0.020): 0.027*\"john\" + 0.015*\"will\" + 0.013*\"jame\" + 0.012*\"david\" + 0.011*\"rival\" + 0.010*\"georg\" + 0.009*\"slur\" + 0.009*\"mexican–american\" + 0.008*\"paul\" + 0.008*\"rhyme\"\n", + "2019-01-31 00:26:18,941 : INFO : topic diff=0.008711, rho=0.056705\n", + "2019-01-31 00:26:19,100 : INFO : PROGRESS: pass 0, at document #624000/4922894\n", + "2019-01-31 00:26:20,566 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:26:20,832 : INFO : topic #29 (0.020): 0.010*\"start\" + 0.010*\"govern\" + 0.009*\"million\" + 0.008*\"yawn\" + 0.007*\"countri\" + 0.007*\"bank\" + 0.007*\"function\" + 0.006*\"trace\" + 0.006*\"replac\" + 0.006*\"placement\"\n", + "2019-01-31 00:26:20,833 : INFO : topic #37 (0.020): 0.010*\"love\" + 0.008*\"gestur\" + 0.008*\"man\" + 0.005*\"blue\" + 0.005*\"bewild\" + 0.005*\"litig\" + 0.004*\"night\" + 0.004*\"ladi\" + 0.003*\"york\" + 0.003*\"healthcar\"\n", + "2019-01-31 00:26:20,834 : INFO : topic #0 (0.020): 0.067*\"statewid\" + 0.040*\"arsen\" + 0.038*\"line\" + 0.032*\"raid\" + 0.029*\"museo\" + 0.021*\"traceabl\" + 0.017*\"serv\" + 0.015*\"pain\" + 0.014*\"exhaust\" + 0.013*\"artist\"\n", + "2019-01-31 00:26:20,836 : INFO : topic #7 (0.020): 0.021*\"snatch\" + 0.020*\"di\" + 0.018*\"factor\" + 0.015*\"yawn\" + 0.015*\"margin\" + 0.013*\"bone\" + 0.012*\"faster\" + 0.012*\"life\" + 0.012*\"daughter\" + 0.011*\"john\"\n", + "2019-01-31 00:26:20,837 : INFO : topic #15 (0.020): 0.012*\"small\" + 0.012*\"develop\" + 0.011*\"organ\" + 0.010*\"word\" + 0.009*\"commun\" + 0.009*\"cultur\" + 0.008*\"human\" + 0.008*\"group\" + 0.008*\"peopl\" + 0.007*\"student\"\n", + "2019-01-31 00:26:20,843 : INFO : topic diff=0.011849, rho=0.056614\n", + "2019-01-31 00:26:21,001 : INFO : PROGRESS: pass 0, at document #626000/4922894\n", + "2019-01-31 00:26:22,437 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:26:22,703 : INFO : topic #49 (0.020): 0.040*\"india\" + 0.028*\"incumb\" + 0.015*\"islam\" + 0.012*\"televis\" + 0.011*\"pakistan\" + 0.011*\"alam\" + 0.011*\"muskoge\" + 0.011*\"khalsa\" + 0.010*\"start\" + 0.009*\"singh\"\n", + "2019-01-31 00:26:22,704 : INFO : topic #5 (0.020): 0.040*\"abroad\" + 0.028*\"son\" + 0.028*\"rel\" + 0.025*\"reconstruct\" + 0.022*\"band\" + 0.018*\"muscl\" + 0.016*\"simultan\" + 0.014*\"charcoal\" + 0.014*\"toyota\" + 0.010*\"myspac\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 00:26:22,705 : INFO : topic #22 (0.020): 0.034*\"spars\" + 0.026*\"factor\" + 0.023*\"adulthood\" + 0.019*\"feel\" + 0.016*\"hostil\" + 0.016*\"male\" + 0.012*\"live\" + 0.011*\"plaisir\" + 0.010*\"yawn\" + 0.009*\"genu\"\n", + "2019-01-31 00:26:22,707 : INFO : topic #9 (0.020): 0.071*\"bone\" + 0.042*\"american\" + 0.028*\"valour\" + 0.020*\"dutch\" + 0.018*\"polit\" + 0.017*\"player\" + 0.016*\"folei\" + 0.016*\"english\" + 0.011*\"netherland\" + 0.010*\"acrimoni\"\n", + "2019-01-31 00:26:22,708 : INFO : topic #3 (0.020): 0.039*\"present\" + 0.029*\"offic\" + 0.028*\"minist\" + 0.021*\"member\" + 0.020*\"gener\" + 0.019*\"seri\" + 0.017*\"govern\" + 0.016*\"chickasaw\" + 0.015*\"serv\" + 0.015*\"nation\"\n", + "2019-01-31 00:26:22,713 : INFO : topic diff=0.009073, rho=0.056523\n", + "2019-01-31 00:26:22,871 : INFO : PROGRESS: pass 0, at document #628000/4922894\n", + "2019-01-31 00:26:24,315 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:26:24,581 : INFO : topic #38 (0.020): 0.021*\"walter\" + 0.011*\"aza\" + 0.010*\"king\" + 0.009*\"battalion\" + 0.009*\"teufel\" + 0.009*\"empath\" + 0.008*\"till\" + 0.008*\"centuri\" + 0.008*\"forc\" + 0.007*\"armi\"\n", + "2019-01-31 00:26:24,583 : INFO : topic #14 (0.020): 0.023*\"forc\" + 0.021*\"walter\" + 0.021*\"armi\" + 0.018*\"aggress\" + 0.016*\"com\" + 0.016*\"oper\" + 0.012*\"unionist\" + 0.012*\"militari\" + 0.011*\"airbu\" + 0.010*\"refut\"\n", + "2019-01-31 00:26:24,584 : INFO : topic #17 (0.020): 0.073*\"church\" + 0.023*\"cathol\" + 0.022*\"christian\" + 0.017*\"bishop\" + 0.016*\"retroflex\" + 0.014*\"sail\" + 0.012*\"centuri\" + 0.009*\"historiographi\" + 0.009*\"italian\" + 0.008*\"poll\"\n", + "2019-01-31 00:26:24,585 : INFO : topic #21 (0.020): 0.038*\"samford\" + 0.021*\"spain\" + 0.020*\"del\" + 0.017*\"mexico\" + 0.013*\"soviet\" + 0.012*\"francisco\" + 0.011*\"juan\" + 0.011*\"lizard\" + 0.011*\"santa\" + 0.011*\"josé\"\n", + "2019-01-31 00:26:24,586 : INFO : topic #44 (0.020): 0.033*\"rooftop\" + 0.028*\"final\" + 0.023*\"wife\" + 0.022*\"tourist\" + 0.017*\"champion\" + 0.015*\"taxpay\" + 0.015*\"chamber\" + 0.015*\"tiepolo\" + 0.014*\"martin\" + 0.012*\"open\"\n", + "2019-01-31 00:26:24,592 : INFO : topic diff=0.011036, rho=0.056433\n", + "2019-01-31 00:26:24,748 : INFO : PROGRESS: pass 0, at document #630000/4922894\n", + "2019-01-31 00:26:26,155 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:26:26,421 : INFO : topic #28 (0.020): 0.030*\"build\" + 0.025*\"hous\" + 0.020*\"rivièr\" + 0.017*\"buford\" + 0.013*\"histor\" + 0.011*\"constitut\" + 0.011*\"strategist\" + 0.010*\"rosenwald\" + 0.010*\"depress\" + 0.009*\"silicon\"\n", + "2019-01-31 00:26:26,422 : INFO : topic #19 (0.020): 0.013*\"languag\" + 0.010*\"origin\" + 0.010*\"woodcut\" + 0.010*\"form\" + 0.008*\"mean\" + 0.008*\"uruguayan\" + 0.007*\"centuri\" + 0.007*\"like\" + 0.006*\"god\" + 0.006*\"dynam\"\n", + "2019-01-31 00:26:26,424 : INFO : topic #5 (0.020): 0.040*\"abroad\" + 0.029*\"son\" + 0.028*\"rel\" + 0.025*\"reconstruct\" + 0.022*\"band\" + 0.017*\"muscl\" + 0.016*\"simultan\" + 0.014*\"charcoal\" + 0.014*\"toyota\" + 0.010*\"myspac\"\n", + "2019-01-31 00:26:26,425 : INFO : topic #21 (0.020): 0.038*\"samford\" + 0.021*\"spain\" + 0.020*\"del\" + 0.017*\"mexico\" + 0.013*\"soviet\" + 0.012*\"francisco\" + 0.011*\"juan\" + 0.011*\"santa\" + 0.011*\"lizard\" + 0.011*\"carlo\"\n", + "2019-01-31 00:26:26,427 : INFO : topic #23 (0.020): 0.139*\"audit\" + 0.067*\"best\" + 0.037*\"yawn\" + 0.033*\"jacksonvil\" + 0.024*\"japanes\" + 0.021*\"noll\" + 0.019*\"women\" + 0.018*\"festiv\" + 0.017*\"intern\" + 0.014*\"prison\"\n", + "2019-01-31 00:26:26,432 : INFO : topic diff=0.009004, rho=0.056344\n", + "2019-01-31 00:26:26,588 : INFO : PROGRESS: pass 0, at document #632000/4922894\n", + "2019-01-31 00:26:28,022 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:26:28,289 : INFO : topic #29 (0.020): 0.010*\"start\" + 0.010*\"govern\" + 0.009*\"million\" + 0.008*\"yawn\" + 0.007*\"bank\" + 0.007*\"countri\" + 0.007*\"function\" + 0.006*\"replac\" + 0.006*\"trace\" + 0.006*\"théori\"\n", + "2019-01-31 00:26:28,290 : INFO : topic #46 (0.020): 0.022*\"stop\" + 0.015*\"norwegian\" + 0.015*\"sweden\" + 0.015*\"norwai\" + 0.014*\"damag\" + 0.014*\"swedish\" + 0.014*\"wind\" + 0.013*\"treeless\" + 0.011*\"farid\" + 0.010*\"danish\"\n", + "2019-01-31 00:26:28,292 : INFO : topic #25 (0.020): 0.029*\"ring\" + 0.019*\"warmth\" + 0.017*\"lagrang\" + 0.015*\"area\" + 0.014*\"mount\" + 0.009*\"palmer\" + 0.008*\"foam\" + 0.008*\"north\" + 0.008*\"lobe\" + 0.008*\"land\"\n", + "2019-01-31 00:26:28,293 : INFO : topic #41 (0.020): 0.046*\"citi\" + 0.036*\"new\" + 0.023*\"palmer\" + 0.020*\"year\" + 0.017*\"center\" + 0.015*\"strategist\" + 0.012*\"open\" + 0.010*\"includ\" + 0.009*\"lobe\" + 0.008*\"highli\"\n", + "2019-01-31 00:26:28,294 : INFO : topic #28 (0.020): 0.030*\"build\" + 0.025*\"hous\" + 0.020*\"rivièr\" + 0.017*\"buford\" + 0.013*\"histor\" + 0.011*\"constitut\" + 0.011*\"strategist\" + 0.010*\"rosenwald\" + 0.010*\"depress\" + 0.010*\"briarwood\"\n", + "2019-01-31 00:26:28,300 : INFO : topic diff=0.009596, rho=0.056254\n", + "2019-01-31 00:26:28,454 : INFO : PROGRESS: pass 0, at document #634000/4922894\n", + "2019-01-31 00:26:29,858 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:26:30,125 : INFO : topic #44 (0.020): 0.034*\"rooftop\" + 0.028*\"final\" + 0.024*\"wife\" + 0.022*\"tourist\" + 0.016*\"champion\" + 0.015*\"taxpay\" + 0.015*\"chamber\" + 0.014*\"tiepolo\" + 0.013*\"martin\" + 0.012*\"open\"\n", + "2019-01-31 00:26:30,126 : INFO : topic #12 (0.020): 0.009*\"number\" + 0.008*\"frontal\" + 0.007*\"théori\" + 0.007*\"exampl\" + 0.007*\"southern\" + 0.006*\"gener\" + 0.006*\"servitud\" + 0.006*\"poet\" + 0.005*\"mode\" + 0.005*\"differ\"\n", + "2019-01-31 00:26:30,127 : INFO : topic #41 (0.020): 0.046*\"citi\" + 0.036*\"new\" + 0.023*\"palmer\" + 0.020*\"year\" + 0.017*\"center\" + 0.015*\"strategist\" + 0.012*\"open\" + 0.010*\"includ\" + 0.009*\"lobe\" + 0.008*\"hot\"\n", + "2019-01-31 00:26:30,128 : INFO : topic #32 (0.020): 0.055*\"district\" + 0.045*\"vigour\" + 0.042*\"popolo\" + 0.041*\"tortur\" + 0.029*\"cotton\" + 0.029*\"regim\" + 0.027*\"area\" + 0.026*\"multitud\" + 0.022*\"citi\" + 0.019*\"commun\"\n", + "2019-01-31 00:26:30,130 : INFO : topic #23 (0.020): 0.138*\"audit\" + 0.068*\"best\" + 0.037*\"yawn\" + 0.034*\"jacksonvil\" + 0.024*\"japanes\" + 0.020*\"noll\" + 0.019*\"women\" + 0.018*\"festiv\" + 0.017*\"intern\" + 0.016*\"prison\"\n", + "2019-01-31 00:26:30,135 : INFO : topic diff=0.009048, rho=0.056166\n", + "2019-01-31 00:26:30,289 : INFO : PROGRESS: pass 0, at document #636000/4922894\n", + "2019-01-31 00:26:31,715 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:26:31,981 : INFO : topic #35 (0.020): 0.054*\"russia\" + 0.030*\"rural\" + 0.029*\"sovereignti\" + 0.027*\"personifi\" + 0.026*\"poison\" + 0.024*\"reprint\" + 0.019*\"moscow\" + 0.017*\"turin\" + 0.017*\"poland\" + 0.014*\"unfortun\"\n", + "2019-01-31 00:26:31,982 : INFO : topic #24 (0.020): 0.039*\"book\" + 0.036*\"publicis\" + 0.023*\"word\" + 0.016*\"new\" + 0.015*\"edit\" + 0.013*\"presid\" + 0.013*\"storag\" + 0.011*\"nicola\" + 0.011*\"worldwid\" + 0.011*\"author\"\n", + "2019-01-31 00:26:31,983 : INFO : topic #32 (0.020): 0.055*\"district\" + 0.045*\"vigour\" + 0.042*\"popolo\" + 0.041*\"tortur\" + 0.029*\"regim\" + 0.029*\"cotton\" + 0.028*\"area\" + 0.026*\"multitud\" + 0.022*\"citi\" + 0.019*\"commun\"\n", + "2019-01-31 00:26:31,984 : INFO : topic #6 (0.020): 0.067*\"fewer\" + 0.025*\"septemb\" + 0.022*\"epiru\" + 0.019*\"teacher\" + 0.016*\"stake\" + 0.012*\"proclaim\" + 0.012*\"rodríguez\" + 0.011*\"produc\" + 0.010*\"direct\" + 0.010*\"movi\"\n", + "2019-01-31 00:26:31,986 : INFO : topic #27 (0.020): 0.068*\"questionnair\" + 0.019*\"taxpay\" + 0.015*\"candid\" + 0.015*\"ret\" + 0.014*\"squatter\" + 0.014*\"tornado\" + 0.012*\"fool\" + 0.012*\"find\" + 0.012*\"driver\" + 0.010*\"champion\"\n", + "2019-01-31 00:26:31,992 : INFO : topic diff=0.010206, rho=0.056077\n", + "2019-01-31 00:26:32,206 : INFO : PROGRESS: pass 0, at document #638000/4922894\n", + "2019-01-31 00:26:33,661 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:26:33,926 : INFO : topic #41 (0.020): 0.045*\"citi\" + 0.035*\"new\" + 0.022*\"palmer\" + 0.020*\"year\" + 0.017*\"center\" + 0.015*\"strategist\" + 0.012*\"open\" + 0.010*\"includ\" + 0.009*\"lobe\" + 0.008*\"hot\"\n", + "2019-01-31 00:26:33,927 : INFO : topic #2 (0.020): 0.046*\"isl\" + 0.036*\"shield\" + 0.019*\"narrat\" + 0.014*\"scot\" + 0.013*\"blur\" + 0.013*\"pope\" + 0.010*\"nativist\" + 0.010*\"coalit\" + 0.009*\"crew\" + 0.009*\"class\"\n", + "2019-01-31 00:26:33,928 : INFO : topic #13 (0.020): 0.027*\"australia\" + 0.026*\"sourc\" + 0.026*\"new\" + 0.024*\"london\" + 0.024*\"england\" + 0.022*\"australian\" + 0.021*\"ireland\" + 0.021*\"british\" + 0.016*\"youth\" + 0.015*\"wale\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 00:26:33,930 : INFO : topic #8 (0.020): 0.028*\"law\" + 0.026*\"cortic\" + 0.020*\"act\" + 0.017*\"start\" + 0.017*\"ricardo\" + 0.014*\"case\" + 0.009*\"polaris\" + 0.009*\"legal\" + 0.008*\"judaism\" + 0.007*\"justic\"\n", + "2019-01-31 00:26:33,931 : INFO : topic #6 (0.020): 0.068*\"fewer\" + 0.025*\"septemb\" + 0.022*\"epiru\" + 0.019*\"teacher\" + 0.016*\"stake\" + 0.012*\"proclaim\" + 0.012*\"rodríguez\" + 0.010*\"produc\" + 0.010*\"direct\" + 0.010*\"movi\"\n", + "2019-01-31 00:26:33,937 : INFO : topic diff=0.010140, rho=0.055989\n", + "2019-01-31 00:26:36,710 : INFO : -11.903 per-word bound, 3828.9 perplexity estimate based on a held-out corpus of 2000 documents with 575834 words\n", + "2019-01-31 00:26:36,710 : INFO : PROGRESS: pass 0, at document #640000/4922894\n", + "2019-01-31 00:26:38,151 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:26:38,418 : INFO : topic #23 (0.020): 0.136*\"audit\" + 0.067*\"best\" + 0.036*\"yawn\" + 0.033*\"jacksonvil\" + 0.026*\"japanes\" + 0.021*\"noll\" + 0.019*\"women\" + 0.019*\"festiv\" + 0.018*\"intern\" + 0.015*\"prison\"\n", + "2019-01-31 00:26:38,419 : INFO : topic #6 (0.020): 0.068*\"fewer\" + 0.025*\"septemb\" + 0.022*\"epiru\" + 0.019*\"teacher\" + 0.016*\"stake\" + 0.012*\"rodríguez\" + 0.012*\"proclaim\" + 0.011*\"produc\" + 0.010*\"direct\" + 0.010*\"movi\"\n", + "2019-01-31 00:26:38,420 : INFO : topic #37 (0.020): 0.010*\"love\" + 0.008*\"gestur\" + 0.008*\"man\" + 0.005*\"blue\" + 0.005*\"bewild\" + 0.004*\"litig\" + 0.004*\"night\" + 0.004*\"ladi\" + 0.003*\"york\" + 0.003*\"dramatist\"\n", + "2019-01-31 00:26:38,421 : INFO : topic #41 (0.020): 0.045*\"citi\" + 0.035*\"new\" + 0.022*\"palmer\" + 0.020*\"year\" + 0.017*\"center\" + 0.015*\"strategist\" + 0.012*\"open\" + 0.010*\"includ\" + 0.010*\"lobe\" + 0.008*\"highli\"\n", + "2019-01-31 00:26:38,422 : INFO : topic #15 (0.020): 0.012*\"small\" + 0.012*\"develop\" + 0.011*\"organ\" + 0.010*\"commun\" + 0.010*\"word\" + 0.009*\"cultur\" + 0.008*\"human\" + 0.008*\"group\" + 0.008*\"peopl\" + 0.007*\"student\"\n", + "2019-01-31 00:26:38,428 : INFO : topic diff=0.010132, rho=0.055902\n", + "2019-01-31 00:26:38,587 : INFO : PROGRESS: pass 0, at document #642000/4922894\n", + "2019-01-31 00:26:40,021 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:26:40,287 : INFO : topic #15 (0.020): 0.012*\"small\" + 0.012*\"develop\" + 0.011*\"organ\" + 0.010*\"commun\" + 0.010*\"word\" + 0.009*\"cultur\" + 0.008*\"human\" + 0.008*\"group\" + 0.008*\"peopl\" + 0.007*\"student\"\n", + "2019-01-31 00:26:40,288 : INFO : topic #6 (0.020): 0.068*\"fewer\" + 0.025*\"septemb\" + 0.022*\"epiru\" + 0.019*\"teacher\" + 0.016*\"stake\" + 0.012*\"rodríguez\" + 0.012*\"proclaim\" + 0.011*\"produc\" + 0.010*\"direct\" + 0.010*\"movi\"\n", + "2019-01-31 00:26:40,289 : INFO : topic #43 (0.020): 0.064*\"elect\" + 0.055*\"parti\" + 0.024*\"voluntari\" + 0.024*\"democrat\" + 0.021*\"member\" + 0.019*\"polici\" + 0.015*\"republ\" + 0.015*\"seaport\" + 0.014*\"bypass\" + 0.014*\"liber\"\n", + "2019-01-31 00:26:40,290 : INFO : topic #29 (0.020): 0.010*\"start\" + 0.010*\"govern\" + 0.009*\"million\" + 0.008*\"yawn\" + 0.007*\"countri\" + 0.007*\"bank\" + 0.007*\"function\" + 0.006*\"trace\" + 0.006*\"replac\" + 0.006*\"new\"\n", + "2019-01-31 00:26:40,291 : INFO : topic #42 (0.020): 0.046*\"german\" + 0.027*\"germani\" + 0.015*\"jewish\" + 0.015*\"berlin\" + 0.013*\"vol\" + 0.013*\"israel\" + 0.012*\"der\" + 0.010*\"austria\" + 0.009*\"hungarian\" + 0.009*\"jeremiah\"\n", + "2019-01-31 00:26:40,297 : INFO : topic diff=0.010181, rho=0.055815\n", + "2019-01-31 00:26:40,456 : INFO : PROGRESS: pass 0, at document #644000/4922894\n", + "2019-01-31 00:26:41,904 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:26:42,174 : INFO : topic #35 (0.020): 0.053*\"russia\" + 0.031*\"rural\" + 0.028*\"sovereignti\" + 0.026*\"personifi\" + 0.026*\"reprint\" + 0.024*\"poison\" + 0.020*\"moscow\" + 0.018*\"turin\" + 0.017*\"poland\" + 0.016*\"shirin\"\n", + "2019-01-31 00:26:42,175 : INFO : topic #4 (0.020): 0.021*\"enfranchis\" + 0.015*\"depress\" + 0.014*\"pour\" + 0.010*\"mode\" + 0.009*\"elabor\" + 0.008*\"produc\" + 0.008*\"veget\" + 0.007*\"encyclopedia\" + 0.007*\"candid\" + 0.007*\"develop\"\n", + "2019-01-31 00:26:42,176 : INFO : topic #22 (0.020): 0.034*\"spars\" + 0.025*\"factor\" + 0.022*\"adulthood\" + 0.017*\"feel\" + 0.015*\"male\" + 0.015*\"hostil\" + 0.011*\"live\" + 0.011*\"plaisir\" + 0.009*\"genu\" + 0.009*\"yawn\"\n", + "2019-01-31 00:26:42,178 : INFO : topic #1 (0.020): 0.052*\"china\" + 0.048*\"chilton\" + 0.026*\"kong\" + 0.025*\"hong\" + 0.025*\"korea\" + 0.018*\"leah\" + 0.018*\"korean\" + 0.017*\"sourc\" + 0.013*\"kim\" + 0.012*\"ashvil\"\n", + "2019-01-31 00:26:42,179 : INFO : topic #44 (0.020): 0.035*\"rooftop\" + 0.026*\"final\" + 0.024*\"wife\" + 0.021*\"tourist\" + 0.017*\"map\" + 0.016*\"champion\" + 0.015*\"taxpay\" + 0.015*\"chamber\" + 0.014*\"tiepolo\" + 0.013*\"martin\"\n", + "2019-01-31 00:26:42,184 : INFO : topic diff=0.010861, rho=0.055728\n", + "2019-01-31 00:26:42,337 : INFO : PROGRESS: pass 0, at document #646000/4922894\n", + "2019-01-31 00:26:43,745 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:26:44,011 : INFO : topic #12 (0.020): 0.009*\"number\" + 0.008*\"utopian\" + 0.007*\"cytokin\" + 0.007*\"frontal\" + 0.007*\"exampl\" + 0.007*\"théori\" + 0.006*\"gener\" + 0.006*\"southern\" + 0.006*\"poet\" + 0.006*\"servitud\"\n", + "2019-01-31 00:26:44,013 : INFO : topic #10 (0.020): 0.012*\"cdd\" + 0.008*\"disco\" + 0.007*\"caus\" + 0.007*\"media\" + 0.007*\"proper\" + 0.007*\"acid\" + 0.007*\"have\" + 0.007*\"hormon\" + 0.006*\"pathwai\" + 0.006*\"effect\"\n", + "2019-01-31 00:26:44,014 : INFO : topic #24 (0.020): 0.039*\"book\" + 0.035*\"publicis\" + 0.023*\"word\" + 0.016*\"new\" + 0.015*\"edit\" + 0.014*\"presid\" + 0.012*\"storag\" + 0.011*\"nicola\" + 0.011*\"worldwid\" + 0.011*\"author\"\n", + "2019-01-31 00:26:44,015 : INFO : topic #28 (0.020): 0.029*\"build\" + 0.024*\"hous\" + 0.019*\"rivièr\" + 0.016*\"buford\" + 0.013*\"histor\" + 0.011*\"constitut\" + 0.011*\"rosenwald\" + 0.011*\"strategist\" + 0.010*\"briarwood\" + 0.010*\"depress\"\n", + "2019-01-31 00:26:44,016 : INFO : topic #8 (0.020): 0.029*\"law\" + 0.026*\"cortic\" + 0.020*\"ricardo\" + 0.019*\"act\" + 0.017*\"start\" + 0.013*\"case\" + 0.010*\"polaris\" + 0.009*\"legal\" + 0.008*\"justic\" + 0.008*\"judaism\"\n", + "2019-01-31 00:26:44,022 : INFO : topic diff=0.009319, rho=0.055641\n", + "2019-01-31 00:26:44,174 : INFO : PROGRESS: pass 0, at document #648000/4922894\n", + "2019-01-31 00:26:45,576 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:26:45,842 : INFO : topic #6 (0.020): 0.068*\"fewer\" + 0.025*\"septemb\" + 0.022*\"epiru\" + 0.019*\"teacher\" + 0.016*\"stake\" + 0.012*\"proclaim\" + 0.012*\"rodríguez\" + 0.011*\"produc\" + 0.010*\"movi\" + 0.010*\"direct\"\n", + "2019-01-31 00:26:45,843 : INFO : topic #26 (0.020): 0.031*\"woman\" + 0.028*\"workplac\" + 0.028*\"champion\" + 0.026*\"alic\" + 0.026*\"men\" + 0.024*\"olymp\" + 0.021*\"medal\" + 0.020*\"event\" + 0.020*\"rainfal\" + 0.017*\"atheist\"\n", + "2019-01-31 00:26:45,844 : INFO : topic #22 (0.020): 0.034*\"spars\" + 0.025*\"factor\" + 0.024*\"adulthood\" + 0.017*\"feel\" + 0.015*\"male\" + 0.015*\"hostil\" + 0.011*\"plaisir\" + 0.011*\"live\" + 0.010*\"genu\" + 0.009*\"yawn\"\n", + "2019-01-31 00:26:45,846 : INFO : topic #35 (0.020): 0.055*\"russia\" + 0.030*\"rural\" + 0.029*\"sovereignti\" + 0.026*\"reprint\" + 0.025*\"personifi\" + 0.025*\"poison\" + 0.020*\"moscow\" + 0.018*\"poland\" + 0.017*\"turin\" + 0.016*\"shirin\"\n", + "2019-01-31 00:26:45,847 : INFO : topic #20 (0.020): 0.134*\"scholar\" + 0.040*\"struggl\" + 0.031*\"high\" + 0.029*\"educ\" + 0.019*\"collector\" + 0.018*\"yawn\" + 0.014*\"prognosi\" + 0.009*\"task\" + 0.009*\"gothic\" + 0.008*\"class\"\n", + "2019-01-31 00:26:45,853 : INFO : topic diff=0.010850, rho=0.055556\n", + "2019-01-31 00:26:46,012 : INFO : PROGRESS: pass 0, at document #650000/4922894\n", + "2019-01-31 00:26:47,458 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:26:47,723 : INFO : topic #6 (0.020): 0.068*\"fewer\" + 0.025*\"septemb\" + 0.022*\"epiru\" + 0.019*\"teacher\" + 0.016*\"stake\" + 0.012*\"proclaim\" + 0.012*\"rodríguez\" + 0.010*\"movi\" + 0.010*\"produc\" + 0.010*\"direct\"\n", + "2019-01-31 00:26:47,724 : INFO : topic #0 (0.020): 0.067*\"statewid\" + 0.039*\"arsen\" + 0.038*\"line\" + 0.033*\"raid\" + 0.028*\"museo\" + 0.020*\"traceabl\" + 0.018*\"serv\" + 0.015*\"pain\" + 0.014*\"artist\" + 0.014*\"exhaust\"\n", + "2019-01-31 00:26:47,726 : INFO : topic #1 (0.020): 0.052*\"china\" + 0.047*\"chilton\" + 0.027*\"kong\" + 0.027*\"hong\" + 0.025*\"korea\" + 0.018*\"leah\" + 0.018*\"korean\" + 0.017*\"sourc\" + 0.014*\"kim\" + 0.012*\"ashvil\"\n", + "2019-01-31 00:26:47,727 : INFO : topic #15 (0.020): 0.012*\"small\" + 0.012*\"develop\" + 0.011*\"organ\" + 0.010*\"commun\" + 0.010*\"word\" + 0.009*\"cultur\" + 0.008*\"group\" + 0.008*\"human\" + 0.008*\"peopl\" + 0.007*\"requir\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 00:26:47,728 : INFO : topic #2 (0.020): 0.046*\"isl\" + 0.037*\"shield\" + 0.019*\"narrat\" + 0.014*\"scot\" + 0.013*\"pope\" + 0.013*\"blur\" + 0.010*\"coalit\" + 0.010*\"nativist\" + 0.009*\"class\" + 0.009*\"fleet\"\n", + "2019-01-31 00:26:47,734 : INFO : topic diff=0.009731, rho=0.055470\n", + "2019-01-31 00:26:47,893 : INFO : PROGRESS: pass 0, at document #652000/4922894\n", + "2019-01-31 00:26:49,337 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:26:49,603 : INFO : topic #47 (0.020): 0.066*\"muscl\" + 0.034*\"perceptu\" + 0.022*\"theater\" + 0.020*\"compos\" + 0.017*\"place\" + 0.017*\"damn\" + 0.014*\"orchestr\" + 0.014*\"physician\" + 0.012*\"olympo\" + 0.011*\"son\"\n", + "2019-01-31 00:26:49,604 : INFO : topic #46 (0.020): 0.023*\"stop\" + 0.017*\"sweden\" + 0.016*\"norwai\" + 0.016*\"treeless\" + 0.015*\"wind\" + 0.015*\"norwegian\" + 0.015*\"swedish\" + 0.013*\"damag\" + 0.012*\"farid\" + 0.011*\"huntsvil\"\n", + "2019-01-31 00:26:49,606 : INFO : topic #18 (0.020): 0.009*\"théori\" + 0.007*\"later\" + 0.007*\"sack\" + 0.007*\"kill\" + 0.006*\"dai\" + 0.005*\"retrospect\" + 0.005*\"man\" + 0.005*\"deal\" + 0.004*\"like\" + 0.004*\"help\"\n", + "2019-01-31 00:26:49,607 : INFO : topic #49 (0.020): 0.043*\"india\" + 0.029*\"incumb\" + 0.015*\"televis\" + 0.014*\"islam\" + 0.012*\"pakistan\" + 0.011*\"muskoge\" + 0.010*\"khalsa\" + 0.010*\"start\" + 0.010*\"sri\" + 0.010*\"alam\"\n", + "2019-01-31 00:26:49,608 : INFO : topic #22 (0.020): 0.034*\"spars\" + 0.025*\"factor\" + 0.024*\"adulthood\" + 0.018*\"feel\" + 0.016*\"male\" + 0.015*\"hostil\" + 0.011*\"plaisir\" + 0.011*\"live\" + 0.009*\"genu\" + 0.009*\"yawn\"\n", + "2019-01-31 00:26:49,614 : INFO : topic diff=0.010291, rho=0.055385\n", + "2019-01-31 00:26:49,767 : INFO : PROGRESS: pass 0, at document #654000/4922894\n", + "2019-01-31 00:26:51,150 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:26:51,416 : INFO : topic #49 (0.020): 0.043*\"india\" + 0.029*\"incumb\" + 0.014*\"televis\" + 0.014*\"islam\" + 0.013*\"pakistan\" + 0.011*\"muskoge\" + 0.011*\"sri\" + 0.010*\"khalsa\" + 0.010*\"start\" + 0.010*\"alam\"\n", + "2019-01-31 00:26:51,417 : INFO : topic #4 (0.020): 0.024*\"enfranchis\" + 0.016*\"depress\" + 0.014*\"pour\" + 0.010*\"mode\" + 0.009*\"elabor\" + 0.008*\"produc\" + 0.007*\"veget\" + 0.007*\"candid\" + 0.007*\"encyclopedia\" + 0.007*\"develop\"\n", + "2019-01-31 00:26:51,418 : INFO : topic #27 (0.020): 0.065*\"questionnair\" + 0.019*\"taxpay\" + 0.015*\"ret\" + 0.015*\"candid\" + 0.014*\"tornado\" + 0.013*\"squatter\" + 0.012*\"fool\" + 0.012*\"driver\" + 0.012*\"find\" + 0.011*\"champion\"\n", + "2019-01-31 00:26:51,419 : INFO : topic #32 (0.020): 0.055*\"district\" + 0.047*\"vigour\" + 0.043*\"tortur\" + 0.042*\"popolo\" + 0.029*\"cotton\" + 0.027*\"regim\" + 0.027*\"area\" + 0.025*\"multitud\" + 0.023*\"citi\" + 0.019*\"prosper\"\n", + "2019-01-31 00:26:51,421 : INFO : topic #41 (0.020): 0.045*\"citi\" + 0.034*\"new\" + 0.022*\"palmer\" + 0.019*\"year\" + 0.016*\"center\" + 0.015*\"strategist\" + 0.012*\"open\" + 0.010*\"includ\" + 0.010*\"lobe\" + 0.008*\"highli\"\n", + "2019-01-31 00:26:51,426 : INFO : topic diff=0.009358, rho=0.055300\n", + "2019-01-31 00:26:51,586 : INFO : PROGRESS: pass 0, at document #656000/4922894\n", + "2019-01-31 00:26:53,025 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:26:53,291 : INFO : topic #48 (0.020): 0.079*\"march\" + 0.077*\"sens\" + 0.076*\"octob\" + 0.071*\"juli\" + 0.070*\"januari\" + 0.069*\"notion\" + 0.068*\"august\" + 0.067*\"april\" + 0.066*\"decatur\" + 0.065*\"judici\"\n", + "2019-01-31 00:26:53,292 : INFO : topic #0 (0.020): 0.069*\"statewid\" + 0.037*\"line\" + 0.037*\"arsen\" + 0.034*\"raid\" + 0.027*\"museo\" + 0.020*\"traceabl\" + 0.019*\"serv\" + 0.015*\"pain\" + 0.014*\"artist\" + 0.013*\"exhaust\"\n", + "2019-01-31 00:26:53,293 : INFO : topic #23 (0.020): 0.136*\"audit\" + 0.066*\"best\" + 0.037*\"yawn\" + 0.032*\"jacksonvil\" + 0.025*\"japanes\" + 0.021*\"noll\" + 0.020*\"women\" + 0.019*\"festiv\" + 0.018*\"intern\" + 0.015*\"prison\"\n", + "2019-01-31 00:26:53,294 : INFO : topic #41 (0.020): 0.046*\"citi\" + 0.034*\"new\" + 0.022*\"palmer\" + 0.019*\"year\" + 0.016*\"center\" + 0.015*\"strategist\" + 0.012*\"open\" + 0.010*\"includ\" + 0.010*\"lobe\" + 0.008*\"highli\"\n", + "2019-01-31 00:26:53,295 : INFO : topic #36 (0.020): 0.019*\"companhia\" + 0.011*\"network\" + 0.010*\"prognosi\" + 0.009*\"develop\" + 0.009*\"pop\" + 0.009*\"serv\" + 0.008*\"includ\" + 0.008*\"oper\" + 0.007*\"user\" + 0.007*\"base\"\n", + "2019-01-31 00:26:53,301 : INFO : topic diff=0.010270, rho=0.055216\n", + "2019-01-31 00:26:53,460 : INFO : PROGRESS: pass 0, at document #658000/4922894\n", + "2019-01-31 00:26:54,879 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:26:55,145 : INFO : topic #9 (0.020): 0.070*\"bone\" + 0.044*\"american\" + 0.028*\"valour\" + 0.019*\"dutch\" + 0.018*\"folei\" + 0.017*\"player\" + 0.017*\"polit\" + 0.017*\"english\" + 0.012*\"acrimoni\" + 0.010*\"simpler\"\n", + "2019-01-31 00:26:55,147 : INFO : topic #49 (0.020): 0.043*\"india\" + 0.030*\"incumb\" + 0.014*\"televis\" + 0.013*\"islam\" + 0.012*\"pakistan\" + 0.011*\"muskoge\" + 0.011*\"sri\" + 0.010*\"khalsa\" + 0.010*\"start\" + 0.010*\"alam\"\n", + "2019-01-31 00:26:55,148 : INFO : topic #36 (0.020): 0.019*\"companhia\" + 0.011*\"network\" + 0.010*\"develop\" + 0.009*\"prognosi\" + 0.009*\"pop\" + 0.008*\"serv\" + 0.008*\"includ\" + 0.008*\"oper\" + 0.007*\"base\" + 0.007*\"user\"\n", + "2019-01-31 00:26:55,149 : INFO : topic #14 (0.020): 0.023*\"forc\" + 0.022*\"aggress\" + 0.020*\"walter\" + 0.019*\"armi\" + 0.017*\"oper\" + 0.016*\"com\" + 0.013*\"unionist\" + 0.012*\"militari\" + 0.012*\"airbu\" + 0.010*\"diversifi\"\n", + "2019-01-31 00:26:55,150 : INFO : topic #39 (0.020): 0.039*\"canada\" + 0.031*\"canadian\" + 0.019*\"scientist\" + 0.018*\"taxpay\" + 0.017*\"hoar\" + 0.017*\"toronto\" + 0.016*\"basketbal\" + 0.014*\"confer\" + 0.014*\"ontario\" + 0.011*\"new\"\n", + "2019-01-31 00:26:55,156 : INFO : topic diff=0.010948, rho=0.055132\n", + "2019-01-31 00:26:57,954 : INFO : -11.596 per-word bound, 3096.3 perplexity estimate based on a held-out corpus of 2000 documents with 573499 words\n", + "2019-01-31 00:26:57,955 : INFO : PROGRESS: pass 0, at document #660000/4922894\n", + "2019-01-31 00:26:59,409 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:26:59,675 : INFO : topic #49 (0.020): 0.044*\"india\" + 0.030*\"incumb\" + 0.013*\"televis\" + 0.013*\"islam\" + 0.012*\"pakistan\" + 0.011*\"muskoge\" + 0.011*\"khalsa\" + 0.011*\"start\" + 0.010*\"sri\" + 0.010*\"alam\"\n", + "2019-01-31 00:26:59,676 : INFO : topic #48 (0.020): 0.078*\"march\" + 0.076*\"sens\" + 0.075*\"octob\" + 0.070*\"juli\" + 0.069*\"januari\" + 0.069*\"august\" + 0.067*\"notion\" + 0.065*\"decatur\" + 0.065*\"april\" + 0.064*\"judici\"\n", + "2019-01-31 00:26:59,677 : INFO : topic #37 (0.020): 0.010*\"love\" + 0.008*\"gestur\" + 0.007*\"man\" + 0.005*\"blue\" + 0.005*\"bewild\" + 0.004*\"night\" + 0.004*\"litig\" + 0.004*\"admit\" + 0.003*\"ladi\" + 0.003*\"dramatist\"\n", + "2019-01-31 00:26:59,679 : INFO : topic #20 (0.020): 0.131*\"scholar\" + 0.039*\"struggl\" + 0.030*\"high\" + 0.029*\"educ\" + 0.019*\"collector\" + 0.018*\"yawn\" + 0.014*\"prognosi\" + 0.009*\"gothic\" + 0.009*\"task\" + 0.008*\"class\"\n", + "2019-01-31 00:26:59,680 : INFO : topic #29 (0.020): 0.010*\"govern\" + 0.010*\"start\" + 0.009*\"million\" + 0.008*\"yawn\" + 0.007*\"countri\" + 0.007*\"function\" + 0.006*\"bank\" + 0.006*\"trace\" + 0.006*\"replac\" + 0.006*\"companhia\"\n", + "2019-01-31 00:26:59,686 : INFO : topic diff=0.010013, rho=0.055048\n", + "2019-01-31 00:26:59,840 : INFO : PROGRESS: pass 0, at document #662000/4922894\n", + "2019-01-31 00:27:01,251 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:27:01,517 : INFO : topic #8 (0.020): 0.029*\"law\" + 0.024*\"cortic\" + 0.019*\"ricardo\" + 0.018*\"act\" + 0.017*\"start\" + 0.013*\"case\" + 0.010*\"polaris\" + 0.009*\"legal\" + 0.008*\"justic\" + 0.007*\"judaism\"\n", + "2019-01-31 00:27:01,518 : INFO : topic #13 (0.020): 0.027*\"australia\" + 0.026*\"new\" + 0.025*\"sourc\" + 0.024*\"london\" + 0.022*\"australian\" + 0.022*\"england\" + 0.022*\"british\" + 0.019*\"ireland\" + 0.015*\"youth\" + 0.014*\"wale\"\n", + "2019-01-31 00:27:01,519 : INFO : topic #19 (0.020): 0.014*\"languag\" + 0.010*\"woodcut\" + 0.010*\"form\" + 0.010*\"origin\" + 0.008*\"mean\" + 0.007*\"uruguayan\" + 0.007*\"centuri\" + 0.007*\"like\" + 0.007*\"god\" + 0.007*\"english\"\n", + "2019-01-31 00:27:01,521 : INFO : topic #25 (0.020): 0.031*\"ring\" + 0.019*\"warmth\" + 0.017*\"lagrang\" + 0.016*\"area\" + 0.014*\"mount\" + 0.011*\"foam\" + 0.009*\"palmer\" + 0.008*\"vacant\" + 0.008*\"north\" + 0.008*\"lobe\"\n", + "2019-01-31 00:27:01,521 : INFO : topic #0 (0.020): 0.069*\"statewid\" + 0.038*\"line\" + 0.037*\"arsen\" + 0.035*\"raid\" + 0.027*\"museo\" + 0.020*\"traceabl\" + 0.019*\"serv\" + 0.015*\"pain\" + 0.013*\"artist\" + 0.013*\"exhaust\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 00:27:01,527 : INFO : topic diff=0.009242, rho=0.054965\n", + "2019-01-31 00:27:01,689 : INFO : PROGRESS: pass 0, at document #664000/4922894\n", + "2019-01-31 00:27:03,160 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:27:03,430 : INFO : topic #4 (0.020): 0.025*\"enfranchis\" + 0.016*\"depress\" + 0.015*\"pour\" + 0.010*\"mode\" + 0.010*\"elabor\" + 0.008*\"veget\" + 0.008*\"produc\" + 0.008*\"candid\" + 0.007*\"encyclopedia\" + 0.007*\"develop\"\n", + "2019-01-31 00:27:03,431 : INFO : topic #23 (0.020): 0.139*\"audit\" + 0.067*\"best\" + 0.036*\"yawn\" + 0.032*\"jacksonvil\" + 0.024*\"japanes\" + 0.020*\"noll\" + 0.020*\"women\" + 0.019*\"festiv\" + 0.018*\"intern\" + 0.015*\"prison\"\n", + "2019-01-31 00:27:03,432 : INFO : topic #48 (0.020): 0.077*\"march\" + 0.076*\"sens\" + 0.075*\"octob\" + 0.068*\"juli\" + 0.068*\"januari\" + 0.067*\"august\" + 0.066*\"notion\" + 0.066*\"decatur\" + 0.064*\"april\" + 0.063*\"judici\"\n", + "2019-01-31 00:27:03,434 : INFO : topic #11 (0.020): 0.027*\"john\" + 0.015*\"will\" + 0.013*\"jame\" + 0.012*\"david\" + 0.012*\"rival\" + 0.010*\"mexican–american\" + 0.009*\"georg\" + 0.009*\"slur\" + 0.008*\"rhyme\" + 0.008*\"paul\"\n", + "2019-01-31 00:27:03,435 : INFO : topic #44 (0.020): 0.034*\"rooftop\" + 0.028*\"final\" + 0.023*\"wife\" + 0.021*\"tourist\" + 0.017*\"champion\" + 0.016*\"taxpay\" + 0.015*\"chamber\" + 0.014*\"tiepolo\" + 0.013*\"map\" + 0.013*\"martin\"\n", + "2019-01-31 00:27:03,440 : INFO : topic diff=0.011357, rho=0.054882\n", + "2019-01-31 00:27:03,597 : INFO : PROGRESS: pass 0, at document #666000/4922894\n", + "2019-01-31 00:27:05,022 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:27:05,288 : INFO : topic #42 (0.020): 0.046*\"german\" + 0.029*\"germani\" + 0.014*\"jewish\" + 0.013*\"berlin\" + 0.013*\"vol\" + 0.013*\"der\" + 0.012*\"israel\" + 0.008*\"austria\" + 0.008*\"jeremiah\" + 0.008*\"hungarian\"\n", + "2019-01-31 00:27:05,289 : INFO : topic #29 (0.020): 0.010*\"govern\" + 0.010*\"start\" + 0.009*\"million\" + 0.008*\"yawn\" + 0.007*\"countri\" + 0.007*\"function\" + 0.006*\"bank\" + 0.006*\"trace\" + 0.006*\"companhia\" + 0.006*\"replac\"\n", + "2019-01-31 00:27:05,290 : INFO : topic #35 (0.020): 0.055*\"russia\" + 0.031*\"sovereignti\" + 0.030*\"rural\" + 0.028*\"reprint\" + 0.025*\"poison\" + 0.023*\"personifi\" + 0.019*\"poland\" + 0.018*\"moscow\" + 0.015*\"czech\" + 0.015*\"turin\"\n", + "2019-01-31 00:27:05,291 : INFO : topic #43 (0.020): 0.061*\"elect\" + 0.055*\"parti\" + 0.026*\"democrat\" + 0.024*\"voluntari\" + 0.023*\"republ\" + 0.020*\"member\" + 0.018*\"polici\" + 0.015*\"liber\" + 0.014*\"bypass\" + 0.013*\"seaport\"\n", + "2019-01-31 00:27:05,292 : INFO : topic #39 (0.020): 0.038*\"canada\" + 0.031*\"canadian\" + 0.019*\"scientist\" + 0.018*\"taxpay\" + 0.017*\"hoar\" + 0.017*\"toronto\" + 0.015*\"basketbal\" + 0.014*\"ontario\" + 0.013*\"confer\" + 0.011*\"new\"\n", + "2019-01-31 00:27:05,298 : INFO : topic diff=0.009918, rho=0.054800\n", + "2019-01-31 00:27:05,454 : INFO : PROGRESS: pass 0, at document #668000/4922894\n", + "2019-01-31 00:27:06,887 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:27:07,153 : INFO : topic #49 (0.020): 0.044*\"india\" + 0.032*\"incumb\" + 0.013*\"pakistan\" + 0.013*\"islam\" + 0.013*\"televis\" + 0.012*\"muskoge\" + 0.011*\"start\" + 0.011*\"khalsa\" + 0.011*\"alam\" + 0.010*\"sri\"\n", + "2019-01-31 00:27:07,155 : INFO : topic #7 (0.020): 0.020*\"snatch\" + 0.020*\"di\" + 0.017*\"factor\" + 0.015*\"yawn\" + 0.015*\"margin\" + 0.013*\"bone\" + 0.012*\"life\" + 0.012*\"faster\" + 0.011*\"daughter\" + 0.011*\"john\"\n", + "2019-01-31 00:27:07,156 : INFO : topic #25 (0.020): 0.034*\"ring\" + 0.019*\"warmth\" + 0.017*\"lagrang\" + 0.016*\"area\" + 0.014*\"mount\" + 0.011*\"foam\" + 0.009*\"palmer\" + 0.008*\"vacant\" + 0.008*\"north\" + 0.008*\"lobe\"\n", + "2019-01-31 00:27:07,157 : INFO : topic #5 (0.020): 0.039*\"abroad\" + 0.028*\"rel\" + 0.028*\"son\" + 0.025*\"reconstruct\" + 0.022*\"band\" + 0.017*\"muscl\" + 0.016*\"simultan\" + 0.014*\"charcoal\" + 0.014*\"toyota\" + 0.010*\"myspac\"\n", + "2019-01-31 00:27:07,158 : INFO : topic #4 (0.020): 0.024*\"enfranchis\" + 0.015*\"depress\" + 0.015*\"pour\" + 0.010*\"mode\" + 0.010*\"elabor\" + 0.008*\"veget\" + 0.008*\"encyclopedia\" + 0.008*\"produc\" + 0.008*\"candid\" + 0.007*\"develop\"\n", + "2019-01-31 00:27:07,164 : INFO : topic diff=0.009477, rho=0.054718\n", + "2019-01-31 00:27:07,373 : INFO : PROGRESS: pass 0, at document #670000/4922894\n", + "2019-01-31 00:27:08,800 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:27:09,067 : INFO : topic #46 (0.020): 0.022*\"stop\" + 0.017*\"sweden\" + 0.015*\"wind\" + 0.015*\"treeless\" + 0.015*\"norwai\" + 0.015*\"damag\" + 0.015*\"swedish\" + 0.014*\"norwegian\" + 0.012*\"huntsvil\" + 0.012*\"iceland\"\n", + "2019-01-31 00:27:09,068 : INFO : topic #24 (0.020): 0.040*\"book\" + 0.035*\"publicis\" + 0.023*\"word\" + 0.016*\"new\" + 0.014*\"edit\" + 0.013*\"presid\" + 0.012*\"storag\" + 0.012*\"nicola\" + 0.011*\"worldwid\" + 0.011*\"author\"\n", + "2019-01-31 00:27:09,069 : INFO : topic #30 (0.020): 0.037*\"leagu\" + 0.034*\"cleveland\" + 0.030*\"place\" + 0.026*\"taxpay\" + 0.025*\"scientist\" + 0.023*\"crete\" + 0.022*\"folei\" + 0.017*\"goal\" + 0.015*\"martin\" + 0.012*\"diversifi\"\n", + "2019-01-31 00:27:09,071 : INFO : topic #33 (0.020): 0.061*\"french\" + 0.043*\"franc\" + 0.030*\"pari\" + 0.023*\"jean\" + 0.023*\"sail\" + 0.016*\"daphn\" + 0.013*\"lazi\" + 0.012*\"loui\" + 0.011*\"piec\" + 0.009*\"focal\"\n", + "2019-01-31 00:27:09,072 : INFO : topic #15 (0.020): 0.012*\"small\" + 0.011*\"develop\" + 0.011*\"organ\" + 0.010*\"word\" + 0.010*\"commun\" + 0.009*\"cultur\" + 0.008*\"group\" + 0.008*\"human\" + 0.008*\"peopl\" + 0.007*\"student\"\n", + "2019-01-31 00:27:09,078 : INFO : topic diff=0.009115, rho=0.054636\n", + "2019-01-31 00:27:09,235 : INFO : PROGRESS: pass 0, at document #672000/4922894\n", + "2019-01-31 00:27:10,652 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:27:10,921 : INFO : topic #39 (0.020): 0.037*\"canada\" + 0.031*\"canadian\" + 0.018*\"scientist\" + 0.018*\"taxpay\" + 0.016*\"hoar\" + 0.016*\"toronto\" + 0.015*\"basketbal\" + 0.014*\"ontario\" + 0.013*\"confer\" + 0.011*\"new\"\n", + "2019-01-31 00:27:10,922 : INFO : topic #14 (0.020): 0.023*\"forc\" + 0.021*\"aggress\" + 0.020*\"armi\" + 0.020*\"walter\" + 0.016*\"com\" + 0.015*\"oper\" + 0.012*\"unionist\" + 0.012*\"airbu\" + 0.012*\"militari\" + 0.010*\"diversifi\"\n", + "2019-01-31 00:27:10,923 : INFO : topic #47 (0.020): 0.067*\"muscl\" + 0.034*\"perceptu\" + 0.021*\"theater\" + 0.020*\"compos\" + 0.018*\"place\" + 0.016*\"damn\" + 0.014*\"physician\" + 0.013*\"orchestr\" + 0.013*\"olympo\" + 0.012*\"word\"\n", + "2019-01-31 00:27:10,924 : INFO : topic #49 (0.020): 0.044*\"india\" + 0.032*\"incumb\" + 0.014*\"pakistan\" + 0.013*\"islam\" + 0.013*\"televis\" + 0.011*\"muskoge\" + 0.011*\"alam\" + 0.011*\"start\" + 0.011*\"khalsa\" + 0.010*\"sri\"\n", + "2019-01-31 00:27:10,926 : INFO : topic #7 (0.020): 0.020*\"snatch\" + 0.020*\"di\" + 0.017*\"factor\" + 0.015*\"yawn\" + 0.015*\"margin\" + 0.013*\"bone\" + 0.012*\"life\" + 0.012*\"faster\" + 0.011*\"daughter\" + 0.011*\"john\"\n", + "2019-01-31 00:27:10,932 : INFO : topic diff=0.010958, rho=0.054554\n", + "2019-01-31 00:27:11,089 : INFO : PROGRESS: pass 0, at document #674000/4922894\n", + "2019-01-31 00:27:12,528 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:27:12,795 : INFO : topic #27 (0.020): 0.066*\"questionnair\" + 0.020*\"taxpay\" + 0.016*\"ret\" + 0.016*\"candid\" + 0.013*\"driver\" + 0.012*\"fool\" + 0.012*\"squatter\" + 0.011*\"tornado\" + 0.011*\"find\" + 0.011*\"champion\"\n", + "2019-01-31 00:27:12,796 : INFO : topic #17 (0.020): 0.070*\"church\" + 0.021*\"cathol\" + 0.021*\"christian\" + 0.019*\"bishop\" + 0.015*\"sail\" + 0.014*\"retroflex\" + 0.011*\"centuri\" + 0.009*\"relationship\" + 0.009*\"italian\" + 0.009*\"historiographi\"\n", + "2019-01-31 00:27:12,797 : INFO : topic #14 (0.020): 0.023*\"forc\" + 0.021*\"aggress\" + 0.020*\"armi\" + 0.020*\"walter\" + 0.016*\"com\" + 0.015*\"oper\" + 0.012*\"unionist\" + 0.012*\"airbu\" + 0.012*\"militari\" + 0.010*\"diversifi\"\n", + "2019-01-31 00:27:12,798 : INFO : topic #49 (0.020): 0.044*\"india\" + 0.031*\"incumb\" + 0.013*\"islam\" + 0.013*\"pakistan\" + 0.013*\"televis\" + 0.011*\"alam\" + 0.011*\"muskoge\" + 0.010*\"start\" + 0.010*\"khalsa\" + 0.010*\"sri\"\n", + "2019-01-31 00:27:12,799 : INFO : topic #42 (0.020): 0.044*\"german\" + 0.028*\"germani\" + 0.014*\"jewish\" + 0.013*\"berlin\" + 0.013*\"vol\" + 0.012*\"der\" + 0.012*\"israel\" + 0.008*\"greek\" + 0.008*\"austria\" + 0.008*\"jeremiah\"\n", + "2019-01-31 00:27:12,805 : INFO : topic diff=0.009570, rho=0.054473\n", + "2019-01-31 00:27:12,965 : INFO : PROGRESS: pass 0, at document #676000/4922894\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 00:27:14,422 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:27:14,688 : INFO : topic #17 (0.020): 0.070*\"church\" + 0.021*\"cathol\" + 0.021*\"christian\" + 0.019*\"bishop\" + 0.014*\"sail\" + 0.014*\"retroflex\" + 0.011*\"centuri\" + 0.009*\"relationship\" + 0.009*\"italian\" + 0.009*\"historiographi\"\n", + "2019-01-31 00:27:14,689 : INFO : topic #19 (0.020): 0.015*\"languag\" + 0.010*\"woodcut\" + 0.010*\"origin\" + 0.010*\"form\" + 0.008*\"mean\" + 0.007*\"uruguayan\" + 0.007*\"centuri\" + 0.007*\"like\" + 0.007*\"god\" + 0.006*\"english\"\n", + "2019-01-31 00:27:14,691 : INFO : topic #46 (0.020): 0.021*\"stop\" + 0.018*\"sweden\" + 0.015*\"wind\" + 0.015*\"damag\" + 0.015*\"swedish\" + 0.015*\"norwai\" + 0.014*\"treeless\" + 0.014*\"norwegian\" + 0.012*\"huntsvil\" + 0.011*\"iceland\"\n", + "2019-01-31 00:27:14,692 : INFO : topic #10 (0.020): 0.012*\"cdd\" + 0.007*\"disco\" + 0.007*\"have\" + 0.007*\"media\" + 0.007*\"caus\" + 0.007*\"pathwai\" + 0.007*\"proper\" + 0.006*\"acid\" + 0.006*\"hormon\" + 0.006*\"treat\"\n", + "2019-01-31 00:27:14,693 : INFO : topic #0 (0.020): 0.069*\"statewid\" + 0.039*\"line\" + 0.038*\"arsen\" + 0.035*\"raid\" + 0.027*\"museo\" + 0.021*\"traceabl\" + 0.019*\"serv\" + 0.016*\"pain\" + 0.014*\"exhaust\" + 0.013*\"artist\"\n", + "2019-01-31 00:27:14,699 : INFO : topic diff=0.009393, rho=0.054393\n", + "2019-01-31 00:27:14,853 : INFO : PROGRESS: pass 0, at document #678000/4922894\n", + "2019-01-31 00:27:16,271 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:27:16,537 : INFO : topic #27 (0.020): 0.066*\"questionnair\" + 0.020*\"taxpay\" + 0.016*\"candid\" + 0.015*\"ret\" + 0.014*\"fool\" + 0.013*\"driver\" + 0.011*\"champion\" + 0.011*\"find\" + 0.011*\"squatter\" + 0.011*\"tornado\"\n", + "2019-01-31 00:27:16,538 : INFO : topic #45 (0.020): 0.017*\"black\" + 0.016*\"western\" + 0.012*\"colder\" + 0.012*\"jpg\" + 0.011*\"fifteenth\" + 0.011*\"record\" + 0.011*\"illicit\" + 0.009*\"blind\" + 0.008*\"green\" + 0.007*\"light\"\n", + "2019-01-31 00:27:16,539 : INFO : topic #30 (0.020): 0.036*\"leagu\" + 0.035*\"cleveland\" + 0.030*\"place\" + 0.027*\"taxpay\" + 0.025*\"scientist\" + 0.023*\"crete\" + 0.022*\"folei\" + 0.017*\"goal\" + 0.015*\"martin\" + 0.012*\"diversifi\"\n", + "2019-01-31 00:27:16,540 : INFO : topic #32 (0.020): 0.057*\"district\" + 0.046*\"vigour\" + 0.043*\"tortur\" + 0.042*\"popolo\" + 0.029*\"area\" + 0.028*\"cotton\" + 0.025*\"regim\" + 0.024*\"multitud\" + 0.022*\"citi\" + 0.019*\"prosper\"\n", + "2019-01-31 00:27:16,541 : INFO : topic #0 (0.020): 0.068*\"statewid\" + 0.039*\"line\" + 0.039*\"arsen\" + 0.035*\"raid\" + 0.027*\"museo\" + 0.021*\"traceabl\" + 0.019*\"serv\" + 0.016*\"pain\" + 0.014*\"exhaust\" + 0.013*\"artist\"\n", + "2019-01-31 00:27:16,547 : INFO : topic diff=0.009438, rho=0.054313\n", + "2019-01-31 00:27:19,314 : INFO : -11.820 per-word bound, 3616.0 perplexity estimate based on a held-out corpus of 2000 documents with 570372 words\n", + "2019-01-31 00:27:19,315 : INFO : PROGRESS: pass 0, at document #680000/4922894\n", + "2019-01-31 00:27:20,756 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:27:21,023 : INFO : topic #33 (0.020): 0.059*\"french\" + 0.044*\"franc\" + 0.029*\"pari\" + 0.024*\"jean\" + 0.022*\"sail\" + 0.016*\"daphn\" + 0.013*\"lazi\" + 0.013*\"loui\" + 0.011*\"piec\" + 0.010*\"focal\"\n", + "2019-01-31 00:27:21,024 : INFO : topic #31 (0.020): 0.062*\"fusiform\" + 0.023*\"scientist\" + 0.023*\"player\" + 0.020*\"taxpay\" + 0.019*\"place\" + 0.012*\"clot\" + 0.012*\"folei\" + 0.012*\"leagu\" + 0.010*\"ruler\" + 0.010*\"reconstruct\"\n", + "2019-01-31 00:27:21,024 : INFO : topic #26 (0.020): 0.030*\"champion\" + 0.030*\"workplac\" + 0.029*\"woman\" + 0.025*\"olymp\" + 0.025*\"men\" + 0.023*\"medal\" + 0.021*\"event\" + 0.019*\"rainfal\" + 0.018*\"nation\" + 0.018*\"alic\"\n", + "2019-01-31 00:27:21,026 : INFO : topic #20 (0.020): 0.135*\"scholar\" + 0.039*\"struggl\" + 0.034*\"high\" + 0.029*\"educ\" + 0.021*\"collector\" + 0.017*\"yawn\" + 0.014*\"prognosi\" + 0.009*\"task\" + 0.008*\"gothic\" + 0.008*\"class\"\n", + "2019-01-31 00:27:21,027 : INFO : topic #14 (0.020): 0.024*\"forc\" + 0.022*\"aggress\" + 0.020*\"walter\" + 0.019*\"armi\" + 0.016*\"com\" + 0.015*\"oper\" + 0.013*\"unionist\" + 0.012*\"militari\" + 0.012*\"airbu\" + 0.010*\"diversifi\"\n", + "2019-01-31 00:27:21,032 : INFO : topic diff=0.008632, rho=0.054233\n", + "2019-01-31 00:27:21,190 : INFO : PROGRESS: pass 0, at document #682000/4922894\n", + "2019-01-31 00:27:22,620 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:27:22,886 : INFO : topic #41 (0.020): 0.045*\"citi\" + 0.034*\"new\" + 0.022*\"palmer\" + 0.018*\"year\" + 0.015*\"center\" + 0.014*\"strategist\" + 0.012*\"open\" + 0.010*\"includ\" + 0.010*\"lobe\" + 0.008*\"dai\"\n", + "2019-01-31 00:27:22,887 : INFO : topic #46 (0.020): 0.020*\"stop\" + 0.018*\"sweden\" + 0.018*\"norwai\" + 0.016*\"norwegian\" + 0.015*\"swedish\" + 0.015*\"damag\" + 0.014*\"wind\" + 0.013*\"treeless\" + 0.011*\"huntsvil\" + 0.011*\"iceland\"\n", + "2019-01-31 00:27:22,888 : INFO : topic #0 (0.020): 0.070*\"statewid\" + 0.040*\"line\" + 0.039*\"arsen\" + 0.034*\"raid\" + 0.029*\"museo\" + 0.021*\"traceabl\" + 0.019*\"serv\" + 0.016*\"pain\" + 0.014*\"exhaust\" + 0.013*\"artist\"\n", + "2019-01-31 00:27:22,889 : INFO : topic #49 (0.020): 0.046*\"india\" + 0.030*\"incumb\" + 0.015*\"islam\" + 0.013*\"pakistan\" + 0.013*\"televis\" + 0.011*\"muskoge\" + 0.011*\"khalsa\" + 0.011*\"alam\" + 0.010*\"start\" + 0.010*\"anglo\"\n", + "2019-01-31 00:27:22,890 : INFO : topic #47 (0.020): 0.065*\"muscl\" + 0.033*\"perceptu\" + 0.021*\"theater\" + 0.019*\"compos\" + 0.018*\"place\" + 0.017*\"damn\" + 0.014*\"orchestr\" + 0.014*\"physician\" + 0.013*\"olympo\" + 0.012*\"jack\"\n", + "2019-01-31 00:27:22,896 : INFO : topic diff=0.009671, rho=0.054153\n", + "2019-01-31 00:27:23,063 : INFO : PROGRESS: pass 0, at document #684000/4922894\n", + "2019-01-31 00:27:24,525 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:27:24,791 : INFO : topic #35 (0.020): 0.052*\"russia\" + 0.034*\"sovereignti\" + 0.031*\"rural\" + 0.026*\"reprint\" + 0.025*\"poison\" + 0.025*\"personifi\" + 0.020*\"moscow\" + 0.019*\"poland\" + 0.014*\"malaysia\" + 0.014*\"czech\"\n", + "2019-01-31 00:27:24,792 : INFO : topic #49 (0.020): 0.045*\"india\" + 0.030*\"incumb\" + 0.015*\"islam\" + 0.013*\"televis\" + 0.013*\"pakistan\" + 0.011*\"khalsa\" + 0.011*\"muskoge\" + 0.011*\"alam\" + 0.010*\"start\" + 0.010*\"anglo\"\n", + "2019-01-31 00:27:24,793 : INFO : topic #37 (0.020): 0.010*\"love\" + 0.008*\"gestur\" + 0.008*\"man\" + 0.005*\"bewild\" + 0.005*\"blue\" + 0.005*\"night\" + 0.004*\"litig\" + 0.004*\"vision\" + 0.003*\"introductori\" + 0.003*\"admit\"\n", + "2019-01-31 00:27:24,794 : INFO : topic #30 (0.020): 0.035*\"leagu\" + 0.034*\"cleveland\" + 0.029*\"place\" + 0.027*\"taxpay\" + 0.025*\"scientist\" + 0.023*\"crete\" + 0.022*\"folei\" + 0.017*\"goal\" + 0.015*\"martin\" + 0.012*\"schmitz\"\n", + "2019-01-31 00:27:24,795 : INFO : topic #4 (0.020): 0.022*\"enfranchis\" + 0.018*\"irish\" + 0.015*\"depress\" + 0.014*\"pour\" + 0.010*\"mode\" + 0.009*\"elabor\" + 0.008*\"produc\" + 0.008*\"veget\" + 0.008*\"encyclopedia\" + 0.007*\"candid\"\n", + "2019-01-31 00:27:24,801 : INFO : topic diff=0.012123, rho=0.054074\n", + "2019-01-31 00:27:24,957 : INFO : PROGRESS: pass 0, at document #686000/4922894\n", + "2019-01-31 00:27:26,372 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:27:26,638 : INFO : topic #36 (0.020): 0.019*\"companhia\" + 0.011*\"network\" + 0.010*\"prognosi\" + 0.010*\"serv\" + 0.009*\"develop\" + 0.009*\"manag\" + 0.009*\"pop\" + 0.008*\"softwar\" + 0.008*\"techniqu\" + 0.008*\"inform\"\n", + "2019-01-31 00:27:26,639 : INFO : topic #8 (0.020): 0.028*\"law\" + 0.025*\"cortic\" + 0.018*\"start\" + 0.017*\"act\" + 0.016*\"ricardo\" + 0.013*\"case\" + 0.011*\"polaris\" + 0.009*\"legal\" + 0.008*\"justic\" + 0.008*\"judaism\"\n", + "2019-01-31 00:27:26,640 : INFO : topic #18 (0.020): 0.010*\"théori\" + 0.007*\"later\" + 0.006*\"sack\" + 0.006*\"kill\" + 0.006*\"dai\" + 0.005*\"retrospect\" + 0.005*\"man\" + 0.005*\"deal\" + 0.004*\"like\" + 0.004*\"help\"\n", + "2019-01-31 00:27:26,641 : INFO : topic #40 (0.020): 0.089*\"unit\" + 0.025*\"collector\" + 0.023*\"schuster\" + 0.022*\"institut\" + 0.019*\"requir\" + 0.017*\"professor\" + 0.017*\"student\" + 0.012*\"word\" + 0.012*\"http\" + 0.011*\"governor\"\n", + "2019-01-31 00:27:26,642 : INFO : topic #32 (0.020): 0.057*\"district\" + 0.046*\"vigour\" + 0.044*\"tortur\" + 0.042*\"popolo\" + 0.028*\"area\" + 0.027*\"cotton\" + 0.025*\"regim\" + 0.025*\"multitud\" + 0.022*\"citi\" + 0.019*\"prosper\"\n", + "2019-01-31 00:27:26,648 : INFO : topic diff=0.007781, rho=0.053995\n", + "2019-01-31 00:27:26,802 : INFO : PROGRESS: pass 0, at document #688000/4922894\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 00:27:28,220 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:27:28,486 : INFO : topic #38 (0.020): 0.022*\"walter\" + 0.011*\"king\" + 0.010*\"aza\" + 0.010*\"battalion\" + 0.009*\"empath\" + 0.008*\"teufel\" + 0.008*\"forc\" + 0.007*\"armi\" + 0.007*\"centuri\" + 0.007*\"till\"\n", + "2019-01-31 00:27:28,487 : INFO : topic #15 (0.020): 0.012*\"small\" + 0.011*\"develop\" + 0.011*\"organ\" + 0.010*\"word\" + 0.010*\"commun\" + 0.009*\"cultur\" + 0.008*\"group\" + 0.008*\"peopl\" + 0.007*\"human\" + 0.007*\"student\"\n", + "2019-01-31 00:27:28,488 : INFO : topic #47 (0.020): 0.065*\"muscl\" + 0.033*\"perceptu\" + 0.021*\"theater\" + 0.019*\"compos\" + 0.018*\"place\" + 0.017*\"damn\" + 0.014*\"orchestr\" + 0.013*\"physician\" + 0.013*\"olympo\" + 0.012*\"jack\"\n", + "2019-01-31 00:27:28,489 : INFO : topic #24 (0.020): 0.039*\"book\" + 0.034*\"publicis\" + 0.024*\"word\" + 0.016*\"new\" + 0.014*\"edit\" + 0.013*\"presid\" + 0.013*\"storag\" + 0.012*\"nicola\" + 0.011*\"collect\" + 0.011*\"worldwid\"\n", + "2019-01-31 00:27:28,490 : INFO : topic #4 (0.020): 0.022*\"enfranchis\" + 0.017*\"irish\" + 0.015*\"depress\" + 0.014*\"pour\" + 0.010*\"mode\" + 0.009*\"elabor\" + 0.009*\"candid\" + 0.008*\"produc\" + 0.008*\"veget\" + 0.008*\"encyclopedia\"\n", + "2019-01-31 00:27:28,496 : INFO : topic diff=0.009390, rho=0.053916\n", + "2019-01-31 00:27:28,653 : INFO : PROGRESS: pass 0, at document #690000/4922894\n", + "2019-01-31 00:27:30,065 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:27:30,332 : INFO : topic #47 (0.020): 0.064*\"muscl\" + 0.033*\"perceptu\" + 0.021*\"theater\" + 0.020*\"compos\" + 0.018*\"place\" + 0.016*\"damn\" + 0.014*\"orchestr\" + 0.014*\"physician\" + 0.013*\"olympo\" + 0.012*\"jack\"\n", + "2019-01-31 00:27:30,333 : INFO : topic #46 (0.020): 0.020*\"stop\" + 0.018*\"norwai\" + 0.017*\"sweden\" + 0.017*\"damag\" + 0.016*\"norwegian\" + 0.015*\"swedish\" + 0.014*\"wind\" + 0.012*\"treeless\" + 0.011*\"huntsvil\" + 0.011*\"danish\"\n", + "2019-01-31 00:27:30,334 : INFO : topic #41 (0.020): 0.044*\"citi\" + 0.034*\"new\" + 0.023*\"palmer\" + 0.018*\"year\" + 0.015*\"center\" + 0.014*\"strategist\" + 0.012*\"open\" + 0.010*\"includ\" + 0.010*\"lobe\" + 0.009*\"hot\"\n", + "2019-01-31 00:27:30,335 : INFO : topic #5 (0.020): 0.039*\"abroad\" + 0.029*\"rel\" + 0.028*\"son\" + 0.025*\"reconstruct\" + 0.023*\"band\" + 0.017*\"muscl\" + 0.016*\"simultan\" + 0.014*\"charcoal\" + 0.013*\"toyota\" + 0.010*\"vocabulari\"\n", + "2019-01-31 00:27:30,336 : INFO : topic #2 (0.020): 0.048*\"isl\" + 0.036*\"shield\" + 0.018*\"narrat\" + 0.014*\"scot\" + 0.014*\"pope\" + 0.012*\"blur\" + 0.011*\"class\" + 0.011*\"coalit\" + 0.010*\"nativist\" + 0.009*\"hawaii\"\n", + "2019-01-31 00:27:30,342 : INFO : topic diff=0.010920, rho=0.053838\n", + "2019-01-31 00:27:30,499 : INFO : PROGRESS: pass 0, at document #692000/4922894\n", + "2019-01-31 00:27:31,907 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:27:32,176 : INFO : topic #0 (0.020): 0.068*\"statewid\" + 0.040*\"line\" + 0.040*\"arsen\" + 0.033*\"raid\" + 0.030*\"museo\" + 0.020*\"traceabl\" + 0.018*\"serv\" + 0.017*\"pain\" + 0.014*\"exhaust\" + 0.013*\"artist\"\n", + "2019-01-31 00:27:32,177 : INFO : topic #23 (0.020): 0.138*\"audit\" + 0.066*\"best\" + 0.035*\"yawn\" + 0.030*\"jacksonvil\" + 0.024*\"japanes\" + 0.021*\"noll\" + 0.019*\"women\" + 0.019*\"festiv\" + 0.018*\"intern\" + 0.015*\"prison\"\n", + "2019-01-31 00:27:32,178 : INFO : topic #10 (0.020): 0.012*\"cdd\" + 0.009*\"media\" + 0.008*\"have\" + 0.008*\"disco\" + 0.007*\"pathwai\" + 0.007*\"caus\" + 0.007*\"hormon\" + 0.006*\"proper\" + 0.006*\"acid\" + 0.006*\"effect\"\n", + "2019-01-31 00:27:32,179 : INFO : topic #39 (0.020): 0.039*\"canada\" + 0.031*\"canadian\" + 0.018*\"scientist\" + 0.018*\"hoar\" + 0.017*\"taxpay\" + 0.015*\"toronto\" + 0.015*\"basketbal\" + 0.013*\"ontario\" + 0.012*\"confer\" + 0.011*\"hydrogen\"\n", + "2019-01-31 00:27:32,180 : INFO : topic #38 (0.020): 0.022*\"walter\" + 0.011*\"king\" + 0.010*\"teufel\" + 0.010*\"aza\" + 0.010*\"battalion\" + 0.009*\"till\" + 0.008*\"empath\" + 0.008*\"forc\" + 0.007*\"armi\" + 0.007*\"centuri\"\n", + "2019-01-31 00:27:32,186 : INFO : topic diff=0.009530, rho=0.053760\n", + "2019-01-31 00:27:32,342 : INFO : PROGRESS: pass 0, at document #694000/4922894\n", + "2019-01-31 00:27:33,784 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:27:34,050 : INFO : topic #31 (0.020): 0.064*\"fusiform\" + 0.024*\"scientist\" + 0.023*\"player\" + 0.020*\"taxpay\" + 0.019*\"place\" + 0.013*\"clot\" + 0.012*\"leagu\" + 0.012*\"folei\" + 0.010*\"ruler\" + 0.009*\"reconstruct\"\n", + "2019-01-31 00:27:34,051 : INFO : topic #14 (0.020): 0.024*\"forc\" + 0.022*\"aggress\" + 0.019*\"walter\" + 0.019*\"armi\" + 0.016*\"com\" + 0.015*\"oper\" + 0.013*\"unionist\" + 0.012*\"airbu\" + 0.012*\"militari\" + 0.009*\"refut\"\n", + "2019-01-31 00:27:34,052 : INFO : topic #4 (0.020): 0.022*\"enfranchis\" + 0.015*\"depress\" + 0.015*\"irish\" + 0.014*\"pour\" + 0.010*\"mode\" + 0.009*\"elabor\" + 0.009*\"candid\" + 0.008*\"produc\" + 0.008*\"veget\" + 0.008*\"encyclopedia\"\n", + "2019-01-31 00:27:34,054 : INFO : topic #20 (0.020): 0.136*\"scholar\" + 0.038*\"struggl\" + 0.033*\"high\" + 0.029*\"educ\" + 0.021*\"collector\" + 0.017*\"yawn\" + 0.014*\"prognosi\" + 0.009*\"task\" + 0.009*\"gothic\" + 0.008*\"district\"\n", + "2019-01-31 00:27:34,054 : INFO : topic #13 (0.020): 0.028*\"australia\" + 0.026*\"new\" + 0.025*\"london\" + 0.025*\"sourc\" + 0.024*\"australian\" + 0.022*\"england\" + 0.021*\"british\" + 0.020*\"ireland\" + 0.015*\"youth\" + 0.014*\"wale\"\n", + "2019-01-31 00:27:34,060 : INFO : topic diff=0.010401, rho=0.053683\n", + "2019-01-31 00:27:34,216 : INFO : PROGRESS: pass 0, at document #696000/4922894\n", + "2019-01-31 00:27:35,651 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:27:35,917 : INFO : topic #25 (0.020): 0.030*\"ring\" + 0.019*\"warmth\" + 0.017*\"lagrang\" + 0.017*\"area\" + 0.015*\"mount\" + 0.010*\"foam\" + 0.008*\"palmer\" + 0.008*\"north\" + 0.008*\"vacant\" + 0.008*\"lobe\"\n", + "2019-01-31 00:27:35,918 : INFO : topic #5 (0.020): 0.039*\"abroad\" + 0.029*\"rel\" + 0.028*\"son\" + 0.026*\"reconstruct\" + 0.023*\"band\" + 0.017*\"muscl\" + 0.016*\"simultan\" + 0.014*\"charcoal\" + 0.013*\"toyota\" + 0.010*\"vocabulari\"\n", + "2019-01-31 00:27:35,919 : INFO : topic #22 (0.020): 0.035*\"spars\" + 0.026*\"factor\" + 0.022*\"adulthood\" + 0.017*\"feel\" + 0.015*\"male\" + 0.015*\"hostil\" + 0.011*\"plaisir\" + 0.011*\"live\" + 0.010*\"genu\" + 0.009*\"yawn\"\n", + "2019-01-31 00:27:35,920 : INFO : topic #2 (0.020): 0.048*\"isl\" + 0.036*\"shield\" + 0.017*\"narrat\" + 0.014*\"scot\" + 0.013*\"pope\" + 0.012*\"blur\" + 0.011*\"class\" + 0.010*\"coalit\" + 0.010*\"nativist\" + 0.009*\"crew\"\n", + "2019-01-31 00:27:35,921 : INFO : topic #34 (0.020): 0.074*\"start\" + 0.033*\"unionist\" + 0.030*\"cotton\" + 0.029*\"american\" + 0.022*\"new\" + 0.015*\"terri\" + 0.014*\"california\" + 0.012*\"warrior\" + 0.012*\"north\" + 0.011*\"year\"\n", + "2019-01-31 00:27:35,927 : INFO : topic diff=0.008782, rho=0.053606\n", + "2019-01-31 00:27:36,089 : INFO : PROGRESS: pass 0, at document #698000/4922894\n", + "2019-01-31 00:27:37,554 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:27:37,820 : INFO : topic #1 (0.020): 0.054*\"china\" + 0.051*\"chilton\" + 0.025*\"hong\" + 0.025*\"kong\" + 0.022*\"korea\" + 0.019*\"korean\" + 0.016*\"leah\" + 0.016*\"sourc\" + 0.012*\"kim\" + 0.012*\"ashvil\"\n", + "2019-01-31 00:27:37,822 : INFO : topic #12 (0.020): 0.010*\"number\" + 0.008*\"frontal\" + 0.007*\"gener\" + 0.006*\"théori\" + 0.006*\"exampl\" + 0.006*\"servitud\" + 0.006*\"measur\" + 0.006*\"cytokin\" + 0.006*\"utopian\" + 0.006*\"southern\"\n", + "2019-01-31 00:27:37,823 : INFO : topic #34 (0.020): 0.074*\"start\" + 0.033*\"unionist\" + 0.029*\"cotton\" + 0.028*\"american\" + 0.022*\"new\" + 0.015*\"terri\" + 0.014*\"california\" + 0.012*\"warrior\" + 0.012*\"north\" + 0.012*\"year\"\n", + "2019-01-31 00:27:37,824 : INFO : topic #37 (0.020): 0.010*\"love\" + 0.008*\"gestur\" + 0.008*\"man\" + 0.005*\"bewild\" + 0.005*\"blue\" + 0.004*\"night\" + 0.004*\"litig\" + 0.003*\"vision\" + 0.003*\"ladi\" + 0.003*\"wither\"\n", + "2019-01-31 00:27:37,825 : INFO : topic #46 (0.020): 0.022*\"stop\" + 0.017*\"norwai\" + 0.017*\"sweden\" + 0.016*\"damag\" + 0.015*\"norwegian\" + 0.015*\"wind\" + 0.015*\"swedish\" + 0.013*\"treeless\" + 0.013*\"huntsvil\" + 0.011*\"farid\"\n", + "2019-01-31 00:27:37,831 : INFO : topic diff=0.011073, rho=0.053529\n", + "2019-01-31 00:27:40,487 : INFO : -11.839 per-word bound, 3664.7 perplexity estimate based on a held-out corpus of 2000 documents with 519573 words\n", + "2019-01-31 00:27:40,487 : INFO : PROGRESS: pass 0, at document #700000/4922894\n", + "2019-01-31 00:27:41,877 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 00:27:42,144 : INFO : topic #25 (0.020): 0.030*\"ring\" + 0.019*\"warmth\" + 0.017*\"area\" + 0.016*\"lagrang\" + 0.015*\"mount\" + 0.010*\"foam\" + 0.008*\"palmer\" + 0.008*\"north\" + 0.008*\"lobe\" + 0.007*\"vacant\"\n", + "2019-01-31 00:27:42,145 : INFO : topic #18 (0.020): 0.010*\"théori\" + 0.007*\"later\" + 0.006*\"sack\" + 0.006*\"kill\" + 0.006*\"dai\" + 0.005*\"retrospect\" + 0.005*\"man\" + 0.004*\"deal\" + 0.004*\"like\" + 0.004*\"help\"\n", + "2019-01-31 00:27:42,146 : INFO : topic #46 (0.020): 0.021*\"stop\" + 0.020*\"sweden\" + 0.019*\"norwai\" + 0.017*\"damag\" + 0.015*\"swedish\" + 0.015*\"wind\" + 0.015*\"norwegian\" + 0.013*\"treeless\" + 0.012*\"huntsvil\" + 0.011*\"farid\"\n", + "2019-01-31 00:27:42,147 : INFO : topic #6 (0.020): 0.067*\"fewer\" + 0.024*\"septemb\" + 0.023*\"epiru\" + 0.019*\"teacher\" + 0.017*\"stake\" + 0.015*\"proclaim\" + 0.012*\"rodríguez\" + 0.011*\"movi\" + 0.010*\"direct\" + 0.010*\"acrimoni\"\n", + "2019-01-31 00:27:42,149 : INFO : topic #30 (0.020): 0.034*\"cleveland\" + 0.034*\"leagu\" + 0.029*\"place\" + 0.027*\"taxpay\" + 0.024*\"scientist\" + 0.023*\"crete\" + 0.021*\"folei\" + 0.017*\"goal\" + 0.015*\"martin\" + 0.012*\"schmitz\"\n", + "2019-01-31 00:27:42,155 : INFO : topic diff=0.009249, rho=0.053452\n", + "2019-01-31 00:27:42,362 : INFO : PROGRESS: pass 0, at document #702000/4922894\n", + "2019-01-31 00:27:43,791 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:27:44,058 : INFO : topic #19 (0.020): 0.015*\"languag\" + 0.011*\"woodcut\" + 0.009*\"form\" + 0.009*\"origin\" + 0.008*\"mean\" + 0.007*\"centuri\" + 0.007*\"uruguayan\" + 0.007*\"like\" + 0.007*\"english\" + 0.006*\"charact\"\n", + "2019-01-31 00:27:44,060 : INFO : topic #38 (0.020): 0.021*\"walter\" + 0.011*\"aza\" + 0.010*\"king\" + 0.010*\"teufel\" + 0.010*\"battalion\" + 0.009*\"till\" + 0.008*\"empath\" + 0.008*\"forc\" + 0.007*\"armi\" + 0.007*\"centuri\"\n", + "2019-01-31 00:27:44,061 : INFO : topic #47 (0.020): 0.062*\"muscl\" + 0.033*\"perceptu\" + 0.021*\"theater\" + 0.019*\"compos\" + 0.018*\"place\" + 0.015*\"damn\" + 0.015*\"orchestr\" + 0.014*\"physician\" + 0.013*\"olympo\" + 0.011*\"word\"\n", + "2019-01-31 00:27:44,062 : INFO : topic #8 (0.020): 0.027*\"law\" + 0.024*\"cortic\" + 0.018*\"start\" + 0.018*\"ricardo\" + 0.017*\"act\" + 0.013*\"case\" + 0.012*\"polaris\" + 0.009*\"legal\" + 0.008*\"justic\" + 0.008*\"judaism\"\n", + "2019-01-31 00:27:44,063 : INFO : topic #7 (0.020): 0.020*\"snatch\" + 0.019*\"di\" + 0.018*\"factor\" + 0.015*\"yawn\" + 0.015*\"margin\" + 0.013*\"bone\" + 0.012*\"life\" + 0.012*\"faster\" + 0.011*\"john\" + 0.011*\"daughter\"\n", + "2019-01-31 00:27:44,069 : INFO : topic diff=0.008232, rho=0.053376\n", + "2019-01-31 00:27:44,235 : INFO : PROGRESS: pass 0, at document #704000/4922894\n", + "2019-01-31 00:27:45,714 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:27:45,980 : INFO : topic #45 (0.020): 0.016*\"black\" + 0.016*\"fifteenth\" + 0.015*\"western\" + 0.013*\"jpg\" + 0.013*\"colder\" + 0.012*\"record\" + 0.011*\"illicit\" + 0.010*\"blind\" + 0.009*\"arm\" + 0.008*\"green\"\n", + "2019-01-31 00:27:45,981 : INFO : topic #26 (0.020): 0.030*\"champion\" + 0.030*\"woman\" + 0.030*\"workplac\" + 0.028*\"men\" + 0.025*\"olymp\" + 0.022*\"medal\" + 0.021*\"event\" + 0.020*\"alic\" + 0.019*\"rainfal\" + 0.018*\"atheist\"\n", + "2019-01-31 00:27:45,982 : INFO : topic #28 (0.020): 0.030*\"build\" + 0.025*\"hous\" + 0.020*\"rivièr\" + 0.016*\"buford\" + 0.013*\"histor\" + 0.012*\"briarwood\" + 0.011*\"constitut\" + 0.011*\"strategist\" + 0.009*\"rosenwald\" + 0.009*\"depress\"\n", + "2019-01-31 00:27:45,983 : INFO : topic #19 (0.020): 0.015*\"languag\" + 0.011*\"woodcut\" + 0.009*\"origin\" + 0.009*\"form\" + 0.008*\"mean\" + 0.007*\"uruguayan\" + 0.007*\"centuri\" + 0.007*\"like\" + 0.007*\"english\" + 0.006*\"charact\"\n", + "2019-01-31 00:27:45,984 : INFO : topic #29 (0.020): 0.010*\"start\" + 0.010*\"million\" + 0.009*\"govern\" + 0.009*\"yawn\" + 0.007*\"countri\" + 0.007*\"bank\" + 0.007*\"companhia\" + 0.007*\"function\" + 0.006*\"trace\" + 0.006*\"inconclus\"\n", + "2019-01-31 00:27:45,990 : INFO : topic diff=0.010897, rho=0.053300\n", + "2019-01-31 00:27:46,146 : INFO : PROGRESS: pass 0, at document #706000/4922894\n", + "2019-01-31 00:27:47,567 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:27:47,833 : INFO : topic #19 (0.020): 0.016*\"languag\" + 0.011*\"woodcut\" + 0.010*\"origin\" + 0.009*\"form\" + 0.008*\"mean\" + 0.007*\"uruguayan\" + 0.007*\"centuri\" + 0.007*\"like\" + 0.006*\"english\" + 0.006*\"charact\"\n", + "2019-01-31 00:27:47,834 : INFO : topic #43 (0.020): 0.065*\"elect\" + 0.057*\"parti\" + 0.027*\"voluntari\" + 0.025*\"democrat\" + 0.020*\"member\" + 0.019*\"republ\" + 0.017*\"polici\" + 0.014*\"bypass\" + 0.014*\"liber\" + 0.014*\"seaport\"\n", + "2019-01-31 00:27:47,835 : INFO : topic #12 (0.020): 0.010*\"number\" + 0.008*\"frontal\" + 0.007*\"gener\" + 0.006*\"théori\" + 0.006*\"measur\" + 0.006*\"exampl\" + 0.006*\"servitud\" + 0.006*\"cytokin\" + 0.006*\"method\" + 0.006*\"utopian\"\n", + "2019-01-31 00:27:47,837 : INFO : topic #23 (0.020): 0.135*\"audit\" + 0.067*\"best\" + 0.034*\"yawn\" + 0.031*\"jacksonvil\" + 0.024*\"japanes\" + 0.021*\"noll\" + 0.019*\"women\" + 0.019*\"festiv\" + 0.018*\"intern\" + 0.015*\"prison\"\n", + "2019-01-31 00:27:47,838 : INFO : topic #17 (0.020): 0.070*\"church\" + 0.021*\"cathol\" + 0.021*\"christian\" + 0.018*\"bishop\" + 0.014*\"sail\" + 0.014*\"retroflex\" + 0.011*\"centuri\" + 0.010*\"relationship\" + 0.009*\"italian\" + 0.008*\"historiographi\"\n", + "2019-01-31 00:27:47,844 : INFO : topic diff=0.009473, rho=0.053225\n", + "2019-01-31 00:27:47,996 : INFO : PROGRESS: pass 0, at document #708000/4922894\n", + "2019-01-31 00:27:49,416 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:27:49,682 : INFO : topic #35 (0.020): 0.053*\"russia\" + 0.033*\"sovereignti\" + 0.030*\"rural\" + 0.024*\"reprint\" + 0.024*\"personifi\" + 0.023*\"poison\" + 0.020*\"moscow\" + 0.018*\"poland\" + 0.015*\"malaysia\" + 0.014*\"unfortun\"\n", + "2019-01-31 00:27:49,683 : INFO : topic #40 (0.020): 0.092*\"unit\" + 0.024*\"collector\" + 0.022*\"institut\" + 0.022*\"schuster\" + 0.019*\"requir\" + 0.017*\"student\" + 0.017*\"professor\" + 0.012*\"governor\" + 0.011*\"word\" + 0.011*\"http\"\n", + "2019-01-31 00:27:49,685 : INFO : topic #7 (0.020): 0.020*\"snatch\" + 0.019*\"di\" + 0.018*\"factor\" + 0.015*\"yawn\" + 0.015*\"margin\" + 0.013*\"bone\" + 0.012*\"life\" + 0.012*\"faster\" + 0.011*\"john\" + 0.011*\"daughter\"\n", + "2019-01-31 00:27:49,686 : INFO : topic #2 (0.020): 0.048*\"isl\" + 0.036*\"shield\" + 0.017*\"narrat\" + 0.014*\"scot\" + 0.013*\"pope\" + 0.012*\"blur\" + 0.011*\"coalit\" + 0.010*\"class\" + 0.010*\"nativist\" + 0.009*\"crew\"\n", + "2019-01-31 00:27:49,687 : INFO : topic #29 (0.020): 0.010*\"start\" + 0.010*\"million\" + 0.009*\"govern\" + 0.009*\"yawn\" + 0.007*\"bank\" + 0.007*\"companhia\" + 0.007*\"countri\" + 0.006*\"function\" + 0.006*\"trace\" + 0.006*\"inconclus\"\n", + "2019-01-31 00:27:49,693 : INFO : topic diff=0.009469, rho=0.053149\n", + "2019-01-31 00:27:49,851 : INFO : PROGRESS: pass 0, at document #710000/4922894\n", + "2019-01-31 00:27:51,286 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:27:51,552 : INFO : topic #39 (0.020): 0.039*\"canada\" + 0.030*\"canadian\" + 0.016*\"scientist\" + 0.016*\"toronto\" + 0.016*\"ontario\" + 0.015*\"taxpay\" + 0.015*\"hoar\" + 0.013*\"basketbal\" + 0.013*\"hydrogen\" + 0.012*\"confer\"\n", + "2019-01-31 00:27:51,553 : INFO : topic #40 (0.020): 0.092*\"unit\" + 0.025*\"collector\" + 0.022*\"institut\" + 0.022*\"schuster\" + 0.019*\"requir\" + 0.017*\"student\" + 0.017*\"professor\" + 0.012*\"governor\" + 0.011*\"word\" + 0.011*\"http\"\n", + "2019-01-31 00:27:51,554 : INFO : topic #35 (0.020): 0.053*\"russia\" + 0.033*\"sovereignti\" + 0.030*\"rural\" + 0.025*\"personifi\" + 0.024*\"reprint\" + 0.023*\"poison\" + 0.020*\"moscow\" + 0.018*\"poland\" + 0.015*\"malaysia\" + 0.014*\"turin\"\n", + "2019-01-31 00:27:51,555 : INFO : topic #1 (0.020): 0.056*\"china\" + 0.050*\"chilton\" + 0.028*\"hong\" + 0.028*\"kong\" + 0.021*\"korea\" + 0.017*\"korean\" + 0.017*\"leah\" + 0.015*\"sourc\" + 0.013*\"kim\" + 0.012*\"ashvil\"\n", + "2019-01-31 00:27:51,556 : INFO : topic #43 (0.020): 0.065*\"elect\" + 0.057*\"parti\" + 0.027*\"voluntari\" + 0.024*\"democrat\" + 0.020*\"member\" + 0.018*\"republ\" + 0.018*\"polici\" + 0.015*\"bypass\" + 0.014*\"liber\" + 0.013*\"seaport\"\n", + "2019-01-31 00:27:51,562 : INFO : topic diff=0.010727, rho=0.053074\n", + "2019-01-31 00:27:51,720 : INFO : PROGRESS: pass 0, at document #712000/4922894\n", + "2019-01-31 00:27:53,120 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:27:53,389 : INFO : topic #41 (0.020): 0.044*\"citi\" + 0.033*\"new\" + 0.024*\"palmer\" + 0.017*\"year\" + 0.015*\"center\" + 0.014*\"strategist\" + 0.012*\"open\" + 0.010*\"includ\" + 0.010*\"lobe\" + 0.009*\"dai\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 00:27:53,390 : INFO : topic #15 (0.020): 0.012*\"small\" + 0.011*\"develop\" + 0.010*\"organ\" + 0.010*\"word\" + 0.010*\"commun\" + 0.009*\"cultur\" + 0.008*\"group\" + 0.008*\"peopl\" + 0.007*\"human\" + 0.007*\"socialist\"\n", + "2019-01-31 00:27:53,391 : INFO : topic #20 (0.020): 0.134*\"scholar\" + 0.038*\"struggl\" + 0.032*\"high\" + 0.029*\"educ\" + 0.021*\"collector\" + 0.018*\"yawn\" + 0.014*\"prognosi\" + 0.009*\"task\" + 0.009*\"gothic\" + 0.008*\"campbel\"\n", + "2019-01-31 00:27:53,392 : INFO : topic #4 (0.020): 0.022*\"enfranchis\" + 0.015*\"depress\" + 0.014*\"pour\" + 0.010*\"mode\" + 0.010*\"irish\" + 0.009*\"elabor\" + 0.009*\"candid\" + 0.008*\"produc\" + 0.008*\"veget\" + 0.007*\"encyclopedia\"\n", + "2019-01-31 00:27:53,393 : INFO : topic #27 (0.020): 0.068*\"questionnair\" + 0.018*\"taxpay\" + 0.017*\"candid\" + 0.016*\"ret\" + 0.013*\"fool\" + 0.012*\"find\" + 0.012*\"driver\" + 0.012*\"tornado\" + 0.011*\"champion\" + 0.010*\"horac\"\n", + "2019-01-31 00:27:53,399 : INFO : topic diff=0.009532, rho=0.053000\n", + "2019-01-31 00:27:53,557 : INFO : PROGRESS: pass 0, at document #714000/4922894\n", + "2019-01-31 00:27:54,989 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:27:55,255 : INFO : topic #11 (0.020): 0.028*\"john\" + 0.015*\"will\" + 0.013*\"jame\" + 0.012*\"david\" + 0.011*\"rival\" + 0.010*\"georg\" + 0.009*\"mexican–american\" + 0.009*\"rhyme\" + 0.009*\"slur\" + 0.008*\"paul\"\n", + "2019-01-31 00:27:55,256 : INFO : topic #22 (0.020): 0.035*\"spars\" + 0.026*\"factor\" + 0.022*\"adulthood\" + 0.018*\"feel\" + 0.015*\"male\" + 0.015*\"hostil\" + 0.011*\"live\" + 0.011*\"plaisir\" + 0.010*\"genu\" + 0.010*\"yawn\"\n", + "2019-01-31 00:27:55,257 : INFO : topic #3 (0.020): 0.038*\"present\" + 0.028*\"offic\" + 0.027*\"minist\" + 0.020*\"member\" + 0.020*\"gener\" + 0.019*\"seri\" + 0.017*\"govern\" + 0.016*\"nation\" + 0.015*\"chickasaw\" + 0.015*\"appeas\"\n", + "2019-01-31 00:27:55,258 : INFO : topic #0 (0.020): 0.072*\"statewid\" + 0.039*\"arsen\" + 0.037*\"line\" + 0.032*\"raid\" + 0.030*\"museo\" + 0.021*\"traceabl\" + 0.019*\"serv\" + 0.016*\"pain\" + 0.014*\"artist\" + 0.014*\"exhaust\"\n", + "2019-01-31 00:27:55,259 : INFO : topic #42 (0.020): 0.045*\"german\" + 0.029*\"germani\" + 0.014*\"vol\" + 0.014*\"jewish\" + 0.013*\"berlin\" + 0.012*\"der\" + 0.012*\"israel\" + 0.008*\"austria\" + 0.008*\"hungarian\" + 0.008*\"europ\"\n", + "2019-01-31 00:27:55,265 : INFO : topic diff=0.009276, rho=0.052926\n", + "2019-01-31 00:27:55,423 : INFO : PROGRESS: pass 0, at document #716000/4922894\n", + "2019-01-31 00:27:56,862 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:27:57,128 : INFO : topic #46 (0.020): 0.021*\"stop\" + 0.019*\"sweden\" + 0.018*\"damag\" + 0.018*\"norwai\" + 0.015*\"swedish\" + 0.015*\"norwegian\" + 0.014*\"ton\" + 0.013*\"wind\" + 0.012*\"treeless\" + 0.012*\"huntsvil\"\n", + "2019-01-31 00:27:57,129 : INFO : topic #45 (0.020): 0.016*\"black\" + 0.015*\"fifteenth\" + 0.015*\"western\" + 0.013*\"jpg\" + 0.013*\"colder\" + 0.012*\"record\" + 0.011*\"illicit\" + 0.010*\"blind\" + 0.009*\"arm\" + 0.007*\"green\"\n", + "2019-01-31 00:27:57,130 : INFO : topic #32 (0.020): 0.054*\"district\" + 0.047*\"vigour\" + 0.042*\"tortur\" + 0.042*\"popolo\" + 0.031*\"cotton\" + 0.029*\"regim\" + 0.027*\"area\" + 0.025*\"multitud\" + 0.022*\"citi\" + 0.020*\"prosper\"\n", + "2019-01-31 00:27:57,130 : INFO : topic #3 (0.020): 0.038*\"present\" + 0.028*\"offic\" + 0.026*\"minist\" + 0.020*\"member\" + 0.020*\"gener\" + 0.019*\"seri\" + 0.018*\"govern\" + 0.016*\"nation\" + 0.015*\"appeas\" + 0.015*\"chickasaw\"\n", + "2019-01-31 00:27:57,132 : INFO : topic #26 (0.020): 0.030*\"champion\" + 0.030*\"workplac\" + 0.029*\"woman\" + 0.026*\"men\" + 0.025*\"olymp\" + 0.023*\"medal\" + 0.022*\"event\" + 0.021*\"alic\" + 0.019*\"rainfal\" + 0.018*\"nation\"\n", + "2019-01-31 00:27:57,137 : INFO : topic diff=0.010792, rho=0.052852\n", + "2019-01-31 00:27:57,294 : INFO : PROGRESS: pass 0, at document #718000/4922894\n", + "2019-01-31 00:27:58,709 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:27:58,975 : INFO : topic #38 (0.020): 0.022*\"walter\" + 0.011*\"aza\" + 0.010*\"teufel\" + 0.010*\"battalion\" + 0.010*\"king\" + 0.009*\"empath\" + 0.009*\"till\" + 0.008*\"forc\" + 0.007*\"centuri\" + 0.007*\"armi\"\n", + "2019-01-31 00:27:58,976 : INFO : topic #3 (0.020): 0.038*\"present\" + 0.028*\"offic\" + 0.026*\"minist\" + 0.020*\"gener\" + 0.020*\"member\" + 0.019*\"seri\" + 0.018*\"govern\" + 0.016*\"nation\" + 0.015*\"appeas\" + 0.015*\"chickasaw\"\n", + "2019-01-31 00:27:58,977 : INFO : topic #43 (0.020): 0.066*\"elect\" + 0.055*\"parti\" + 0.027*\"voluntari\" + 0.025*\"democrat\" + 0.020*\"member\" + 0.018*\"republ\" + 0.017*\"polici\" + 0.014*\"bypass\" + 0.014*\"liber\" + 0.013*\"report\"\n", + "2019-01-31 00:27:58,978 : INFO : topic #37 (0.020): 0.010*\"love\" + 0.008*\"man\" + 0.008*\"gestur\" + 0.006*\"blue\" + 0.005*\"bewild\" + 0.004*\"night\" + 0.004*\"litig\" + 0.003*\"admit\" + 0.003*\"vision\" + 0.003*\"wither\"\n", + "2019-01-31 00:27:58,979 : INFO : topic #28 (0.020): 0.030*\"build\" + 0.025*\"hous\" + 0.020*\"rivièr\" + 0.017*\"buford\" + 0.013*\"histor\" + 0.011*\"briarwood\" + 0.011*\"constitut\" + 0.011*\"strategist\" + 0.009*\"depress\" + 0.009*\"rosenwald\"\n", + "2019-01-31 00:27:58,985 : INFO : topic diff=0.009099, rho=0.052778\n", + "2019-01-31 00:28:01,721 : INFO : -11.684 per-word bound, 3291.0 perplexity estimate based on a held-out corpus of 2000 documents with 546750 words\n", + "2019-01-31 00:28:01,721 : INFO : PROGRESS: pass 0, at document #720000/4922894\n", + "2019-01-31 00:28:03,144 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:28:03,411 : INFO : topic #46 (0.020): 0.020*\"stop\" + 0.018*\"sweden\" + 0.018*\"damag\" + 0.017*\"norwai\" + 0.016*\"swedish\" + 0.015*\"norwegian\" + 0.013*\"wind\" + 0.013*\"ton\" + 0.012*\"treeless\" + 0.012*\"huntsvil\"\n", + "2019-01-31 00:28:03,412 : INFO : topic #27 (0.020): 0.068*\"questionnair\" + 0.018*\"taxpay\" + 0.018*\"candid\" + 0.014*\"ret\" + 0.013*\"driver\" + 0.012*\"tornado\" + 0.012*\"find\" + 0.012*\"fool\" + 0.011*\"squatter\" + 0.011*\"champion\"\n", + "2019-01-31 00:28:03,413 : INFO : topic #24 (0.020): 0.039*\"book\" + 0.033*\"publicis\" + 0.023*\"word\" + 0.017*\"new\" + 0.013*\"edit\" + 0.013*\"storag\" + 0.013*\"presid\" + 0.012*\"nicola\" + 0.011*\"collect\" + 0.011*\"levi\"\n", + "2019-01-31 00:28:03,414 : INFO : topic #44 (0.020): 0.030*\"rooftop\" + 0.028*\"final\" + 0.023*\"wife\" + 0.023*\"tourist\" + 0.018*\"champion\" + 0.017*\"taxpay\" + 0.016*\"chamber\" + 0.014*\"tiepolo\" + 0.013*\"martin\" + 0.012*\"women\"\n", + "2019-01-31 00:28:03,415 : INFO : topic #37 (0.020): 0.010*\"love\" + 0.008*\"man\" + 0.008*\"gestur\" + 0.006*\"blue\" + 0.005*\"bewild\" + 0.004*\"night\" + 0.004*\"litig\" + 0.003*\"admit\" + 0.003*\"introductori\" + 0.003*\"york\"\n", + "2019-01-31 00:28:03,421 : INFO : topic diff=0.009619, rho=0.052705\n", + "2019-01-31 00:28:03,576 : INFO : PROGRESS: pass 0, at document #722000/4922894\n", + "2019-01-31 00:28:04,986 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:28:05,252 : INFO : topic #25 (0.020): 0.031*\"ring\" + 0.017*\"warmth\" + 0.017*\"lagrang\" + 0.017*\"area\" + 0.014*\"mount\" + 0.008*\"foam\" + 0.008*\"palmer\" + 0.008*\"north\" + 0.008*\"lobe\" + 0.008*\"sourc\"\n", + "2019-01-31 00:28:05,253 : INFO : topic #29 (0.020): 0.010*\"start\" + 0.009*\"million\" + 0.009*\"govern\" + 0.009*\"yawn\" + 0.008*\"companhia\" + 0.007*\"bank\" + 0.007*\"countri\" + 0.006*\"function\" + 0.006*\"trace\" + 0.006*\"new\"\n", + "2019-01-31 00:28:05,255 : INFO : topic #39 (0.020): 0.040*\"canada\" + 0.030*\"canadian\" + 0.019*\"toronto\" + 0.016*\"ontario\" + 0.016*\"scientist\" + 0.015*\"taxpay\" + 0.015*\"hoar\" + 0.013*\"basketbal\" + 0.012*\"new\" + 0.012*\"confer\"\n", + "2019-01-31 00:28:05,256 : INFO : topic #28 (0.020): 0.030*\"build\" + 0.026*\"hous\" + 0.020*\"rivièr\" + 0.017*\"buford\" + 0.013*\"histor\" + 0.011*\"briarwood\" + 0.011*\"strategist\" + 0.011*\"constitut\" + 0.009*\"rosenwald\" + 0.009*\"depress\"\n", + "2019-01-31 00:28:05,257 : INFO : topic #27 (0.020): 0.069*\"questionnair\" + 0.019*\"taxpay\" + 0.018*\"candid\" + 0.014*\"ret\" + 0.013*\"driver\" + 0.012*\"tornado\" + 0.012*\"fool\" + 0.012*\"find\" + 0.011*\"squatter\" + 0.011*\"champion\"\n", + "2019-01-31 00:28:05,263 : INFO : topic diff=0.010817, rho=0.052632\n", + "2019-01-31 00:28:05,426 : INFO : PROGRESS: pass 0, at document #724000/4922894\n", + "2019-01-31 00:28:06,862 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:28:07,128 : INFO : topic #17 (0.020): 0.069*\"church\" + 0.022*\"cathol\" + 0.020*\"christian\" + 0.019*\"bishop\" + 0.014*\"sail\" + 0.013*\"retroflex\" + 0.010*\"centuri\" + 0.010*\"relationship\" + 0.009*\"poll\" + 0.008*\"italian\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 00:28:07,129 : INFO : topic #33 (0.020): 0.066*\"french\" + 0.044*\"franc\" + 0.030*\"pari\" + 0.024*\"sail\" + 0.021*\"jean\" + 0.016*\"daphn\" + 0.013*\"lazi\" + 0.012*\"loui\" + 0.010*\"piec\" + 0.009*\"wine\"\n", + "2019-01-31 00:28:07,130 : INFO : topic #5 (0.020): 0.039*\"abroad\" + 0.028*\"rel\" + 0.028*\"son\" + 0.026*\"reconstruct\" + 0.022*\"band\" + 0.017*\"muscl\" + 0.016*\"simultan\" + 0.014*\"charcoal\" + 0.014*\"toyota\" + 0.010*\"vocabulari\"\n", + "2019-01-31 00:28:07,132 : INFO : topic #16 (0.020): 0.036*\"king\" + 0.032*\"priest\" + 0.022*\"grammat\" + 0.021*\"duke\" + 0.020*\"quarterli\" + 0.017*\"rotterdam\" + 0.015*\"idiosyncrat\" + 0.015*\"brazil\" + 0.014*\"princ\" + 0.014*\"maria\"\n", + "2019-01-31 00:28:07,133 : INFO : topic #21 (0.020): 0.036*\"samford\" + 0.023*\"spain\" + 0.020*\"del\" + 0.017*\"mexico\" + 0.014*\"soviet\" + 0.012*\"juan\" + 0.011*\"santa\" + 0.011*\"carlo\" + 0.011*\"josé\" + 0.010*\"francisco\"\n", + "2019-01-31 00:28:07,138 : INFO : topic diff=0.009092, rho=0.052559\n", + "2019-01-31 00:28:07,297 : INFO : PROGRESS: pass 0, at document #726000/4922894\n", + "2019-01-31 00:28:08,748 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:28:09,015 : INFO : topic #35 (0.020): 0.050*\"russia\" + 0.034*\"sovereignti\" + 0.030*\"rural\" + 0.026*\"reprint\" + 0.023*\"personifi\" + 0.021*\"poison\" + 0.019*\"moscow\" + 0.017*\"poland\" + 0.015*\"malaysia\" + 0.014*\"czech\"\n", + "2019-01-31 00:28:09,016 : INFO : topic #17 (0.020): 0.069*\"church\" + 0.023*\"cathol\" + 0.020*\"christian\" + 0.019*\"bishop\" + 0.014*\"sail\" + 0.013*\"retroflex\" + 0.011*\"centuri\" + 0.010*\"relationship\" + 0.009*\"poll\" + 0.008*\"historiographi\"\n", + "2019-01-31 00:28:09,017 : INFO : topic #14 (0.020): 0.024*\"forc\" + 0.021*\"aggress\" + 0.020*\"walter\" + 0.019*\"armi\" + 0.016*\"com\" + 0.014*\"oper\" + 0.012*\"unionist\" + 0.012*\"militari\" + 0.012*\"airbu\" + 0.011*\"diversifi\"\n", + "2019-01-31 00:28:09,018 : INFO : topic #47 (0.020): 0.061*\"muscl\" + 0.032*\"perceptu\" + 0.021*\"theater\" + 0.019*\"compos\" + 0.018*\"place\" + 0.017*\"physician\" + 0.016*\"damn\" + 0.015*\"orchestr\" + 0.012*\"olympo\" + 0.011*\"word\"\n", + "2019-01-31 00:28:09,019 : INFO : topic #33 (0.020): 0.066*\"french\" + 0.044*\"franc\" + 0.030*\"pari\" + 0.024*\"sail\" + 0.021*\"jean\" + 0.016*\"daphn\" + 0.012*\"lazi\" + 0.012*\"loui\" + 0.010*\"piec\" + 0.009*\"focal\"\n", + "2019-01-31 00:28:09,025 : INFO : topic diff=0.011120, rho=0.052486\n", + "2019-01-31 00:28:09,178 : INFO : PROGRESS: pass 0, at document #728000/4922894\n", + "2019-01-31 00:28:10,585 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:28:10,851 : INFO : topic #20 (0.020): 0.141*\"scholar\" + 0.038*\"struggl\" + 0.033*\"high\" + 0.029*\"educ\" + 0.021*\"collector\" + 0.017*\"yawn\" + 0.013*\"prognosi\" + 0.009*\"pseudo\" + 0.009*\"task\" + 0.009*\"gothic\"\n", + "2019-01-31 00:28:10,852 : INFO : topic #26 (0.020): 0.029*\"workplac\" + 0.029*\"champion\" + 0.029*\"woman\" + 0.026*\"men\" + 0.025*\"olymp\" + 0.023*\"medal\" + 0.022*\"event\" + 0.020*\"alic\" + 0.018*\"rainfal\" + 0.018*\"nation\"\n", + "2019-01-31 00:28:10,853 : INFO : topic #6 (0.020): 0.068*\"fewer\" + 0.024*\"septemb\" + 0.021*\"epiru\" + 0.019*\"teacher\" + 0.017*\"stake\" + 0.014*\"proclaim\" + 0.012*\"rodríguez\" + 0.011*\"movi\" + 0.011*\"direct\" + 0.010*\"acrimoni\"\n", + "2019-01-31 00:28:10,854 : INFO : topic #0 (0.020): 0.072*\"statewid\" + 0.038*\"line\" + 0.038*\"arsen\" + 0.034*\"raid\" + 0.029*\"museo\" + 0.021*\"traceabl\" + 0.019*\"serv\" + 0.016*\"pain\" + 0.014*\"exhaust\" + 0.013*\"artist\"\n", + "2019-01-31 00:28:10,855 : INFO : topic #39 (0.020): 0.041*\"canada\" + 0.030*\"canadian\" + 0.018*\"toronto\" + 0.016*\"ontario\" + 0.016*\"scientist\" + 0.015*\"hoar\" + 0.015*\"taxpay\" + 0.013*\"basketbal\" + 0.013*\"confer\" + 0.012*\"new\"\n", + "2019-01-31 00:28:10,861 : INFO : topic diff=0.009583, rho=0.052414\n", + "2019-01-31 00:28:11,022 : INFO : PROGRESS: pass 0, at document #730000/4922894\n", + "2019-01-31 00:28:12,478 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:28:12,744 : INFO : topic #47 (0.020): 0.065*\"muscl\" + 0.032*\"perceptu\" + 0.020*\"theater\" + 0.018*\"compos\" + 0.018*\"place\" + 0.017*\"physician\" + 0.016*\"damn\" + 0.015*\"orchestr\" + 0.013*\"olympo\" + 0.012*\"word\"\n", + "2019-01-31 00:28:12,745 : INFO : topic #14 (0.020): 0.024*\"forc\" + 0.021*\"aggress\" + 0.020*\"walter\" + 0.019*\"armi\" + 0.016*\"com\" + 0.014*\"oper\" + 0.013*\"unionist\" + 0.012*\"airbu\" + 0.012*\"militari\" + 0.011*\"diversifi\"\n", + "2019-01-31 00:28:12,746 : INFO : topic #13 (0.020): 0.026*\"new\" + 0.026*\"australia\" + 0.025*\"sourc\" + 0.024*\"london\" + 0.021*\"australian\" + 0.021*\"british\" + 0.021*\"england\" + 0.020*\"ireland\" + 0.016*\"youth\" + 0.015*\"wale\"\n", + "2019-01-31 00:28:12,747 : INFO : topic #36 (0.020): 0.018*\"companhia\" + 0.011*\"network\" + 0.010*\"serv\" + 0.010*\"develop\" + 0.010*\"prognosi\" + 0.009*\"pop\" + 0.008*\"base\" + 0.007*\"manag\" + 0.007*\"includ\" + 0.007*\"oper\"\n", + "2019-01-31 00:28:12,748 : INFO : topic #27 (0.020): 0.070*\"questionnair\" + 0.018*\"taxpay\" + 0.017*\"candid\" + 0.013*\"driver\" + 0.012*\"find\" + 0.011*\"tornado\" + 0.011*\"ret\" + 0.011*\"squatter\" + 0.011*\"landslid\" + 0.010*\"fool\"\n", + "2019-01-31 00:28:12,754 : INFO : topic diff=0.012185, rho=0.052342\n", + "2019-01-31 00:28:12,914 : INFO : PROGRESS: pass 0, at document #732000/4922894\n", + "2019-01-31 00:28:14,325 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:28:14,594 : INFO : topic #20 (0.020): 0.141*\"scholar\" + 0.037*\"struggl\" + 0.033*\"high\" + 0.029*\"educ\" + 0.021*\"collector\" + 0.017*\"yawn\" + 0.013*\"prognosi\" + 0.009*\"pseudo\" + 0.009*\"task\" + 0.008*\"class\"\n", + "2019-01-31 00:28:14,595 : INFO : topic #43 (0.020): 0.065*\"elect\" + 0.056*\"parti\" + 0.026*\"voluntari\" + 0.025*\"democrat\" + 0.020*\"member\" + 0.018*\"polici\" + 0.017*\"republ\" + 0.014*\"liber\" + 0.014*\"bypass\" + 0.013*\"report\"\n", + "2019-01-31 00:28:14,597 : INFO : topic #41 (0.020): 0.043*\"citi\" + 0.033*\"new\" + 0.024*\"palmer\" + 0.017*\"year\" + 0.015*\"center\" + 0.014*\"strategist\" + 0.012*\"open\" + 0.010*\"includ\" + 0.010*\"lobe\" + 0.009*\"dai\"\n", + "2019-01-31 00:28:14,598 : INFO : topic #44 (0.020): 0.030*\"rooftop\" + 0.027*\"final\" + 0.023*\"wife\" + 0.023*\"tourist\" + 0.019*\"champion\" + 0.017*\"taxpay\" + 0.016*\"chamber\" + 0.016*\"martin\" + 0.014*\"tiepolo\" + 0.012*\"women\"\n", + "2019-01-31 00:28:14,599 : INFO : topic #5 (0.020): 0.039*\"abroad\" + 0.028*\"rel\" + 0.028*\"son\" + 0.026*\"reconstruct\" + 0.021*\"band\" + 0.017*\"muscl\" + 0.016*\"simultan\" + 0.015*\"charcoal\" + 0.014*\"toyota\" + 0.010*\"vocabulari\"\n", + "2019-01-31 00:28:14,605 : INFO : topic diff=0.009083, rho=0.052271\n", + "2019-01-31 00:28:14,764 : INFO : PROGRESS: pass 0, at document #734000/4922894\n", + "2019-01-31 00:28:16,210 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:28:16,476 : INFO : topic #48 (0.020): 0.081*\"march\" + 0.078*\"sens\" + 0.074*\"octob\" + 0.072*\"januari\" + 0.069*\"juli\" + 0.068*\"august\" + 0.067*\"notion\" + 0.065*\"april\" + 0.065*\"decatur\" + 0.064*\"judici\"\n", + "2019-01-31 00:28:16,477 : INFO : topic #15 (0.020): 0.012*\"small\" + 0.011*\"develop\" + 0.011*\"organ\" + 0.010*\"word\" + 0.009*\"commun\" + 0.009*\"cultur\" + 0.009*\"group\" + 0.008*\"peopl\" + 0.008*\"human\" + 0.007*\"student\"\n", + "2019-01-31 00:28:16,478 : INFO : topic #24 (0.020): 0.040*\"book\" + 0.034*\"publicis\" + 0.024*\"word\" + 0.017*\"new\" + 0.013*\"edit\" + 0.013*\"storag\" + 0.012*\"presid\" + 0.012*\"nicola\" + 0.011*\"worldwid\" + 0.011*\"collect\"\n", + "2019-01-31 00:28:16,479 : INFO : topic #11 (0.020): 0.028*\"john\" + 0.015*\"will\" + 0.013*\"jame\" + 0.012*\"david\" + 0.012*\"rival\" + 0.010*\"georg\" + 0.010*\"mexican–american\" + 0.009*\"rhyme\" + 0.009*\"slur\" + 0.008*\"paul\"\n", + "2019-01-31 00:28:16,481 : INFO : topic #37 (0.020): 0.010*\"love\" + 0.008*\"gestur\" + 0.008*\"man\" + 0.006*\"blue\" + 0.005*\"night\" + 0.005*\"bewild\" + 0.004*\"litig\" + 0.003*\"ladi\" + 0.003*\"introductori\" + 0.003*\"vision\"\n", + "2019-01-31 00:28:16,486 : INFO : topic diff=0.010534, rho=0.052200\n", + "2019-01-31 00:28:16,700 : INFO : PROGRESS: pass 0, at document #736000/4922894\n", + "2019-01-31 00:28:18,086 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:28:18,352 : INFO : topic #8 (0.020): 0.027*\"law\" + 0.024*\"cortic\" + 0.022*\"act\" + 0.019*\"start\" + 0.016*\"ricardo\" + 0.014*\"case\" + 0.012*\"polaris\" + 0.009*\"legal\" + 0.008*\"judaism\" + 0.007*\"replac\"\n", + "2019-01-31 00:28:18,353 : INFO : topic #17 (0.020): 0.070*\"church\" + 0.023*\"cathol\" + 0.021*\"christian\" + 0.019*\"bishop\" + 0.014*\"sail\" + 0.013*\"retroflex\" + 0.011*\"centuri\" + 0.010*\"relationship\" + 0.009*\"cathedr\" + 0.009*\"poll\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 00:28:18,355 : INFO : topic #1 (0.020): 0.055*\"china\" + 0.046*\"chilton\" + 0.029*\"hong\" + 0.026*\"kong\" + 0.021*\"korea\" + 0.016*\"korean\" + 0.015*\"sourc\" + 0.015*\"min\" + 0.015*\"leah\" + 0.013*\"kim\"\n", + "2019-01-31 00:28:18,356 : INFO : topic #37 (0.020): 0.010*\"love\" + 0.008*\"gestur\" + 0.008*\"man\" + 0.006*\"blue\" + 0.005*\"night\" + 0.005*\"bewild\" + 0.004*\"litig\" + 0.003*\"vision\" + 0.003*\"ladi\" + 0.003*\"introductori\"\n", + "2019-01-31 00:28:18,357 : INFO : topic #18 (0.020): 0.010*\"théori\" + 0.007*\"later\" + 0.007*\"sack\" + 0.006*\"kill\" + 0.006*\"dai\" + 0.005*\"retrospect\" + 0.005*\"man\" + 0.004*\"like\" + 0.004*\"deal\" + 0.004*\"help\"\n", + "2019-01-31 00:28:18,363 : INFO : topic diff=0.010058, rho=0.052129\n", + "2019-01-31 00:28:18,522 : INFO : PROGRESS: pass 0, at document #738000/4922894\n", + "2019-01-31 00:28:19,963 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:28:20,230 : INFO : topic #27 (0.020): 0.073*\"questionnair\" + 0.019*\"taxpay\" + 0.018*\"candid\" + 0.014*\"driver\" + 0.013*\"find\" + 0.011*\"ret\" + 0.011*\"tornado\" + 0.011*\"landslid\" + 0.011*\"fool\" + 0.010*\"champion\"\n", + "2019-01-31 00:28:20,231 : INFO : topic #47 (0.020): 0.065*\"muscl\" + 0.032*\"perceptu\" + 0.021*\"theater\" + 0.019*\"compos\" + 0.018*\"place\" + 0.016*\"physician\" + 0.016*\"damn\" + 0.015*\"orchestr\" + 0.014*\"olympo\" + 0.012*\"word\"\n", + "2019-01-31 00:28:20,232 : INFO : topic #41 (0.020): 0.043*\"citi\" + 0.033*\"new\" + 0.024*\"palmer\" + 0.017*\"year\" + 0.015*\"center\" + 0.014*\"strategist\" + 0.012*\"open\" + 0.010*\"includ\" + 0.010*\"lobe\" + 0.009*\"dai\"\n", + "2019-01-31 00:28:20,233 : INFO : topic #15 (0.020): 0.012*\"small\" + 0.011*\"develop\" + 0.011*\"organ\" + 0.010*\"word\" + 0.009*\"commun\" + 0.009*\"cultur\" + 0.008*\"group\" + 0.008*\"peopl\" + 0.008*\"human\" + 0.007*\"student\"\n", + "2019-01-31 00:28:20,234 : INFO : topic #39 (0.020): 0.042*\"canada\" + 0.031*\"canadian\" + 0.018*\"toronto\" + 0.015*\"ontario\" + 0.015*\"scientist\" + 0.015*\"hoar\" + 0.014*\"taxpay\" + 0.013*\"basketbal\" + 0.012*\"new\" + 0.012*\"confer\"\n", + "2019-01-31 00:28:20,241 : INFO : topic diff=0.010591, rho=0.052058\n", + "2019-01-31 00:28:23,019 : INFO : -11.716 per-word bound, 3364.1 perplexity estimate based on a held-out corpus of 2000 documents with 572016 words\n", + "2019-01-31 00:28:23,019 : INFO : PROGRESS: pass 0, at document #740000/4922894\n", + "2019-01-31 00:28:24,463 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:28:24,729 : INFO : topic #19 (0.020): 0.014*\"languag\" + 0.010*\"woodcut\" + 0.010*\"origin\" + 0.010*\"form\" + 0.008*\"mean\" + 0.008*\"centuri\" + 0.007*\"uruguayan\" + 0.007*\"like\" + 0.006*\"charact\" + 0.006*\"english\"\n", + "2019-01-31 00:28:24,730 : INFO : topic #44 (0.020): 0.032*\"rooftop\" + 0.027*\"final\" + 0.023*\"tourist\" + 0.022*\"wife\" + 0.019*\"champion\" + 0.016*\"taxpay\" + 0.015*\"martin\" + 0.015*\"chamber\" + 0.014*\"tiepolo\" + 0.012*\"women\"\n", + "2019-01-31 00:28:24,731 : INFO : topic #35 (0.020): 0.050*\"russia\" + 0.034*\"sovereignti\" + 0.030*\"rural\" + 0.025*\"reprint\" + 0.025*\"personifi\" + 0.021*\"poison\" + 0.020*\"moscow\" + 0.017*\"poland\" + 0.014*\"turin\" + 0.014*\"czech\"\n", + "2019-01-31 00:28:24,732 : INFO : topic #4 (0.020): 0.022*\"enfranchis\" + 0.015*\"pour\" + 0.015*\"depress\" + 0.010*\"mode\" + 0.009*\"elabor\" + 0.008*\"produc\" + 0.008*\"candid\" + 0.008*\"veget\" + 0.007*\"encyclopedia\" + 0.007*\"proclaim\"\n", + "2019-01-31 00:28:24,733 : INFO : topic #16 (0.020): 0.037*\"king\" + 0.033*\"priest\" + 0.024*\"quarterli\" + 0.021*\"grammat\" + 0.021*\"duke\" + 0.018*\"rotterdam\" + 0.015*\"idiosyncrat\" + 0.015*\"princ\" + 0.015*\"maria\" + 0.013*\"brazil\"\n", + "2019-01-31 00:28:24,739 : INFO : topic diff=0.009036, rho=0.051988\n", + "2019-01-31 00:28:24,893 : INFO : PROGRESS: pass 0, at document #742000/4922894\n", + "2019-01-31 00:28:26,275 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:28:26,544 : INFO : topic #19 (0.020): 0.014*\"languag\" + 0.010*\"origin\" + 0.010*\"woodcut\" + 0.010*\"form\" + 0.008*\"centuri\" + 0.008*\"mean\" + 0.007*\"uruguayan\" + 0.007*\"like\" + 0.006*\"god\" + 0.006*\"charact\"\n", + "2019-01-31 00:28:26,545 : INFO : topic #1 (0.020): 0.055*\"china\" + 0.047*\"chilton\" + 0.027*\"hong\" + 0.025*\"kong\" + 0.021*\"korea\" + 0.016*\"korean\" + 0.015*\"sourc\" + 0.014*\"leah\" + 0.014*\"min\" + 0.013*\"kim\"\n", + "2019-01-31 00:28:26,546 : INFO : topic #25 (0.020): 0.032*\"ring\" + 0.016*\"lagrang\" + 0.016*\"area\" + 0.015*\"warmth\" + 0.015*\"mount\" + 0.011*\"palmer\" + 0.009*\"north\" + 0.008*\"vacant\" + 0.008*\"foam\" + 0.008*\"land\"\n", + "2019-01-31 00:28:26,547 : INFO : topic #20 (0.020): 0.141*\"scholar\" + 0.038*\"struggl\" + 0.032*\"high\" + 0.029*\"educ\" + 0.020*\"collector\" + 0.017*\"yawn\" + 0.013*\"prognosi\" + 0.009*\"class\" + 0.009*\"pseudo\" + 0.009*\"gothic\"\n", + "2019-01-31 00:28:26,548 : INFO : topic #41 (0.020): 0.043*\"citi\" + 0.033*\"new\" + 0.024*\"palmer\" + 0.017*\"year\" + 0.015*\"center\" + 0.014*\"strategist\" + 0.012*\"open\" + 0.010*\"includ\" + 0.010*\"lobe\" + 0.009*\"dai\"\n", + "2019-01-31 00:28:26,554 : INFO : topic diff=0.009144, rho=0.051917\n", + "2019-01-31 00:28:26,709 : INFO : PROGRESS: pass 0, at document #744000/4922894\n", + "2019-01-31 00:28:28,108 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:28:28,374 : INFO : topic #48 (0.020): 0.080*\"march\" + 0.076*\"sens\" + 0.076*\"octob\" + 0.072*\"januari\" + 0.069*\"juli\" + 0.068*\"notion\" + 0.067*\"august\" + 0.067*\"decatur\" + 0.065*\"april\" + 0.064*\"judici\"\n", + "2019-01-31 00:28:28,375 : INFO : topic #18 (0.020): 0.010*\"théori\" + 0.007*\"later\" + 0.007*\"sack\" + 0.006*\"kill\" + 0.006*\"dai\" + 0.005*\"retrospect\" + 0.005*\"man\" + 0.004*\"like\" + 0.004*\"deal\" + 0.004*\"help\"\n", + "2019-01-31 00:28:28,376 : INFO : topic #29 (0.020): 0.010*\"start\" + 0.009*\"million\" + 0.009*\"govern\" + 0.009*\"yawn\" + 0.008*\"companhia\" + 0.008*\"bank\" + 0.007*\"countri\" + 0.007*\"function\" + 0.006*\"trace\" + 0.006*\"new\"\n", + "2019-01-31 00:28:28,377 : INFO : topic #33 (0.020): 0.062*\"french\" + 0.043*\"franc\" + 0.030*\"pari\" + 0.023*\"sail\" + 0.022*\"jean\" + 0.015*\"daphn\" + 0.012*\"lazi\" + 0.012*\"loui\" + 0.010*\"piec\" + 0.009*\"wine\"\n", + "2019-01-31 00:28:28,378 : INFO : topic #42 (0.020): 0.044*\"german\" + 0.030*\"germani\" + 0.014*\"vol\" + 0.014*\"berlin\" + 0.013*\"der\" + 0.012*\"jewish\" + 0.011*\"israel\" + 0.009*\"austria\" + 0.008*\"itali\" + 0.008*\"hungarian\"\n", + "2019-01-31 00:28:28,384 : INFO : topic diff=0.009368, rho=0.051848\n", + "2019-01-31 00:28:28,539 : INFO : PROGRESS: pass 0, at document #746000/4922894\n", + "2019-01-31 00:28:29,956 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:28:30,222 : INFO : topic #0 (0.020): 0.067*\"statewid\" + 0.039*\"arsen\" + 0.038*\"line\" + 0.032*\"raid\" + 0.028*\"museo\" + 0.020*\"traceabl\" + 0.019*\"pain\" + 0.018*\"serv\" + 0.014*\"artist\" + 0.014*\"exhaust\"\n", + "2019-01-31 00:28:30,223 : INFO : topic #13 (0.020): 0.026*\"sourc\" + 0.026*\"australia\" + 0.025*\"new\" + 0.022*\"london\" + 0.022*\"australian\" + 0.022*\"ireland\" + 0.022*\"england\" + 0.020*\"british\" + 0.016*\"wale\" + 0.015*\"youth\"\n", + "2019-01-31 00:28:30,224 : INFO : topic #47 (0.020): 0.065*\"muscl\" + 0.033*\"perceptu\" + 0.020*\"theater\" + 0.019*\"compos\" + 0.017*\"place\" + 0.015*\"damn\" + 0.015*\"olympo\" + 0.015*\"physician\" + 0.014*\"orchestr\" + 0.012*\"word\"\n", + "2019-01-31 00:28:30,226 : INFO : topic #35 (0.020): 0.051*\"russia\" + 0.034*\"sovereignti\" + 0.031*\"rural\" + 0.025*\"reprint\" + 0.024*\"personifi\" + 0.022*\"poison\" + 0.020*\"moscow\" + 0.016*\"poland\" + 0.014*\"turin\" + 0.014*\"czech\"\n", + "2019-01-31 00:28:30,227 : INFO : topic #45 (0.020): 0.016*\"black\" + 0.015*\"fifteenth\" + 0.015*\"jpg\" + 0.014*\"western\" + 0.014*\"colder\" + 0.013*\"illicit\" + 0.011*\"record\" + 0.009*\"blind\" + 0.007*\"arm\" + 0.007*\"green\"\n", + "2019-01-31 00:28:30,233 : INFO : topic diff=0.008913, rho=0.051778\n", + "2019-01-31 00:28:30,391 : INFO : PROGRESS: pass 0, at document #748000/4922894\n", + "2019-01-31 00:28:31,834 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:28:32,100 : INFO : topic #13 (0.020): 0.026*\"australia\" + 0.026*\"sourc\" + 0.025*\"new\" + 0.022*\"london\" + 0.022*\"australian\" + 0.022*\"england\" + 0.021*\"ireland\" + 0.020*\"british\" + 0.016*\"wale\" + 0.015*\"youth\"\n", + "2019-01-31 00:28:32,101 : INFO : topic #27 (0.020): 0.071*\"questionnair\" + 0.018*\"taxpay\" + 0.017*\"candid\" + 0.014*\"driver\" + 0.014*\"horac\" + 0.013*\"find\" + 0.012*\"tornado\" + 0.012*\"ret\" + 0.011*\"squatter\" + 0.010*\"landslid\"\n", + "2019-01-31 00:28:32,102 : INFO : topic #42 (0.020): 0.045*\"german\" + 0.031*\"germani\" + 0.014*\"vol\" + 0.014*\"berlin\" + 0.013*\"der\" + 0.012*\"jewish\" + 0.011*\"israel\" + 0.008*\"austria\" + 0.008*\"itali\" + 0.008*\"europ\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 00:28:32,104 : INFO : topic #8 (0.020): 0.027*\"law\" + 0.024*\"cortic\" + 0.021*\"act\" + 0.019*\"start\" + 0.016*\"ricardo\" + 0.014*\"case\" + 0.012*\"polaris\" + 0.009*\"legal\" + 0.008*\"judaism\" + 0.008*\"replac\"\n", + "2019-01-31 00:28:32,105 : INFO : topic #1 (0.020): 0.056*\"china\" + 0.048*\"chilton\" + 0.028*\"hong\" + 0.025*\"kong\" + 0.022*\"korea\" + 0.015*\"sourc\" + 0.015*\"korean\" + 0.014*\"leah\" + 0.013*\"kim\" + 0.013*\"min\"\n", + "2019-01-31 00:28:32,110 : INFO : topic diff=0.008882, rho=0.051709\n", + "2019-01-31 00:28:32,264 : INFO : PROGRESS: pass 0, at document #750000/4922894\n", + "2019-01-31 00:28:33,669 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:28:33,935 : INFO : topic #35 (0.020): 0.053*\"russia\" + 0.035*\"sovereignti\" + 0.031*\"rural\" + 0.025*\"reprint\" + 0.023*\"personifi\" + 0.022*\"poison\" + 0.020*\"moscow\" + 0.016*\"poland\" + 0.015*\"unfortun\" + 0.014*\"czech\"\n", + "2019-01-31 00:28:33,936 : INFO : topic #9 (0.020): 0.069*\"bone\" + 0.037*\"american\" + 0.028*\"valour\" + 0.020*\"dutch\" + 0.018*\"folei\" + 0.016*\"english\" + 0.016*\"polit\" + 0.015*\"player\" + 0.011*\"simpler\" + 0.011*\"acrimoni\"\n", + "2019-01-31 00:28:33,937 : INFO : topic #34 (0.020): 0.070*\"start\" + 0.039*\"cotton\" + 0.030*\"unionist\" + 0.027*\"american\" + 0.022*\"new\" + 0.014*\"california\" + 0.013*\"terri\" + 0.013*\"warrior\" + 0.012*\"year\" + 0.011*\"north\"\n", + "2019-01-31 00:28:33,938 : INFO : topic #32 (0.020): 0.057*\"district\" + 0.045*\"vigour\" + 0.041*\"tortur\" + 0.041*\"popolo\" + 0.039*\"area\" + 0.030*\"cotton\" + 0.027*\"regim\" + 0.023*\"multitud\" + 0.022*\"citi\" + 0.018*\"commun\"\n", + "2019-01-31 00:28:33,940 : INFO : topic #14 (0.020): 0.024*\"forc\" + 0.021*\"aggress\" + 0.021*\"walter\" + 0.020*\"armi\" + 0.016*\"com\" + 0.014*\"oper\" + 0.013*\"unionist\" + 0.012*\"militari\" + 0.012*\"airbu\" + 0.010*\"refut\"\n", + "2019-01-31 00:28:33,945 : INFO : topic diff=0.008682, rho=0.051640\n", + "2019-01-31 00:28:34,106 : INFO : PROGRESS: pass 0, at document #752000/4922894\n", + "2019-01-31 00:28:35,528 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:28:35,794 : INFO : topic #41 (0.020): 0.042*\"citi\" + 0.033*\"new\" + 0.023*\"palmer\" + 0.017*\"year\" + 0.015*\"center\" + 0.014*\"strategist\" + 0.012*\"open\" + 0.011*\"lobe\" + 0.010*\"includ\" + 0.008*\"highli\"\n", + "2019-01-31 00:28:35,795 : INFO : topic #32 (0.020): 0.058*\"district\" + 0.045*\"vigour\" + 0.041*\"tortur\" + 0.041*\"popolo\" + 0.039*\"area\" + 0.029*\"cotton\" + 0.027*\"regim\" + 0.023*\"multitud\" + 0.021*\"citi\" + 0.019*\"commun\"\n", + "2019-01-31 00:28:35,797 : INFO : topic #31 (0.020): 0.066*\"fusiform\" + 0.025*\"player\" + 0.023*\"scientist\" + 0.021*\"taxpay\" + 0.020*\"place\" + 0.013*\"leagu\" + 0.012*\"clot\" + 0.011*\"folei\" + 0.009*\"barber\" + 0.009*\"ruler\"\n", + "2019-01-31 00:28:35,798 : INFO : topic #12 (0.020): 0.009*\"number\" + 0.008*\"frontal\" + 0.007*\"southern\" + 0.007*\"exampl\" + 0.007*\"gener\" + 0.006*\"servitud\" + 0.006*\"théori\" + 0.006*\"poet\" + 0.006*\"measur\" + 0.006*\"method\"\n", + "2019-01-31 00:28:35,799 : INFO : topic #40 (0.020): 0.088*\"unit\" + 0.024*\"collector\" + 0.023*\"schuster\" + 0.021*\"institut\" + 0.018*\"requir\" + 0.018*\"student\" + 0.016*\"professor\" + 0.012*\"governor\" + 0.011*\"word\" + 0.010*\"http\"\n", + "2019-01-31 00:28:35,805 : INFO : topic diff=0.010350, rho=0.051571\n", + "2019-01-31 00:28:35,959 : INFO : PROGRESS: pass 0, at document #754000/4922894\n", + "2019-01-31 00:28:37,373 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:28:37,639 : INFO : topic #46 (0.020): 0.018*\"damag\" + 0.018*\"stop\" + 0.018*\"sweden\" + 0.016*\"norwai\" + 0.015*\"swedish\" + 0.014*\"norwegian\" + 0.014*\"wind\" + 0.013*\"unjust\" + 0.012*\"treeless\" + 0.011*\"ton\"\n", + "2019-01-31 00:28:37,640 : INFO : topic #32 (0.020): 0.058*\"district\" + 0.045*\"vigour\" + 0.041*\"tortur\" + 0.041*\"popolo\" + 0.038*\"area\" + 0.029*\"cotton\" + 0.026*\"regim\" + 0.023*\"multitud\" + 0.022*\"citi\" + 0.019*\"commun\"\n", + "2019-01-31 00:28:37,641 : INFO : topic #21 (0.020): 0.036*\"samford\" + 0.024*\"spain\" + 0.019*\"del\" + 0.018*\"mexico\" + 0.015*\"soviet\" + 0.012*\"santa\" + 0.011*\"juan\" + 0.011*\"carlo\" + 0.011*\"francisco\" + 0.011*\"lizard\"\n", + "2019-01-31 00:28:37,642 : INFO : topic #35 (0.020): 0.053*\"russia\" + 0.036*\"sovereignti\" + 0.031*\"rural\" + 0.025*\"reprint\" + 0.023*\"personifi\" + 0.022*\"poison\" + 0.020*\"moscow\" + 0.016*\"poland\" + 0.015*\"czech\" + 0.015*\"unfortun\"\n", + "2019-01-31 00:28:37,643 : INFO : topic #29 (0.020): 0.010*\"start\" + 0.009*\"govern\" + 0.009*\"million\" + 0.009*\"companhia\" + 0.009*\"yawn\" + 0.008*\"bank\" + 0.007*\"countri\" + 0.006*\"function\" + 0.006*\"trace\" + 0.006*\"new\"\n", + "2019-01-31 00:28:37,649 : INFO : topic diff=0.008350, rho=0.051503\n", + "2019-01-31 00:28:37,804 : INFO : PROGRESS: pass 0, at document #756000/4922894\n", + "2019-01-31 00:28:39,213 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:28:39,479 : INFO : topic #31 (0.020): 0.065*\"fusiform\" + 0.025*\"player\" + 0.024*\"scientist\" + 0.021*\"taxpay\" + 0.021*\"place\" + 0.013*\"leagu\" + 0.012*\"clot\" + 0.011*\"folei\" + 0.009*\"barber\" + 0.009*\"ruler\"\n", + "2019-01-31 00:28:39,480 : INFO : topic #6 (0.020): 0.068*\"fewer\" + 0.025*\"septemb\" + 0.022*\"epiru\" + 0.019*\"teacher\" + 0.016*\"stake\" + 0.013*\"proclaim\" + 0.012*\"rodríguez\" + 0.011*\"direct\" + 0.011*\"movi\" + 0.010*\"acrimoni\"\n", + "2019-01-31 00:28:39,481 : INFO : topic #1 (0.020): 0.056*\"china\" + 0.047*\"chilton\" + 0.027*\"hong\" + 0.025*\"kong\" + 0.022*\"korea\" + 0.016*\"leah\" + 0.015*\"korean\" + 0.015*\"sourc\" + 0.014*\"min\" + 0.014*\"kim\"\n", + "2019-01-31 00:28:39,482 : INFO : topic #40 (0.020): 0.088*\"unit\" + 0.024*\"collector\" + 0.024*\"schuster\" + 0.021*\"institut\" + 0.019*\"requir\" + 0.018*\"student\" + 0.016*\"professor\" + 0.012*\"governor\" + 0.011*\"word\" + 0.010*\"http\"\n", + "2019-01-31 00:28:39,483 : INFO : topic #47 (0.020): 0.065*\"muscl\" + 0.032*\"perceptu\" + 0.021*\"theater\" + 0.018*\"compos\" + 0.017*\"place\" + 0.015*\"olympo\" + 0.015*\"damn\" + 0.015*\"physician\" + 0.014*\"orchestr\" + 0.012*\"word\"\n", + "2019-01-31 00:28:39,490 : INFO : topic diff=0.009668, rho=0.051434\n", + "2019-01-31 00:28:39,647 : INFO : PROGRESS: pass 0, at document #758000/4922894\n", + "2019-01-31 00:28:41,157 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:28:41,423 : INFO : topic #0 (0.020): 0.071*\"statewid\" + 0.040*\"arsen\" + 0.038*\"line\" + 0.032*\"raid\" + 0.030*\"museo\" + 0.020*\"traceabl\" + 0.018*\"pain\" + 0.017*\"serv\" + 0.014*\"artist\" + 0.014*\"exhaust\"\n", + "2019-01-31 00:28:41,425 : INFO : topic #31 (0.020): 0.065*\"fusiform\" + 0.025*\"player\" + 0.024*\"scientist\" + 0.021*\"taxpay\" + 0.021*\"place\" + 0.013*\"leagu\" + 0.012*\"clot\" + 0.012*\"folei\" + 0.010*\"barber\" + 0.009*\"ruler\"\n", + "2019-01-31 00:28:41,426 : INFO : topic #40 (0.020): 0.088*\"unit\" + 0.024*\"collector\" + 0.024*\"schuster\" + 0.020*\"institut\" + 0.019*\"requir\" + 0.018*\"student\" + 0.016*\"professor\" + 0.012*\"governor\" + 0.011*\"word\" + 0.011*\"http\"\n", + "2019-01-31 00:28:41,427 : INFO : topic #1 (0.020): 0.056*\"china\" + 0.046*\"chilton\" + 0.027*\"hong\" + 0.025*\"kong\" + 0.022*\"korea\" + 0.016*\"leah\" + 0.015*\"korean\" + 0.015*\"sourc\" + 0.014*\"min\" + 0.014*\"kim\"\n", + "2019-01-31 00:28:41,428 : INFO : topic #33 (0.020): 0.061*\"french\" + 0.043*\"franc\" + 0.031*\"pari\" + 0.024*\"sail\" + 0.021*\"jean\" + 0.015*\"daphn\" + 0.012*\"lazi\" + 0.012*\"loui\" + 0.010*\"piec\" + 0.009*\"wine\"\n", + "2019-01-31 00:28:41,434 : INFO : topic diff=0.008459, rho=0.051367\n", + "2019-01-31 00:28:44,196 : INFO : -11.812 per-word bound, 3594.4 perplexity estimate based on a held-out corpus of 2000 documents with 586166 words\n", + "2019-01-31 00:28:44,196 : INFO : PROGRESS: pass 0, at document #760000/4922894\n", + "2019-01-31 00:28:45,624 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:28:45,890 : INFO : topic #20 (0.020): 0.137*\"scholar\" + 0.037*\"struggl\" + 0.033*\"high\" + 0.029*\"educ\" + 0.021*\"collector\" + 0.017*\"yawn\" + 0.013*\"prognosi\" + 0.009*\"task\" + 0.009*\"class\" + 0.009*\"gothic\"\n", + "2019-01-31 00:28:45,891 : INFO : topic #46 (0.020): 0.022*\"damag\" + 0.018*\"sweden\" + 0.017*\"stop\" + 0.016*\"norwai\" + 0.015*\"swedish\" + 0.013*\"norwegian\" + 0.013*\"ton\" + 0.013*\"wind\" + 0.012*\"unjust\" + 0.011*\"treeless\"\n", + "2019-01-31 00:28:45,893 : INFO : topic #11 (0.020): 0.028*\"john\" + 0.017*\"will\" + 0.013*\"jame\" + 0.012*\"david\" + 0.012*\"rival\" + 0.010*\"georg\" + 0.010*\"mexican–american\" + 0.009*\"wilson\" + 0.009*\"rhyme\" + 0.008*\"slur\"\n", + "2019-01-31 00:28:45,894 : INFO : topic #45 (0.020): 0.016*\"black\" + 0.016*\"fifteenth\" + 0.015*\"illicit\" + 0.015*\"jpg\" + 0.014*\"western\" + 0.013*\"colder\" + 0.011*\"record\" + 0.009*\"blind\" + 0.007*\"light\" + 0.007*\"green\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 00:28:45,895 : INFO : topic #7 (0.020): 0.020*\"snatch\" + 0.018*\"di\" + 0.017*\"factor\" + 0.015*\"yawn\" + 0.014*\"margin\" + 0.013*\"bone\" + 0.013*\"life\" + 0.012*\"faster\" + 0.011*\"daughter\" + 0.011*\"deal\"\n", + "2019-01-31 00:28:45,901 : INFO : topic diff=0.008575, rho=0.051299\n", + "2019-01-31 00:28:46,059 : INFO : PROGRESS: pass 0, at document #762000/4922894\n", + "2019-01-31 00:28:47,490 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:28:47,759 : INFO : topic #33 (0.020): 0.060*\"french\" + 0.044*\"franc\" + 0.031*\"pari\" + 0.024*\"sail\" + 0.022*\"jean\" + 0.016*\"daphn\" + 0.012*\"lazi\" + 0.012*\"loui\" + 0.010*\"piec\" + 0.010*\"wine\"\n", + "2019-01-31 00:28:47,760 : INFO : topic #21 (0.020): 0.035*\"samford\" + 0.023*\"spain\" + 0.019*\"mexico\" + 0.018*\"del\" + 0.015*\"soviet\" + 0.012*\"santa\" + 0.011*\"carlo\" + 0.011*\"juan\" + 0.011*\"francisco\" + 0.010*\"lizard\"\n", + "2019-01-31 00:28:47,761 : INFO : topic #12 (0.020): 0.009*\"number\" + 0.008*\"frontal\" + 0.007*\"southern\" + 0.007*\"exampl\" + 0.007*\"servitud\" + 0.006*\"gener\" + 0.006*\"théori\" + 0.006*\"poet\" + 0.006*\"measur\" + 0.005*\"method\"\n", + "2019-01-31 00:28:47,762 : INFO : topic #30 (0.020): 0.036*\"leagu\" + 0.035*\"cleveland\" + 0.029*\"place\" + 0.027*\"taxpay\" + 0.024*\"scientist\" + 0.022*\"crete\" + 0.022*\"folei\" + 0.016*\"goal\" + 0.015*\"martin\" + 0.011*\"schmitz\"\n", + "2019-01-31 00:28:47,764 : INFO : topic #40 (0.020): 0.090*\"unit\" + 0.024*\"collector\" + 0.023*\"schuster\" + 0.021*\"institut\" + 0.018*\"requir\" + 0.018*\"student\" + 0.016*\"professor\" + 0.012*\"governor\" + 0.011*\"word\" + 0.011*\"http\"\n", + "2019-01-31 00:28:47,769 : INFO : topic diff=0.008768, rho=0.051232\n", + "2019-01-31 00:28:47,923 : INFO : PROGRESS: pass 0, at document #764000/4922894\n", + "2019-01-31 00:28:49,323 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:28:49,588 : INFO : topic #13 (0.020): 0.026*\"sourc\" + 0.025*\"new\" + 0.025*\"australia\" + 0.024*\"london\" + 0.022*\"england\" + 0.022*\"australian\" + 0.021*\"ireland\" + 0.021*\"british\" + 0.015*\"youth\" + 0.015*\"wale\"\n", + "2019-01-31 00:28:49,589 : INFO : topic #36 (0.020): 0.017*\"companhia\" + 0.011*\"network\" + 0.011*\"pop\" + 0.009*\"serv\" + 0.009*\"develop\" + 0.009*\"prognosi\" + 0.008*\"base\" + 0.008*\"user\" + 0.008*\"includ\" + 0.007*\"manag\"\n", + "2019-01-31 00:28:49,590 : INFO : topic #45 (0.020): 0.016*\"black\" + 0.016*\"fifteenth\" + 0.015*\"jpg\" + 0.014*\"western\" + 0.014*\"illicit\" + 0.013*\"colder\" + 0.011*\"record\" + 0.009*\"blind\" + 0.007*\"green\" + 0.007*\"light\"\n", + "2019-01-31 00:28:49,592 : INFO : topic #42 (0.020): 0.045*\"german\" + 0.030*\"germani\" + 0.014*\"vol\" + 0.013*\"berlin\" + 0.012*\"jewish\" + 0.012*\"israel\" + 0.012*\"der\" + 0.009*\"itali\" + 0.009*\"europ\" + 0.008*\"austria\"\n", + "2019-01-31 00:28:49,593 : INFO : topic #28 (0.020): 0.030*\"build\" + 0.024*\"hous\" + 0.021*\"rivièr\" + 0.017*\"buford\" + 0.012*\"histor\" + 0.012*\"briarwood\" + 0.011*\"linear\" + 0.011*\"constitut\" + 0.010*\"strategist\" + 0.010*\"rosenwald\"\n", + "2019-01-31 00:28:49,599 : INFO : topic diff=0.008894, rho=0.051164\n", + "2019-01-31 00:28:49,816 : INFO : PROGRESS: pass 0, at document #766000/4922894\n", + "2019-01-31 00:28:51,246 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:28:51,512 : INFO : topic #42 (0.020): 0.045*\"german\" + 0.030*\"germani\" + 0.014*\"vol\" + 0.013*\"berlin\" + 0.013*\"israel\" + 0.012*\"jewish\" + 0.012*\"der\" + 0.009*\"itali\" + 0.008*\"europ\" + 0.008*\"austria\"\n", + "2019-01-31 00:28:51,513 : INFO : topic #48 (0.020): 0.085*\"march\" + 0.079*\"octob\" + 0.078*\"sens\" + 0.074*\"januari\" + 0.072*\"notion\" + 0.071*\"juli\" + 0.070*\"august\" + 0.069*\"decatur\" + 0.069*\"april\" + 0.068*\"judici\"\n", + "2019-01-31 00:28:51,514 : INFO : topic #34 (0.020): 0.071*\"start\" + 0.040*\"cotton\" + 0.031*\"unionist\" + 0.028*\"american\" + 0.023*\"new\" + 0.015*\"california\" + 0.014*\"terri\" + 0.013*\"warrior\" + 0.012*\"year\" + 0.011*\"north\"\n", + "2019-01-31 00:28:51,515 : INFO : topic #49 (0.020): 0.046*\"india\" + 0.032*\"incumb\" + 0.013*\"islam\" + 0.012*\"televis\" + 0.012*\"pakistan\" + 0.011*\"anglo\" + 0.011*\"muskoge\" + 0.010*\"start\" + 0.010*\"singh\" + 0.009*\"alam\"\n", + "2019-01-31 00:28:51,516 : INFO : topic #2 (0.020): 0.046*\"isl\" + 0.036*\"shield\" + 0.020*\"narrat\" + 0.013*\"scot\" + 0.013*\"pope\" + 0.013*\"coalit\" + 0.011*\"blur\" + 0.011*\"nativist\" + 0.011*\"class\" + 0.010*\"bahá\"\n", + "2019-01-31 00:28:51,522 : INFO : topic diff=0.008444, rho=0.051098\n", + "2019-01-31 00:28:51,688 : INFO : PROGRESS: pass 0, at document #768000/4922894\n", + "2019-01-31 00:28:53,120 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:28:53,386 : INFO : topic #22 (0.020): 0.034*\"spars\" + 0.026*\"factor\" + 0.021*\"adulthood\" + 0.016*\"feel\" + 0.015*\"hostil\" + 0.015*\"male\" + 0.012*\"plaisir\" + 0.011*\"live\" + 0.010*\"genu\" + 0.009*\"yawn\"\n", + "2019-01-31 00:28:53,387 : INFO : topic #43 (0.020): 0.066*\"elect\" + 0.056*\"parti\" + 0.027*\"voluntari\" + 0.023*\"democrat\" + 0.020*\"member\" + 0.018*\"polici\" + 0.015*\"republ\" + 0.014*\"liber\" + 0.014*\"bypass\" + 0.013*\"selma\"\n", + "2019-01-31 00:28:53,388 : INFO : topic #37 (0.020): 0.010*\"love\" + 0.008*\"gestur\" + 0.008*\"man\" + 0.006*\"blue\" + 0.005*\"litig\" + 0.005*\"bewild\" + 0.005*\"night\" + 0.003*\"vision\" + 0.003*\"ladi\" + 0.003*\"healthcar\"\n", + "2019-01-31 00:28:53,389 : INFO : topic #39 (0.020): 0.039*\"canada\" + 0.031*\"canadian\" + 0.017*\"toronto\" + 0.016*\"hoar\" + 0.015*\"ontario\" + 0.015*\"basketbal\" + 0.014*\"taxpay\" + 0.014*\"scientist\" + 0.012*\"new\" + 0.012*\"confer\"\n", + "2019-01-31 00:28:53,390 : INFO : topic #24 (0.020): 0.039*\"book\" + 0.034*\"publicis\" + 0.023*\"word\" + 0.017*\"new\" + 0.014*\"edit\" + 0.013*\"storag\" + 0.013*\"nicola\" + 0.012*\"presid\" + 0.012*\"collect\" + 0.011*\"worldwid\"\n", + "2019-01-31 00:28:53,396 : INFO : topic diff=0.009250, rho=0.051031\n", + "2019-01-31 00:28:53,553 : INFO : PROGRESS: pass 0, at document #770000/4922894\n", + "2019-01-31 00:28:54,959 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:28:55,228 : INFO : topic #6 (0.020): 0.069*\"fewer\" + 0.024*\"septemb\" + 0.022*\"epiru\" + 0.019*\"teacher\" + 0.016*\"stake\" + 0.013*\"proclaim\" + 0.012*\"rodríguez\" + 0.011*\"movi\" + 0.011*\"direct\" + 0.011*\"acrimoni\"\n", + "2019-01-31 00:28:55,229 : INFO : topic #12 (0.020): 0.009*\"number\" + 0.008*\"frontal\" + 0.007*\"southern\" + 0.007*\"théori\" + 0.006*\"exampl\" + 0.006*\"gener\" + 0.006*\"servitud\" + 0.006*\"poet\" + 0.005*\"measur\" + 0.005*\"utopian\"\n", + "2019-01-31 00:28:55,230 : INFO : topic #1 (0.020): 0.057*\"china\" + 0.046*\"chilton\" + 0.029*\"hong\" + 0.027*\"kong\" + 0.023*\"korea\" + 0.020*\"korean\" + 0.016*\"sourc\" + 0.016*\"leah\" + 0.014*\"kim\" + 0.012*\"min\"\n", + "2019-01-31 00:28:55,232 : INFO : topic #20 (0.020): 0.139*\"scholar\" + 0.037*\"struggl\" + 0.033*\"high\" + 0.030*\"educ\" + 0.020*\"collector\" + 0.017*\"yawn\" + 0.013*\"prognosi\" + 0.009*\"gothic\" + 0.009*\"task\" + 0.009*\"district\"\n", + "2019-01-31 00:28:55,233 : INFO : topic #41 (0.020): 0.044*\"citi\" + 0.033*\"new\" + 0.022*\"palmer\" + 0.016*\"year\" + 0.014*\"strategist\" + 0.014*\"center\" + 0.011*\"open\" + 0.011*\"includ\" + 0.010*\"lobe\" + 0.008*\"highli\"\n", + "2019-01-31 00:28:55,239 : INFO : topic diff=0.008915, rho=0.050965\n", + "2019-01-31 00:28:55,401 : INFO : PROGRESS: pass 0, at document #772000/4922894\n", + "2019-01-31 00:28:56,856 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:28:57,122 : INFO : topic #32 (0.020): 0.056*\"district\" + 0.045*\"vigour\" + 0.043*\"popolo\" + 0.041*\"tortur\" + 0.037*\"area\" + 0.028*\"cotton\" + 0.026*\"regim\" + 0.024*\"multitud\" + 0.022*\"citi\" + 0.019*\"commun\"\n", + "2019-01-31 00:28:57,123 : INFO : topic #29 (0.020): 0.010*\"million\" + 0.010*\"start\" + 0.010*\"govern\" + 0.009*\"companhia\" + 0.009*\"yawn\" + 0.008*\"bank\" + 0.007*\"countri\" + 0.007*\"function\" + 0.006*\"trace\" + 0.006*\"market\"\n", + "2019-01-31 00:28:57,124 : INFO : topic #36 (0.020): 0.016*\"companhia\" + 0.011*\"network\" + 0.010*\"pop\" + 0.009*\"develop\" + 0.009*\"prognosi\" + 0.009*\"serv\" + 0.008*\"base\" + 0.008*\"includ\" + 0.007*\"user\" + 0.007*\"manag\"\n", + "2019-01-31 00:28:57,126 : INFO : topic #39 (0.020): 0.039*\"canada\" + 0.031*\"canadian\" + 0.017*\"hoar\" + 0.017*\"toronto\" + 0.015*\"ontario\" + 0.014*\"basketbal\" + 0.014*\"taxpay\" + 0.014*\"scientist\" + 0.012*\"new\" + 0.012*\"confer\"\n", + "2019-01-31 00:28:57,127 : INFO : topic #46 (0.020): 0.019*\"damag\" + 0.018*\"sweden\" + 0.017*\"stop\" + 0.016*\"norwai\" + 0.016*\"swedish\" + 0.014*\"wind\" + 0.014*\"norwegian\" + 0.011*\"treeless\" + 0.010*\"farid\" + 0.010*\"unjust\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 00:28:57,133 : INFO : topic diff=0.010324, rho=0.050899\n", + "2019-01-31 00:28:57,292 : INFO : PROGRESS: pass 0, at document #774000/4922894\n", + "2019-01-31 00:28:58,722 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:28:58,988 : INFO : topic #33 (0.020): 0.058*\"french\" + 0.044*\"franc\" + 0.031*\"pari\" + 0.025*\"sail\" + 0.021*\"jean\" + 0.016*\"daphn\" + 0.014*\"loui\" + 0.012*\"lazi\" + 0.010*\"piec\" + 0.009*\"wine\"\n", + "2019-01-31 00:28:58,990 : INFO : topic #7 (0.020): 0.020*\"snatch\" + 0.018*\"di\" + 0.017*\"factor\" + 0.015*\"yawn\" + 0.014*\"margin\" + 0.013*\"bone\" + 0.013*\"life\" + 0.013*\"faster\" + 0.011*\"daughter\" + 0.011*\"deal\"\n", + "2019-01-31 00:28:58,991 : INFO : topic #44 (0.020): 0.031*\"rooftop\" + 0.028*\"final\" + 0.024*\"wife\" + 0.021*\"tourist\" + 0.018*\"champion\" + 0.018*\"taxpay\" + 0.016*\"martin\" + 0.014*\"tiepolo\" + 0.014*\"chamber\" + 0.013*\"women\"\n", + "2019-01-31 00:28:58,992 : INFO : topic #9 (0.020): 0.073*\"bone\" + 0.042*\"american\" + 0.026*\"valour\" + 0.020*\"folei\" + 0.018*\"english\" + 0.018*\"dutch\" + 0.018*\"player\" + 0.017*\"polit\" + 0.011*\"simpler\" + 0.011*\"acrimoni\"\n", + "2019-01-31 00:28:58,993 : INFO : topic #37 (0.020): 0.010*\"love\" + 0.009*\"gestur\" + 0.008*\"man\" + 0.006*\"blue\" + 0.005*\"bewild\" + 0.005*\"litig\" + 0.004*\"night\" + 0.003*\"vision\" + 0.003*\"ladi\" + 0.003*\"madison\"\n", + "2019-01-31 00:28:58,999 : INFO : topic diff=0.009207, rho=0.050833\n", + "2019-01-31 00:28:59,154 : INFO : PROGRESS: pass 0, at document #776000/4922894\n", + "2019-01-31 00:29:00,578 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:29:00,844 : INFO : topic #31 (0.020): 0.065*\"fusiform\" + 0.025*\"player\" + 0.024*\"scientist\" + 0.021*\"taxpay\" + 0.020*\"place\" + 0.013*\"clot\" + 0.013*\"leagu\" + 0.011*\"folei\" + 0.010*\"barber\" + 0.009*\"ruler\"\n", + "2019-01-31 00:29:00,846 : INFO : topic #16 (0.020): 0.037*\"king\" + 0.034*\"priest\" + 0.021*\"duke\" + 0.021*\"grammat\" + 0.020*\"quarterli\" + 0.017*\"rotterdam\" + 0.015*\"idiosyncrat\" + 0.014*\"maria\" + 0.014*\"princ\" + 0.013*\"brazil\"\n", + "2019-01-31 00:29:00,847 : INFO : topic #29 (0.020): 0.010*\"govern\" + 0.010*\"start\" + 0.009*\"million\" + 0.009*\"companhia\" + 0.009*\"yawn\" + 0.008*\"bank\" + 0.007*\"countri\" + 0.007*\"function\" + 0.006*\"trace\" + 0.006*\"market\"\n", + "2019-01-31 00:29:00,848 : INFO : topic #22 (0.020): 0.034*\"spars\" + 0.027*\"factor\" + 0.021*\"adulthood\" + 0.016*\"feel\" + 0.015*\"hostil\" + 0.014*\"male\" + 0.012*\"plaisir\" + 0.011*\"live\" + 0.009*\"yawn\" + 0.009*\"genu\"\n", + "2019-01-31 00:29:00,849 : INFO : topic #10 (0.020): 0.010*\"cdd\" + 0.008*\"media\" + 0.008*\"disco\" + 0.007*\"pathwai\" + 0.007*\"have\" + 0.006*\"proper\" + 0.006*\"caus\" + 0.006*\"treat\" + 0.006*\"hormon\" + 0.006*\"effect\"\n", + "2019-01-31 00:29:00,855 : INFO : topic diff=0.008623, rho=0.050767\n", + "2019-01-31 00:29:01,012 : INFO : PROGRESS: pass 0, at document #778000/4922894\n", + "2019-01-31 00:29:02,440 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:29:02,707 : INFO : topic #4 (0.020): 0.024*\"enfranchis\" + 0.016*\"depress\" + 0.014*\"pour\" + 0.010*\"mode\" + 0.009*\"candid\" + 0.009*\"produc\" + 0.008*\"elabor\" + 0.008*\"veget\" + 0.007*\"uruguayan\" + 0.007*\"encyclopedia\"\n", + "2019-01-31 00:29:02,708 : INFO : topic #12 (0.020): 0.009*\"number\" + 0.008*\"frontal\" + 0.008*\"southern\" + 0.007*\"théori\" + 0.006*\"gener\" + 0.006*\"exampl\" + 0.006*\"servitud\" + 0.006*\"poet\" + 0.006*\"measur\" + 0.005*\"utopian\"\n", + "2019-01-31 00:29:02,709 : INFO : topic #8 (0.020): 0.027*\"law\" + 0.024*\"cortic\" + 0.019*\"act\" + 0.019*\"start\" + 0.015*\"ricardo\" + 0.013*\"case\" + 0.013*\"polaris\" + 0.009*\"legal\" + 0.009*\"judaism\" + 0.008*\"justic\"\n", + "2019-01-31 00:29:02,710 : INFO : topic #25 (0.020): 0.032*\"ring\" + 0.017*\"warmth\" + 0.016*\"lagrang\" + 0.015*\"area\" + 0.015*\"mount\" + 0.010*\"palmer\" + 0.009*\"north\" + 0.009*\"vacant\" + 0.008*\"foam\" + 0.008*\"sourc\"\n", + "2019-01-31 00:29:02,712 : INFO : topic #32 (0.020): 0.057*\"district\" + 0.046*\"vigour\" + 0.042*\"popolo\" + 0.040*\"tortur\" + 0.036*\"area\" + 0.028*\"cotton\" + 0.026*\"regim\" + 0.024*\"multitud\" + 0.022*\"citi\" + 0.020*\"commun\"\n", + "2019-01-31 00:29:02,717 : INFO : topic diff=0.008873, rho=0.050702\n", + "2019-01-31 00:29:05,364 : INFO : -11.571 per-word bound, 3042.2 perplexity estimate based on a held-out corpus of 2000 documents with 517534 words\n", + "2019-01-31 00:29:05,365 : INFO : PROGRESS: pass 0, at document #780000/4922894\n", + "2019-01-31 00:29:06,750 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:29:07,016 : INFO : topic #3 (0.020): 0.036*\"present\" + 0.030*\"serv\" + 0.028*\"offic\" + 0.025*\"minist\" + 0.020*\"member\" + 0.017*\"govern\" + 0.017*\"seri\" + 0.017*\"nation\" + 0.017*\"gener\" + 0.015*\"chickasaw\"\n", + "2019-01-31 00:29:07,018 : INFO : topic #29 (0.020): 0.010*\"govern\" + 0.009*\"start\" + 0.009*\"million\" + 0.009*\"companhia\" + 0.009*\"yawn\" + 0.008*\"bank\" + 0.007*\"countri\" + 0.007*\"function\" + 0.006*\"trace\" + 0.006*\"market\"\n", + "2019-01-31 00:29:07,019 : INFO : topic #33 (0.020): 0.060*\"french\" + 0.043*\"franc\" + 0.030*\"pari\" + 0.025*\"sail\" + 0.021*\"jean\" + 0.016*\"daphn\" + 0.013*\"loui\" + 0.013*\"lazi\" + 0.010*\"piec\" + 0.009*\"wine\"\n", + "2019-01-31 00:29:07,020 : INFO : topic #15 (0.020): 0.011*\"small\" + 0.011*\"develop\" + 0.011*\"organ\" + 0.010*\"word\" + 0.009*\"commun\" + 0.009*\"group\" + 0.008*\"cultur\" + 0.008*\"peopl\" + 0.007*\"student\" + 0.007*\"human\"\n", + "2019-01-31 00:29:07,021 : INFO : topic #38 (0.020): 0.021*\"walter\" + 0.010*\"aza\" + 0.010*\"king\" + 0.010*\"battalion\" + 0.009*\"empath\" + 0.009*\"centuri\" + 0.008*\"teufel\" + 0.008*\"forc\" + 0.007*\"armi\" + 0.007*\"embassi\"\n", + "2019-01-31 00:29:07,027 : INFO : topic diff=0.008137, rho=0.050637\n", + "2019-01-31 00:29:07,182 : INFO : PROGRESS: pass 0, at document #782000/4922894\n", + "2019-01-31 00:29:08,595 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:29:08,862 : INFO : topic #38 (0.020): 0.021*\"walter\" + 0.010*\"aza\" + 0.010*\"king\" + 0.010*\"battalion\" + 0.009*\"empath\" + 0.009*\"centuri\" + 0.008*\"teufel\" + 0.008*\"forc\" + 0.007*\"embassi\" + 0.007*\"armi\"\n", + "2019-01-31 00:29:08,863 : INFO : topic #25 (0.020): 0.031*\"ring\" + 0.017*\"warmth\" + 0.016*\"lagrang\" + 0.015*\"area\" + 0.015*\"mount\" + 0.011*\"palmer\" + 0.009*\"north\" + 0.008*\"vacant\" + 0.008*\"foam\" + 0.008*\"sourc\"\n", + "2019-01-31 00:29:08,865 : INFO : topic #17 (0.020): 0.074*\"church\" + 0.022*\"christian\" + 0.021*\"cathol\" + 0.019*\"bishop\" + 0.015*\"sail\" + 0.014*\"retroflex\" + 0.010*\"centuri\" + 0.009*\"historiographi\" + 0.009*\"relationship\" + 0.009*\"poll\"\n", + "2019-01-31 00:29:08,866 : INFO : topic #34 (0.020): 0.070*\"start\" + 0.039*\"cotton\" + 0.030*\"unionist\" + 0.027*\"american\" + 0.023*\"new\" + 0.015*\"california\" + 0.014*\"terri\" + 0.013*\"warrior\" + 0.012*\"year\" + 0.011*\"north\"\n", + "2019-01-31 00:29:08,867 : INFO : topic #37 (0.020): 0.010*\"love\" + 0.009*\"gestur\" + 0.008*\"man\" + 0.006*\"blue\" + 0.005*\"bewild\" + 0.004*\"litig\" + 0.004*\"night\" + 0.003*\"vision\" + 0.003*\"york\" + 0.003*\"ladi\"\n", + "2019-01-31 00:29:08,873 : INFO : topic diff=0.008638, rho=0.050572\n", + "2019-01-31 00:29:09,028 : INFO : PROGRESS: pass 0, at document #784000/4922894\n", + "2019-01-31 00:29:10,431 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:29:10,697 : INFO : topic #25 (0.020): 0.031*\"ring\" + 0.016*\"warmth\" + 0.016*\"lagrang\" + 0.015*\"mount\" + 0.015*\"area\" + 0.010*\"palmer\" + 0.009*\"north\" + 0.008*\"vacant\" + 0.008*\"foam\" + 0.008*\"sourc\"\n", + "2019-01-31 00:29:10,699 : INFO : topic #15 (0.020): 0.011*\"small\" + 0.011*\"develop\" + 0.011*\"organ\" + 0.010*\"word\" + 0.009*\"commun\" + 0.009*\"group\" + 0.008*\"cultur\" + 0.008*\"peopl\" + 0.007*\"human\" + 0.007*\"student\"\n", + "2019-01-31 00:29:10,700 : INFO : topic #5 (0.020): 0.040*\"abroad\" + 0.028*\"son\" + 0.027*\"rel\" + 0.025*\"reconstruct\" + 0.021*\"band\" + 0.017*\"muscl\" + 0.017*\"simultan\" + 0.015*\"charcoal\" + 0.013*\"toyota\" + 0.010*\"vocabulari\"\n", + "2019-01-31 00:29:10,701 : INFO : topic #24 (0.020): 0.039*\"book\" + 0.034*\"publicis\" + 0.023*\"word\" + 0.017*\"new\" + 0.014*\"edit\" + 0.013*\"nicola\" + 0.012*\"storag\" + 0.012*\"presid\" + 0.011*\"collect\" + 0.011*\"worldwid\"\n", + "2019-01-31 00:29:10,702 : INFO : topic #29 (0.020): 0.009*\"govern\" + 0.009*\"million\" + 0.009*\"start\" + 0.009*\"companhia\" + 0.009*\"yawn\" + 0.008*\"bank\" + 0.007*\"countri\" + 0.007*\"function\" + 0.006*\"market\" + 0.006*\"trace\"\n", + "2019-01-31 00:29:10,708 : INFO : topic diff=0.008466, rho=0.050508\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 00:29:10,871 : INFO : PROGRESS: pass 0, at document #786000/4922894\n", + "2019-01-31 00:29:12,334 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:29:12,601 : INFO : topic #24 (0.020): 0.039*\"book\" + 0.034*\"publicis\" + 0.023*\"word\" + 0.017*\"new\" + 0.014*\"edit\" + 0.013*\"nicola\" + 0.013*\"storag\" + 0.012*\"presid\" + 0.011*\"collect\" + 0.011*\"worldwid\"\n", + "2019-01-31 00:29:12,602 : INFO : topic #13 (0.020): 0.025*\"australia\" + 0.025*\"sourc\" + 0.025*\"new\" + 0.024*\"london\" + 0.021*\"england\" + 0.021*\"australian\" + 0.020*\"ireland\" + 0.020*\"british\" + 0.015*\"youth\" + 0.014*\"wale\"\n", + "2019-01-31 00:29:12,603 : INFO : topic #12 (0.020): 0.009*\"number\" + 0.008*\"frontal\" + 0.007*\"southern\" + 0.007*\"théori\" + 0.006*\"exampl\" + 0.006*\"gener\" + 0.006*\"servitud\" + 0.006*\"poet\" + 0.006*\"utopian\" + 0.005*\"measur\"\n", + "2019-01-31 00:29:12,604 : INFO : topic #23 (0.020): 0.130*\"audit\" + 0.067*\"best\" + 0.035*\"yawn\" + 0.030*\"jacksonvil\" + 0.023*\"japanes\" + 0.022*\"noll\" + 0.019*\"women\" + 0.018*\"festiv\" + 0.018*\"intern\" + 0.014*\"winner\"\n", + "2019-01-31 00:29:12,605 : INFO : topic #0 (0.020): 0.069*\"statewid\" + 0.042*\"arsen\" + 0.036*\"line\" + 0.034*\"museo\" + 0.034*\"raid\" + 0.019*\"traceabl\" + 0.018*\"pain\" + 0.017*\"serv\" + 0.015*\"exhaust\" + 0.014*\"artist\"\n", + "2019-01-31 00:29:12,611 : INFO : topic diff=0.008958, rho=0.050443\n", + "2019-01-31 00:29:12,770 : INFO : PROGRESS: pass 0, at document #788000/4922894\n", + "2019-01-31 00:29:14,200 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:29:14,466 : INFO : topic #12 (0.020): 0.009*\"number\" + 0.008*\"frontal\" + 0.007*\"southern\" + 0.007*\"théori\" + 0.006*\"gener\" + 0.006*\"exampl\" + 0.006*\"servitud\" + 0.006*\"measur\" + 0.006*\"poet\" + 0.006*\"utopian\"\n", + "2019-01-31 00:29:14,468 : INFO : topic #31 (0.020): 0.065*\"fusiform\" + 0.025*\"scientist\" + 0.024*\"player\" + 0.021*\"taxpay\" + 0.021*\"place\" + 0.013*\"clot\" + 0.012*\"leagu\" + 0.011*\"folei\" + 0.009*\"ruler\" + 0.009*\"barber\"\n", + "2019-01-31 00:29:14,469 : INFO : topic #9 (0.020): 0.070*\"bone\" + 0.042*\"american\" + 0.026*\"valour\" + 0.020*\"folei\" + 0.018*\"english\" + 0.017*\"dutch\" + 0.017*\"player\" + 0.015*\"polit\" + 0.012*\"acrimoni\" + 0.012*\"simpler\"\n", + "2019-01-31 00:29:14,470 : INFO : topic #28 (0.020): 0.029*\"build\" + 0.025*\"hous\" + 0.020*\"rivièr\" + 0.017*\"buford\" + 0.014*\"histor\" + 0.011*\"constitut\" + 0.011*\"briarwood\" + 0.010*\"linear\" + 0.010*\"strategist\" + 0.009*\"silicon\"\n", + "2019-01-31 00:29:14,471 : INFO : topic #22 (0.020): 0.034*\"spars\" + 0.027*\"factor\" + 0.022*\"adulthood\" + 0.016*\"feel\" + 0.015*\"hostil\" + 0.014*\"male\" + 0.011*\"live\" + 0.011*\"plaisir\" + 0.010*\"biom\" + 0.010*\"yawn\"\n", + "2019-01-31 00:29:14,477 : INFO : topic diff=0.008537, rho=0.050379\n", + "2019-01-31 00:29:14,641 : INFO : PROGRESS: pass 0, at document #790000/4922894\n", + "2019-01-31 00:29:16,050 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:29:16,316 : INFO : topic #9 (0.020): 0.070*\"bone\" + 0.042*\"american\" + 0.026*\"valour\" + 0.021*\"dutch\" + 0.019*\"folei\" + 0.018*\"english\" + 0.017*\"player\" + 0.015*\"polit\" + 0.011*\"simpler\" + 0.011*\"acrimoni\"\n", + "2019-01-31 00:29:16,318 : INFO : topic #38 (0.020): 0.021*\"walter\" + 0.010*\"aza\" + 0.010*\"king\" + 0.010*\"battalion\" + 0.009*\"centuri\" + 0.009*\"empath\" + 0.008*\"forc\" + 0.008*\"teufel\" + 0.007*\"armi\" + 0.007*\"embassi\"\n", + "2019-01-31 00:29:16,319 : INFO : topic #37 (0.020): 0.010*\"love\" + 0.008*\"gestur\" + 0.008*\"man\" + 0.006*\"blue\" + 0.005*\"bewild\" + 0.004*\"litig\" + 0.004*\"night\" + 0.004*\"vision\" + 0.003*\"york\" + 0.003*\"ladi\"\n", + "2019-01-31 00:29:16,320 : INFO : topic #26 (0.020): 0.031*\"workplac\" + 0.031*\"woman\" + 0.030*\"champion\" + 0.026*\"olymp\" + 0.025*\"men\" + 0.022*\"medal\" + 0.021*\"event\" + 0.020*\"nation\" + 0.019*\"rainfal\" + 0.018*\"taxpay\"\n", + "2019-01-31 00:29:16,321 : INFO : topic #30 (0.020): 0.036*\"cleveland\" + 0.036*\"leagu\" + 0.029*\"place\" + 0.027*\"taxpay\" + 0.024*\"scientist\" + 0.024*\"crete\" + 0.023*\"folei\" + 0.016*\"goal\" + 0.014*\"martin\" + 0.011*\"diversifi\"\n", + "2019-01-31 00:29:16,327 : INFO : topic diff=0.007219, rho=0.050315\n", + "2019-01-31 00:29:16,478 : INFO : PROGRESS: pass 0, at document #792000/4922894\n", + "2019-01-31 00:29:17,856 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:29:18,123 : INFO : topic #36 (0.020): 0.015*\"companhia\" + 0.011*\"network\" + 0.010*\"pop\" + 0.009*\"prognosi\" + 0.009*\"develop\" + 0.009*\"serv\" + 0.007*\"includ\" + 0.007*\"base\" + 0.007*\"user\" + 0.007*\"diggin\"\n", + "2019-01-31 00:29:18,124 : INFO : topic #47 (0.020): 0.066*\"muscl\" + 0.033*\"perceptu\" + 0.020*\"theater\" + 0.018*\"compos\" + 0.018*\"place\" + 0.017*\"damn\" + 0.015*\"olympo\" + 0.015*\"physician\" + 0.014*\"orchestr\" + 0.012*\"word\"\n", + "2019-01-31 00:29:18,125 : INFO : topic #44 (0.020): 0.030*\"rooftop\" + 0.028*\"final\" + 0.023*\"wife\" + 0.022*\"tourist\" + 0.019*\"champion\" + 0.018*\"taxpay\" + 0.016*\"martin\" + 0.015*\"tiepolo\" + 0.014*\"chamber\" + 0.013*\"women\"\n", + "2019-01-31 00:29:18,127 : INFO : topic #9 (0.020): 0.069*\"bone\" + 0.042*\"american\" + 0.026*\"valour\" + 0.021*\"dutch\" + 0.019*\"folei\" + 0.018*\"english\" + 0.017*\"player\" + 0.015*\"polit\" + 0.011*\"simpler\" + 0.011*\"acrimoni\"\n", + "2019-01-31 00:29:18,128 : INFO : topic #24 (0.020): 0.040*\"book\" + 0.034*\"publicis\" + 0.023*\"word\" + 0.017*\"new\" + 0.014*\"edit\" + 0.013*\"nicola\" + 0.012*\"presid\" + 0.012*\"storag\" + 0.011*\"collect\" + 0.011*\"worldwid\"\n", + "2019-01-31 00:29:18,133 : INFO : topic diff=0.009157, rho=0.050252\n", + "2019-01-31 00:29:18,289 : INFO : PROGRESS: pass 0, at document #794000/4922894\n", + "2019-01-31 00:29:19,709 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:29:19,976 : INFO : topic #35 (0.020): 0.053*\"russia\" + 0.034*\"rural\" + 0.034*\"sovereignti\" + 0.026*\"reprint\" + 0.024*\"personifi\" + 0.024*\"poison\" + 0.021*\"moscow\" + 0.017*\"poland\" + 0.015*\"unfortun\" + 0.014*\"czech\"\n", + "2019-01-31 00:29:19,977 : INFO : topic #7 (0.020): 0.020*\"snatch\" + 0.019*\"di\" + 0.018*\"factor\" + 0.015*\"yawn\" + 0.015*\"margin\" + 0.013*\"bone\" + 0.013*\"faster\" + 0.012*\"life\" + 0.011*\"daughter\" + 0.011*\"deal\"\n", + "2019-01-31 00:29:19,978 : INFO : topic #10 (0.020): 0.012*\"cdd\" + 0.008*\"media\" + 0.008*\"have\" + 0.008*\"disco\" + 0.007*\"hormon\" + 0.007*\"pathwai\" + 0.007*\"caus\" + 0.006*\"proper\" + 0.006*\"effect\" + 0.006*\"treat\"\n", + "2019-01-31 00:29:19,979 : INFO : topic #2 (0.020): 0.050*\"isl\" + 0.038*\"shield\" + 0.018*\"narrat\" + 0.014*\"pope\" + 0.013*\"scot\" + 0.012*\"coalit\" + 0.011*\"blur\" + 0.010*\"nativist\" + 0.010*\"class\" + 0.009*\"bahá\"\n", + "2019-01-31 00:29:19,980 : INFO : topic #32 (0.020): 0.055*\"district\" + 0.047*\"vigour\" + 0.043*\"popolo\" + 0.041*\"tortur\" + 0.034*\"area\" + 0.028*\"cotton\" + 0.026*\"regim\" + 0.024*\"multitud\" + 0.022*\"citi\" + 0.021*\"commun\"\n", + "2019-01-31 00:29:19,986 : INFO : topic diff=0.007998, rho=0.050189\n", + "2019-01-31 00:29:20,145 : INFO : PROGRESS: pass 0, at document #796000/4922894\n", + "2019-01-31 00:29:21,576 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:29:21,842 : INFO : topic #26 (0.020): 0.031*\"workplac\" + 0.030*\"champion\" + 0.030*\"woman\" + 0.027*\"olymp\" + 0.024*\"men\" + 0.022*\"medal\" + 0.021*\"event\" + 0.020*\"nation\" + 0.019*\"rainfal\" + 0.018*\"atheist\"\n", + "2019-01-31 00:29:21,843 : INFO : topic #6 (0.020): 0.070*\"fewer\" + 0.025*\"septemb\" + 0.022*\"epiru\" + 0.018*\"teacher\" + 0.016*\"stake\" + 0.012*\"proclaim\" + 0.012*\"rodríguez\" + 0.011*\"direct\" + 0.011*\"acrimoni\" + 0.011*\"movi\"\n", + "2019-01-31 00:29:21,844 : INFO : topic #44 (0.020): 0.030*\"rooftop\" + 0.028*\"final\" + 0.022*\"wife\" + 0.022*\"tourist\" + 0.019*\"champion\" + 0.018*\"taxpay\" + 0.017*\"martin\" + 0.015*\"tiepolo\" + 0.014*\"chamber\" + 0.013*\"women\"\n", + "2019-01-31 00:29:21,845 : INFO : topic #37 (0.020): 0.010*\"love\" + 0.008*\"gestur\" + 0.008*\"man\" + 0.006*\"blue\" + 0.005*\"bewild\" + 0.005*\"night\" + 0.004*\"litig\" + 0.004*\"vision\" + 0.003*\"york\" + 0.003*\"ladi\"\n", + "2019-01-31 00:29:21,846 : INFO : topic #32 (0.020): 0.055*\"district\" + 0.047*\"vigour\" + 0.043*\"popolo\" + 0.041*\"tortur\" + 0.034*\"area\" + 0.028*\"cotton\" + 0.025*\"regim\" + 0.024*\"multitud\" + 0.022*\"citi\" + 0.021*\"commun\"\n", + "2019-01-31 00:29:21,852 : INFO : topic diff=0.009112, rho=0.050125\n", + "2019-01-31 00:29:22,056 : INFO : PROGRESS: pass 0, at document #798000/4922894\n", + "2019-01-31 00:29:23,448 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 00:29:23,714 : INFO : topic #6 (0.020): 0.071*\"fewer\" + 0.024*\"septemb\" + 0.022*\"epiru\" + 0.018*\"teacher\" + 0.016*\"stake\" + 0.012*\"proclaim\" + 0.012*\"rodríguez\" + 0.011*\"direct\" + 0.011*\"acrimoni\" + 0.011*\"movi\"\n", + "2019-01-31 00:29:23,715 : INFO : topic #3 (0.020): 0.037*\"present\" + 0.028*\"minist\" + 0.027*\"offic\" + 0.026*\"serv\" + 0.020*\"member\" + 0.018*\"gener\" + 0.017*\"seri\" + 0.017*\"govern\" + 0.017*\"nation\" + 0.015*\"chickasaw\"\n", + "2019-01-31 00:29:23,716 : INFO : topic #1 (0.020): 0.056*\"china\" + 0.046*\"chilton\" + 0.026*\"hong\" + 0.025*\"kong\" + 0.021*\"korea\" + 0.017*\"leah\" + 0.017*\"korean\" + 0.017*\"sourc\" + 0.014*\"wang\" + 0.014*\"kim\"\n", + "2019-01-31 00:29:23,717 : INFO : topic #40 (0.020): 0.089*\"unit\" + 0.025*\"collector\" + 0.024*\"schuster\" + 0.021*\"institut\" + 0.019*\"requir\" + 0.017*\"student\" + 0.016*\"professor\" + 0.011*\"governor\" + 0.011*\"word\" + 0.011*\"degre\"\n", + "2019-01-31 00:29:23,719 : INFO : topic #26 (0.020): 0.030*\"workplac\" + 0.030*\"champion\" + 0.029*\"woman\" + 0.027*\"olymp\" + 0.024*\"men\" + 0.022*\"medal\" + 0.021*\"event\" + 0.021*\"nation\" + 0.019*\"rainfal\" + 0.018*\"atheist\"\n", + "2019-01-31 00:29:23,724 : INFO : topic diff=0.009841, rho=0.050063\n", + "2019-01-31 00:29:26,478 : INFO : -11.794 per-word bound, 3552.0 perplexity estimate based on a held-out corpus of 2000 documents with 569599 words\n", + "2019-01-31 00:29:26,479 : INFO : PROGRESS: pass 0, at document #800000/4922894\n", + "2019-01-31 00:29:27,903 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:29:28,170 : INFO : topic #30 (0.020): 0.038*\"leagu\" + 0.037*\"cleveland\" + 0.029*\"place\" + 0.026*\"taxpay\" + 0.024*\"scientist\" + 0.024*\"crete\" + 0.023*\"folei\" + 0.017*\"goal\" + 0.014*\"martin\" + 0.013*\"diversifi\"\n", + "2019-01-31 00:29:28,171 : INFO : topic #40 (0.020): 0.089*\"unit\" + 0.025*\"collector\" + 0.024*\"schuster\" + 0.021*\"institut\" + 0.019*\"requir\" + 0.017*\"student\" + 0.016*\"professor\" + 0.012*\"governor\" + 0.011*\"word\" + 0.011*\"degre\"\n", + "2019-01-31 00:29:28,172 : INFO : topic #12 (0.020): 0.009*\"number\" + 0.008*\"frontal\" + 0.007*\"southern\" + 0.006*\"théori\" + 0.006*\"exampl\" + 0.006*\"gener\" + 0.006*\"measur\" + 0.006*\"poet\" + 0.006*\"servitud\" + 0.005*\"utopian\"\n", + "2019-01-31 00:29:28,173 : INFO : topic #15 (0.020): 0.012*\"small\" + 0.011*\"develop\" + 0.011*\"organ\" + 0.010*\"word\" + 0.009*\"group\" + 0.008*\"commun\" + 0.008*\"cultur\" + 0.008*\"peopl\" + 0.007*\"student\" + 0.007*\"human\"\n", + "2019-01-31 00:29:28,174 : INFO : topic #44 (0.020): 0.029*\"rooftop\" + 0.028*\"final\" + 0.022*\"tourist\" + 0.022*\"wife\" + 0.019*\"champion\" + 0.018*\"taxpay\" + 0.016*\"martin\" + 0.015*\"tiepolo\" + 0.014*\"chamber\" + 0.013*\"women\"\n", + "2019-01-31 00:29:28,180 : INFO : topic diff=0.008847, rho=0.050000\n", + "2019-01-31 00:29:28,341 : INFO : PROGRESS: pass 0, at document #802000/4922894\n", + "2019-01-31 00:29:29,781 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:29:30,048 : INFO : topic #23 (0.020): 0.134*\"audit\" + 0.067*\"best\" + 0.035*\"yawn\" + 0.031*\"jacksonvil\" + 0.024*\"japanes\" + 0.022*\"noll\" + 0.020*\"festiv\" + 0.019*\"women\" + 0.018*\"intern\" + 0.014*\"winner\"\n", + "2019-01-31 00:29:30,049 : INFO : topic #25 (0.020): 0.031*\"ring\" + 0.016*\"warmth\" + 0.016*\"lagrang\" + 0.016*\"area\" + 0.015*\"mount\" + 0.010*\"palmer\" + 0.009*\"north\" + 0.008*\"foam\" + 0.008*\"vacant\" + 0.008*\"land\"\n", + "2019-01-31 00:29:30,050 : INFO : topic #38 (0.020): 0.020*\"walter\" + 0.010*\"aza\" + 0.010*\"king\" + 0.009*\"battalion\" + 0.009*\"centuri\" + 0.008*\"empath\" + 0.008*\"forc\" + 0.007*\"teufel\" + 0.007*\"embassi\" + 0.007*\"armi\"\n", + "2019-01-31 00:29:30,051 : INFO : topic #17 (0.020): 0.075*\"church\" + 0.022*\"christian\" + 0.022*\"cathol\" + 0.018*\"bishop\" + 0.015*\"sail\" + 0.014*\"retroflex\" + 0.010*\"centuri\" + 0.010*\"relationship\" + 0.009*\"historiographi\" + 0.008*\"cathedr\"\n", + "2019-01-31 00:29:30,052 : INFO : topic #34 (0.020): 0.077*\"start\" + 0.036*\"cotton\" + 0.032*\"unionist\" + 0.027*\"american\" + 0.024*\"new\" + 0.015*\"california\" + 0.013*\"warrior\" + 0.013*\"terri\" + 0.012*\"year\" + 0.012*\"north\"\n", + "2019-01-31 00:29:30,058 : INFO : topic diff=0.008455, rho=0.049938\n", + "2019-01-31 00:29:30,215 : INFO : PROGRESS: pass 0, at document #804000/4922894\n", + "2019-01-31 00:29:31,651 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:29:31,917 : INFO : topic #22 (0.020): 0.034*\"spars\" + 0.026*\"factor\" + 0.022*\"adulthood\" + 0.016*\"feel\" + 0.016*\"hostil\" + 0.014*\"male\" + 0.011*\"live\" + 0.011*\"plaisir\" + 0.010*\"yawn\" + 0.009*\"genu\"\n", + "2019-01-31 00:29:31,918 : INFO : topic #44 (0.020): 0.031*\"rooftop\" + 0.028*\"final\" + 0.023*\"tourist\" + 0.022*\"wife\" + 0.019*\"taxpay\" + 0.019*\"champion\" + 0.016*\"martin\" + 0.015*\"tiepolo\" + 0.014*\"chamber\" + 0.013*\"women\"\n", + "2019-01-31 00:29:31,919 : INFO : topic #30 (0.020): 0.038*\"leagu\" + 0.037*\"cleveland\" + 0.029*\"place\" + 0.027*\"taxpay\" + 0.024*\"scientist\" + 0.024*\"crete\" + 0.023*\"folei\" + 0.017*\"goal\" + 0.014*\"martin\" + 0.013*\"diversifi\"\n", + "2019-01-31 00:29:31,921 : INFO : topic #46 (0.020): 0.022*\"sweden\" + 0.019*\"norwai\" + 0.018*\"swedish\" + 0.016*\"stop\" + 0.015*\"damag\" + 0.015*\"norwegian\" + 0.014*\"turkish\" + 0.014*\"wind\" + 0.012*\"denmark\" + 0.011*\"danish\"\n", + "2019-01-31 00:29:31,922 : INFO : topic #23 (0.020): 0.134*\"audit\" + 0.067*\"best\" + 0.035*\"yawn\" + 0.031*\"jacksonvil\" + 0.024*\"japanes\" + 0.021*\"noll\" + 0.020*\"festiv\" + 0.019*\"women\" + 0.018*\"intern\" + 0.014*\"winner\"\n", + "2019-01-31 00:29:31,928 : INFO : topic diff=0.007734, rho=0.049875\n", + "2019-01-31 00:29:32,086 : INFO : PROGRESS: pass 0, at document #806000/4922894\n", + "2019-01-31 00:29:33,477 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:29:33,743 : INFO : topic #16 (0.020): 0.041*\"king\" + 0.033*\"priest\" + 0.021*\"grammat\" + 0.020*\"quarterli\" + 0.020*\"duke\" + 0.017*\"rotterdam\" + 0.016*\"idiosyncrat\" + 0.014*\"maria\" + 0.013*\"order\" + 0.012*\"count\"\n", + "2019-01-31 00:29:33,745 : INFO : topic #45 (0.020): 0.017*\"fifteenth\" + 0.017*\"jpg\" + 0.016*\"black\" + 0.015*\"western\" + 0.015*\"illicit\" + 0.015*\"colder\" + 0.014*\"record\" + 0.009*\"blind\" + 0.007*\"green\" + 0.007*\"light\"\n", + "2019-01-31 00:29:33,746 : INFO : topic #34 (0.020): 0.077*\"start\" + 0.036*\"cotton\" + 0.032*\"unionist\" + 0.027*\"american\" + 0.024*\"new\" + 0.015*\"california\" + 0.013*\"warrior\" + 0.013*\"terri\" + 0.012*\"year\" + 0.012*\"north\"\n", + "2019-01-31 00:29:33,747 : INFO : topic #26 (0.020): 0.031*\"workplac\" + 0.030*\"champion\" + 0.029*\"woman\" + 0.027*\"olymp\" + 0.023*\"men\" + 0.023*\"medal\" + 0.020*\"nation\" + 0.020*\"event\" + 0.019*\"rainfal\" + 0.019*\"atheist\"\n", + "2019-01-31 00:29:33,749 : INFO : topic #14 (0.020): 0.023*\"forc\" + 0.021*\"walter\" + 0.021*\"armi\" + 0.019*\"aggress\" + 0.017*\"com\" + 0.016*\"oper\" + 0.014*\"unionist\" + 0.013*\"militari\" + 0.011*\"airbu\" + 0.011*\"diversifi\"\n", + "2019-01-31 00:29:33,754 : INFO : topic diff=0.009141, rho=0.049814\n", + "2019-01-31 00:29:33,910 : INFO : PROGRESS: pass 0, at document #808000/4922894\n", + "2019-01-31 00:29:35,334 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:29:35,599 : INFO : topic #8 (0.020): 0.027*\"law\" + 0.024*\"cortic\" + 0.019*\"start\" + 0.019*\"act\" + 0.015*\"ricardo\" + 0.014*\"case\" + 0.012*\"polaris\" + 0.009*\"legal\" + 0.008*\"judaism\" + 0.008*\"replac\"\n", + "2019-01-31 00:29:35,600 : INFO : topic #48 (0.020): 0.084*\"march\" + 0.080*\"octob\" + 0.078*\"sens\" + 0.076*\"januari\" + 0.072*\"notion\" + 0.072*\"juli\" + 0.071*\"april\" + 0.071*\"decatur\" + 0.070*\"august\" + 0.069*\"judici\"\n", + "2019-01-31 00:29:35,602 : INFO : topic #44 (0.020): 0.031*\"rooftop\" + 0.027*\"final\" + 0.022*\"tourist\" + 0.022*\"wife\" + 0.019*\"champion\" + 0.019*\"taxpay\" + 0.016*\"martin\" + 0.015*\"tiepolo\" + 0.014*\"chamber\" + 0.012*\"poet\"\n", + "2019-01-31 00:29:35,603 : INFO : topic #25 (0.020): 0.032*\"ring\" + 0.017*\"warmth\" + 0.017*\"lagrang\" + 0.016*\"area\" + 0.015*\"mount\" + 0.010*\"palmer\" + 0.009*\"north\" + 0.009*\"foam\" + 0.008*\"vacant\" + 0.008*\"sourc\"\n", + "2019-01-31 00:29:35,604 : INFO : topic #22 (0.020): 0.034*\"spars\" + 0.026*\"factor\" + 0.022*\"adulthood\" + 0.016*\"feel\" + 0.016*\"hostil\" + 0.015*\"male\" + 0.011*\"plaisir\" + 0.011*\"live\" + 0.010*\"yawn\" + 0.009*\"genu\"\n", + "2019-01-31 00:29:35,610 : INFO : topic diff=0.008247, rho=0.049752\n", + "2019-01-31 00:29:35,766 : INFO : PROGRESS: pass 0, at document #810000/4922894\n", + "2019-01-31 00:29:37,199 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 00:29:37,465 : INFO : topic #46 (0.020): 0.021*\"sweden\" + 0.019*\"norwai\" + 0.017*\"swedish\" + 0.017*\"turkish\" + 0.015*\"stop\" + 0.015*\"norwegian\" + 0.015*\"damag\" + 0.013*\"wind\" + 0.012*\"denmark\" + 0.011*\"turkei\"\n", + "2019-01-31 00:29:37,466 : INFO : topic #33 (0.020): 0.061*\"french\" + 0.047*\"franc\" + 0.029*\"pari\" + 0.024*\"sail\" + 0.021*\"jean\" + 0.016*\"daphn\" + 0.013*\"loui\" + 0.013*\"lazi\" + 0.011*\"piec\" + 0.009*\"wine\"\n", + "2019-01-31 00:29:37,467 : INFO : topic #28 (0.020): 0.030*\"build\" + 0.024*\"hous\" + 0.022*\"rivièr\" + 0.018*\"buford\" + 0.013*\"histor\" + 0.011*\"briarwood\" + 0.011*\"constitut\" + 0.010*\"strategist\" + 0.010*\"linear\" + 0.010*\"rosenwald\"\n", + "2019-01-31 00:29:37,468 : INFO : topic #13 (0.020): 0.026*\"sourc\" + 0.026*\"australia\" + 0.025*\"london\" + 0.024*\"new\" + 0.023*\"australian\" + 0.021*\"england\" + 0.020*\"british\" + 0.019*\"ireland\" + 0.015*\"wale\" + 0.014*\"youth\"\n", + "2019-01-31 00:29:37,469 : INFO : topic #22 (0.020): 0.034*\"spars\" + 0.026*\"factor\" + 0.022*\"adulthood\" + 0.016*\"feel\" + 0.015*\"hostil\" + 0.014*\"male\" + 0.011*\"plaisir\" + 0.011*\"live\" + 0.009*\"yawn\" + 0.009*\"genu\"\n", + "2019-01-31 00:29:37,475 : INFO : topic diff=0.007096, rho=0.049690\n", + "2019-01-31 00:29:37,635 : INFO : PROGRESS: pass 0, at document #812000/4922894\n", + "2019-01-31 00:29:39,084 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:29:39,350 : INFO : topic #8 (0.020): 0.028*\"law\" + 0.025*\"cortic\" + 0.019*\"start\" + 0.018*\"act\" + 0.015*\"ricardo\" + 0.014*\"case\" + 0.012*\"polaris\" + 0.009*\"legal\" + 0.009*\"judaism\" + 0.008*\"replac\"\n", + "2019-01-31 00:29:39,351 : INFO : topic #2 (0.020): 0.049*\"isl\" + 0.037*\"shield\" + 0.017*\"narrat\" + 0.013*\"class\" + 0.013*\"pope\" + 0.013*\"scot\" + 0.012*\"blur\" + 0.012*\"coalit\" + 0.011*\"nativist\" + 0.009*\"bahá\"\n", + "2019-01-31 00:29:39,353 : INFO : topic #35 (0.020): 0.053*\"russia\" + 0.034*\"sovereignti\" + 0.032*\"rural\" + 0.027*\"poison\" + 0.026*\"reprint\" + 0.024*\"personifi\" + 0.020*\"moscow\" + 0.017*\"poland\" + 0.015*\"czech\" + 0.015*\"unfortun\"\n", + "2019-01-31 00:29:39,354 : INFO : topic #44 (0.020): 0.031*\"rooftop\" + 0.027*\"final\" + 0.022*\"tourist\" + 0.021*\"wife\" + 0.019*\"taxpay\" + 0.019*\"champion\" + 0.017*\"martin\" + 0.014*\"tiepolo\" + 0.014*\"chamber\" + 0.012*\"women\"\n", + "2019-01-31 00:29:39,355 : INFO : topic #40 (0.020): 0.091*\"unit\" + 0.025*\"collector\" + 0.023*\"schuster\" + 0.021*\"institut\" + 0.019*\"requir\" + 0.017*\"student\" + 0.015*\"professor\" + 0.012*\"governor\" + 0.012*\"word\" + 0.011*\"degre\"\n", + "2019-01-31 00:29:39,361 : INFO : topic diff=0.009155, rho=0.049629\n", + "2019-01-31 00:29:39,517 : INFO : PROGRESS: pass 0, at document #814000/4922894\n", + "2019-01-31 00:29:40,923 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:29:41,189 : INFO : topic #23 (0.020): 0.133*\"audit\" + 0.066*\"best\" + 0.038*\"yawn\" + 0.030*\"jacksonvil\" + 0.024*\"japanes\" + 0.022*\"noll\" + 0.019*\"festiv\" + 0.019*\"women\" + 0.017*\"intern\" + 0.013*\"winner\"\n", + "2019-01-31 00:29:41,191 : INFO : topic #10 (0.020): 0.013*\"cdd\" + 0.008*\"media\" + 0.008*\"have\" + 0.008*\"pathwai\" + 0.008*\"disco\" + 0.007*\"caus\" + 0.006*\"hormon\" + 0.006*\"effect\" + 0.006*\"proper\" + 0.006*\"activ\"\n", + "2019-01-31 00:29:41,192 : INFO : topic #20 (0.020): 0.135*\"scholar\" + 0.038*\"struggl\" + 0.031*\"high\" + 0.029*\"educ\" + 0.020*\"collector\" + 0.018*\"yawn\" + 0.013*\"prognosi\" + 0.009*\"gothic\" + 0.009*\"district\" + 0.009*\"class\"\n", + "2019-01-31 00:29:41,193 : INFO : topic #36 (0.020): 0.015*\"companhia\" + 0.011*\"pop\" + 0.011*\"network\" + 0.010*\"prognosi\" + 0.009*\"develop\" + 0.009*\"serv\" + 0.007*\"diggin\" + 0.007*\"includ\" + 0.007*\"base\" + 0.007*\"brio\"\n", + "2019-01-31 00:29:41,194 : INFO : topic #39 (0.020): 0.040*\"canada\" + 0.035*\"canadian\" + 0.018*\"toronto\" + 0.017*\"hoar\" + 0.016*\"ontario\" + 0.014*\"taxpay\" + 0.013*\"new\" + 0.013*\"scientist\" + 0.012*\"basketbal\" + 0.011*\"hydrogen\"\n", + "2019-01-31 00:29:41,200 : INFO : topic diff=0.008637, rho=0.049568\n", + "2019-01-31 00:29:41,356 : INFO : PROGRESS: pass 0, at document #816000/4922894\n", + "2019-01-31 00:29:42,786 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:29:43,052 : INFO : topic #32 (0.020): 0.056*\"district\" + 0.046*\"vigour\" + 0.044*\"popolo\" + 0.041*\"tortur\" + 0.033*\"area\" + 0.027*\"cotton\" + 0.025*\"regim\" + 0.024*\"multitud\" + 0.021*\"citi\" + 0.021*\"commun\"\n", + "2019-01-31 00:29:43,053 : INFO : topic #7 (0.020): 0.020*\"snatch\" + 0.020*\"di\" + 0.017*\"factor\" + 0.015*\"yawn\" + 0.015*\"margin\" + 0.013*\"bone\" + 0.013*\"life\" + 0.012*\"faster\" + 0.011*\"daughter\" + 0.011*\"john\"\n", + "2019-01-31 00:29:43,055 : INFO : topic #8 (0.020): 0.029*\"law\" + 0.025*\"cortic\" + 0.019*\"start\" + 0.018*\"act\" + 0.015*\"ricardo\" + 0.014*\"case\" + 0.011*\"polaris\" + 0.009*\"legal\" + 0.009*\"judaism\" + 0.008*\"replac\"\n", + "2019-01-31 00:29:43,056 : INFO : topic #39 (0.020): 0.039*\"canada\" + 0.033*\"canadian\" + 0.018*\"toronto\" + 0.017*\"hoar\" + 0.015*\"ontario\" + 0.014*\"taxpay\" + 0.013*\"new\" + 0.013*\"scientist\" + 0.012*\"basketbal\" + 0.011*\"novotná\"\n", + "2019-01-31 00:29:43,057 : INFO : topic #29 (0.020): 0.010*\"companhia\" + 0.010*\"million\" + 0.009*\"govern\" + 0.009*\"start\" + 0.009*\"yawn\" + 0.008*\"bank\" + 0.007*\"function\" + 0.007*\"countri\" + 0.006*\"market\" + 0.006*\"inconclus\"\n", + "2019-01-31 00:29:43,063 : INFO : topic diff=0.008697, rho=0.049507\n", + "2019-01-31 00:29:43,219 : INFO : PROGRESS: pass 0, at document #818000/4922894\n", + "2019-01-31 00:29:44,654 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:29:44,921 : INFO : topic #14 (0.020): 0.023*\"forc\" + 0.021*\"armi\" + 0.021*\"walter\" + 0.020*\"aggress\" + 0.017*\"com\" + 0.015*\"oper\" + 0.014*\"unionist\" + 0.012*\"militari\" + 0.011*\"airbu\" + 0.011*\"diversifi\"\n", + "2019-01-31 00:29:44,922 : INFO : topic #18 (0.020): 0.009*\"théori\" + 0.007*\"later\" + 0.007*\"sack\" + 0.006*\"kill\" + 0.005*\"dai\" + 0.005*\"retrospect\" + 0.005*\"man\" + 0.005*\"like\" + 0.004*\"end\" + 0.004*\"call\"\n", + "2019-01-31 00:29:44,923 : INFO : topic #9 (0.020): 0.068*\"bone\" + 0.042*\"american\" + 0.028*\"valour\" + 0.020*\"dutch\" + 0.019*\"folei\" + 0.018*\"english\" + 0.017*\"player\" + 0.016*\"polit\" + 0.012*\"simpler\" + 0.011*\"acrimoni\"\n", + "2019-01-31 00:29:44,925 : INFO : topic #47 (0.020): 0.064*\"muscl\" + 0.033*\"perceptu\" + 0.021*\"theater\" + 0.018*\"place\" + 0.018*\"damn\" + 0.018*\"compos\" + 0.014*\"olympo\" + 0.014*\"orchestr\" + 0.014*\"physician\" + 0.013*\"jack\"\n", + "2019-01-31 00:29:44,926 : INFO : topic #5 (0.020): 0.039*\"abroad\" + 0.028*\"son\" + 0.027*\"rel\" + 0.026*\"reconstruct\" + 0.021*\"band\" + 0.017*\"muscl\" + 0.017*\"simultan\" + 0.015*\"charcoal\" + 0.014*\"toyota\" + 0.009*\"myspac\"\n", + "2019-01-31 00:29:44,932 : INFO : topic diff=0.009332, rho=0.049447\n", + "2019-01-31 00:29:47,647 : INFO : -11.485 per-word bound, 2866.5 perplexity estimate based on a held-out corpus of 2000 documents with 539358 words\n", + "2019-01-31 00:29:47,648 : INFO : PROGRESS: pass 0, at document #820000/4922894\n", + "2019-01-31 00:29:49,063 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:29:49,329 : INFO : topic #18 (0.020): 0.010*\"théori\" + 0.007*\"later\" + 0.007*\"sack\" + 0.006*\"kill\" + 0.005*\"dai\" + 0.005*\"retrospect\" + 0.005*\"man\" + 0.005*\"like\" + 0.004*\"end\" + 0.004*\"call\"\n", + "2019-01-31 00:29:49,330 : INFO : topic #12 (0.020): 0.009*\"number\" + 0.008*\"frontal\" + 0.006*\"exampl\" + 0.006*\"southern\" + 0.006*\"method\" + 0.006*\"gener\" + 0.006*\"théori\" + 0.006*\"poet\" + 0.006*\"measur\" + 0.006*\"utopian\"\n", + "2019-01-31 00:29:49,331 : INFO : topic #0 (0.020): 0.068*\"statewid\" + 0.039*\"line\" + 0.038*\"arsen\" + 0.033*\"raid\" + 0.030*\"museo\" + 0.021*\"traceabl\" + 0.018*\"serv\" + 0.016*\"pain\" + 0.015*\"exhaust\" + 0.014*\"artist\"\n", + "2019-01-31 00:29:49,332 : INFO : topic #16 (0.020): 0.040*\"king\" + 0.032*\"priest\" + 0.021*\"grammat\" + 0.019*\"duke\" + 0.019*\"quarterli\" + 0.016*\"rotterdam\" + 0.016*\"idiosyncrat\" + 0.014*\"maria\" + 0.013*\"order\" + 0.012*\"portugues\"\n", + "2019-01-31 00:29:49,333 : INFO : topic #23 (0.020): 0.131*\"audit\" + 0.066*\"best\" + 0.036*\"yawn\" + 0.029*\"jacksonvil\" + 0.024*\"festiv\" + 0.023*\"japanes\" + 0.022*\"intern\" + 0.022*\"noll\" + 0.019*\"women\" + 0.013*\"prison\"\n", + "2019-01-31 00:29:49,339 : INFO : topic diff=0.007250, rho=0.049386\n", + "2019-01-31 00:29:49,490 : INFO : PROGRESS: pass 0, at document #822000/4922894\n", + "2019-01-31 00:29:50,887 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:29:51,153 : INFO : topic #22 (0.020): 0.034*\"spars\" + 0.026*\"factor\" + 0.023*\"adulthood\" + 0.016*\"feel\" + 0.015*\"hostil\" + 0.014*\"male\" + 0.012*\"plaisir\" + 0.011*\"live\" + 0.010*\"genu\" + 0.010*\"yawn\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 00:29:51,154 : INFO : topic #3 (0.020): 0.036*\"present\" + 0.028*\"offic\" + 0.026*\"minist\" + 0.024*\"serv\" + 0.020*\"member\" + 0.019*\"gener\" + 0.018*\"seri\" + 0.018*\"nation\" + 0.017*\"govern\" + 0.016*\"chickasaw\"\n", + "2019-01-31 00:29:51,155 : INFO : topic #31 (0.020): 0.063*\"fusiform\" + 0.024*\"scientist\" + 0.023*\"player\" + 0.021*\"taxpay\" + 0.020*\"place\" + 0.013*\"clot\" + 0.012*\"leagu\" + 0.012*\"yard\" + 0.011*\"folei\" + 0.009*\"barber\"\n", + "2019-01-31 00:29:51,157 : INFO : topic #38 (0.020): 0.021*\"walter\" + 0.010*\"battalion\" + 0.010*\"king\" + 0.010*\"aza\" + 0.008*\"forc\" + 0.008*\"empath\" + 0.008*\"centuri\" + 0.007*\"armi\" + 0.007*\"embassi\" + 0.007*\"teufel\"\n", + "2019-01-31 00:29:51,158 : INFO : topic #33 (0.020): 0.063*\"french\" + 0.048*\"franc\" + 0.031*\"pari\" + 0.023*\"sail\" + 0.023*\"jean\" + 0.017*\"daphn\" + 0.015*\"lazi\" + 0.013*\"loui\" + 0.011*\"piec\" + 0.009*\"wine\"\n", + "2019-01-31 00:29:51,164 : INFO : topic diff=0.008012, rho=0.049326\n", + "2019-01-31 00:29:51,322 : INFO : PROGRESS: pass 0, at document #824000/4922894\n", + "2019-01-31 00:29:52,753 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:29:53,019 : INFO : topic #7 (0.020): 0.020*\"snatch\" + 0.020*\"di\" + 0.017*\"factor\" + 0.015*\"yawn\" + 0.015*\"margin\" + 0.014*\"bone\" + 0.013*\"life\" + 0.012*\"faster\" + 0.011*\"daughter\" + 0.011*\"deal\"\n", + "2019-01-31 00:29:53,020 : INFO : topic #3 (0.020): 0.036*\"present\" + 0.028*\"offic\" + 0.026*\"minist\" + 0.023*\"serv\" + 0.020*\"member\" + 0.018*\"gener\" + 0.018*\"seri\" + 0.018*\"nation\" + 0.017*\"govern\" + 0.016*\"chickasaw\"\n", + "2019-01-31 00:29:53,022 : INFO : topic #27 (0.020): 0.069*\"questionnair\" + 0.018*\"taxpay\" + 0.017*\"candid\" + 0.016*\"ret\" + 0.013*\"driver\" + 0.012*\"fool\" + 0.012*\"find\" + 0.011*\"tornado\" + 0.011*\"landslid\" + 0.011*\"théori\"\n", + "2019-01-31 00:29:53,023 : INFO : topic #43 (0.020): 0.066*\"elect\" + 0.054*\"parti\" + 0.024*\"voluntari\" + 0.022*\"democrat\" + 0.022*\"member\" + 0.018*\"polici\" + 0.015*\"liber\" + 0.014*\"report\" + 0.014*\"conserv\" + 0.014*\"republ\"\n", + "2019-01-31 00:29:53,024 : INFO : topic #34 (0.020): 0.076*\"start\" + 0.034*\"cotton\" + 0.032*\"unionist\" + 0.026*\"american\" + 0.024*\"new\" + 0.015*\"california\" + 0.013*\"terri\" + 0.013*\"warrior\" + 0.012*\"year\" + 0.012*\"north\"\n", + "2019-01-31 00:29:53,030 : INFO : topic diff=0.008492, rho=0.049266\n", + "2019-01-31 00:29:53,189 : INFO : PROGRESS: pass 0, at document #826000/4922894\n", + "2019-01-31 00:29:54,622 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:29:54,888 : INFO : topic #2 (0.020): 0.049*\"isl\" + 0.038*\"shield\" + 0.017*\"narrat\" + 0.013*\"scot\" + 0.013*\"blur\" + 0.012*\"pope\" + 0.012*\"coalit\" + 0.012*\"class\" + 0.011*\"nativist\" + 0.009*\"fleet\"\n", + "2019-01-31 00:29:54,889 : INFO : topic #28 (0.020): 0.030*\"build\" + 0.025*\"hous\" + 0.022*\"rivièr\" + 0.017*\"buford\" + 0.013*\"histor\" + 0.011*\"briarwood\" + 0.011*\"constitut\" + 0.011*\"strategist\" + 0.010*\"rosenwald\" + 0.010*\"linear\"\n", + "2019-01-31 00:29:54,890 : INFO : topic #43 (0.020): 0.065*\"elect\" + 0.056*\"parti\" + 0.024*\"voluntari\" + 0.022*\"democrat\" + 0.021*\"member\" + 0.018*\"polici\" + 0.015*\"liber\" + 0.014*\"conserv\" + 0.014*\"report\" + 0.014*\"republ\"\n", + "2019-01-31 00:29:54,891 : INFO : topic #19 (0.020): 0.013*\"languag\" + 0.010*\"woodcut\" + 0.010*\"origin\" + 0.009*\"form\" + 0.008*\"mean\" + 0.008*\"centuri\" + 0.007*\"uruguayan\" + 0.007*\"charact\" + 0.007*\"like\" + 0.007*\"english\"\n", + "2019-01-31 00:29:54,892 : INFO : topic #8 (0.020): 0.029*\"law\" + 0.025*\"cortic\" + 0.019*\"start\" + 0.018*\"act\" + 0.015*\"ricardo\" + 0.014*\"case\" + 0.012*\"polaris\" + 0.009*\"legal\" + 0.008*\"judaism\" + 0.008*\"replac\"\n", + "2019-01-31 00:29:54,898 : INFO : topic diff=0.006894, rho=0.049207\n", + "2019-01-31 00:29:55,054 : INFO : PROGRESS: pass 0, at document #828000/4922894\n", + "2019-01-31 00:29:56,457 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:29:56,723 : INFO : topic #6 (0.020): 0.072*\"fewer\" + 0.025*\"septemb\" + 0.023*\"epiru\" + 0.018*\"teacher\" + 0.016*\"stake\" + 0.012*\"rodríguez\" + 0.012*\"proclaim\" + 0.012*\"direct\" + 0.011*\"movi\" + 0.010*\"acrimoni\"\n", + "2019-01-31 00:29:56,724 : INFO : topic #3 (0.020): 0.036*\"present\" + 0.028*\"offic\" + 0.026*\"minist\" + 0.023*\"serv\" + 0.020*\"member\" + 0.018*\"gener\" + 0.018*\"seri\" + 0.018*\"nation\" + 0.017*\"govern\" + 0.016*\"chickasaw\"\n", + "2019-01-31 00:29:56,725 : INFO : topic #47 (0.020): 0.064*\"muscl\" + 0.033*\"perceptu\" + 0.021*\"theater\" + 0.018*\"compos\" + 0.018*\"place\" + 0.017*\"damn\" + 0.016*\"physician\" + 0.014*\"olympo\" + 0.014*\"orchestr\" + 0.012*\"word\"\n", + "2019-01-31 00:29:56,726 : INFO : topic #15 (0.020): 0.012*\"small\" + 0.011*\"develop\" + 0.011*\"organ\" + 0.010*\"word\" + 0.009*\"commun\" + 0.009*\"cultur\" + 0.008*\"group\" + 0.008*\"peopl\" + 0.007*\"student\" + 0.007*\"human\"\n", + "2019-01-31 00:29:56,727 : INFO : topic #20 (0.020): 0.135*\"scholar\" + 0.038*\"struggl\" + 0.032*\"high\" + 0.029*\"educ\" + 0.021*\"collector\" + 0.018*\"yawn\" + 0.014*\"prognosi\" + 0.009*\"gothic\" + 0.009*\"task\" + 0.009*\"class\"\n", + "2019-01-31 00:29:56,733 : INFO : topic diff=0.010578, rho=0.049147\n", + "2019-01-31 00:29:56,886 : INFO : PROGRESS: pass 0, at document #830000/4922894\n", + "2019-01-31 00:29:58,289 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:29:58,556 : INFO : topic #3 (0.020): 0.036*\"present\" + 0.028*\"offic\" + 0.027*\"minist\" + 0.023*\"serv\" + 0.020*\"member\" + 0.018*\"gener\" + 0.018*\"seri\" + 0.018*\"nation\" + 0.018*\"govern\" + 0.016*\"chickasaw\"\n", + "2019-01-31 00:29:58,557 : INFO : topic #46 (0.020): 0.020*\"sweden\" + 0.017*\"norwai\" + 0.017*\"swedish\" + 0.017*\"turkish\" + 0.017*\"stop\" + 0.015*\"damag\" + 0.014*\"norwegian\" + 0.012*\"wind\" + 0.012*\"turkei\" + 0.012*\"denmark\"\n", + "2019-01-31 00:29:58,558 : INFO : topic #26 (0.020): 0.031*\"woman\" + 0.030*\"champion\" + 0.029*\"workplac\" + 0.026*\"men\" + 0.025*\"olymp\" + 0.022*\"medal\" + 0.021*\"event\" + 0.020*\"rainfal\" + 0.019*\"atheist\" + 0.019*\"nation\"\n", + "2019-01-31 00:29:58,559 : INFO : topic #4 (0.020): 0.021*\"enfranchis\" + 0.015*\"depress\" + 0.014*\"pour\" + 0.010*\"mode\" + 0.009*\"elabor\" + 0.009*\"produc\" + 0.008*\"candid\" + 0.008*\"veget\" + 0.007*\"encyclopedia\" + 0.007*\"uruguayan\"\n", + "2019-01-31 00:29:58,560 : INFO : topic #21 (0.020): 0.036*\"samford\" + 0.023*\"spain\" + 0.021*\"mexico\" + 0.019*\"del\" + 0.013*\"soviet\" + 0.012*\"santa\" + 0.012*\"francisco\" + 0.011*\"lizard\" + 0.011*\"juan\" + 0.011*\"mexican\"\n", + "2019-01-31 00:29:58,566 : INFO : topic diff=0.007455, rho=0.049088\n", + "2019-01-31 00:29:58,785 : INFO : PROGRESS: pass 0, at document #832000/4922894\n", + "2019-01-31 00:30:00,196 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:30:00,462 : INFO : topic #25 (0.020): 0.030*\"ring\" + 0.019*\"lagrang\" + 0.016*\"warmth\" + 0.016*\"area\" + 0.014*\"mount\" + 0.009*\"palmer\" + 0.009*\"north\" + 0.009*\"foam\" + 0.008*\"sourc\" + 0.008*\"land\"\n", + "2019-01-31 00:30:00,464 : INFO : topic #10 (0.020): 0.013*\"cdd\" + 0.008*\"media\" + 0.008*\"have\" + 0.008*\"pathwai\" + 0.008*\"disco\" + 0.007*\"caus\" + 0.007*\"hormon\" + 0.006*\"effect\" + 0.006*\"treat\" + 0.006*\"proper\"\n", + "2019-01-31 00:30:00,465 : INFO : topic #42 (0.020): 0.042*\"german\" + 0.029*\"germani\" + 0.014*\"jewish\" + 0.014*\"vol\" + 0.013*\"der\" + 0.013*\"israel\" + 0.013*\"berlin\" + 0.010*\"itali\" + 0.009*\"austria\" + 0.009*\"europ\"\n", + "2019-01-31 00:30:00,466 : INFO : topic #20 (0.020): 0.135*\"scholar\" + 0.038*\"struggl\" + 0.032*\"high\" + 0.030*\"educ\" + 0.022*\"collector\" + 0.018*\"yawn\" + 0.013*\"prognosi\" + 0.009*\"task\" + 0.009*\"gothic\" + 0.009*\"class\"\n", + "2019-01-31 00:30:00,467 : INFO : topic #39 (0.020): 0.039*\"canada\" + 0.033*\"canadian\" + 0.017*\"toronto\" + 0.017*\"hoar\" + 0.015*\"ontario\" + 0.014*\"taxpay\" + 0.013*\"new\" + 0.013*\"scientist\" + 0.012*\"basketbal\" + 0.011*\"misericordia\"\n", + "2019-01-31 00:30:00,473 : INFO : topic diff=0.008851, rho=0.049029\n", + "2019-01-31 00:30:00,625 : INFO : PROGRESS: pass 0, at document #834000/4922894\n", + "2019-01-31 00:30:02,008 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:30:02,275 : INFO : topic #5 (0.020): 0.039*\"abroad\" + 0.028*\"son\" + 0.027*\"rel\" + 0.026*\"reconstruct\" + 0.020*\"band\" + 0.017*\"muscl\" + 0.016*\"simultan\" + 0.015*\"charcoal\" + 0.014*\"toyota\" + 0.010*\"vocabulari\"\n", + "2019-01-31 00:30:02,276 : INFO : topic #40 (0.020): 0.089*\"unit\" + 0.024*\"collector\" + 0.023*\"schuster\" + 0.021*\"institut\" + 0.019*\"requir\" + 0.017*\"student\" + 0.015*\"professor\" + 0.012*\"governor\" + 0.012*\"word\" + 0.011*\"http\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 00:30:02,277 : INFO : topic #11 (0.020): 0.028*\"john\" + 0.015*\"will\" + 0.013*\"jame\" + 0.012*\"david\" + 0.011*\"rival\" + 0.010*\"georg\" + 0.009*\"rhyme\" + 0.009*\"mexican–american\" + 0.009*\"slur\" + 0.008*\"paul\"\n", + "2019-01-31 00:30:02,278 : INFO : topic #45 (0.020): 0.018*\"fifteenth\" + 0.018*\"jpg\" + 0.015*\"black\" + 0.015*\"western\" + 0.014*\"colder\" + 0.014*\"illicit\" + 0.013*\"record\" + 0.009*\"blind\" + 0.008*\"green\" + 0.007*\"light\"\n", + "2019-01-31 00:30:02,280 : INFO : topic #7 (0.020): 0.020*\"snatch\" + 0.020*\"di\" + 0.017*\"factor\" + 0.015*\"yawn\" + 0.015*\"margin\" + 0.014*\"bone\" + 0.013*\"life\" + 0.012*\"faster\" + 0.011*\"deal\" + 0.011*\"daughter\"\n", + "2019-01-31 00:30:02,285 : INFO : topic diff=0.007856, rho=0.048970\n", + "2019-01-31 00:30:02,443 : INFO : PROGRESS: pass 0, at document #836000/4922894\n", + "2019-01-31 00:30:03,873 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:30:04,140 : INFO : topic #29 (0.020): 0.010*\"companhia\" + 0.010*\"million\" + 0.009*\"govern\" + 0.009*\"yawn\" + 0.009*\"start\" + 0.008*\"bank\" + 0.007*\"function\" + 0.007*\"countri\" + 0.006*\"market\" + 0.006*\"industri\"\n", + "2019-01-31 00:30:04,141 : INFO : topic #46 (0.020): 0.019*\"sweden\" + 0.018*\"stop\" + 0.017*\"norwai\" + 0.017*\"swedish\" + 0.015*\"turkish\" + 0.015*\"wind\" + 0.014*\"damag\" + 0.013*\"norwegian\" + 0.013*\"treeless\" + 0.012*\"huntsvil\"\n", + "2019-01-31 00:30:04,142 : INFO : topic #26 (0.020): 0.031*\"woman\" + 0.029*\"champion\" + 0.028*\"workplac\" + 0.026*\"men\" + 0.026*\"olymp\" + 0.022*\"medal\" + 0.021*\"event\" + 0.020*\"rainfal\" + 0.020*\"atheist\" + 0.020*\"nation\"\n", + "2019-01-31 00:30:04,143 : INFO : topic #35 (0.020): 0.054*\"russia\" + 0.035*\"sovereignti\" + 0.032*\"rural\" + 0.027*\"reprint\" + 0.023*\"poison\" + 0.023*\"personifi\" + 0.020*\"moscow\" + 0.018*\"turin\" + 0.015*\"poland\" + 0.014*\"malaysia\"\n", + "2019-01-31 00:30:04,145 : INFO : topic #18 (0.020): 0.009*\"théori\" + 0.007*\"later\" + 0.007*\"kill\" + 0.007*\"sack\" + 0.006*\"dai\" + 0.005*\"retrospect\" + 0.005*\"man\" + 0.005*\"like\" + 0.004*\"end\" + 0.004*\"deal\"\n", + "2019-01-31 00:30:04,150 : INFO : topic diff=0.007664, rho=0.048912\n", + "2019-01-31 00:30:04,305 : INFO : PROGRESS: pass 0, at document #838000/4922894\n", + "2019-01-31 00:30:05,698 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:30:05,964 : INFO : topic #2 (0.020): 0.050*\"isl\" + 0.038*\"shield\" + 0.018*\"narrat\" + 0.014*\"scot\" + 0.012*\"blur\" + 0.012*\"pope\" + 0.012*\"coalit\" + 0.011*\"nativist\" + 0.011*\"class\" + 0.009*\"fleet\"\n", + "2019-01-31 00:30:05,965 : INFO : topic #29 (0.020): 0.011*\"companhia\" + 0.010*\"million\" + 0.009*\"govern\" + 0.009*\"yawn\" + 0.009*\"start\" + 0.008*\"bank\" + 0.007*\"function\" + 0.007*\"countri\" + 0.006*\"market\" + 0.006*\"industri\"\n", + "2019-01-31 00:30:05,966 : INFO : topic #0 (0.020): 0.065*\"statewid\" + 0.040*\"line\" + 0.037*\"raid\" + 0.036*\"arsen\" + 0.028*\"museo\" + 0.020*\"traceabl\" + 0.018*\"serv\" + 0.014*\"pain\" + 0.014*\"exhaust\" + 0.013*\"artist\"\n", + "2019-01-31 00:30:05,967 : INFO : topic #22 (0.020): 0.034*\"spars\" + 0.025*\"factor\" + 0.023*\"adulthood\" + 0.017*\"feel\" + 0.015*\"hostil\" + 0.015*\"male\" + 0.012*\"plaisir\" + 0.011*\"live\" + 0.010*\"genu\" + 0.010*\"yawn\"\n", + "2019-01-31 00:30:05,969 : INFO : topic #41 (0.020): 0.045*\"citi\" + 0.031*\"new\" + 0.022*\"palmer\" + 0.016*\"year\" + 0.015*\"center\" + 0.015*\"strategist\" + 0.012*\"open\" + 0.011*\"includ\" + 0.010*\"lobe\" + 0.008*\"hot\"\n", + "2019-01-31 00:30:05,974 : INFO : topic diff=0.008260, rho=0.048853\n", + "2019-01-31 00:30:08,653 : INFO : -11.748 per-word bound, 3439.5 perplexity estimate based on a held-out corpus of 2000 documents with 526338 words\n", + "2019-01-31 00:30:08,653 : INFO : PROGRESS: pass 0, at document #840000/4922894\n", + "2019-01-31 00:30:10,046 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:30:10,312 : INFO : topic #10 (0.020): 0.012*\"cdd\" + 0.008*\"media\" + 0.008*\"pathwai\" + 0.008*\"disco\" + 0.008*\"have\" + 0.007*\"hormon\" + 0.006*\"caus\" + 0.006*\"treat\" + 0.006*\"effect\" + 0.006*\"proper\"\n", + "2019-01-31 00:30:10,313 : INFO : topic #5 (0.020): 0.040*\"abroad\" + 0.028*\"son\" + 0.028*\"rel\" + 0.025*\"reconstruct\" + 0.021*\"band\" + 0.017*\"muscl\" + 0.016*\"simultan\" + 0.015*\"charcoal\" + 0.014*\"toyota\" + 0.010*\"myspac\"\n", + "2019-01-31 00:30:10,314 : INFO : topic #20 (0.020): 0.136*\"scholar\" + 0.038*\"struggl\" + 0.032*\"high\" + 0.029*\"educ\" + 0.022*\"collector\" + 0.018*\"yawn\" + 0.014*\"prognosi\" + 0.009*\"gothic\" + 0.009*\"task\" + 0.009*\"class\"\n", + "2019-01-31 00:30:10,315 : INFO : topic #6 (0.020): 0.071*\"fewer\" + 0.024*\"septemb\" + 0.023*\"epiru\" + 0.018*\"teacher\" + 0.016*\"stake\" + 0.013*\"rodríguez\" + 0.012*\"proclaim\" + 0.011*\"movi\" + 0.011*\"direct\" + 0.011*\"acrimoni\"\n", + "2019-01-31 00:30:10,317 : INFO : topic #47 (0.020): 0.065*\"muscl\" + 0.033*\"perceptu\" + 0.021*\"theater\" + 0.019*\"compos\" + 0.018*\"place\" + 0.016*\"damn\" + 0.016*\"physician\" + 0.014*\"orchestr\" + 0.014*\"olympo\" + 0.012*\"word\"\n", + "2019-01-31 00:30:10,322 : INFO : topic diff=0.008498, rho=0.048795\n", + "2019-01-31 00:30:10,477 : INFO : PROGRESS: pass 0, at document #842000/4922894\n", + "2019-01-31 00:30:11,889 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:30:12,155 : INFO : topic #10 (0.020): 0.012*\"cdd\" + 0.008*\"media\" + 0.008*\"disco\" + 0.008*\"pathwai\" + 0.008*\"have\" + 0.007*\"hormon\" + 0.006*\"caus\" + 0.006*\"treat\" + 0.006*\"effect\" + 0.006*\"proper\"\n", + "2019-01-31 00:30:12,156 : INFO : topic #47 (0.020): 0.065*\"muscl\" + 0.032*\"perceptu\" + 0.021*\"theater\" + 0.019*\"compos\" + 0.018*\"place\" + 0.016*\"damn\" + 0.016*\"physician\" + 0.014*\"orchestr\" + 0.014*\"olympo\" + 0.013*\"word\"\n", + "2019-01-31 00:30:12,157 : INFO : topic #18 (0.020): 0.009*\"théori\" + 0.007*\"later\" + 0.007*\"kill\" + 0.007*\"sack\" + 0.006*\"dai\" + 0.005*\"retrospect\" + 0.005*\"man\" + 0.005*\"like\" + 0.004*\"help\" + 0.004*\"deal\"\n", + "2019-01-31 00:30:12,158 : INFO : topic #6 (0.020): 0.071*\"fewer\" + 0.024*\"septemb\" + 0.023*\"epiru\" + 0.018*\"teacher\" + 0.016*\"stake\" + 0.013*\"rodríguez\" + 0.012*\"proclaim\" + 0.011*\"movi\" + 0.011*\"direct\" + 0.011*\"acrimoni\"\n", + "2019-01-31 00:30:12,159 : INFO : topic #16 (0.020): 0.040*\"king\" + 0.035*\"priest\" + 0.021*\"quarterli\" + 0.019*\"duke\" + 0.019*\"grammat\" + 0.017*\"idiosyncrat\" + 0.016*\"rotterdam\" + 0.014*\"maria\" + 0.013*\"princ\" + 0.012*\"brazil\"\n", + "2019-01-31 00:30:12,165 : INFO : topic diff=0.008895, rho=0.048737\n", + "2019-01-31 00:30:12,319 : INFO : PROGRESS: pass 0, at document #844000/4922894\n", + "2019-01-31 00:30:13,676 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:30:13,945 : INFO : topic #35 (0.020): 0.054*\"russia\" + 0.034*\"sovereignti\" + 0.032*\"rural\" + 0.026*\"reprint\" + 0.026*\"poison\" + 0.024*\"personifi\" + 0.021*\"moscow\" + 0.017*\"turin\" + 0.016*\"poland\" + 0.014*\"malaysia\"\n", + "2019-01-31 00:30:13,946 : INFO : topic #15 (0.020): 0.012*\"small\" + 0.011*\"develop\" + 0.011*\"organ\" + 0.010*\"word\" + 0.009*\"commun\" + 0.009*\"cultur\" + 0.009*\"group\" + 0.008*\"peopl\" + 0.007*\"student\" + 0.007*\"socialist\"\n", + "2019-01-31 00:30:13,947 : INFO : topic #43 (0.020): 0.067*\"elect\" + 0.055*\"parti\" + 0.024*\"voluntari\" + 0.024*\"democrat\" + 0.020*\"member\" + 0.017*\"polici\" + 0.017*\"seaport\" + 0.016*\"republ\" + 0.015*\"liber\" + 0.014*\"bypass\"\n", + "2019-01-31 00:30:13,948 : INFO : topic #16 (0.020): 0.040*\"king\" + 0.035*\"priest\" + 0.021*\"quarterli\" + 0.019*\"duke\" + 0.019*\"grammat\" + 0.018*\"idiosyncrat\" + 0.016*\"rotterdam\" + 0.014*\"maria\" + 0.013*\"princ\" + 0.012*\"brazil\"\n", + "2019-01-31 00:30:13,949 : INFO : topic #47 (0.020): 0.066*\"muscl\" + 0.032*\"perceptu\" + 0.020*\"theater\" + 0.019*\"compos\" + 0.017*\"place\" + 0.017*\"damn\" + 0.016*\"physician\" + 0.014*\"orchestr\" + 0.014*\"olympo\" + 0.013*\"word\"\n", + "2019-01-31 00:30:13,955 : INFO : topic diff=0.008711, rho=0.048679\n", + "2019-01-31 00:30:14,109 : INFO : PROGRESS: pass 0, at document #846000/4922894\n", + "2019-01-31 00:30:15,509 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:30:15,775 : INFO : topic #21 (0.020): 0.035*\"samford\" + 0.023*\"spain\" + 0.020*\"mexico\" + 0.018*\"del\" + 0.013*\"soviet\" + 0.012*\"santa\" + 0.011*\"francisco\" + 0.011*\"mexican\" + 0.011*\"carlo\" + 0.011*\"juan\"\n", + "2019-01-31 00:30:15,776 : INFO : topic #7 (0.020): 0.021*\"snatch\" + 0.020*\"di\" + 0.017*\"factor\" + 0.015*\"yawn\" + 0.015*\"margin\" + 0.014*\"bone\" + 0.013*\"life\" + 0.012*\"faster\" + 0.012*\"daughter\" + 0.011*\"deal\"\n", + "2019-01-31 00:30:15,777 : INFO : topic #4 (0.020): 0.021*\"enfranchis\" + 0.015*\"depress\" + 0.015*\"pour\" + 0.010*\"mode\" + 0.009*\"elabor\" + 0.009*\"produc\" + 0.008*\"candid\" + 0.008*\"veget\" + 0.007*\"encyclopedia\" + 0.007*\"uruguayan\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 00:30:15,778 : INFO : topic #0 (0.020): 0.066*\"statewid\" + 0.039*\"line\" + 0.038*\"arsen\" + 0.037*\"raid\" + 0.028*\"museo\" + 0.020*\"traceabl\" + 0.018*\"serv\" + 0.015*\"pain\" + 0.014*\"exhaust\" + 0.013*\"artist\"\n", + "2019-01-31 00:30:15,779 : INFO : topic #29 (0.020): 0.011*\"companhia\" + 0.010*\"million\" + 0.009*\"govern\" + 0.009*\"yawn\" + 0.009*\"start\" + 0.008*\"bank\" + 0.007*\"countri\" + 0.007*\"function\" + 0.006*\"market\" + 0.006*\"industri\"\n", + "2019-01-31 00:30:15,785 : INFO : topic diff=0.008453, rho=0.048622\n", + "2019-01-31 00:30:15,940 : INFO : PROGRESS: pass 0, at document #848000/4922894\n", + "2019-01-31 00:30:17,370 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:30:17,636 : INFO : topic #35 (0.020): 0.054*\"russia\" + 0.036*\"sovereignti\" + 0.032*\"rural\" + 0.026*\"reprint\" + 0.026*\"personifi\" + 0.025*\"poison\" + 0.020*\"moscow\" + 0.016*\"turin\" + 0.015*\"poland\" + 0.014*\"unfortun\"\n", + "2019-01-31 00:30:17,637 : INFO : topic #10 (0.020): 0.011*\"cdd\" + 0.008*\"media\" + 0.008*\"disco\" + 0.008*\"have\" + 0.008*\"pathwai\" + 0.007*\"caus\" + 0.006*\"hormon\" + 0.006*\"treat\" + 0.006*\"effect\" + 0.006*\"proper\"\n", + "2019-01-31 00:30:17,638 : INFO : topic #7 (0.020): 0.021*\"snatch\" + 0.020*\"di\" + 0.017*\"factor\" + 0.015*\"yawn\" + 0.015*\"margin\" + 0.014*\"bone\" + 0.013*\"life\" + 0.012*\"faster\" + 0.012*\"daughter\" + 0.011*\"deal\"\n", + "2019-01-31 00:30:17,640 : INFO : topic #4 (0.020): 0.021*\"enfranchis\" + 0.016*\"depress\" + 0.015*\"pour\" + 0.010*\"mode\" + 0.010*\"elabor\" + 0.009*\"produc\" + 0.008*\"candid\" + 0.008*\"veget\" + 0.007*\"encyclopedia\" + 0.007*\"uruguayan\"\n", + "2019-01-31 00:30:17,641 : INFO : topic #31 (0.020): 0.062*\"fusiform\" + 0.024*\"scientist\" + 0.023*\"player\" + 0.021*\"taxpay\" + 0.020*\"place\" + 0.012*\"clot\" + 0.012*\"leagu\" + 0.011*\"yard\" + 0.011*\"folei\" + 0.009*\"yawn\"\n", + "2019-01-31 00:30:17,647 : INFO : topic diff=0.007210, rho=0.048564\n", + "2019-01-31 00:30:17,803 : INFO : PROGRESS: pass 0, at document #850000/4922894\n", + "2019-01-31 00:30:19,205 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:30:19,472 : INFO : topic #32 (0.020): 0.054*\"district\" + 0.046*\"vigour\" + 0.044*\"popolo\" + 0.040*\"tortur\" + 0.031*\"area\" + 0.026*\"regim\" + 0.025*\"cotton\" + 0.025*\"multitud\" + 0.022*\"citi\" + 0.021*\"commun\"\n", + "2019-01-31 00:30:19,473 : INFO : topic #23 (0.020): 0.134*\"audit\" + 0.067*\"best\" + 0.036*\"yawn\" + 0.027*\"jacksonvil\" + 0.023*\"japanes\" + 0.022*\"noll\" + 0.022*\"festiv\" + 0.022*\"intern\" + 0.019*\"women\" + 0.015*\"prison\"\n", + "2019-01-31 00:30:19,474 : INFO : topic #37 (0.020): 0.009*\"love\" + 0.008*\"gestur\" + 0.008*\"man\" + 0.006*\"blue\" + 0.005*\"bewild\" + 0.004*\"night\" + 0.004*\"litig\" + 0.004*\"vision\" + 0.003*\"amphora\" + 0.003*\"black\"\n", + "2019-01-31 00:30:19,475 : INFO : topic #2 (0.020): 0.051*\"isl\" + 0.038*\"shield\" + 0.018*\"narrat\" + 0.014*\"scot\" + 0.013*\"blur\" + 0.012*\"pope\" + 0.011*\"class\" + 0.011*\"nativist\" + 0.011*\"coalit\" + 0.008*\"fleet\"\n", + "2019-01-31 00:30:19,476 : INFO : topic #5 (0.020): 0.039*\"abroad\" + 0.028*\"rel\" + 0.028*\"son\" + 0.026*\"reconstruct\" + 0.021*\"band\" + 0.017*\"muscl\" + 0.016*\"simultan\" + 0.015*\"charcoal\" + 0.014*\"toyota\" + 0.010*\"myspac\"\n", + "2019-01-31 00:30:19,482 : INFO : topic diff=0.013095, rho=0.048507\n", + "2019-01-31 00:30:19,630 : INFO : PROGRESS: pass 0, at document #852000/4922894\n", + "2019-01-31 00:30:21,009 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:30:21,276 : INFO : topic #8 (0.020): 0.028*\"law\" + 0.025*\"cortic\" + 0.019*\"start\" + 0.017*\"act\" + 0.014*\"ricardo\" + 0.014*\"case\" + 0.010*\"polaris\" + 0.009*\"legal\" + 0.008*\"replac\" + 0.008*\"princess\"\n", + "2019-01-31 00:30:21,277 : INFO : topic #15 (0.020): 0.012*\"small\" + 0.011*\"develop\" + 0.011*\"organ\" + 0.010*\"word\" + 0.009*\"commun\" + 0.009*\"cultur\" + 0.008*\"group\" + 0.008*\"peopl\" + 0.007*\"student\" + 0.007*\"human\"\n", + "2019-01-31 00:30:21,278 : INFO : topic #13 (0.020): 0.027*\"sourc\" + 0.026*\"australia\" + 0.024*\"australian\" + 0.024*\"new\" + 0.024*\"london\" + 0.020*\"england\" + 0.019*\"british\" + 0.018*\"ireland\" + 0.014*\"youth\" + 0.014*\"wale\"\n", + "2019-01-31 00:30:21,279 : INFO : topic #45 (0.020): 0.020*\"jpg\" + 0.019*\"fifteenth\" + 0.015*\"black\" + 0.014*\"illicit\" + 0.014*\"western\" + 0.014*\"colder\" + 0.012*\"record\" + 0.009*\"blind\" + 0.008*\"green\" + 0.007*\"light\"\n", + "2019-01-31 00:30:21,280 : INFO : topic #0 (0.020): 0.065*\"statewid\" + 0.039*\"line\" + 0.039*\"arsen\" + 0.036*\"raid\" + 0.028*\"museo\" + 0.020*\"traceabl\" + 0.018*\"serv\" + 0.015*\"pain\" + 0.014*\"exhaust\" + 0.013*\"artist\"\n", + "2019-01-31 00:30:21,286 : INFO : topic diff=0.008795, rho=0.048450\n", + "2019-01-31 00:30:21,445 : INFO : PROGRESS: pass 0, at document #854000/4922894\n", + "2019-01-31 00:30:22,849 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:30:23,116 : INFO : topic #13 (0.020): 0.027*\"sourc\" + 0.027*\"australia\" + 0.024*\"london\" + 0.024*\"new\" + 0.024*\"australian\" + 0.020*\"england\" + 0.020*\"british\" + 0.018*\"ireland\" + 0.014*\"youth\" + 0.014*\"wale\"\n", + "2019-01-31 00:30:23,117 : INFO : topic #7 (0.020): 0.020*\"snatch\" + 0.019*\"di\" + 0.017*\"factor\" + 0.015*\"yawn\" + 0.015*\"margin\" + 0.013*\"bone\" + 0.012*\"life\" + 0.012*\"faster\" + 0.012*\"daughter\" + 0.011*\"deal\"\n", + "2019-01-31 00:30:23,118 : INFO : topic #35 (0.020): 0.054*\"russia\" + 0.036*\"sovereignti\" + 0.033*\"rural\" + 0.026*\"poison\" + 0.025*\"reprint\" + 0.025*\"personifi\" + 0.022*\"moscow\" + 0.016*\"turin\" + 0.016*\"poland\" + 0.014*\"unfortun\"\n", + "2019-01-31 00:30:23,119 : INFO : topic #49 (0.020): 0.044*\"india\" + 0.032*\"incumb\" + 0.013*\"televis\" + 0.013*\"pakistan\" + 0.012*\"islam\" + 0.011*\"khalsa\" + 0.011*\"anglo\" + 0.010*\"muskoge\" + 0.010*\"start\" + 0.009*\"alam\"\n", + "2019-01-31 00:30:23,120 : INFO : topic #0 (0.020): 0.066*\"statewid\" + 0.039*\"arsen\" + 0.039*\"line\" + 0.036*\"raid\" + 0.029*\"museo\" + 0.020*\"traceabl\" + 0.018*\"serv\" + 0.015*\"pain\" + 0.014*\"exhaust\" + 0.014*\"artist\"\n", + "2019-01-31 00:30:23,126 : INFO : topic diff=0.007686, rho=0.048393\n", + "2019-01-31 00:30:23,283 : INFO : PROGRESS: pass 0, at document #856000/4922894\n", + "2019-01-31 00:30:24,709 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:30:24,975 : INFO : topic #9 (0.020): 0.072*\"bone\" + 0.042*\"american\" + 0.028*\"valour\" + 0.019*\"dutch\" + 0.019*\"folei\" + 0.018*\"player\" + 0.017*\"english\" + 0.016*\"polit\" + 0.012*\"simpler\" + 0.012*\"acrimoni\"\n", + "2019-01-31 00:30:24,976 : INFO : topic #1 (0.020): 0.053*\"china\" + 0.046*\"chilton\" + 0.025*\"kong\" + 0.025*\"hong\" + 0.021*\"korea\" + 0.019*\"korean\" + 0.017*\"leah\" + 0.017*\"sourc\" + 0.013*\"kim\" + 0.012*\"taiwan\"\n", + "2019-01-31 00:30:24,977 : INFO : topic #2 (0.020): 0.052*\"isl\" + 0.037*\"shield\" + 0.018*\"narrat\" + 0.014*\"scot\" + 0.012*\"pope\" + 0.012*\"blur\" + 0.011*\"class\" + 0.011*\"coalit\" + 0.011*\"nativist\" + 0.009*\"fleet\"\n", + "2019-01-31 00:30:24,978 : INFO : topic #40 (0.020): 0.090*\"unit\" + 0.023*\"collector\" + 0.022*\"schuster\" + 0.020*\"institut\" + 0.019*\"requir\" + 0.018*\"student\" + 0.016*\"professor\" + 0.012*\"governor\" + 0.012*\"word\" + 0.011*\"degre\"\n", + "2019-01-31 00:30:24,979 : INFO : topic #33 (0.020): 0.061*\"french\" + 0.048*\"franc\" + 0.033*\"pari\" + 0.026*\"sail\" + 0.022*\"jean\" + 0.017*\"daphn\" + 0.014*\"lazi\" + 0.012*\"loui\" + 0.011*\"piec\" + 0.009*\"wine\"\n", + "2019-01-31 00:30:24,985 : INFO : topic diff=0.007652, rho=0.048337\n", + "2019-01-31 00:30:25,140 : INFO : PROGRESS: pass 0, at document #858000/4922894\n", + "2019-01-31 00:30:26,534 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:30:26,800 : INFO : topic #46 (0.020): 0.020*\"sweden\" + 0.018*\"stop\" + 0.018*\"norwai\" + 0.018*\"swedish\" + 0.015*\"norwegian\" + 0.015*\"wind\" + 0.014*\"turkish\" + 0.013*\"damag\" + 0.012*\"denmark\" + 0.012*\"huntsvil\"\n", + "2019-01-31 00:30:26,802 : INFO : topic #42 (0.020): 0.041*\"german\" + 0.029*\"germani\" + 0.013*\"israel\" + 0.013*\"jewish\" + 0.013*\"vol\" + 0.013*\"der\" + 0.013*\"berlin\" + 0.010*\"austria\" + 0.009*\"itali\" + 0.008*\"european\"\n", + "2019-01-31 00:30:26,803 : INFO : topic #39 (0.020): 0.038*\"canada\" + 0.035*\"canadian\" + 0.019*\"toronto\" + 0.017*\"hoar\" + 0.015*\"ontario\" + 0.013*\"new\" + 0.013*\"taxpay\" + 0.013*\"scientist\" + 0.012*\"basketbal\" + 0.011*\"hydrogen\"\n", + "2019-01-31 00:30:26,804 : INFO : topic #19 (0.020): 0.013*\"languag\" + 0.010*\"origin\" + 0.010*\"woodcut\" + 0.009*\"form\" + 0.008*\"mean\" + 0.008*\"centuri\" + 0.007*\"charact\" + 0.007*\"uruguayan\" + 0.007*\"like\" + 0.007*\"god\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 00:30:26,805 : INFO : topic #2 (0.020): 0.052*\"isl\" + 0.037*\"shield\" + 0.018*\"narrat\" + 0.014*\"scot\" + 0.012*\"blur\" + 0.012*\"pope\" + 0.011*\"class\" + 0.011*\"coalit\" + 0.011*\"nativist\" + 0.008*\"fleet\"\n", + "2019-01-31 00:30:26,811 : INFO : topic diff=0.007951, rho=0.048280\n", + "2019-01-31 00:30:29,563 : INFO : -11.691 per-word bound, 3306.6 perplexity estimate based on a held-out corpus of 2000 documents with 552096 words\n", + "2019-01-31 00:30:29,563 : INFO : PROGRESS: pass 0, at document #860000/4922894\n", + "2019-01-31 00:30:31,144 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:30:31,411 : INFO : topic #38 (0.020): 0.023*\"walter\" + 0.010*\"battalion\" + 0.009*\"king\" + 0.009*\"aza\" + 0.008*\"forc\" + 0.008*\"empath\" + 0.008*\"centuri\" + 0.007*\"teufel\" + 0.007*\"armi\" + 0.006*\"embassi\"\n", + "2019-01-31 00:30:31,412 : INFO : topic #36 (0.020): 0.013*\"companhia\" + 0.011*\"pop\" + 0.010*\"network\" + 0.010*\"prognosi\" + 0.009*\"develop\" + 0.009*\"serv\" + 0.008*\"base\" + 0.008*\"includ\" + 0.007*\"brio\" + 0.007*\"diggin\"\n", + "2019-01-31 00:30:31,414 : INFO : topic #15 (0.020): 0.012*\"small\" + 0.011*\"develop\" + 0.011*\"organ\" + 0.010*\"word\" + 0.009*\"commun\" + 0.008*\"cultur\" + 0.008*\"group\" + 0.008*\"peopl\" + 0.007*\"human\" + 0.007*\"student\"\n", + "2019-01-31 00:30:31,415 : INFO : topic #46 (0.020): 0.020*\"sweden\" + 0.018*\"stop\" + 0.018*\"norwai\" + 0.017*\"swedish\" + 0.015*\"norwegian\" + 0.015*\"wind\" + 0.014*\"turkish\" + 0.013*\"damag\" + 0.012*\"denmark\" + 0.012*\"huntsvil\"\n", + "2019-01-31 00:30:31,416 : INFO : topic #20 (0.020): 0.136*\"scholar\" + 0.039*\"struggl\" + 0.032*\"high\" + 0.029*\"educ\" + 0.023*\"collector\" + 0.018*\"yawn\" + 0.014*\"prognosi\" + 0.009*\"task\" + 0.009*\"class\" + 0.009*\"gothic\"\n", + "2019-01-31 00:30:31,422 : INFO : topic diff=0.007213, rho=0.048224\n", + "2019-01-31 00:30:31,633 : INFO : PROGRESS: pass 0, at document #862000/4922894\n", + "2019-01-31 00:30:33,042 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:30:33,309 : INFO : topic #6 (0.020): 0.071*\"fewer\" + 0.025*\"septemb\" + 0.023*\"epiru\" + 0.018*\"teacher\" + 0.016*\"stake\" + 0.012*\"rodríguez\" + 0.012*\"proclaim\" + 0.011*\"direct\" + 0.011*\"movi\" + 0.011*\"acrimoni\"\n", + "2019-01-31 00:30:33,310 : INFO : topic #26 (0.020): 0.030*\"woman\" + 0.030*\"workplac\" + 0.029*\"champion\" + 0.028*\"men\" + 0.025*\"olymp\" + 0.022*\"medal\" + 0.021*\"alic\" + 0.020*\"event\" + 0.019*\"rainfal\" + 0.019*\"atheist\"\n", + "2019-01-31 00:30:33,312 : INFO : topic #8 (0.020): 0.028*\"law\" + 0.024*\"cortic\" + 0.019*\"start\" + 0.017*\"act\" + 0.014*\"ricardo\" + 0.014*\"case\" + 0.011*\"polaris\" + 0.009*\"legal\" + 0.009*\"replac\" + 0.008*\"judaism\"\n", + "2019-01-31 00:30:33,313 : INFO : topic #22 (0.020): 0.035*\"spars\" + 0.026*\"factor\" + 0.023*\"adulthood\" + 0.017*\"feel\" + 0.015*\"hostil\" + 0.015*\"male\" + 0.012*\"plaisir\" + 0.011*\"live\" + 0.011*\"genu\" + 0.010*\"yawn\"\n", + "2019-01-31 00:30:33,314 : INFO : topic #3 (0.020): 0.036*\"present\" + 0.030*\"offic\" + 0.025*\"minist\" + 0.021*\"serv\" + 0.019*\"member\" + 0.018*\"gener\" + 0.017*\"govern\" + 0.017*\"seri\" + 0.017*\"nation\" + 0.016*\"chickasaw\"\n", + "2019-01-31 00:30:33,320 : INFO : topic diff=0.008605, rho=0.048168\n", + "2019-01-31 00:30:33,477 : INFO : PROGRESS: pass 0, at document #864000/4922894\n", + "2019-01-31 00:30:34,844 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:30:35,114 : INFO : topic #10 (0.020): 0.011*\"cdd\" + 0.008*\"media\" + 0.008*\"hormon\" + 0.008*\"pathwai\" + 0.008*\"disco\" + 0.007*\"have\" + 0.007*\"caus\" + 0.006*\"treat\" + 0.006*\"proper\" + 0.006*\"effect\"\n", + "2019-01-31 00:30:35,115 : INFO : topic #5 (0.020): 0.039*\"abroad\" + 0.028*\"son\" + 0.027*\"rel\" + 0.025*\"reconstruct\" + 0.021*\"band\" + 0.017*\"muscl\" + 0.016*\"simultan\" + 0.015*\"charcoal\" + 0.014*\"toyota\" + 0.010*\"myspac\"\n", + "2019-01-31 00:30:35,116 : INFO : topic #13 (0.020): 0.028*\"australia\" + 0.027*\"sourc\" + 0.024*\"australian\" + 0.024*\"new\" + 0.024*\"london\" + 0.020*\"british\" + 0.020*\"england\" + 0.017*\"ireland\" + 0.014*\"youth\" + 0.013*\"wale\"\n", + "2019-01-31 00:30:35,117 : INFO : topic #41 (0.020): 0.044*\"citi\" + 0.032*\"new\" + 0.021*\"palmer\" + 0.016*\"year\" + 0.015*\"strategist\" + 0.014*\"center\" + 0.012*\"open\" + 0.011*\"includ\" + 0.010*\"lobe\" + 0.009*\"highli\"\n", + "2019-01-31 00:30:35,118 : INFO : topic #30 (0.020): 0.037*\"leagu\" + 0.036*\"cleveland\" + 0.030*\"place\" + 0.028*\"taxpay\" + 0.025*\"scientist\" + 0.024*\"crete\" + 0.021*\"folei\" + 0.016*\"goal\" + 0.015*\"martin\" + 0.012*\"diversifi\"\n", + "2019-01-31 00:30:35,124 : INFO : topic diff=0.008393, rho=0.048113\n", + "2019-01-31 00:30:35,281 : INFO : PROGRESS: pass 0, at document #866000/4922894\n", + "2019-01-31 00:30:36,699 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:30:36,965 : INFO : topic #30 (0.020): 0.037*\"leagu\" + 0.036*\"cleveland\" + 0.030*\"place\" + 0.027*\"taxpay\" + 0.025*\"scientist\" + 0.025*\"crete\" + 0.021*\"folei\" + 0.016*\"goal\" + 0.015*\"martin\" + 0.013*\"diversifi\"\n", + "2019-01-31 00:30:36,966 : INFO : topic #11 (0.020): 0.028*\"john\" + 0.015*\"will\" + 0.013*\"jame\" + 0.012*\"david\" + 0.011*\"rival\" + 0.010*\"georg\" + 0.009*\"mexican–american\" + 0.009*\"slur\" + 0.009*\"rhyme\" + 0.008*\"paul\"\n", + "2019-01-31 00:30:36,968 : INFO : topic #27 (0.020): 0.069*\"questionnair\" + 0.018*\"taxpay\" + 0.017*\"candid\" + 0.013*\"fool\" + 0.013*\"driver\" + 0.012*\"ret\" + 0.012*\"find\" + 0.011*\"tornado\" + 0.011*\"landslid\" + 0.011*\"théori\"\n", + "2019-01-31 00:30:36,969 : INFO : topic #15 (0.020): 0.012*\"small\" + 0.011*\"develop\" + 0.011*\"organ\" + 0.010*\"word\" + 0.009*\"commun\" + 0.008*\"group\" + 0.008*\"cultur\" + 0.008*\"peopl\" + 0.007*\"human\" + 0.007*\"student\"\n", + "2019-01-31 00:30:36,970 : INFO : topic #41 (0.020): 0.044*\"citi\" + 0.031*\"new\" + 0.021*\"palmer\" + 0.016*\"year\" + 0.015*\"strategist\" + 0.014*\"center\" + 0.012*\"open\" + 0.010*\"includ\" + 0.010*\"lobe\" + 0.009*\"highli\"\n", + "2019-01-31 00:30:36,976 : INFO : topic diff=0.008114, rho=0.048057\n", + "2019-01-31 00:30:37,130 : INFO : PROGRESS: pass 0, at document #868000/4922894\n", + "2019-01-31 00:30:38,542 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:30:38,808 : INFO : topic #11 (0.020): 0.028*\"john\" + 0.015*\"will\" + 0.013*\"jame\" + 0.012*\"david\" + 0.011*\"rival\" + 0.010*\"georg\" + 0.009*\"mexican–american\" + 0.009*\"slur\" + 0.009*\"rhyme\" + 0.008*\"paul\"\n", + "2019-01-31 00:30:38,809 : INFO : topic #39 (0.020): 0.039*\"canada\" + 0.036*\"canadian\" + 0.019*\"hoar\" + 0.018*\"toronto\" + 0.015*\"ontario\" + 0.013*\"new\" + 0.013*\"taxpay\" + 0.012*\"scientist\" + 0.012*\"hydrogen\" + 0.012*\"basketbal\"\n", + "2019-01-31 00:30:38,810 : INFO : topic #36 (0.020): 0.013*\"companhia\" + 0.011*\"pop\" + 0.011*\"prognosi\" + 0.010*\"network\" + 0.010*\"develop\" + 0.008*\"serv\" + 0.008*\"base\" + 0.008*\"includ\" + 0.007*\"user\" + 0.007*\"brio\"\n", + "2019-01-31 00:30:38,812 : INFO : topic #25 (0.020): 0.030*\"ring\" + 0.018*\"lagrang\" + 0.017*\"warmth\" + 0.016*\"area\" + 0.014*\"mount\" + 0.009*\"palmer\" + 0.009*\"north\" + 0.009*\"foam\" + 0.008*\"land\" + 0.008*\"vacant\"\n", + "2019-01-31 00:30:38,813 : INFO : topic #23 (0.020): 0.134*\"audit\" + 0.068*\"best\" + 0.036*\"yawn\" + 0.028*\"jacksonvil\" + 0.024*\"japanes\" + 0.023*\"festiv\" + 0.022*\"noll\" + 0.020*\"intern\" + 0.019*\"women\" + 0.014*\"prison\"\n", + "2019-01-31 00:30:38,819 : INFO : topic diff=0.007517, rho=0.048002\n", + "2019-01-31 00:30:38,978 : INFO : PROGRESS: pass 0, at document #870000/4922894\n", + "2019-01-31 00:30:40,407 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:30:40,673 : INFO : topic #1 (0.020): 0.053*\"china\" + 0.046*\"chilton\" + 0.028*\"kong\" + 0.027*\"hong\" + 0.020*\"korea\" + 0.018*\"korean\" + 0.018*\"leah\" + 0.016*\"sourc\" + 0.013*\"kim\" + 0.011*\"taiwan\"\n", + "2019-01-31 00:30:40,674 : INFO : topic #38 (0.020): 0.022*\"walter\" + 0.009*\"battalion\" + 0.009*\"aza\" + 0.009*\"king\" + 0.009*\"forc\" + 0.008*\"empath\" + 0.008*\"centuri\" + 0.008*\"teufel\" + 0.007*\"armi\" + 0.006*\"till\"\n", + "2019-01-31 00:30:40,675 : INFO : topic #31 (0.020): 0.063*\"fusiform\" + 0.025*\"scientist\" + 0.023*\"player\" + 0.021*\"taxpay\" + 0.020*\"place\" + 0.012*\"clot\" + 0.012*\"leagu\" + 0.011*\"yard\" + 0.010*\"folei\" + 0.010*\"ruler\"\n", + "2019-01-31 00:30:40,677 : INFO : topic #39 (0.020): 0.039*\"canada\" + 0.036*\"canadian\" + 0.020*\"hoar\" + 0.018*\"toronto\" + 0.014*\"ontario\" + 0.013*\"taxpay\" + 0.013*\"new\" + 0.012*\"hydrogen\" + 0.012*\"scientist\" + 0.012*\"basketbal\"\n", + "2019-01-31 00:30:40,678 : INFO : topic #25 (0.020): 0.030*\"ring\" + 0.018*\"lagrang\" + 0.017*\"warmth\" + 0.016*\"area\" + 0.014*\"mount\" + 0.009*\"palmer\" + 0.009*\"north\" + 0.009*\"foam\" + 0.008*\"land\" + 0.008*\"vacant\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 00:30:40,684 : INFO : topic diff=0.008654, rho=0.047946\n", + "2019-01-31 00:30:40,843 : INFO : PROGRESS: pass 0, at document #872000/4922894\n", + "2019-01-31 00:30:42,276 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:30:42,546 : INFO : topic #18 (0.020): 0.009*\"théori\" + 0.007*\"later\" + 0.007*\"sack\" + 0.007*\"kill\" + 0.006*\"dai\" + 0.005*\"retrospect\" + 0.005*\"like\" + 0.004*\"man\" + 0.004*\"deal\" + 0.004*\"end\"\n", + "2019-01-31 00:30:42,547 : INFO : topic #26 (0.020): 0.030*\"alic\" + 0.029*\"workplac\" + 0.029*\"woman\" + 0.029*\"champion\" + 0.027*\"men\" + 0.025*\"olymp\" + 0.023*\"medal\" + 0.022*\"left\" + 0.020*\"event\" + 0.018*\"rainfal\"\n", + "2019-01-31 00:30:42,548 : INFO : topic #1 (0.020): 0.053*\"china\" + 0.046*\"chilton\" + 0.027*\"kong\" + 0.026*\"hong\" + 0.020*\"korea\" + 0.018*\"korean\" + 0.018*\"leah\" + 0.016*\"sourc\" + 0.013*\"kim\" + 0.011*\"taiwan\"\n", + "2019-01-31 00:30:42,549 : INFO : topic #5 (0.020): 0.039*\"abroad\" + 0.028*\"son\" + 0.027*\"rel\" + 0.025*\"reconstruct\" + 0.020*\"band\" + 0.018*\"muscl\" + 0.016*\"simultan\" + 0.015*\"charcoal\" + 0.014*\"toyota\" + 0.010*\"myspac\"\n", + "2019-01-31 00:30:42,551 : INFO : topic #37 (0.020): 0.009*\"love\" + 0.008*\"gestur\" + 0.008*\"man\" + 0.006*\"blue\" + 0.005*\"litig\" + 0.005*\"bewild\" + 0.004*\"night\" + 0.004*\"vision\" + 0.004*\"black\" + 0.003*\"admit\"\n", + "2019-01-31 00:30:42,557 : INFO : topic diff=0.008624, rho=0.047891\n", + "2019-01-31 00:30:42,714 : INFO : PROGRESS: pass 0, at document #874000/4922894\n", + "2019-01-31 00:30:44,116 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:30:44,383 : INFO : topic #29 (0.020): 0.012*\"companhia\" + 0.010*\"million\" + 0.009*\"yawn\" + 0.008*\"govern\" + 0.008*\"start\" + 0.008*\"bank\" + 0.007*\"countri\" + 0.007*\"function\" + 0.007*\"market\" + 0.006*\"busi\"\n", + "2019-01-31 00:30:44,384 : INFO : topic #42 (0.020): 0.043*\"german\" + 0.029*\"germani\" + 0.014*\"vol\" + 0.013*\"jewish\" + 0.013*\"der\" + 0.013*\"israel\" + 0.012*\"berlin\" + 0.010*\"austria\" + 0.009*\"itali\" + 0.008*\"europ\"\n", + "2019-01-31 00:30:44,386 : INFO : topic #44 (0.020): 0.029*\"rooftop\" + 0.028*\"final\" + 0.024*\"tourist\" + 0.020*\"wife\" + 0.020*\"champion\" + 0.018*\"taxpay\" + 0.015*\"martin\" + 0.014*\"tiepolo\" + 0.013*\"chamber\" + 0.013*\"women\"\n", + "2019-01-31 00:30:44,387 : INFO : topic #10 (0.020): 0.010*\"cdd\" + 0.008*\"media\" + 0.008*\"disco\" + 0.007*\"hormon\" + 0.007*\"pathwai\" + 0.007*\"have\" + 0.007*\"caus\" + 0.006*\"treat\" + 0.006*\"proper\" + 0.006*\"effect\"\n", + "2019-01-31 00:30:44,388 : INFO : topic #11 (0.020): 0.029*\"john\" + 0.016*\"will\" + 0.014*\"jame\" + 0.011*\"david\" + 0.011*\"rival\" + 0.010*\"georg\" + 0.009*\"slur\" + 0.009*\"mexican–american\" + 0.009*\"rhyme\" + 0.008*\"paul\"\n", + "2019-01-31 00:30:44,394 : INFO : topic diff=0.008442, rho=0.047836\n", + "2019-01-31 00:30:44,547 : INFO : PROGRESS: pass 0, at document #876000/4922894\n", + "2019-01-31 00:30:45,948 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:30:46,214 : INFO : topic #43 (0.020): 0.066*\"elect\" + 0.057*\"parti\" + 0.024*\"voluntari\" + 0.024*\"democrat\" + 0.020*\"member\" + 0.018*\"polici\" + 0.015*\"seaport\" + 0.015*\"republ\" + 0.014*\"liber\" + 0.013*\"report\"\n", + "2019-01-31 00:30:46,216 : INFO : topic #25 (0.020): 0.030*\"ring\" + 0.018*\"warmth\" + 0.018*\"lagrang\" + 0.016*\"area\" + 0.014*\"mount\" + 0.009*\"palmer\" + 0.009*\"north\" + 0.008*\"land\" + 0.008*\"foam\" + 0.008*\"vacant\"\n", + "2019-01-31 00:30:46,217 : INFO : topic #40 (0.020): 0.089*\"unit\" + 0.023*\"collector\" + 0.022*\"schuster\" + 0.021*\"institut\" + 0.019*\"requir\" + 0.018*\"student\" + 0.017*\"professor\" + 0.012*\"governor\" + 0.012*\"word\" + 0.011*\"http\"\n", + "2019-01-31 00:30:46,219 : INFO : topic #33 (0.020): 0.061*\"french\" + 0.050*\"franc\" + 0.032*\"pari\" + 0.027*\"sail\" + 0.022*\"jean\" + 0.017*\"daphn\" + 0.013*\"lazi\" + 0.012*\"loui\" + 0.011*\"piec\" + 0.009*\"wine\"\n", + "2019-01-31 00:30:46,220 : INFO : topic #3 (0.020): 0.038*\"present\" + 0.028*\"offic\" + 0.025*\"minist\" + 0.020*\"member\" + 0.019*\"serv\" + 0.018*\"gener\" + 0.018*\"govern\" + 0.017*\"seri\" + 0.017*\"nation\" + 0.016*\"chickasaw\"\n", + "2019-01-31 00:30:46,226 : INFO : topic diff=0.008555, rho=0.047782\n", + "2019-01-31 00:30:46,390 : INFO : PROGRESS: pass 0, at document #878000/4922894\n", + "2019-01-31 00:30:47,802 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:30:48,068 : INFO : topic #6 (0.020): 0.071*\"fewer\" + 0.025*\"septemb\" + 0.023*\"epiru\" + 0.018*\"teacher\" + 0.015*\"stake\" + 0.014*\"proclaim\" + 0.012*\"rodríguez\" + 0.011*\"movi\" + 0.011*\"direct\" + 0.011*\"acrimoni\"\n", + "2019-01-31 00:30:48,069 : INFO : topic #26 (0.020): 0.030*\"workplac\" + 0.029*\"champion\" + 0.028*\"alic\" + 0.028*\"woman\" + 0.027*\"men\" + 0.025*\"olymp\" + 0.023*\"medal\" + 0.021*\"left\" + 0.020*\"event\" + 0.018*\"atheist\"\n", + "2019-01-31 00:30:48,071 : INFO : topic #9 (0.020): 0.069*\"bone\" + 0.047*\"american\" + 0.025*\"valour\" + 0.019*\"folei\" + 0.018*\"dutch\" + 0.018*\"player\" + 0.016*\"polit\" + 0.015*\"english\" + 0.013*\"acrimoni\" + 0.012*\"simpler\"\n", + "2019-01-31 00:30:48,072 : INFO : topic #12 (0.020): 0.009*\"number\" + 0.008*\"frontal\" + 0.007*\"théori\" + 0.007*\"exampl\" + 0.006*\"gener\" + 0.006*\"southern\" + 0.006*\"measur\" + 0.006*\"method\" + 0.006*\"poet\" + 0.006*\"differ\"\n", + "2019-01-31 00:30:48,074 : INFO : topic #41 (0.020): 0.044*\"citi\" + 0.031*\"new\" + 0.022*\"palmer\" + 0.015*\"year\" + 0.015*\"center\" + 0.015*\"strategist\" + 0.012*\"open\" + 0.010*\"includ\" + 0.010*\"lobe\" + 0.008*\"highli\"\n", + "2019-01-31 00:30:48,079 : INFO : topic diff=0.007568, rho=0.047727\n", + "2019-01-31 00:30:50,743 : INFO : -11.666 per-word bound, 3249.4 perplexity estimate based on a held-out corpus of 2000 documents with 523385 words\n", + "2019-01-31 00:30:50,743 : INFO : PROGRESS: pass 0, at document #880000/4922894\n", + "2019-01-31 00:30:52,132 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:30:52,398 : INFO : topic #49 (0.020): 0.042*\"india\" + 0.032*\"incumb\" + 0.013*\"pakistan\" + 0.013*\"islam\" + 0.012*\"televis\" + 0.011*\"khalsa\" + 0.011*\"anglo\" + 0.010*\"muskoge\" + 0.010*\"start\" + 0.010*\"affection\"\n", + "2019-01-31 00:30:52,399 : INFO : topic #32 (0.020): 0.053*\"district\" + 0.046*\"vigour\" + 0.044*\"popolo\" + 0.040*\"tortur\" + 0.030*\"area\" + 0.026*\"regim\" + 0.025*\"cotton\" + 0.024*\"multitud\" + 0.022*\"citi\" + 0.020*\"commun\"\n", + "2019-01-31 00:30:52,400 : INFO : topic #28 (0.020): 0.030*\"build\" + 0.025*\"hous\" + 0.020*\"rivièr\" + 0.017*\"buford\" + 0.013*\"histor\" + 0.011*\"briarwood\" + 0.011*\"constitut\" + 0.011*\"strategist\" + 0.010*\"linear\" + 0.009*\"depress\"\n", + "2019-01-31 00:30:52,401 : INFO : topic #42 (0.020): 0.044*\"german\" + 0.029*\"germani\" + 0.014*\"vol\" + 0.013*\"jewish\" + 0.013*\"der\" + 0.012*\"berlin\" + 0.012*\"israel\" + 0.010*\"austria\" + 0.009*\"itali\" + 0.009*\"europ\"\n", + "2019-01-31 00:30:52,403 : INFO : topic #41 (0.020): 0.045*\"citi\" + 0.031*\"new\" + 0.022*\"palmer\" + 0.015*\"year\" + 0.015*\"center\" + 0.015*\"strategist\" + 0.012*\"open\" + 0.010*\"includ\" + 0.010*\"lobe\" + 0.008*\"highli\"\n", + "2019-01-31 00:30:52,409 : INFO : topic diff=0.007326, rho=0.047673\n", + "2019-01-31 00:30:52,565 : INFO : PROGRESS: pass 0, at document #882000/4922894\n", + "2019-01-31 00:30:53,987 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:30:54,254 : INFO : topic #27 (0.020): 0.068*\"questionnair\" + 0.018*\"candid\" + 0.018*\"taxpay\" + 0.013*\"tornado\" + 0.013*\"find\" + 0.013*\"driver\" + 0.012*\"fool\" + 0.011*\"landslid\" + 0.011*\"théori\" + 0.010*\"ret\"\n", + "2019-01-31 00:30:54,255 : INFO : topic #22 (0.020): 0.034*\"spars\" + 0.024*\"factor\" + 0.022*\"adulthood\" + 0.016*\"feel\" + 0.014*\"hostil\" + 0.014*\"male\" + 0.012*\"plaisir\" + 0.011*\"live\" + 0.010*\"genu\" + 0.009*\"yawn\"\n", + "2019-01-31 00:30:54,257 : INFO : topic #4 (0.020): 0.022*\"enfranchis\" + 0.015*\"depress\" + 0.014*\"pour\" + 0.009*\"produc\" + 0.009*\"mode\" + 0.009*\"elabor\" + 0.008*\"veget\" + 0.007*\"candid\" + 0.007*\"encyclopedia\" + 0.007*\"uruguayan\"\n", + "2019-01-31 00:30:54,258 : INFO : topic #42 (0.020): 0.044*\"german\" + 0.029*\"germani\" + 0.014*\"vol\" + 0.014*\"jewish\" + 0.013*\"der\" + 0.013*\"berlin\" + 0.012*\"israel\" + 0.010*\"austria\" + 0.009*\"itali\" + 0.009*\"europ\"\n", + "2019-01-31 00:30:54,259 : INFO : topic #19 (0.020): 0.013*\"languag\" + 0.010*\"woodcut\" + 0.010*\"origin\" + 0.009*\"form\" + 0.008*\"mean\" + 0.008*\"centuri\" + 0.007*\"trade\" + 0.007*\"like\" + 0.007*\"uruguayan\" + 0.007*\"god\"\n", + "2019-01-31 00:30:54,265 : INFO : topic diff=0.008168, rho=0.047619\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 00:30:54,425 : INFO : PROGRESS: pass 0, at document #884000/4922894\n", + "2019-01-31 00:30:55,869 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:30:56,136 : INFO : topic #0 (0.020): 0.065*\"statewid\" + 0.041*\"arsen\" + 0.039*\"line\" + 0.033*\"raid\" + 0.029*\"museo\" + 0.019*\"traceabl\" + 0.017*\"serv\" + 0.017*\"pain\" + 0.015*\"artist\" + 0.015*\"exhaust\"\n", + "2019-01-31 00:30:56,137 : INFO : topic #3 (0.020): 0.038*\"present\" + 0.028*\"offic\" + 0.024*\"minist\" + 0.020*\"member\" + 0.019*\"serv\" + 0.018*\"govern\" + 0.018*\"gener\" + 0.018*\"seri\" + 0.017*\"nation\" + 0.016*\"chickasaw\"\n", + "2019-01-31 00:30:56,138 : INFO : topic #17 (0.020): 0.070*\"church\" + 0.021*\"christian\" + 0.021*\"cathol\" + 0.019*\"bishop\" + 0.017*\"sail\" + 0.015*\"cathedr\" + 0.014*\"retroflex\" + 0.010*\"centuri\" + 0.009*\"italian\" + 0.009*\"historiographi\"\n", + "2019-01-31 00:30:56,139 : INFO : topic #24 (0.020): 0.041*\"book\" + 0.036*\"publicis\" + 0.023*\"word\" + 0.017*\"new\" + 0.014*\"edit\" + 0.014*\"presid\" + 0.013*\"storag\" + 0.013*\"nicola\" + 0.012*\"magazin\" + 0.012*\"worldwid\"\n", + "2019-01-31 00:30:56,140 : INFO : topic #35 (0.020): 0.059*\"russia\" + 0.036*\"sovereignti\" + 0.036*\"rural\" + 0.025*\"poison\" + 0.025*\"reprint\" + 0.024*\"personifi\" + 0.021*\"moscow\" + 0.016*\"poland\" + 0.015*\"unfortun\" + 0.014*\"malaysia\"\n", + "2019-01-31 00:30:56,146 : INFO : topic diff=0.007349, rho=0.047565\n", + "2019-01-31 00:30:56,306 : INFO : PROGRESS: pass 0, at document #886000/4922894\n", + "2019-01-31 00:30:57,852 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:30:58,118 : INFO : topic #16 (0.020): 0.041*\"king\" + 0.030*\"priest\" + 0.021*\"grammat\" + 0.021*\"quarterli\" + 0.018*\"duke\" + 0.016*\"rotterdam\" + 0.015*\"maria\" + 0.015*\"idiosyncrat\" + 0.014*\"order\" + 0.014*\"brazil\"\n", + "2019-01-31 00:30:58,119 : INFO : topic #30 (0.020): 0.037*\"leagu\" + 0.036*\"cleveland\" + 0.030*\"place\" + 0.027*\"taxpay\" + 0.025*\"scientist\" + 0.023*\"crete\" + 0.021*\"folei\" + 0.017*\"goal\" + 0.015*\"martin\" + 0.012*\"diversifi\"\n", + "2019-01-31 00:30:58,120 : INFO : topic #17 (0.020): 0.070*\"church\" + 0.021*\"christian\" + 0.021*\"cathol\" + 0.019*\"bishop\" + 0.017*\"sail\" + 0.014*\"retroflex\" + 0.014*\"cathedr\" + 0.010*\"centuri\" + 0.010*\"italian\" + 0.009*\"historiographi\"\n", + "2019-01-31 00:30:58,121 : INFO : topic #43 (0.020): 0.064*\"elect\" + 0.057*\"parti\" + 0.027*\"democrat\" + 0.024*\"voluntari\" + 0.020*\"member\" + 0.018*\"polici\" + 0.017*\"republ\" + 0.015*\"seaport\" + 0.014*\"liber\" + 0.014*\"report\"\n", + "2019-01-31 00:30:58,123 : INFO : topic #11 (0.020): 0.028*\"john\" + 0.016*\"will\" + 0.014*\"jame\" + 0.011*\"david\" + 0.011*\"rival\" + 0.010*\"georg\" + 0.009*\"slur\" + 0.009*\"mexican–american\" + 0.009*\"rhyme\" + 0.008*\"paul\"\n", + "2019-01-31 00:30:58,129 : INFO : topic diff=0.009032, rho=0.047511\n", + "2019-01-31 00:30:58,283 : INFO : PROGRESS: pass 0, at document #888000/4922894\n", + "2019-01-31 00:30:59,906 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:31:00,173 : INFO : topic #6 (0.020): 0.071*\"fewer\" + 0.025*\"septemb\" + 0.024*\"epiru\" + 0.018*\"teacher\" + 0.015*\"stake\" + 0.014*\"proclaim\" + 0.013*\"rodríguez\" + 0.011*\"movi\" + 0.011*\"direct\" + 0.010*\"acrimoni\"\n", + "2019-01-31 00:31:00,174 : INFO : topic #9 (0.020): 0.068*\"bone\" + 0.048*\"american\" + 0.025*\"valour\" + 0.019*\"dutch\" + 0.019*\"folei\" + 0.018*\"player\" + 0.016*\"polit\" + 0.015*\"english\" + 0.013*\"acrimoni\" + 0.012*\"simpler\"\n", + "2019-01-31 00:31:00,176 : INFO : topic #41 (0.020): 0.045*\"citi\" + 0.031*\"new\" + 0.022*\"palmer\" + 0.016*\"year\" + 0.016*\"strategist\" + 0.015*\"center\" + 0.012*\"open\" + 0.010*\"includ\" + 0.010*\"lobe\" + 0.008*\"highli\"\n", + "2019-01-31 00:31:00,177 : INFO : topic #16 (0.020): 0.041*\"king\" + 0.030*\"priest\" + 0.022*\"quarterli\" + 0.021*\"grammat\" + 0.018*\"duke\" + 0.016*\"rotterdam\" + 0.015*\"maria\" + 0.014*\"idiosyncrat\" + 0.014*\"order\" + 0.013*\"brazil\"\n", + "2019-01-31 00:31:00,178 : INFO : topic #34 (0.020): 0.071*\"start\" + 0.032*\"cotton\" + 0.029*\"unionist\" + 0.027*\"american\" + 0.025*\"new\" + 0.014*\"california\" + 0.014*\"terri\" + 0.013*\"year\" + 0.013*\"warrior\" + 0.012*\"north\"\n", + "2019-01-31 00:31:00,184 : INFO : topic diff=0.008016, rho=0.047458\n", + "2019-01-31 00:31:00,337 : INFO : PROGRESS: pass 0, at document #890000/4922894\n", + "2019-01-31 00:31:01,721 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:31:01,988 : INFO : topic #31 (0.020): 0.060*\"fusiform\" + 0.025*\"scientist\" + 0.023*\"player\" + 0.021*\"taxpay\" + 0.020*\"place\" + 0.013*\"clot\" + 0.011*\"leagu\" + 0.011*\"folei\" + 0.010*\"yard\" + 0.009*\"yawn\"\n", + "2019-01-31 00:31:01,989 : INFO : topic #13 (0.020): 0.027*\"sourc\" + 0.027*\"australia\" + 0.026*\"new\" + 0.026*\"london\" + 0.024*\"australian\" + 0.022*\"england\" + 0.019*\"british\" + 0.017*\"ireland\" + 0.016*\"youth\" + 0.013*\"wale\"\n", + "2019-01-31 00:31:01,990 : INFO : topic #24 (0.020): 0.041*\"book\" + 0.035*\"publicis\" + 0.023*\"word\" + 0.017*\"new\" + 0.014*\"edit\" + 0.014*\"presid\" + 0.013*\"nicola\" + 0.013*\"storag\" + 0.012*\"worldwid\" + 0.012*\"magazin\"\n", + "2019-01-31 00:31:01,991 : INFO : topic #47 (0.020): 0.063*\"muscl\" + 0.033*\"perceptu\" + 0.020*\"theater\" + 0.019*\"compos\" + 0.018*\"place\" + 0.016*\"damn\" + 0.015*\"physician\" + 0.014*\"orchestr\" + 0.014*\"olympo\" + 0.013*\"word\"\n", + "2019-01-31 00:31:01,992 : INFO : topic #25 (0.020): 0.031*\"ring\" + 0.018*\"lagrang\" + 0.017*\"warmth\" + 0.016*\"area\" + 0.014*\"mount\" + 0.009*\"north\" + 0.009*\"palmer\" + 0.008*\"foam\" + 0.008*\"land\" + 0.008*\"vacant\"\n", + "2019-01-31 00:31:01,999 : INFO : topic diff=0.008166, rho=0.047405\n", + "2019-01-31 00:31:02,160 : INFO : PROGRESS: pass 0, at document #892000/4922894\n", + "2019-01-31 00:31:03,567 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:31:03,837 : INFO : topic #28 (0.020): 0.030*\"build\" + 0.025*\"hous\" + 0.020*\"rivièr\" + 0.017*\"buford\" + 0.013*\"histor\" + 0.012*\"briarwood\" + 0.011*\"strategist\" + 0.011*\"constitut\" + 0.010*\"linear\" + 0.009*\"depress\"\n", + "2019-01-31 00:31:03,838 : INFO : topic #43 (0.020): 0.064*\"elect\" + 0.057*\"parti\" + 0.026*\"democrat\" + 0.024*\"voluntari\" + 0.020*\"member\" + 0.018*\"polici\" + 0.017*\"republ\" + 0.014*\"report\" + 0.014*\"liber\" + 0.014*\"seaport\"\n", + "2019-01-31 00:31:03,839 : INFO : topic #44 (0.020): 0.029*\"final\" + 0.029*\"rooftop\" + 0.022*\"tourist\" + 0.022*\"wife\" + 0.020*\"champion\" + 0.018*\"taxpay\" + 0.016*\"martin\" + 0.014*\"tiepolo\" + 0.013*\"chamber\" + 0.013*\"women\"\n", + "2019-01-31 00:31:03,840 : INFO : topic #6 (0.020): 0.071*\"fewer\" + 0.025*\"septemb\" + 0.023*\"epiru\" + 0.018*\"teacher\" + 0.016*\"stake\" + 0.014*\"proclaim\" + 0.013*\"rodríguez\" + 0.011*\"movi\" + 0.011*\"direct\" + 0.010*\"acrimoni\"\n", + "2019-01-31 00:31:03,841 : INFO : topic #32 (0.020): 0.051*\"district\" + 0.046*\"vigour\" + 0.044*\"popolo\" + 0.041*\"tortur\" + 0.030*\"area\" + 0.026*\"regim\" + 0.025*\"cotton\" + 0.024*\"multitud\" + 0.022*\"citi\" + 0.020*\"commun\"\n", + "2019-01-31 00:31:03,847 : INFO : topic diff=0.009180, rho=0.047351\n", + "2019-01-31 00:31:04,004 : INFO : PROGRESS: pass 0, at document #894000/4922894\n", + "2019-01-31 00:31:05,426 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:31:05,693 : INFO : topic #40 (0.020): 0.087*\"unit\" + 0.023*\"schuster\" + 0.022*\"collector\" + 0.020*\"institut\" + 0.019*\"requir\" + 0.018*\"student\" + 0.016*\"professor\" + 0.012*\"word\" + 0.012*\"governor\" + 0.011*\"http\"\n", + "2019-01-31 00:31:05,694 : INFO : topic #26 (0.020): 0.030*\"workplac\" + 0.029*\"champion\" + 0.028*\"alic\" + 0.027*\"woman\" + 0.025*\"men\" + 0.024*\"olymp\" + 0.023*\"medal\" + 0.023*\"left\" + 0.020*\"event\" + 0.018*\"atheist\"\n", + "2019-01-31 00:31:05,695 : INFO : topic #22 (0.020): 0.033*\"spars\" + 0.024*\"factor\" + 0.022*\"adulthood\" + 0.016*\"feel\" + 0.015*\"hostil\" + 0.014*\"male\" + 0.012*\"plaisir\" + 0.011*\"live\" + 0.009*\"genu\" + 0.009*\"yawn\"\n", + "2019-01-31 00:31:05,696 : INFO : topic #36 (0.020): 0.012*\"companhia\" + 0.011*\"network\" + 0.011*\"pop\" + 0.010*\"prognosi\" + 0.009*\"develop\" + 0.008*\"brio\" + 0.008*\"serv\" + 0.008*\"base\" + 0.008*\"includ\" + 0.008*\"softwar\"\n", + "2019-01-31 00:31:05,697 : INFO : topic #0 (0.020): 0.068*\"statewid\" + 0.041*\"arsen\" + 0.038*\"line\" + 0.033*\"raid\" + 0.030*\"museo\" + 0.019*\"traceabl\" + 0.018*\"serv\" + 0.016*\"pain\" + 0.014*\"exhaust\" + 0.014*\"artist\"\n", + "2019-01-31 00:31:05,703 : INFO : topic diff=0.008095, rho=0.047298\n", + "2019-01-31 00:31:05,914 : INFO : PROGRESS: pass 0, at document #896000/4922894\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 00:31:07,318 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:31:07,585 : INFO : topic #7 (0.020): 0.021*\"snatch\" + 0.021*\"di\" + 0.017*\"factor\" + 0.015*\"margin\" + 0.015*\"yawn\" + 0.014*\"bone\" + 0.012*\"life\" + 0.012*\"faster\" + 0.012*\"daughter\" + 0.011*\"deal\"\n", + "2019-01-31 00:31:07,586 : INFO : topic #13 (0.020): 0.027*\"sourc\" + 0.026*\"new\" + 0.026*\"australia\" + 0.026*\"london\" + 0.023*\"australian\" + 0.022*\"england\" + 0.019*\"british\" + 0.017*\"ireland\" + 0.016*\"youth\" + 0.013*\"wale\"\n", + "2019-01-31 00:31:07,587 : INFO : topic #10 (0.020): 0.011*\"cdd\" + 0.009*\"disco\" + 0.008*\"media\" + 0.007*\"caus\" + 0.007*\"pathwai\" + 0.007*\"have\" + 0.006*\"hormon\" + 0.006*\"proper\" + 0.006*\"treat\" + 0.006*\"effect\"\n", + "2019-01-31 00:31:07,588 : INFO : topic #12 (0.020): 0.009*\"number\" + 0.008*\"frontal\" + 0.006*\"southern\" + 0.006*\"exampl\" + 0.006*\"théori\" + 0.006*\"poet\" + 0.006*\"gener\" + 0.006*\"measur\" + 0.006*\"method\" + 0.005*\"differ\"\n", + "2019-01-31 00:31:07,589 : INFO : topic #40 (0.020): 0.087*\"unit\" + 0.022*\"collector\" + 0.022*\"schuster\" + 0.020*\"institut\" + 0.019*\"requir\" + 0.018*\"student\" + 0.016*\"professor\" + 0.012*\"word\" + 0.012*\"governor\" + 0.011*\"http\"\n", + "2019-01-31 00:31:07,595 : INFO : topic diff=0.008053, rho=0.047246\n", + "2019-01-31 00:31:07,754 : INFO : PROGRESS: pass 0, at document #898000/4922894\n", + "2019-01-31 00:31:09,168 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:31:09,434 : INFO : topic #24 (0.020): 0.041*\"book\" + 0.035*\"publicis\" + 0.023*\"word\" + 0.017*\"new\" + 0.015*\"edit\" + 0.013*\"presid\" + 0.013*\"nicola\" + 0.013*\"storag\" + 0.012*\"worldwid\" + 0.011*\"collect\"\n", + "2019-01-31 00:31:09,435 : INFO : topic #45 (0.020): 0.019*\"jpg\" + 0.019*\"fifteenth\" + 0.015*\"black\" + 0.014*\"western\" + 0.014*\"colder\" + 0.013*\"illicit\" + 0.013*\"record\" + 0.009*\"blind\" + 0.008*\"green\" + 0.007*\"light\"\n", + "2019-01-31 00:31:09,437 : INFO : topic #12 (0.020): 0.009*\"number\" + 0.008*\"frontal\" + 0.007*\"southern\" + 0.006*\"théori\" + 0.006*\"exampl\" + 0.006*\"gener\" + 0.006*\"poet\" + 0.006*\"measur\" + 0.006*\"method\" + 0.005*\"differ\"\n", + "2019-01-31 00:31:09,438 : INFO : topic #17 (0.020): 0.071*\"church\" + 0.022*\"cathol\" + 0.021*\"christian\" + 0.019*\"bishop\" + 0.017*\"sail\" + 0.014*\"retroflex\" + 0.012*\"cathedr\" + 0.010*\"italian\" + 0.010*\"centuri\" + 0.009*\"historiographi\"\n", + "2019-01-31 00:31:09,439 : INFO : topic #30 (0.020): 0.037*\"leagu\" + 0.036*\"cleveland\" + 0.030*\"place\" + 0.027*\"taxpay\" + 0.025*\"scientist\" + 0.023*\"crete\" + 0.021*\"folei\" + 0.017*\"goal\" + 0.015*\"martin\" + 0.012*\"schmitz\"\n", + "2019-01-31 00:31:09,445 : INFO : topic diff=0.008844, rho=0.047193\n", + "2019-01-31 00:31:12,255 : INFO : -11.820 per-word bound, 3614.7 perplexity estimate based on a held-out corpus of 2000 documents with 591241 words\n", + "2019-01-31 00:31:12,255 : INFO : PROGRESS: pass 0, at document #900000/4922894\n", + "2019-01-31 00:31:13,705 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:31:13,971 : INFO : topic #42 (0.020): 0.044*\"german\" + 0.028*\"germani\" + 0.014*\"vol\" + 0.014*\"austria\" + 0.013*\"jewish\" + 0.013*\"israel\" + 0.012*\"berlin\" + 0.012*\"der\" + 0.009*\"itali\" + 0.009*\"europ\"\n", + "2019-01-31 00:31:13,972 : INFO : topic #2 (0.020): 0.052*\"isl\" + 0.038*\"shield\" + 0.018*\"narrat\" + 0.014*\"scot\" + 0.013*\"pope\" + 0.012*\"blur\" + 0.011*\"coalit\" + 0.010*\"class\" + 0.010*\"nativist\" + 0.009*\"vernon\"\n", + "2019-01-31 00:31:13,974 : INFO : topic #29 (0.020): 0.014*\"companhia\" + 0.010*\"million\" + 0.009*\"yawn\" + 0.008*\"govern\" + 0.008*\"start\" + 0.008*\"bank\" + 0.007*\"countri\" + 0.007*\"function\" + 0.007*\"busi\" + 0.007*\"market\"\n", + "2019-01-31 00:31:13,975 : INFO : topic #17 (0.020): 0.071*\"church\" + 0.022*\"cathol\" + 0.022*\"christian\" + 0.019*\"bishop\" + 0.016*\"sail\" + 0.014*\"retroflex\" + 0.012*\"cathedr\" + 0.010*\"italian\" + 0.010*\"centuri\" + 0.009*\"historiographi\"\n", + "2019-01-31 00:31:13,976 : INFO : topic #9 (0.020): 0.067*\"bone\" + 0.048*\"american\" + 0.026*\"valour\" + 0.019*\"folei\" + 0.018*\"dutch\" + 0.018*\"player\" + 0.016*\"polit\" + 0.016*\"english\" + 0.013*\"acrimoni\" + 0.011*\"simpler\"\n", + "2019-01-31 00:31:13,982 : INFO : topic diff=0.008991, rho=0.047140\n", + "2019-01-31 00:31:14,141 : INFO : PROGRESS: pass 0, at document #902000/4922894\n", + "2019-01-31 00:31:15,567 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:31:15,834 : INFO : topic #12 (0.020): 0.009*\"number\" + 0.008*\"frontal\" + 0.006*\"southern\" + 0.006*\"théori\" + 0.006*\"gener\" + 0.006*\"exampl\" + 0.006*\"poet\" + 0.006*\"measur\" + 0.006*\"method\" + 0.006*\"servitud\"\n", + "2019-01-31 00:31:15,835 : INFO : topic #14 (0.020): 0.024*\"forc\" + 0.022*\"aggress\" + 0.021*\"armi\" + 0.021*\"walter\" + 0.018*\"com\" + 0.014*\"oper\" + 0.013*\"militari\" + 0.013*\"unionist\" + 0.011*\"airbu\" + 0.011*\"refut\"\n", + "2019-01-31 00:31:15,836 : INFO : topic #38 (0.020): 0.021*\"walter\" + 0.010*\"battalion\" + 0.009*\"aza\" + 0.009*\"king\" + 0.008*\"forc\" + 0.008*\"centuri\" + 0.008*\"empath\" + 0.007*\"armi\" + 0.007*\"teufel\" + 0.006*\"till\"\n", + "2019-01-31 00:31:15,837 : INFO : topic #37 (0.020): 0.011*\"man\" + 0.009*\"love\" + 0.008*\"gestur\" + 0.005*\"blue\" + 0.005*\"litig\" + 0.005*\"bewild\" + 0.005*\"spider\" + 0.004*\"night\" + 0.004*\"vision\" + 0.004*\"black\"\n", + "2019-01-31 00:31:15,838 : INFO : topic #44 (0.020): 0.029*\"rooftop\" + 0.028*\"final\" + 0.024*\"tourist\" + 0.022*\"wife\" + 0.020*\"champion\" + 0.018*\"taxpay\" + 0.015*\"martin\" + 0.014*\"chamber\" + 0.014*\"tiepolo\" + 0.013*\"winner\"\n", + "2019-01-31 00:31:15,844 : INFO : topic diff=0.008169, rho=0.047088\n", + "2019-01-31 00:31:16,001 : INFO : PROGRESS: pass 0, at document #904000/4922894\n", + "2019-01-31 00:31:17,409 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:31:17,675 : INFO : topic #28 (0.020): 0.030*\"build\" + 0.025*\"hous\" + 0.020*\"rivièr\" + 0.017*\"buford\" + 0.013*\"histor\" + 0.011*\"briarwood\" + 0.011*\"constitut\" + 0.010*\"strategist\" + 0.010*\"linear\" + 0.010*\"depress\"\n", + "2019-01-31 00:31:17,677 : INFO : topic #7 (0.020): 0.021*\"snatch\" + 0.020*\"di\" + 0.018*\"factor\" + 0.015*\"margin\" + 0.015*\"yawn\" + 0.014*\"bone\" + 0.012*\"life\" + 0.012*\"faster\" + 0.012*\"daughter\" + 0.011*\"deal\"\n", + "2019-01-31 00:31:17,678 : INFO : topic #37 (0.020): 0.011*\"man\" + 0.009*\"love\" + 0.008*\"gestur\" + 0.005*\"blue\" + 0.005*\"litig\" + 0.005*\"bewild\" + 0.004*\"night\" + 0.004*\"spider\" + 0.004*\"vision\" + 0.004*\"black\"\n", + "2019-01-31 00:31:17,679 : INFO : topic #24 (0.020): 0.041*\"book\" + 0.035*\"publicis\" + 0.024*\"word\" + 0.018*\"new\" + 0.015*\"edit\" + 0.013*\"presid\" + 0.013*\"nicola\" + 0.012*\"storag\" + 0.011*\"worldwid\" + 0.011*\"collect\"\n", + "2019-01-31 00:31:17,680 : INFO : topic #42 (0.020): 0.043*\"german\" + 0.028*\"germani\" + 0.014*\"vol\" + 0.013*\"austria\" + 0.012*\"berlin\" + 0.012*\"jewish\" + 0.012*\"israel\" + 0.012*\"der\" + 0.010*\"itali\" + 0.009*\"europ\"\n", + "2019-01-31 00:31:17,686 : INFO : topic diff=0.007569, rho=0.047036\n", + "2019-01-31 00:31:17,840 : INFO : PROGRESS: pass 0, at document #906000/4922894\n", + "2019-01-31 00:31:19,228 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:31:19,494 : INFO : topic #12 (0.020): 0.009*\"number\" + 0.008*\"frontal\" + 0.006*\"gener\" + 0.006*\"théori\" + 0.006*\"exampl\" + 0.006*\"southern\" + 0.006*\"measur\" + 0.006*\"poet\" + 0.006*\"method\" + 0.005*\"differ\"\n", + "2019-01-31 00:31:19,495 : INFO : topic #33 (0.020): 0.062*\"french\" + 0.046*\"franc\" + 0.030*\"pari\" + 0.024*\"sail\" + 0.021*\"jean\" + 0.017*\"daphn\" + 0.014*\"lazi\" + 0.012*\"loui\" + 0.011*\"piec\" + 0.009*\"wine\"\n", + "2019-01-31 00:31:19,496 : INFO : topic #17 (0.020): 0.070*\"church\" + 0.022*\"cathol\" + 0.021*\"christian\" + 0.019*\"bishop\" + 0.016*\"sail\" + 0.014*\"retroflex\" + 0.012*\"cathedr\" + 0.010*\"italian\" + 0.010*\"centuri\" + 0.009*\"relationship\"\n", + "2019-01-31 00:31:19,497 : INFO : topic #21 (0.020): 0.034*\"samford\" + 0.022*\"spain\" + 0.019*\"del\" + 0.018*\"mexico\" + 0.013*\"soviet\" + 0.012*\"santa\" + 0.011*\"carlo\" + 0.011*\"lizard\" + 0.010*\"juan\" + 0.010*\"francisco\"\n", + "2019-01-31 00:31:19,499 : INFO : topic #41 (0.020): 0.043*\"citi\" + 0.030*\"new\" + 0.022*\"palmer\" + 0.016*\"year\" + 0.015*\"strategist\" + 0.014*\"center\" + 0.011*\"open\" + 0.011*\"includ\" + 0.010*\"lobe\" + 0.009*\"dai\"\n", + "2019-01-31 00:31:19,504 : INFO : topic diff=0.006656, rho=0.046984\n", + "2019-01-31 00:31:19,661 : INFO : PROGRESS: pass 0, at document #908000/4922894\n", + "2019-01-31 00:31:21,067 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 00:31:21,333 : INFO : topic #20 (0.020): 0.138*\"scholar\" + 0.039*\"struggl\" + 0.033*\"high\" + 0.030*\"educ\" + 0.022*\"collector\" + 0.018*\"yawn\" + 0.014*\"prognosi\" + 0.009*\"task\" + 0.009*\"class\" + 0.008*\"gothic\"\n", + "2019-01-31 00:31:21,334 : INFO : topic #3 (0.020): 0.037*\"present\" + 0.028*\"offic\" + 0.025*\"minist\" + 0.020*\"member\" + 0.020*\"serv\" + 0.018*\"gener\" + 0.018*\"govern\" + 0.017*\"nation\" + 0.017*\"seri\" + 0.015*\"chickasaw\"\n", + "2019-01-31 00:31:21,335 : INFO : topic #0 (0.020): 0.068*\"statewid\" + 0.040*\"line\" + 0.038*\"arsen\" + 0.034*\"raid\" + 0.029*\"museo\" + 0.019*\"traceabl\" + 0.019*\"serv\" + 0.015*\"pain\" + 0.014*\"exhaust\" + 0.013*\"artist\"\n", + "2019-01-31 00:31:21,336 : INFO : topic #45 (0.020): 0.019*\"jpg\" + 0.018*\"fifteenth\" + 0.015*\"black\" + 0.015*\"colder\" + 0.014*\"western\" + 0.013*\"illicit\" + 0.012*\"record\" + 0.009*\"blind\" + 0.009*\"light\" + 0.007*\"green\"\n", + "2019-01-31 00:31:21,337 : INFO : topic #17 (0.020): 0.071*\"church\" + 0.022*\"cathol\" + 0.021*\"christian\" + 0.019*\"bishop\" + 0.016*\"sail\" + 0.014*\"retroflex\" + 0.012*\"cathedr\" + 0.010*\"italian\" + 0.010*\"centuri\" + 0.009*\"historiographi\"\n", + "2019-01-31 00:31:21,343 : INFO : topic diff=0.006732, rho=0.046932\n", + "2019-01-31 00:31:21,502 : INFO : PROGRESS: pass 0, at document #910000/4922894\n", + "2019-01-31 00:31:22,922 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:31:23,189 : INFO : topic #45 (0.020): 0.019*\"jpg\" + 0.018*\"fifteenth\" + 0.015*\"black\" + 0.015*\"colder\" + 0.014*\"western\" + 0.014*\"illicit\" + 0.012*\"record\" + 0.009*\"light\" + 0.009*\"blind\" + 0.007*\"green\"\n", + "2019-01-31 00:31:23,190 : INFO : topic #34 (0.020): 0.072*\"start\" + 0.031*\"cotton\" + 0.030*\"unionist\" + 0.028*\"american\" + 0.024*\"new\" + 0.014*\"california\" + 0.014*\"terri\" + 0.013*\"warrior\" + 0.013*\"year\" + 0.012*\"north\"\n", + "2019-01-31 00:31:23,191 : INFO : topic #22 (0.020): 0.033*\"spars\" + 0.024*\"factor\" + 0.023*\"adulthood\" + 0.017*\"feel\" + 0.015*\"hostil\" + 0.015*\"male\" + 0.012*\"plaisir\" + 0.011*\"live\" + 0.010*\"genu\" + 0.010*\"yawn\"\n", + "2019-01-31 00:31:23,192 : INFO : topic #9 (0.020): 0.069*\"bone\" + 0.046*\"american\" + 0.028*\"valour\" + 0.018*\"folei\" + 0.018*\"dutch\" + 0.017*\"player\" + 0.016*\"polit\" + 0.016*\"english\" + 0.012*\"acrimoni\" + 0.011*\"wedg\"\n", + "2019-01-31 00:31:23,193 : INFO : topic #17 (0.020): 0.074*\"church\" + 0.022*\"cathol\" + 0.021*\"christian\" + 0.019*\"bishop\" + 0.016*\"sail\" + 0.014*\"retroflex\" + 0.012*\"cathedr\" + 0.010*\"italian\" + 0.010*\"centuri\" + 0.009*\"historiographi\"\n", + "2019-01-31 00:31:23,199 : INFO : topic diff=0.009476, rho=0.046881\n", + "2019-01-31 00:31:23,354 : INFO : PROGRESS: pass 0, at document #912000/4922894\n", + "2019-01-31 00:31:24,758 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:31:25,024 : INFO : topic #29 (0.020): 0.014*\"companhia\" + 0.010*\"million\" + 0.009*\"yawn\" + 0.008*\"govern\" + 0.008*\"start\" + 0.008*\"bank\" + 0.007*\"countri\" + 0.007*\"function\" + 0.007*\"market\" + 0.007*\"busi\"\n", + "2019-01-31 00:31:25,025 : INFO : topic #44 (0.020): 0.029*\"rooftop\" + 0.028*\"final\" + 0.023*\"tourist\" + 0.022*\"wife\" + 0.021*\"champion\" + 0.019*\"taxpay\" + 0.015*\"martin\" + 0.014*\"chamber\" + 0.014*\"tiepolo\" + 0.013*\"women\"\n", + "2019-01-31 00:31:25,026 : INFO : topic #23 (0.020): 0.134*\"audit\" + 0.073*\"best\" + 0.040*\"yawn\" + 0.028*\"jacksonvil\" + 0.023*\"festiv\" + 0.022*\"japanes\" + 0.022*\"noll\" + 0.019*\"intern\" + 0.019*\"women\" + 0.015*\"prison\"\n", + "2019-01-31 00:31:25,027 : INFO : topic #22 (0.020): 0.034*\"spars\" + 0.024*\"factor\" + 0.022*\"adulthood\" + 0.017*\"feel\" + 0.015*\"hostil\" + 0.015*\"male\" + 0.012*\"plaisir\" + 0.011*\"live\" + 0.010*\"genu\" + 0.010*\"yawn\"\n", + "2019-01-31 00:31:25,029 : INFO : topic #38 (0.020): 0.021*\"walter\" + 0.010*\"battalion\" + 0.009*\"aza\" + 0.009*\"forc\" + 0.009*\"king\" + 0.008*\"centuri\" + 0.008*\"empath\" + 0.007*\"armi\" + 0.007*\"teufel\" + 0.006*\"till\"\n", + "2019-01-31 00:31:25,035 : INFO : topic diff=0.006759, rho=0.046829\n", + "2019-01-31 00:31:25,192 : INFO : PROGRESS: pass 0, at document #914000/4922894\n", + "2019-01-31 00:31:26,604 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:31:26,871 : INFO : topic #37 (0.020): 0.010*\"man\" + 0.009*\"love\" + 0.008*\"gestur\" + 0.005*\"blue\" + 0.005*\"litig\" + 0.004*\"vision\" + 0.004*\"bewild\" + 0.004*\"night\" + 0.004*\"spider\" + 0.004*\"black\"\n", + "2019-01-31 00:31:26,872 : INFO : topic #9 (0.020): 0.069*\"bone\" + 0.045*\"american\" + 0.028*\"valour\" + 0.018*\"folei\" + 0.018*\"dutch\" + 0.017*\"player\" + 0.016*\"polit\" + 0.016*\"english\" + 0.012*\"acrimoni\" + 0.011*\"wedg\"\n", + "2019-01-31 00:31:26,873 : INFO : topic #3 (0.020): 0.037*\"present\" + 0.028*\"offic\" + 0.024*\"minist\" + 0.020*\"member\" + 0.020*\"serv\" + 0.018*\"govern\" + 0.018*\"gener\" + 0.017*\"seri\" + 0.017*\"nation\" + 0.015*\"chickasaw\"\n", + "2019-01-31 00:31:26,874 : INFO : topic #27 (0.020): 0.068*\"questionnair\" + 0.019*\"candid\" + 0.017*\"taxpay\" + 0.013*\"driver\" + 0.012*\"ret\" + 0.012*\"find\" + 0.012*\"tornado\" + 0.011*\"fool\" + 0.011*\"landslid\" + 0.011*\"théori\"\n", + "2019-01-31 00:31:26,875 : INFO : topic #6 (0.020): 0.070*\"fewer\" + 0.025*\"septemb\" + 0.023*\"epiru\" + 0.018*\"teacher\" + 0.016*\"stake\" + 0.013*\"proclaim\" + 0.012*\"rodríguez\" + 0.011*\"movi\" + 0.011*\"direct\" + 0.010*\"acrimoni\"\n", + "2019-01-31 00:31:26,881 : INFO : topic diff=0.008904, rho=0.046778\n", + "2019-01-31 00:31:27,040 : INFO : PROGRESS: pass 0, at document #916000/4922894\n", + "2019-01-31 00:31:28,457 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:31:28,723 : INFO : topic #47 (0.020): 0.065*\"muscl\" + 0.033*\"perceptu\" + 0.022*\"theater\" + 0.019*\"place\" + 0.018*\"compos\" + 0.016*\"damn\" + 0.015*\"orchestr\" + 0.013*\"olympo\" + 0.013*\"physician\" + 0.013*\"word\"\n", + "2019-01-31 00:31:28,724 : INFO : topic #36 (0.020): 0.011*\"companhia\" + 0.011*\"network\" + 0.011*\"pop\" + 0.010*\"prognosi\" + 0.009*\"develop\" + 0.009*\"serv\" + 0.008*\"brio\" + 0.008*\"user\" + 0.007*\"base\" + 0.007*\"includ\"\n", + "2019-01-31 00:31:28,726 : INFO : topic #5 (0.020): 0.041*\"abroad\" + 0.028*\"son\" + 0.028*\"rel\" + 0.026*\"reconstruct\" + 0.021*\"band\" + 0.017*\"muscl\" + 0.016*\"simultan\" + 0.015*\"charcoal\" + 0.014*\"toyota\" + 0.010*\"myspac\"\n", + "2019-01-31 00:31:28,727 : INFO : topic #1 (0.020): 0.053*\"china\" + 0.050*\"chilton\" + 0.025*\"kong\" + 0.025*\"hong\" + 0.024*\"korea\" + 0.022*\"korean\" + 0.016*\"leah\" + 0.016*\"sourc\" + 0.014*\"kim\" + 0.013*\"min\"\n", + "2019-01-31 00:31:28,728 : INFO : topic #39 (0.020): 0.041*\"canada\" + 0.034*\"canadian\" + 0.019*\"hoar\" + 0.018*\"toronto\" + 0.016*\"ontario\" + 0.013*\"taxpay\" + 0.013*\"scientist\" + 0.012*\"new\" + 0.012*\"hydrogen\" + 0.011*\"basketbal\"\n", + "2019-01-31 00:31:28,733 : INFO : topic diff=0.007084, rho=0.046727\n", + "2019-01-31 00:31:28,887 : INFO : PROGRESS: pass 0, at document #918000/4922894\n", + "2019-01-31 00:31:30,267 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:31:30,534 : INFO : topic #18 (0.020): 0.010*\"théori\" + 0.007*\"later\" + 0.006*\"sack\" + 0.006*\"kill\" + 0.006*\"dai\" + 0.005*\"retrospect\" + 0.004*\"like\" + 0.004*\"man\" + 0.004*\"end\" + 0.004*\"help\"\n", + "2019-01-31 00:31:30,535 : INFO : topic #49 (0.020): 0.045*\"india\" + 0.032*\"incumb\" + 0.013*\"pakistan\" + 0.013*\"islam\" + 0.012*\"televis\" + 0.012*\"muskoge\" + 0.011*\"anglo\" + 0.011*\"khalsa\" + 0.010*\"start\" + 0.010*\"sri\"\n", + "2019-01-31 00:31:30,536 : INFO : topic #20 (0.020): 0.136*\"scholar\" + 0.040*\"struggl\" + 0.033*\"high\" + 0.030*\"educ\" + 0.022*\"collector\" + 0.019*\"yawn\" + 0.014*\"prognosi\" + 0.009*\"class\" + 0.009*\"task\" + 0.009*\"gothic\"\n", + "2019-01-31 00:31:30,537 : INFO : topic #32 (0.020): 0.061*\"district\" + 0.045*\"vigour\" + 0.044*\"tortur\" + 0.043*\"popolo\" + 0.029*\"area\" + 0.025*\"regim\" + 0.025*\"cotton\" + 0.023*\"multitud\" + 0.022*\"citi\" + 0.020*\"commun\"\n", + "2019-01-31 00:31:30,538 : INFO : topic #29 (0.020): 0.014*\"companhia\" + 0.010*\"million\" + 0.009*\"yawn\" + 0.008*\"govern\" + 0.008*\"start\" + 0.008*\"bank\" + 0.007*\"countri\" + 0.007*\"function\" + 0.007*\"market\" + 0.007*\"busi\"\n", + "2019-01-31 00:31:30,544 : INFO : topic diff=0.007579, rho=0.046676\n", + "2019-01-31 00:31:33,355 : INFO : -11.682 per-word bound, 3285.1 perplexity estimate based on a held-out corpus of 2000 documents with 607112 words\n", + "2019-01-31 00:31:33,356 : INFO : PROGRESS: pass 0, at document #920000/4922894\n", + "2019-01-31 00:31:34,795 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:31:35,062 : INFO : topic #34 (0.020): 0.072*\"start\" + 0.031*\"cotton\" + 0.029*\"unionist\" + 0.028*\"american\" + 0.024*\"new\" + 0.014*\"california\" + 0.013*\"terri\" + 0.013*\"warrior\" + 0.013*\"year\" + 0.012*\"north\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 00:31:35,063 : INFO : topic #28 (0.020): 0.030*\"build\" + 0.025*\"hous\" + 0.021*\"rivièr\" + 0.017*\"buford\" + 0.012*\"histor\" + 0.011*\"briarwood\" + 0.011*\"strategist\" + 0.011*\"constitut\" + 0.010*\"depress\" + 0.010*\"linear\"\n", + "2019-01-31 00:31:35,065 : INFO : topic #43 (0.020): 0.063*\"elect\" + 0.061*\"parti\" + 0.024*\"democrat\" + 0.024*\"voluntari\" + 0.020*\"member\" + 0.018*\"polici\" + 0.015*\"republ\" + 0.014*\"report\" + 0.014*\"liber\" + 0.013*\"seaport\"\n", + "2019-01-31 00:31:35,066 : INFO : topic #10 (0.020): 0.012*\"cdd\" + 0.008*\"media\" + 0.008*\"disco\" + 0.007*\"pathwai\" + 0.007*\"hormon\" + 0.007*\"have\" + 0.006*\"caus\" + 0.006*\"proper\" + 0.006*\"effect\" + 0.006*\"acid\"\n", + "2019-01-31 00:31:35,067 : INFO : topic #11 (0.020): 0.028*\"john\" + 0.016*\"will\" + 0.013*\"jame\" + 0.012*\"david\" + 0.011*\"rival\" + 0.010*\"georg\" + 0.009*\"mexican–american\" + 0.009*\"slur\" + 0.008*\"rhyme\" + 0.008*\"paul\"\n", + "2019-01-31 00:31:35,073 : INFO : topic diff=0.008514, rho=0.046625\n", + "2019-01-31 00:31:35,228 : INFO : PROGRESS: pass 0, at document #922000/4922894\n", + "2019-01-31 00:31:36,630 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:31:36,897 : INFO : topic #17 (0.020): 0.075*\"church\" + 0.021*\"cathol\" + 0.021*\"christian\" + 0.019*\"bishop\" + 0.016*\"sail\" + 0.014*\"retroflex\" + 0.011*\"cathedr\" + 0.010*\"centuri\" + 0.010*\"relationship\" + 0.009*\"italian\"\n", + "2019-01-31 00:31:36,898 : INFO : topic #5 (0.020): 0.041*\"abroad\" + 0.028*\"son\" + 0.028*\"rel\" + 0.026*\"reconstruct\" + 0.021*\"band\" + 0.017*\"muscl\" + 0.016*\"simultan\" + 0.014*\"charcoal\" + 0.013*\"toyota\" + 0.010*\"myspac\"\n", + "2019-01-31 00:31:36,899 : INFO : topic #20 (0.020): 0.138*\"scholar\" + 0.040*\"struggl\" + 0.033*\"high\" + 0.030*\"educ\" + 0.022*\"collector\" + 0.018*\"yawn\" + 0.014*\"prognosi\" + 0.009*\"task\" + 0.009*\"class\" + 0.009*\"gothic\"\n", + "2019-01-31 00:31:36,900 : INFO : topic #26 (0.020): 0.031*\"alic\" + 0.030*\"workplac\" + 0.029*\"champion\" + 0.027*\"woman\" + 0.026*\"olymp\" + 0.024*\"men\" + 0.022*\"left\" + 0.022*\"medal\" + 0.020*\"event\" + 0.018*\"rainfal\"\n", + "2019-01-31 00:31:36,901 : INFO : topic #39 (0.020): 0.041*\"canada\" + 0.034*\"canadian\" + 0.019*\"hoar\" + 0.017*\"toronto\" + 0.016*\"ontario\" + 0.013*\"taxpay\" + 0.013*\"scientist\" + 0.012*\"new\" + 0.011*\"hydrogen\" + 0.011*\"basketbal\"\n", + "2019-01-31 00:31:36,907 : INFO : topic diff=0.006184, rho=0.046575\n", + "2019-01-31 00:31:37,062 : INFO : PROGRESS: pass 0, at document #924000/4922894\n", + "2019-01-31 00:31:38,458 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:31:38,725 : INFO : topic #27 (0.020): 0.068*\"questionnair\" + 0.020*\"candid\" + 0.016*\"taxpay\" + 0.013*\"ret\" + 0.013*\"driver\" + 0.012*\"find\" + 0.012*\"fool\" + 0.012*\"tornado\" + 0.011*\"landslid\" + 0.011*\"théori\"\n", + "2019-01-31 00:31:38,726 : INFO : topic #19 (0.020): 0.013*\"languag\" + 0.010*\"origin\" + 0.010*\"woodcut\" + 0.009*\"form\" + 0.009*\"centuri\" + 0.008*\"mean\" + 0.007*\"uruguayan\" + 0.007*\"charact\" + 0.007*\"like\" + 0.007*\"trade\"\n", + "2019-01-31 00:31:38,727 : INFO : topic #31 (0.020): 0.062*\"fusiform\" + 0.025*\"player\" + 0.025*\"scientist\" + 0.022*\"taxpay\" + 0.020*\"place\" + 0.013*\"clot\" + 0.012*\"leagu\" + 0.010*\"folei\" + 0.009*\"ruler\" + 0.009*\"yawn\"\n", + "2019-01-31 00:31:38,728 : INFO : topic #11 (0.020): 0.028*\"john\" + 0.016*\"will\" + 0.013*\"jame\" + 0.012*\"david\" + 0.011*\"rival\" + 0.010*\"georg\" + 0.009*\"mexican–american\" + 0.009*\"slur\" + 0.008*\"rhyme\" + 0.008*\"paul\"\n", + "2019-01-31 00:31:38,729 : INFO : topic #13 (0.020): 0.027*\"sourc\" + 0.026*\"new\" + 0.025*\"australia\" + 0.025*\"london\" + 0.022*\"england\" + 0.021*\"australian\" + 0.019*\"british\" + 0.017*\"ireland\" + 0.016*\"youth\" + 0.013*\"wale\"\n", + "2019-01-31 00:31:38,735 : INFO : topic diff=0.008220, rho=0.046524\n", + "2019-01-31 00:31:38,949 : INFO : PROGRESS: pass 0, at document #926000/4922894\n", + "2019-01-31 00:31:40,358 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:31:40,623 : INFO : topic #0 (0.020): 0.067*\"statewid\" + 0.042*\"line\" + 0.038*\"arsen\" + 0.036*\"raid\" + 0.027*\"museo\" + 0.020*\"traceabl\" + 0.018*\"serv\" + 0.015*\"pain\" + 0.013*\"artist\" + 0.013*\"exhaust\"\n", + "2019-01-31 00:31:40,625 : INFO : topic #17 (0.020): 0.074*\"church\" + 0.021*\"cathol\" + 0.021*\"christian\" + 0.019*\"bishop\" + 0.016*\"parish\" + 0.016*\"sail\" + 0.015*\"retroflex\" + 0.011*\"cathedr\" + 0.010*\"centuri\" + 0.010*\"historiographi\"\n", + "2019-01-31 00:31:40,626 : INFO : topic #5 (0.020): 0.041*\"abroad\" + 0.029*\"son\" + 0.028*\"rel\" + 0.025*\"reconstruct\" + 0.021*\"band\" + 0.017*\"muscl\" + 0.016*\"simultan\" + 0.014*\"charcoal\" + 0.013*\"toyota\" + 0.010*\"myspac\"\n", + "2019-01-31 00:31:40,627 : INFO : topic #9 (0.020): 0.070*\"bone\" + 0.045*\"american\" + 0.027*\"valour\" + 0.018*\"dutch\" + 0.017*\"folei\" + 0.016*\"polit\" + 0.016*\"player\" + 0.016*\"english\" + 0.013*\"acrimoni\" + 0.011*\"wedg\"\n", + "2019-01-31 00:31:40,628 : INFO : topic #8 (0.020): 0.030*\"law\" + 0.024*\"cortic\" + 0.018*\"start\" + 0.016*\"act\" + 0.016*\"ricardo\" + 0.013*\"case\" + 0.010*\"polaris\" + 0.010*\"legal\" + 0.008*\"replac\" + 0.008*\"justic\"\n", + "2019-01-31 00:31:40,634 : INFO : topic diff=0.008511, rho=0.046474\n", + "2019-01-31 00:31:40,786 : INFO : PROGRESS: pass 0, at document #928000/4922894\n", + "2019-01-31 00:31:42,152 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:31:42,418 : INFO : topic #25 (0.020): 0.030*\"ring\" + 0.018*\"lagrang\" + 0.017*\"warmth\" + 0.016*\"area\" + 0.014*\"mount\" + 0.009*\"north\" + 0.009*\"palmer\" + 0.009*\"foam\" + 0.008*\"land\" + 0.008*\"vacant\"\n", + "2019-01-31 00:31:42,419 : INFO : topic #6 (0.020): 0.070*\"fewer\" + 0.027*\"septemb\" + 0.023*\"epiru\" + 0.018*\"teacher\" + 0.016*\"stake\" + 0.013*\"proclaim\" + 0.012*\"rodríguez\" + 0.012*\"direct\" + 0.011*\"movi\" + 0.010*\"acrimoni\"\n", + "2019-01-31 00:31:42,420 : INFO : topic #41 (0.020): 0.045*\"citi\" + 0.030*\"new\" + 0.022*\"palmer\" + 0.016*\"strategist\" + 0.015*\"year\" + 0.014*\"center\" + 0.012*\"open\" + 0.011*\"includ\" + 0.010*\"lobe\" + 0.008*\"highli\"\n", + "2019-01-31 00:31:42,421 : INFO : topic #24 (0.020): 0.041*\"book\" + 0.035*\"publicis\" + 0.024*\"word\" + 0.017*\"new\" + 0.014*\"edit\" + 0.014*\"presid\" + 0.013*\"nicola\" + 0.012*\"storag\" + 0.012*\"collect\" + 0.011*\"author\"\n", + "2019-01-31 00:31:42,422 : INFO : topic #21 (0.020): 0.034*\"samford\" + 0.022*\"spain\" + 0.021*\"mexico\" + 0.019*\"del\" + 0.012*\"soviet\" + 0.012*\"santa\" + 0.012*\"juan\" + 0.011*\"francisco\" + 0.011*\"lizard\" + 0.010*\"carlo\"\n", + "2019-01-31 00:31:42,428 : INFO : topic diff=0.007606, rho=0.046424\n", + "2019-01-31 00:31:42,585 : INFO : PROGRESS: pass 0, at document #930000/4922894\n", + "2019-01-31 00:31:44,009 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:31:44,275 : INFO : topic #36 (0.020): 0.011*\"network\" + 0.011*\"pop\" + 0.010*\"prognosi\" + 0.010*\"companhia\" + 0.009*\"develop\" + 0.008*\"serv\" + 0.008*\"user\" + 0.008*\"brio\" + 0.008*\"softwar\" + 0.008*\"base\"\n", + "2019-01-31 00:31:44,277 : INFO : topic #18 (0.020): 0.010*\"théori\" + 0.007*\"later\" + 0.007*\"kill\" + 0.006*\"sack\" + 0.006*\"dai\" + 0.005*\"retrospect\" + 0.005*\"like\" + 0.004*\"end\" + 0.004*\"help\" + 0.004*\"man\"\n", + "2019-01-31 00:31:44,278 : INFO : topic #11 (0.020): 0.028*\"john\" + 0.016*\"will\" + 0.013*\"jame\" + 0.012*\"david\" + 0.011*\"rival\" + 0.010*\"georg\" + 0.009*\"mexican–american\" + 0.009*\"slur\" + 0.008*\"rhyme\" + 0.008*\"paul\"\n", + "2019-01-31 00:31:44,279 : INFO : topic #0 (0.020): 0.067*\"statewid\" + 0.043*\"line\" + 0.038*\"arsen\" + 0.035*\"raid\" + 0.027*\"museo\" + 0.020*\"traceabl\" + 0.018*\"serv\" + 0.015*\"pain\" + 0.013*\"artist\" + 0.013*\"exhaust\"\n", + "2019-01-31 00:31:44,280 : INFO : topic #40 (0.020): 0.088*\"unit\" + 0.023*\"schuster\" + 0.022*\"collector\" + 0.021*\"institut\" + 0.020*\"requir\" + 0.018*\"student\" + 0.016*\"professor\" + 0.012*\"governor\" + 0.012*\"word\" + 0.012*\"http\"\n", + "2019-01-31 00:31:44,286 : INFO : topic diff=0.008304, rho=0.046374\n", + "2019-01-31 00:31:44,441 : INFO : PROGRESS: pass 0, at document #932000/4922894\n", + "2019-01-31 00:31:45,855 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:31:46,122 : INFO : topic #28 (0.020): 0.029*\"build\" + 0.025*\"hous\" + 0.020*\"rivièr\" + 0.017*\"buford\" + 0.013*\"histor\" + 0.011*\"briarwood\" + 0.011*\"constitut\" + 0.011*\"strategist\" + 0.010*\"depress\" + 0.010*\"linear\"\n", + "2019-01-31 00:31:46,123 : INFO : topic #3 (0.020): 0.037*\"present\" + 0.028*\"offic\" + 0.024*\"minist\" + 0.020*\"member\" + 0.020*\"serv\" + 0.018*\"govern\" + 0.018*\"gener\" + 0.017*\"seri\" + 0.017*\"nation\" + 0.015*\"chickasaw\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 00:31:46,124 : INFO : topic #1 (0.020): 0.055*\"china\" + 0.048*\"chilton\" + 0.026*\"kong\" + 0.026*\"hong\" + 0.024*\"korean\" + 0.024*\"korea\" + 0.016*\"sourc\" + 0.015*\"leah\" + 0.013*\"kim\" + 0.013*\"ashvil\"\n", + "2019-01-31 00:31:46,125 : INFO : topic #37 (0.020): 0.010*\"man\" + 0.009*\"love\" + 0.008*\"gestur\" + 0.005*\"blue\" + 0.005*\"litig\" + 0.004*\"bewild\" + 0.004*\"vision\" + 0.004*\"night\" + 0.003*\"black\" + 0.003*\"admit\"\n", + "2019-01-31 00:31:46,126 : INFO : topic #17 (0.020): 0.073*\"church\" + 0.021*\"cathol\" + 0.020*\"christian\" + 0.019*\"bishop\" + 0.015*\"sail\" + 0.015*\"parish\" + 0.015*\"retroflex\" + 0.011*\"cathedr\" + 0.010*\"historiographi\" + 0.010*\"centuri\"\n", + "2019-01-31 00:31:46,132 : INFO : topic diff=0.006844, rho=0.046324\n", + "2019-01-31 00:31:46,286 : INFO : PROGRESS: pass 0, at document #934000/4922894\n", + "2019-01-31 00:31:47,688 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:31:47,955 : INFO : topic #19 (0.020): 0.013*\"languag\" + 0.010*\"origin\" + 0.010*\"woodcut\" + 0.009*\"form\" + 0.008*\"centuri\" + 0.008*\"mean\" + 0.007*\"uruguayan\" + 0.007*\"charact\" + 0.007*\"like\" + 0.007*\"trade\"\n", + "2019-01-31 00:31:47,956 : INFO : topic #41 (0.020): 0.045*\"citi\" + 0.031*\"new\" + 0.022*\"palmer\" + 0.015*\"strategist\" + 0.015*\"year\" + 0.015*\"center\" + 0.012*\"open\" + 0.011*\"includ\" + 0.010*\"lobe\" + 0.008*\"dai\"\n", + "2019-01-31 00:31:47,957 : INFO : topic #30 (0.020): 0.036*\"cleveland\" + 0.036*\"leagu\" + 0.030*\"place\" + 0.028*\"taxpay\" + 0.024*\"scientist\" + 0.023*\"crete\" + 0.022*\"folei\" + 0.017*\"goal\" + 0.016*\"martin\" + 0.012*\"schmitz\"\n", + "2019-01-31 00:31:47,958 : INFO : topic #38 (0.020): 0.022*\"walter\" + 0.010*\"battalion\" + 0.009*\"king\" + 0.008*\"forc\" + 0.008*\"aza\" + 0.008*\"empath\" + 0.008*\"centuri\" + 0.007*\"armi\" + 0.006*\"citi\" + 0.006*\"pour\"\n", + "2019-01-31 00:31:47,959 : INFO : topic #45 (0.020): 0.020*\"jpg\" + 0.019*\"fifteenth\" + 0.015*\"black\" + 0.014*\"western\" + 0.014*\"colder\" + 0.014*\"illicit\" + 0.012*\"record\" + 0.009*\"light\" + 0.009*\"blind\" + 0.007*\"green\"\n", + "2019-01-31 00:31:47,965 : INFO : topic diff=0.007177, rho=0.046274\n", + "2019-01-31 00:31:48,125 : INFO : PROGRESS: pass 0, at document #936000/4922894\n", + "2019-01-31 00:31:49,558 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:31:49,825 : INFO : topic #15 (0.020): 0.012*\"small\" + 0.012*\"organ\" + 0.011*\"develop\" + 0.010*\"commun\" + 0.009*\"word\" + 0.009*\"group\" + 0.009*\"cultur\" + 0.008*\"peopl\" + 0.007*\"human\" + 0.007*\"student\"\n", + "2019-01-31 00:31:49,826 : INFO : topic #40 (0.020): 0.087*\"unit\" + 0.025*\"schuster\" + 0.021*\"collector\" + 0.021*\"institut\" + 0.020*\"requir\" + 0.018*\"student\" + 0.016*\"professor\" + 0.012*\"word\" + 0.012*\"governor\" + 0.011*\"http\"\n", + "2019-01-31 00:31:49,827 : INFO : topic #9 (0.020): 0.071*\"bone\" + 0.043*\"american\" + 0.027*\"valour\" + 0.020*\"dutch\" + 0.018*\"folei\" + 0.017*\"player\" + 0.016*\"english\" + 0.016*\"polit\" + 0.012*\"acrimoni\" + 0.010*\"wedg\"\n", + "2019-01-31 00:31:49,829 : INFO : topic #14 (0.020): 0.025*\"forc\" + 0.022*\"aggress\" + 0.021*\"walter\" + 0.021*\"armi\" + 0.017*\"com\" + 0.014*\"oper\" + 0.014*\"unionist\" + 0.013*\"militari\" + 0.011*\"airbu\" + 0.011*\"refut\"\n", + "2019-01-31 00:31:49,830 : INFO : topic #11 (0.020): 0.028*\"john\" + 0.016*\"will\" + 0.013*\"jame\" + 0.012*\"david\" + 0.011*\"rival\" + 0.010*\"georg\" + 0.009*\"mexican–american\" + 0.009*\"slur\" + 0.008*\"rhyme\" + 0.008*\"paul\"\n", + "2019-01-31 00:31:49,836 : INFO : topic diff=0.010119, rho=0.046225\n", + "2019-01-31 00:31:49,990 : INFO : PROGRESS: pass 0, at document #938000/4922894\n", + "2019-01-31 00:31:51,355 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:31:51,621 : INFO : topic #10 (0.020): 0.011*\"cdd\" + 0.008*\"media\" + 0.008*\"disco\" + 0.007*\"pathwai\" + 0.007*\"caus\" + 0.007*\"have\" + 0.007*\"hormon\" + 0.006*\"proper\" + 0.006*\"treat\" + 0.006*\"effect\"\n", + "2019-01-31 00:31:51,622 : INFO : topic #20 (0.020): 0.136*\"scholar\" + 0.040*\"struggl\" + 0.032*\"high\" + 0.029*\"educ\" + 0.023*\"collector\" + 0.018*\"yawn\" + 0.014*\"prognosi\" + 0.009*\"task\" + 0.009*\"gothic\" + 0.008*\"class\"\n", + "2019-01-31 00:31:51,623 : INFO : topic #48 (0.020): 0.078*\"sens\" + 0.077*\"octob\" + 0.074*\"march\" + 0.067*\"januari\" + 0.066*\"august\" + 0.066*\"juli\" + 0.066*\"notion\" + 0.064*\"april\" + 0.063*\"decatur\" + 0.063*\"judici\"\n", + "2019-01-31 00:31:51,624 : INFO : topic #12 (0.020): 0.008*\"number\" + 0.008*\"frontal\" + 0.007*\"exampl\" + 0.007*\"gener\" + 0.006*\"southern\" + 0.006*\"measur\" + 0.006*\"poet\" + 0.006*\"théori\" + 0.006*\"method\" + 0.006*\"differ\"\n", + "2019-01-31 00:31:51,625 : INFO : topic #28 (0.020): 0.029*\"build\" + 0.025*\"hous\" + 0.020*\"rivièr\" + 0.017*\"buford\" + 0.013*\"histor\" + 0.011*\"briarwood\" + 0.011*\"constitut\" + 0.010*\"strategist\" + 0.010*\"depress\" + 0.010*\"linear\"\n", + "2019-01-31 00:31:51,631 : INFO : topic diff=0.007750, rho=0.046176\n", + "2019-01-31 00:31:54,332 : INFO : -11.930 per-word bound, 3900.8 perplexity estimate based on a held-out corpus of 2000 documents with 557660 words\n", + "2019-01-31 00:31:54,332 : INFO : PROGRESS: pass 0, at document #940000/4922894\n", + "2019-01-31 00:31:55,732 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:31:55,998 : INFO : topic #22 (0.020): 0.034*\"spars\" + 0.024*\"factor\" + 0.021*\"adulthood\" + 0.016*\"feel\" + 0.015*\"male\" + 0.014*\"hostil\" + 0.012*\"plaisir\" + 0.010*\"live\" + 0.010*\"genu\" + 0.009*\"yawn\"\n", + "2019-01-31 00:31:55,999 : INFO : topic #16 (0.020): 0.046*\"king\" + 0.032*\"priest\" + 0.020*\"quarterli\" + 0.019*\"duke\" + 0.018*\"grammat\" + 0.016*\"rotterdam\" + 0.015*\"idiosyncrat\" + 0.014*\"portugues\" + 0.014*\"count\" + 0.013*\"maria\"\n", + "2019-01-31 00:31:56,000 : INFO : topic #1 (0.020): 0.055*\"china\" + 0.049*\"chilton\" + 0.027*\"kong\" + 0.026*\"hong\" + 0.024*\"korea\" + 0.023*\"korean\" + 0.016*\"sourc\" + 0.015*\"leah\" + 0.013*\"kim\" + 0.013*\"ashvil\"\n", + "2019-01-31 00:31:56,001 : INFO : topic #34 (0.020): 0.072*\"start\" + 0.032*\"cotton\" + 0.030*\"unionist\" + 0.028*\"american\" + 0.024*\"new\" + 0.014*\"california\" + 0.013*\"terri\" + 0.013*\"warrior\" + 0.012*\"north\" + 0.012*\"year\"\n", + "2019-01-31 00:31:56,002 : INFO : topic #0 (0.020): 0.067*\"statewid\" + 0.042*\"line\" + 0.037*\"arsen\" + 0.035*\"raid\" + 0.026*\"museo\" + 0.020*\"traceabl\" + 0.019*\"serv\" + 0.015*\"pain\" + 0.013*\"exhaust\" + 0.013*\"artist\"\n", + "2019-01-31 00:31:56,008 : INFO : topic diff=0.008186, rho=0.046127\n", + "2019-01-31 00:31:56,166 : INFO : PROGRESS: pass 0, at document #942000/4922894\n", + "2019-01-31 00:31:57,559 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:31:57,825 : INFO : topic #47 (0.020): 0.066*\"muscl\" + 0.036*\"perceptu\" + 0.022*\"theater\" + 0.020*\"place\" + 0.018*\"compos\" + 0.016*\"damn\" + 0.015*\"orchestr\" + 0.014*\"olympo\" + 0.012*\"word\" + 0.012*\"physician\"\n", + "2019-01-31 00:31:57,826 : INFO : topic #49 (0.020): 0.042*\"india\" + 0.030*\"incumb\" + 0.014*\"islam\" + 0.014*\"televis\" + 0.012*\"khalsa\" + 0.012*\"pakistan\" + 0.011*\"muskoge\" + 0.011*\"anglo\" + 0.010*\"sri\" + 0.010*\"start\"\n", + "2019-01-31 00:31:57,827 : INFO : topic #44 (0.020): 0.031*\"rooftop\" + 0.028*\"final\" + 0.023*\"wife\" + 0.022*\"tourist\" + 0.019*\"champion\" + 0.017*\"taxpay\" + 0.013*\"martin\" + 0.013*\"tiepolo\" + 0.013*\"chamber\" + 0.013*\"open\"\n", + "2019-01-31 00:31:57,828 : INFO : topic #27 (0.020): 0.068*\"questionnair\" + 0.020*\"candid\" + 0.016*\"taxpay\" + 0.013*\"driver\" + 0.012*\"fool\" + 0.012*\"ret\" + 0.011*\"find\" + 0.011*\"tornado\" + 0.011*\"landslid\" + 0.011*\"théori\"\n", + "2019-01-31 00:31:57,829 : INFO : topic #21 (0.020): 0.035*\"samford\" + 0.023*\"spain\" + 0.022*\"mexico\" + 0.020*\"del\" + 0.013*\"soviet\" + 0.012*\"santa\" + 0.011*\"juan\" + 0.010*\"mexican\" + 0.010*\"carlo\" + 0.010*\"francisco\"\n", + "2019-01-31 00:31:57,835 : INFO : topic diff=0.007473, rho=0.046078\n", + "2019-01-31 00:31:57,988 : INFO : PROGRESS: pass 0, at document #944000/4922894\n", + "2019-01-31 00:31:59,375 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:31:59,641 : INFO : topic #26 (0.020): 0.030*\"workplac\" + 0.029*\"champion\" + 0.028*\"woman\" + 0.026*\"alic\" + 0.025*\"men\" + 0.024*\"olymp\" + 0.023*\"medal\" + 0.020*\"event\" + 0.018*\"atheist\" + 0.018*\"left\"\n", + "2019-01-31 00:31:59,642 : INFO : topic #2 (0.020): 0.048*\"isl\" + 0.039*\"shield\" + 0.019*\"narrat\" + 0.014*\"scot\" + 0.012*\"blur\" + 0.012*\"pope\" + 0.011*\"nativist\" + 0.010*\"coalit\" + 0.010*\"class\" + 0.009*\"fleet\"\n", + "2019-01-31 00:31:59,643 : INFO : topic #44 (0.020): 0.032*\"rooftop\" + 0.027*\"final\" + 0.023*\"wife\" + 0.022*\"tourist\" + 0.019*\"champion\" + 0.018*\"taxpay\" + 0.013*\"martin\" + 0.013*\"tiepolo\" + 0.013*\"chamber\" + 0.013*\"women\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 00:31:59,644 : INFO : topic #21 (0.020): 0.034*\"samford\" + 0.023*\"spain\" + 0.021*\"mexico\" + 0.019*\"del\" + 0.013*\"soviet\" + 0.012*\"santa\" + 0.011*\"juan\" + 0.011*\"carlo\" + 0.010*\"francisco\" + 0.010*\"mexican\"\n", + "2019-01-31 00:31:59,645 : INFO : topic #46 (0.020): 0.020*\"stop\" + 0.019*\"sweden\" + 0.018*\"swedish\" + 0.016*\"norwai\" + 0.015*\"wind\" + 0.014*\"huntsvil\" + 0.013*\"norwegian\" + 0.013*\"treeless\" + 0.012*\"damag\" + 0.012*\"farid\"\n", + "2019-01-31 00:31:59,651 : INFO : topic diff=0.008291, rho=0.046029\n", + "2019-01-31 00:31:59,805 : INFO : PROGRESS: pass 0, at document #946000/4922894\n", + "2019-01-31 00:32:01,200 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:32:01,466 : INFO : topic #11 (0.020): 0.027*\"john\" + 0.015*\"will\" + 0.013*\"jame\" + 0.012*\"david\" + 0.011*\"rival\" + 0.010*\"slur\" + 0.010*\"georg\" + 0.009*\"mexican–american\" + 0.008*\"rhyme\" + 0.008*\"paul\"\n", + "2019-01-31 00:32:01,467 : INFO : topic #9 (0.020): 0.075*\"bone\" + 0.044*\"american\" + 0.027*\"valour\" + 0.020*\"dutch\" + 0.017*\"folei\" + 0.017*\"player\" + 0.016*\"english\" + 0.016*\"polit\" + 0.012*\"acrimoni\" + 0.011*\"simpler\"\n", + "2019-01-31 00:32:01,468 : INFO : topic #17 (0.020): 0.073*\"church\" + 0.021*\"cathol\" + 0.021*\"christian\" + 0.019*\"bishop\" + 0.015*\"sail\" + 0.015*\"retroflex\" + 0.014*\"parish\" + 0.011*\"cathedr\" + 0.009*\"centuri\" + 0.009*\"historiographi\"\n", + "2019-01-31 00:32:01,469 : INFO : topic #24 (0.020): 0.041*\"book\" + 0.035*\"publicis\" + 0.023*\"word\" + 0.018*\"new\" + 0.014*\"presid\" + 0.014*\"edit\" + 0.013*\"nicola\" + 0.012*\"storag\" + 0.012*\"collect\" + 0.011*\"worldwid\"\n", + "2019-01-31 00:32:01,471 : INFO : topic #37 (0.020): 0.010*\"man\" + 0.009*\"love\" + 0.007*\"gestur\" + 0.005*\"blue\" + 0.005*\"litig\" + 0.004*\"night\" + 0.004*\"bewild\" + 0.004*\"vision\" + 0.003*\"black\" + 0.003*\"comic\"\n", + "2019-01-31 00:32:01,477 : INFO : topic diff=0.006835, rho=0.045980\n", + "2019-01-31 00:32:01,639 : INFO : PROGRESS: pass 0, at document #948000/4922894\n", + "2019-01-31 00:32:03,064 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:32:03,331 : INFO : topic #26 (0.020): 0.029*\"workplac\" + 0.028*\"champion\" + 0.028*\"woman\" + 0.026*\"alic\" + 0.025*\"men\" + 0.025*\"olymp\" + 0.022*\"medal\" + 0.020*\"event\" + 0.018*\"atheist\" + 0.017*\"left\"\n", + "2019-01-31 00:32:03,332 : INFO : topic #29 (0.020): 0.015*\"companhia\" + 0.011*\"million\" + 0.009*\"yawn\" + 0.009*\"bank\" + 0.008*\"govern\" + 0.008*\"start\" + 0.007*\"busi\" + 0.007*\"function\" + 0.007*\"countri\" + 0.007*\"market\"\n", + "2019-01-31 00:32:03,333 : INFO : topic #25 (0.020): 0.030*\"ring\" + 0.019*\"warmth\" + 0.018*\"lagrang\" + 0.017*\"area\" + 0.014*\"mount\" + 0.009*\"palmer\" + 0.009*\"north\" + 0.008*\"foam\" + 0.008*\"vacant\" + 0.008*\"land\"\n", + "2019-01-31 00:32:03,334 : INFO : topic #10 (0.020): 0.012*\"cdd\" + 0.008*\"media\" + 0.008*\"disco\" + 0.007*\"pathwai\" + 0.007*\"hormon\" + 0.007*\"caus\" + 0.007*\"have\" + 0.006*\"acid\" + 0.006*\"proper\" + 0.006*\"treat\"\n", + "2019-01-31 00:32:03,335 : INFO : topic #1 (0.020): 0.054*\"china\" + 0.048*\"chilton\" + 0.026*\"kong\" + 0.026*\"hong\" + 0.023*\"korea\" + 0.021*\"korean\" + 0.017*\"leah\" + 0.015*\"sourc\" + 0.014*\"kim\" + 0.013*\"ashvil\"\n", + "2019-01-31 00:32:03,341 : INFO : topic diff=0.010003, rho=0.045932\n", + "2019-01-31 00:32:03,497 : INFO : PROGRESS: pass 0, at document #950000/4922894\n", + "2019-01-31 00:32:04,887 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:32:05,154 : INFO : topic #7 (0.020): 0.021*\"snatch\" + 0.019*\"di\" + 0.018*\"factor\" + 0.015*\"margin\" + 0.015*\"yawn\" + 0.014*\"bone\" + 0.012*\"life\" + 0.012*\"faster\" + 0.011*\"daughter\" + 0.011*\"deal\"\n", + "2019-01-31 00:32:05,155 : INFO : topic #13 (0.020): 0.026*\"new\" + 0.026*\"london\" + 0.026*\"sourc\" + 0.025*\"australia\" + 0.022*\"england\" + 0.022*\"australian\" + 0.019*\"british\" + 0.018*\"ireland\" + 0.016*\"youth\" + 0.013*\"wale\"\n", + "2019-01-31 00:32:05,156 : INFO : topic #30 (0.020): 0.037*\"leagu\" + 0.037*\"cleveland\" + 0.030*\"place\" + 0.027*\"taxpay\" + 0.024*\"scientist\" + 0.023*\"crete\" + 0.022*\"folei\" + 0.017*\"goal\" + 0.016*\"martin\" + 0.012*\"schmitz\"\n", + "2019-01-31 00:32:05,157 : INFO : topic #21 (0.020): 0.034*\"samford\" + 0.023*\"spain\" + 0.022*\"mexico\" + 0.019*\"del\" + 0.013*\"soviet\" + 0.012*\"santa\" + 0.011*\"mexican\" + 0.011*\"juan\" + 0.011*\"carlo\" + 0.010*\"francisco\"\n", + "2019-01-31 00:32:05,158 : INFO : topic #42 (0.020): 0.045*\"german\" + 0.031*\"germani\" + 0.014*\"vol\" + 0.013*\"berlin\" + 0.013*\"jewish\" + 0.012*\"der\" + 0.012*\"israel\" + 0.009*\"austria\" + 0.009*\"european\" + 0.009*\"itali\"\n", + "2019-01-31 00:32:05,164 : INFO : topic diff=0.008111, rho=0.045883\n", + "2019-01-31 00:32:05,318 : INFO : PROGRESS: pass 0, at document #952000/4922894\n", + "2019-01-31 00:32:06,707 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:32:06,973 : INFO : topic #41 (0.020): 0.046*\"citi\" + 0.030*\"new\" + 0.022*\"palmer\" + 0.015*\"year\" + 0.015*\"strategist\" + 0.014*\"center\" + 0.011*\"open\" + 0.011*\"includ\" + 0.010*\"lobe\" + 0.008*\"dai\"\n", + "2019-01-31 00:32:06,974 : INFO : topic #4 (0.020): 0.021*\"enfranchis\" + 0.016*\"pour\" + 0.014*\"depress\" + 0.010*\"elabor\" + 0.010*\"mode\" + 0.009*\"produc\" + 0.008*\"veget\" + 0.007*\"encyclopedia\" + 0.007*\"uruguayan\" + 0.007*\"candid\"\n", + "2019-01-31 00:32:06,976 : INFO : topic #18 (0.020): 0.010*\"théori\" + 0.007*\"later\" + 0.007*\"sack\" + 0.006*\"kill\" + 0.006*\"dai\" + 0.005*\"retrospect\" + 0.005*\"like\" + 0.004*\"help\" + 0.004*\"end\" + 0.004*\"man\"\n", + "2019-01-31 00:32:06,977 : INFO : topic #43 (0.020): 0.064*\"elect\" + 0.056*\"parti\" + 0.024*\"voluntari\" + 0.022*\"democrat\" + 0.020*\"member\" + 0.018*\"polici\" + 0.015*\"republ\" + 0.014*\"seaport\" + 0.014*\"report\" + 0.014*\"selma\"\n", + "2019-01-31 00:32:06,978 : INFO : topic #22 (0.020): 0.035*\"spars\" + 0.024*\"factor\" + 0.021*\"adulthood\" + 0.016*\"feel\" + 0.014*\"male\" + 0.014*\"hostil\" + 0.011*\"plaisir\" + 0.011*\"genu\" + 0.010*\"live\" + 0.009*\"yawn\"\n", + "2019-01-31 00:32:06,984 : INFO : topic diff=0.007736, rho=0.045835\n", + "2019-01-31 00:32:07,136 : INFO : PROGRESS: pass 0, at document #954000/4922894\n", + "2019-01-31 00:32:08,507 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:32:08,774 : INFO : topic #5 (0.020): 0.040*\"abroad\" + 0.029*\"son\" + 0.027*\"rel\" + 0.025*\"reconstruct\" + 0.021*\"band\" + 0.017*\"muscl\" + 0.016*\"simultan\" + 0.014*\"charcoal\" + 0.013*\"toyota\" + 0.010*\"myspac\"\n", + "2019-01-31 00:32:08,775 : INFO : topic #31 (0.020): 0.059*\"fusiform\" + 0.024*\"scientist\" + 0.024*\"player\" + 0.022*\"taxpay\" + 0.019*\"place\" + 0.013*\"clot\" + 0.013*\"leagu\" + 0.011*\"folei\" + 0.010*\"yard\" + 0.010*\"yawn\"\n", + "2019-01-31 00:32:08,776 : INFO : topic #29 (0.020): 0.015*\"companhia\" + 0.011*\"million\" + 0.009*\"yawn\" + 0.008*\"bank\" + 0.008*\"govern\" + 0.008*\"start\" + 0.007*\"busi\" + 0.007*\"function\" + 0.007*\"countri\" + 0.007*\"market\"\n", + "2019-01-31 00:32:08,777 : INFO : topic #34 (0.020): 0.074*\"start\" + 0.032*\"cotton\" + 0.030*\"unionist\" + 0.029*\"american\" + 0.024*\"new\" + 0.014*\"terri\" + 0.014*\"california\" + 0.013*\"warrior\" + 0.013*\"year\" + 0.012*\"north\"\n", + "2019-01-31 00:32:08,778 : INFO : topic #21 (0.020): 0.035*\"samford\" + 0.024*\"mexico\" + 0.022*\"spain\" + 0.020*\"del\" + 0.013*\"soviet\" + 0.011*\"santa\" + 0.011*\"mexican\" + 0.011*\"juan\" + 0.010*\"josé\" + 0.010*\"carlo\"\n", + "2019-01-31 00:32:08,784 : INFO : topic diff=0.008295, rho=0.045787\n", + "2019-01-31 00:32:08,945 : INFO : PROGRESS: pass 0, at document #956000/4922894\n", + "2019-01-31 00:32:10,373 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:32:10,639 : INFO : topic #14 (0.020): 0.024*\"forc\" + 0.022*\"aggress\" + 0.021*\"armi\" + 0.021*\"walter\" + 0.018*\"com\" + 0.014*\"oper\" + 0.014*\"unionist\" + 0.013*\"airmen\" + 0.013*\"militari\" + 0.011*\"refut\"\n", + "2019-01-31 00:32:10,640 : INFO : topic #23 (0.020): 0.132*\"audit\" + 0.072*\"best\" + 0.036*\"yawn\" + 0.028*\"jacksonvil\" + 0.023*\"japanes\" + 0.022*\"noll\" + 0.022*\"intern\" + 0.021*\"festiv\" + 0.018*\"women\" + 0.016*\"winner\"\n", + "2019-01-31 00:32:10,641 : INFO : topic #37 (0.020): 0.010*\"man\" + 0.009*\"love\" + 0.007*\"gestur\" + 0.005*\"blue\" + 0.005*\"litig\" + 0.004*\"vision\" + 0.004*\"night\" + 0.004*\"bewild\" + 0.003*\"black\" + 0.003*\"comic\"\n", + "2019-01-31 00:32:10,643 : INFO : topic #28 (0.020): 0.030*\"build\" + 0.026*\"hous\" + 0.019*\"rivièr\" + 0.017*\"buford\" + 0.013*\"histor\" + 0.011*\"briarwood\" + 0.011*\"constitut\" + 0.010*\"depress\" + 0.010*\"linear\" + 0.010*\"rosenwald\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 00:32:10,644 : INFO : topic #27 (0.020): 0.067*\"questionnair\" + 0.019*\"candid\" + 0.016*\"taxpay\" + 0.014*\"horac\" + 0.012*\"driver\" + 0.012*\"landslid\" + 0.011*\"find\" + 0.011*\"tornado\" + 0.011*\"fool\" + 0.010*\"théori\"\n", + "2019-01-31 00:32:10,650 : INFO : topic diff=0.007442, rho=0.045739\n", + "2019-01-31 00:32:10,860 : INFO : PROGRESS: pass 0, at document #958000/4922894\n", + "2019-01-31 00:32:12,272 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:32:12,538 : INFO : topic #30 (0.020): 0.037*\"leagu\" + 0.036*\"cleveland\" + 0.030*\"place\" + 0.027*\"taxpay\" + 0.024*\"scientist\" + 0.023*\"crete\" + 0.022*\"folei\" + 0.016*\"goal\" + 0.016*\"martin\" + 0.011*\"schmitz\"\n", + "2019-01-31 00:32:12,539 : INFO : topic #22 (0.020): 0.035*\"spars\" + 0.024*\"factor\" + 0.020*\"adulthood\" + 0.016*\"feel\" + 0.015*\"male\" + 0.014*\"hostil\" + 0.011*\"plaisir\" + 0.011*\"genu\" + 0.010*\"live\" + 0.009*\"yawn\"\n", + "2019-01-31 00:32:12,540 : INFO : topic #43 (0.020): 0.066*\"elect\" + 0.056*\"parti\" + 0.024*\"voluntari\" + 0.023*\"democrat\" + 0.020*\"member\" + 0.018*\"polici\" + 0.015*\"republ\" + 0.014*\"seaport\" + 0.014*\"report\" + 0.014*\"bypass\"\n", + "2019-01-31 00:32:12,541 : INFO : topic #48 (0.020): 0.078*\"sens\" + 0.076*\"octob\" + 0.072*\"march\" + 0.068*\"august\" + 0.068*\"januari\" + 0.065*\"notion\" + 0.065*\"juli\" + 0.064*\"decatur\" + 0.063*\"april\" + 0.062*\"judici\"\n", + "2019-01-31 00:32:12,542 : INFO : topic #47 (0.020): 0.065*\"muscl\" + 0.035*\"perceptu\" + 0.022*\"theater\" + 0.020*\"place\" + 0.017*\"compos\" + 0.016*\"damn\" + 0.015*\"orchestr\" + 0.014*\"olympo\" + 0.012*\"physician\" + 0.012*\"word\"\n", + "2019-01-31 00:32:12,548 : INFO : topic diff=0.007158, rho=0.045691\n", + "2019-01-31 00:32:15,231 : INFO : -11.914 per-word bound, 3858.4 perplexity estimate based on a held-out corpus of 2000 documents with 536438 words\n", + "2019-01-31 00:32:15,232 : INFO : PROGRESS: pass 0, at document #960000/4922894\n", + "2019-01-31 00:32:16,621 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:32:16,887 : INFO : topic #13 (0.020): 0.025*\"new\" + 0.025*\"london\" + 0.025*\"sourc\" + 0.025*\"australia\" + 0.022*\"england\" + 0.022*\"australian\" + 0.019*\"british\" + 0.018*\"ireland\" + 0.016*\"youth\" + 0.013*\"wale\"\n", + "2019-01-31 00:32:16,888 : INFO : topic #46 (0.020): 0.019*\"stop\" + 0.019*\"sweden\" + 0.017*\"swedish\" + 0.016*\"norwai\" + 0.014*\"wind\" + 0.013*\"treeless\" + 0.013*\"norwegian\" + 0.012*\"huntsvil\" + 0.011*\"damag\" + 0.011*\"denmark\"\n", + "2019-01-31 00:32:16,889 : INFO : topic #48 (0.020): 0.078*\"sens\" + 0.076*\"octob\" + 0.072*\"march\" + 0.069*\"januari\" + 0.068*\"august\" + 0.066*\"notion\" + 0.066*\"juli\" + 0.064*\"decatur\" + 0.063*\"april\" + 0.062*\"judici\"\n", + "2019-01-31 00:32:16,890 : INFO : topic #34 (0.020): 0.075*\"start\" + 0.031*\"cotton\" + 0.031*\"unionist\" + 0.028*\"american\" + 0.024*\"new\" + 0.014*\"california\" + 0.014*\"terri\" + 0.013*\"warrior\" + 0.013*\"year\" + 0.012*\"north\"\n", + "2019-01-31 00:32:16,891 : INFO : topic #18 (0.020): 0.010*\"théori\" + 0.007*\"later\" + 0.007*\"sack\" + 0.006*\"kill\" + 0.006*\"dai\" + 0.005*\"retrospect\" + 0.005*\"like\" + 0.004*\"end\" + 0.004*\"help\" + 0.004*\"man\"\n", + "2019-01-31 00:32:16,898 : INFO : topic diff=0.007073, rho=0.045644\n", + "2019-01-31 00:32:17,055 : INFO : PROGRESS: pass 0, at document #962000/4922894\n", + "2019-01-31 00:32:18,946 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:32:19,212 : INFO : topic #23 (0.020): 0.133*\"audit\" + 0.073*\"best\" + 0.036*\"yawn\" + 0.027*\"jacksonvil\" + 0.023*\"noll\" + 0.023*\"japanes\" + 0.022*\"intern\" + 0.021*\"festiv\" + 0.019*\"women\" + 0.015*\"winner\"\n", + "2019-01-31 00:32:19,213 : INFO : topic #5 (0.020): 0.040*\"abroad\" + 0.029*\"son\" + 0.027*\"rel\" + 0.025*\"reconstruct\" + 0.021*\"band\" + 0.017*\"muscl\" + 0.016*\"simultan\" + 0.014*\"charcoal\" + 0.013*\"toyota\" + 0.010*\"myspac\"\n", + "2019-01-31 00:32:19,214 : INFO : topic #7 (0.020): 0.021*\"snatch\" + 0.019*\"di\" + 0.018*\"factor\" + 0.015*\"margin\" + 0.015*\"yawn\" + 0.014*\"bone\" + 0.012*\"life\" + 0.012*\"faster\" + 0.012*\"daughter\" + 0.011*\"deal\"\n", + "2019-01-31 00:32:19,215 : INFO : topic #14 (0.020): 0.024*\"forc\" + 0.023*\"aggress\" + 0.021*\"walter\" + 0.021*\"armi\" + 0.018*\"com\" + 0.014*\"unionist\" + 0.014*\"oper\" + 0.013*\"militari\" + 0.013*\"airmen\" + 0.011*\"refut\"\n", + "2019-01-31 00:32:19,217 : INFO : topic #27 (0.020): 0.067*\"questionnair\" + 0.019*\"candid\" + 0.017*\"taxpay\" + 0.014*\"horac\" + 0.013*\"driver\" + 0.012*\"landslid\" + 0.011*\"find\" + 0.011*\"fool\" + 0.011*\"tornado\" + 0.011*\"ret\"\n", + "2019-01-31 00:32:19,223 : INFO : topic diff=0.008002, rho=0.045596\n", + "2019-01-31 00:32:19,380 : INFO : PROGRESS: pass 0, at document #964000/4922894\n", + "2019-01-31 00:32:20,819 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:32:21,086 : INFO : topic #20 (0.020): 0.140*\"scholar\" + 0.039*\"struggl\" + 0.036*\"high\" + 0.029*\"educ\" + 0.024*\"collector\" + 0.018*\"yawn\" + 0.013*\"prognosi\" + 0.009*\"gothic\" + 0.009*\"task\" + 0.009*\"class\"\n", + "2019-01-31 00:32:21,087 : INFO : topic #5 (0.020): 0.040*\"abroad\" + 0.029*\"son\" + 0.027*\"rel\" + 0.026*\"reconstruct\" + 0.021*\"band\" + 0.017*\"muscl\" + 0.016*\"simultan\" + 0.014*\"charcoal\" + 0.013*\"toyota\" + 0.010*\"vocabulari\"\n", + "2019-01-31 00:32:21,088 : INFO : topic #25 (0.020): 0.029*\"ring\" + 0.018*\"lagrang\" + 0.018*\"warmth\" + 0.017*\"area\" + 0.014*\"mount\" + 0.010*\"palmer\" + 0.009*\"foam\" + 0.009*\"north\" + 0.008*\"vacant\" + 0.008*\"land\"\n", + "2019-01-31 00:32:21,089 : INFO : topic #36 (0.020): 0.011*\"network\" + 0.011*\"pop\" + 0.010*\"prognosi\" + 0.009*\"companhia\" + 0.009*\"develop\" + 0.009*\"serv\" + 0.008*\"cytokin\" + 0.008*\"softwar\" + 0.008*\"base\" + 0.008*\"includ\"\n", + "2019-01-31 00:32:21,090 : INFO : topic #27 (0.020): 0.068*\"questionnair\" + 0.019*\"candid\" + 0.017*\"taxpay\" + 0.014*\"horac\" + 0.013*\"driver\" + 0.012*\"landslid\" + 0.011*\"tornado\" + 0.011*\"find\" + 0.011*\"fool\" + 0.011*\"ret\"\n", + "2019-01-31 00:32:21,096 : INFO : topic diff=0.008078, rho=0.045549\n", + "2019-01-31 00:32:21,253 : INFO : PROGRESS: pass 0, at document #966000/4922894\n", + "2019-01-31 00:32:22,664 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:32:22,930 : INFO : topic #11 (0.020): 0.028*\"john\" + 0.015*\"will\" + 0.013*\"jame\" + 0.012*\"david\" + 0.012*\"rival\" + 0.010*\"georg\" + 0.010*\"mexican–american\" + 0.009*\"slur\" + 0.008*\"rhyme\" + 0.008*\"paul\"\n", + "2019-01-31 00:32:22,931 : INFO : topic #13 (0.020): 0.025*\"london\" + 0.025*\"new\" + 0.025*\"sourc\" + 0.025*\"australia\" + 0.023*\"england\" + 0.022*\"australian\" + 0.019*\"british\" + 0.019*\"ireland\" + 0.015*\"youth\" + 0.014*\"wale\"\n", + "2019-01-31 00:32:22,932 : INFO : topic #32 (0.020): 0.058*\"district\" + 0.046*\"vigour\" + 0.043*\"popolo\" + 0.042*\"tortur\" + 0.028*\"area\" + 0.027*\"cotton\" + 0.025*\"regim\" + 0.023*\"multitud\" + 0.022*\"citi\" + 0.018*\"commun\"\n", + "2019-01-31 00:32:22,933 : INFO : topic #1 (0.020): 0.055*\"china\" + 0.048*\"chilton\" + 0.028*\"kong\" + 0.025*\"hong\" + 0.021*\"korea\" + 0.019*\"korean\" + 0.015*\"leah\" + 0.014*\"sourc\" + 0.013*\"kim\" + 0.013*\"taiwan\"\n", + "2019-01-31 00:32:22,934 : INFO : topic #20 (0.020): 0.141*\"scholar\" + 0.039*\"struggl\" + 0.036*\"high\" + 0.029*\"educ\" + 0.024*\"collector\" + 0.018*\"yawn\" + 0.013*\"prognosi\" + 0.009*\"gothic\" + 0.009*\"task\" + 0.008*\"class\"\n", + "2019-01-31 00:32:22,940 : INFO : topic diff=0.008432, rho=0.045502\n", + "2019-01-31 00:32:23,094 : INFO : PROGRESS: pass 0, at document #968000/4922894\n", + "2019-01-31 00:32:24,520 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:32:24,786 : INFO : topic #21 (0.020): 0.036*\"samford\" + 0.023*\"mexico\" + 0.022*\"spain\" + 0.020*\"del\" + 0.013*\"soviet\" + 0.011*\"santa\" + 0.011*\"juan\" + 0.011*\"mexican\" + 0.011*\"carlo\" + 0.010*\"francisco\"\n", + "2019-01-31 00:32:24,788 : INFO : topic #47 (0.020): 0.065*\"muscl\" + 0.035*\"perceptu\" + 0.021*\"theater\" + 0.019*\"place\" + 0.017*\"compos\" + 0.016*\"damn\" + 0.014*\"orchestr\" + 0.014*\"olympo\" + 0.013*\"physician\" + 0.012*\"word\"\n", + "2019-01-31 00:32:24,789 : INFO : topic #4 (0.020): 0.020*\"enfranchis\" + 0.015*\"pour\" + 0.014*\"depress\" + 0.012*\"elabor\" + 0.010*\"mode\" + 0.009*\"produc\" + 0.008*\"veget\" + 0.007*\"uruguayan\" + 0.007*\"encyclopedia\" + 0.007*\"candid\"\n", + "2019-01-31 00:32:24,790 : INFO : topic #48 (0.020): 0.079*\"sens\" + 0.076*\"octob\" + 0.072*\"march\" + 0.069*\"januari\" + 0.068*\"august\" + 0.067*\"notion\" + 0.066*\"juli\" + 0.064*\"decatur\" + 0.063*\"april\" + 0.063*\"judici\"\n", + "2019-01-31 00:32:24,791 : INFO : topic #26 (0.020): 0.029*\"champion\" + 0.029*\"workplac\" + 0.026*\"woman\" + 0.025*\"olymp\" + 0.024*\"alic\" + 0.023*\"men\" + 0.023*\"medal\" + 0.020*\"event\" + 0.019*\"atheist\" + 0.017*\"nation\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 00:32:24,797 : INFO : topic diff=0.007734, rho=0.045455\n", + "2019-01-31 00:32:24,952 : INFO : PROGRESS: pass 0, at document #970000/4922894\n", + "2019-01-31 00:32:26,355 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:32:26,621 : INFO : topic #14 (0.020): 0.024*\"forc\" + 0.023*\"aggress\" + 0.021*\"walter\" + 0.021*\"armi\" + 0.018*\"com\" + 0.014*\"unionist\" + 0.013*\"oper\" + 0.013*\"militari\" + 0.012*\"airmen\" + 0.012*\"refut\"\n", + "2019-01-31 00:32:26,623 : INFO : topic #18 (0.020): 0.010*\"théori\" + 0.007*\"later\" + 0.007*\"sack\" + 0.006*\"kill\" + 0.006*\"dai\" + 0.005*\"retrospect\" + 0.005*\"like\" + 0.004*\"end\" + 0.004*\"man\" + 0.004*\"help\"\n", + "2019-01-31 00:32:26,624 : INFO : topic #27 (0.020): 0.067*\"questionnair\" + 0.019*\"candid\" + 0.017*\"taxpay\" + 0.015*\"ret\" + 0.013*\"horac\" + 0.012*\"driver\" + 0.012*\"tornado\" + 0.011*\"fool\" + 0.011*\"landslid\" + 0.011*\"find\"\n", + "2019-01-31 00:32:26,625 : INFO : topic #2 (0.020): 0.047*\"isl\" + 0.040*\"shield\" + 0.018*\"narrat\" + 0.015*\"scot\" + 0.013*\"blur\" + 0.012*\"pope\" + 0.011*\"class\" + 0.010*\"nativist\" + 0.010*\"coalit\" + 0.009*\"fleet\"\n", + "2019-01-31 00:32:26,626 : INFO : topic #36 (0.020): 0.011*\"network\" + 0.011*\"pop\" + 0.011*\"prognosi\" + 0.009*\"companhia\" + 0.009*\"serv\" + 0.009*\"develop\" + 0.008*\"cytokin\" + 0.008*\"softwar\" + 0.008*\"includ\" + 0.008*\"base\"\n", + "2019-01-31 00:32:26,632 : INFO : topic diff=0.006966, rho=0.045408\n", + "2019-01-31 00:32:26,790 : INFO : PROGRESS: pass 0, at document #972000/4922894\n", + "2019-01-31 00:32:28,193 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:32:28,459 : INFO : topic #45 (0.020): 0.021*\"fifteenth\" + 0.020*\"jpg\" + 0.015*\"western\" + 0.014*\"black\" + 0.014*\"illicit\" + 0.013*\"colder\" + 0.013*\"record\" + 0.010*\"blind\" + 0.008*\"light\" + 0.007*\"green\"\n", + "2019-01-31 00:32:28,460 : INFO : topic #14 (0.020): 0.025*\"forc\" + 0.023*\"aggress\" + 0.021*\"walter\" + 0.021*\"armi\" + 0.017*\"com\" + 0.014*\"unionist\" + 0.014*\"oper\" + 0.013*\"militari\" + 0.012*\"airmen\" + 0.011*\"airbu\"\n", + "2019-01-31 00:32:28,461 : INFO : topic #18 (0.020): 0.010*\"théori\" + 0.007*\"later\" + 0.006*\"sack\" + 0.006*\"kill\" + 0.006*\"dai\" + 0.005*\"retrospect\" + 0.005*\"like\" + 0.004*\"man\" + 0.004*\"end\" + 0.004*\"help\"\n", + "2019-01-31 00:32:28,462 : INFO : topic #30 (0.020): 0.036*\"leagu\" + 0.036*\"cleveland\" + 0.030*\"place\" + 0.028*\"taxpay\" + 0.024*\"scientist\" + 0.023*\"crete\" + 0.021*\"folei\" + 0.016*\"goal\" + 0.016*\"martin\" + 0.012*\"schmitz\"\n", + "2019-01-31 00:32:28,463 : INFO : topic #33 (0.020): 0.063*\"french\" + 0.045*\"franc\" + 0.030*\"pari\" + 0.022*\"jean\" + 0.022*\"sail\" + 0.017*\"daphn\" + 0.014*\"lazi\" + 0.013*\"loui\" + 0.011*\"wine\" + 0.011*\"piec\"\n", + "2019-01-31 00:32:28,469 : INFO : topic diff=0.007905, rho=0.045361\n", + "2019-01-31 00:32:28,628 : INFO : PROGRESS: pass 0, at document #974000/4922894\n", + "2019-01-31 00:32:30,049 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:32:30,316 : INFO : topic #29 (0.020): 0.016*\"companhia\" + 0.011*\"million\" + 0.009*\"yawn\" + 0.008*\"bank\" + 0.008*\"govern\" + 0.008*\"start\" + 0.007*\"busi\" + 0.007*\"market\" + 0.007*\"countri\" + 0.007*\"function\"\n", + "2019-01-31 00:32:30,317 : INFO : topic #35 (0.020): 0.056*\"russia\" + 0.039*\"sovereignti\" + 0.032*\"rural\" + 0.027*\"poison\" + 0.024*\"reprint\" + 0.024*\"personifi\" + 0.021*\"moscow\" + 0.018*\"poland\" + 0.016*\"unfortun\" + 0.015*\"tyrant\"\n", + "2019-01-31 00:32:30,318 : INFO : topic #15 (0.020): 0.013*\"small\" + 0.011*\"organ\" + 0.010*\"develop\" + 0.010*\"commun\" + 0.009*\"group\" + 0.009*\"word\" + 0.009*\"cultur\" + 0.008*\"peopl\" + 0.007*\"human\" + 0.007*\"student\"\n", + "2019-01-31 00:32:30,319 : INFO : topic #47 (0.020): 0.064*\"muscl\" + 0.035*\"perceptu\" + 0.020*\"theater\" + 0.019*\"place\" + 0.017*\"compos\" + 0.015*\"damn\" + 0.014*\"physician\" + 0.014*\"orchestr\" + 0.014*\"olympo\" + 0.012*\"word\"\n", + "2019-01-31 00:32:30,320 : INFO : topic #34 (0.020): 0.075*\"start\" + 0.034*\"cotton\" + 0.030*\"unionist\" + 0.028*\"american\" + 0.025*\"new\" + 0.013*\"year\" + 0.013*\"warrior\" + 0.013*\"terri\" + 0.013*\"california\" + 0.012*\"north\"\n", + "2019-01-31 00:32:30,326 : INFO : topic diff=0.009206, rho=0.045314\n", + "2019-01-31 00:32:30,488 : INFO : PROGRESS: pass 0, at document #976000/4922894\n", + "2019-01-31 00:32:31,903 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:32:32,169 : INFO : topic #31 (0.020): 0.061*\"fusiform\" + 0.024*\"scientist\" + 0.024*\"player\" + 0.022*\"taxpay\" + 0.019*\"place\" + 0.013*\"clot\" + 0.012*\"leagu\" + 0.011*\"folei\" + 0.009*\"yawn\" + 0.009*\"reconstruct\"\n", + "2019-01-31 00:32:32,170 : INFO : topic #13 (0.020): 0.026*\"australia\" + 0.025*\"london\" + 0.025*\"new\" + 0.025*\"sourc\" + 0.023*\"england\" + 0.022*\"australian\" + 0.019*\"british\" + 0.019*\"ireland\" + 0.016*\"youth\" + 0.014*\"wale\"\n", + "2019-01-31 00:32:32,172 : INFO : topic #18 (0.020): 0.010*\"théori\" + 0.007*\"later\" + 0.006*\"sack\" + 0.006*\"kill\" + 0.006*\"dai\" + 0.005*\"retrospect\" + 0.005*\"like\" + 0.004*\"end\" + 0.004*\"man\" + 0.004*\"help\"\n", + "2019-01-31 00:32:32,173 : INFO : topic #41 (0.020): 0.047*\"citi\" + 0.031*\"new\" + 0.022*\"palmer\" + 0.016*\"year\" + 0.015*\"strategist\" + 0.014*\"center\" + 0.011*\"open\" + 0.011*\"includ\" + 0.010*\"lobe\" + 0.008*\"dai\"\n", + "2019-01-31 00:32:32,174 : INFO : topic #37 (0.020): 0.010*\"man\" + 0.009*\"love\" + 0.007*\"gestur\" + 0.005*\"blue\" + 0.005*\"litig\" + 0.005*\"vision\" + 0.004*\"bewild\" + 0.004*\"comic\" + 0.004*\"night\" + 0.003*\"black\"\n", + "2019-01-31 00:32:32,180 : INFO : topic diff=0.009012, rho=0.045268\n", + "2019-01-31 00:32:32,339 : INFO : PROGRESS: pass 0, at document #978000/4922894\n", + "2019-01-31 00:32:33,767 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:32:34,033 : INFO : topic #47 (0.020): 0.066*\"muscl\" + 0.034*\"perceptu\" + 0.020*\"theater\" + 0.018*\"place\" + 0.018*\"compos\" + 0.015*\"damn\" + 0.014*\"orchestr\" + 0.013*\"physician\" + 0.013*\"olympo\" + 0.012*\"word\"\n", + "2019-01-31 00:32:34,034 : INFO : topic #4 (0.020): 0.021*\"enfranchis\" + 0.015*\"pour\" + 0.014*\"depress\" + 0.011*\"elabor\" + 0.010*\"mode\" + 0.009*\"produc\" + 0.008*\"veget\" + 0.007*\"uruguayan\" + 0.007*\"turn\" + 0.007*\"encyclopedia\"\n", + "2019-01-31 00:32:34,035 : INFO : topic #13 (0.020): 0.026*\"australia\" + 0.025*\"new\" + 0.025*\"london\" + 0.025*\"sourc\" + 0.024*\"england\" + 0.022*\"australian\" + 0.020*\"british\" + 0.019*\"ireland\" + 0.016*\"youth\" + 0.014*\"wale\"\n", + "2019-01-31 00:32:34,036 : INFO : topic #0 (0.020): 0.066*\"statewid\" + 0.040*\"line\" + 0.038*\"arsen\" + 0.033*\"raid\" + 0.028*\"museo\" + 0.020*\"traceabl\" + 0.018*\"serv\" + 0.015*\"pain\" + 0.014*\"exhaust\" + 0.013*\"artist\"\n", + "2019-01-31 00:32:34,037 : INFO : topic #17 (0.020): 0.076*\"church\" + 0.022*\"christian\" + 0.021*\"cathol\" + 0.019*\"bishop\" + 0.015*\"sail\" + 0.014*\"retroflex\" + 0.012*\"parish\" + 0.010*\"historiographi\" + 0.010*\"cathedr\" + 0.009*\"centuri\"\n", + "2019-01-31 00:32:34,043 : INFO : topic diff=0.006830, rho=0.045222\n", + "2019-01-31 00:32:36,816 : INFO : -11.568 per-word bound, 3035.8 perplexity estimate based on a held-out corpus of 2000 documents with 604118 words\n", + "2019-01-31 00:32:36,816 : INFO : PROGRESS: pass 0, at document #980000/4922894\n", + "2019-01-31 00:32:38,235 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:32:38,501 : INFO : topic #30 (0.020): 0.036*\"leagu\" + 0.036*\"cleveland\" + 0.029*\"place\" + 0.027*\"taxpay\" + 0.024*\"scientist\" + 0.023*\"crete\" + 0.021*\"folei\" + 0.016*\"goal\" + 0.016*\"martin\" + 0.012*\"schmitz\"\n", + "2019-01-31 00:32:38,502 : INFO : topic #2 (0.020): 0.049*\"isl\" + 0.039*\"shield\" + 0.018*\"narrat\" + 0.015*\"scot\" + 0.012*\"blur\" + 0.012*\"pope\" + 0.010*\"nativist\" + 0.010*\"class\" + 0.010*\"coalit\" + 0.009*\"fleet\"\n", + "2019-01-31 00:32:38,504 : INFO : topic #24 (0.020): 0.042*\"book\" + 0.035*\"publicis\" + 0.026*\"word\" + 0.018*\"new\" + 0.014*\"edit\" + 0.013*\"presid\" + 0.013*\"nicola\" + 0.012*\"storag\" + 0.012*\"collect\" + 0.011*\"author\"\n", + "2019-01-31 00:32:38,504 : INFO : topic #48 (0.020): 0.082*\"sens\" + 0.078*\"octob\" + 0.076*\"march\" + 0.069*\"august\" + 0.069*\"juli\" + 0.068*\"april\" + 0.068*\"januari\" + 0.068*\"judici\" + 0.067*\"notion\" + 0.065*\"decatur\"\n", + "2019-01-31 00:32:38,505 : INFO : topic #27 (0.020): 0.068*\"questionnair\" + 0.019*\"candid\" + 0.018*\"taxpay\" + 0.016*\"ret\" + 0.013*\"driver\" + 0.012*\"tornado\" + 0.012*\"horac\" + 0.011*\"fool\" + 0.011*\"landslid\" + 0.011*\"find\"\n", + "2019-01-31 00:32:38,511 : INFO : topic diff=0.007551, rho=0.045175\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 00:32:38,667 : INFO : PROGRESS: pass 0, at document #982000/4922894\n", + "2019-01-31 00:32:40,069 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:32:40,335 : INFO : topic #33 (0.020): 0.063*\"french\" + 0.045*\"franc\" + 0.031*\"pari\" + 0.022*\"jean\" + 0.022*\"sail\" + 0.017*\"daphn\" + 0.014*\"lazi\" + 0.013*\"loui\" + 0.011*\"piec\" + 0.011*\"wine\"\n", + "2019-01-31 00:32:40,336 : INFO : topic #34 (0.020): 0.075*\"start\" + 0.034*\"cotton\" + 0.030*\"unionist\" + 0.028*\"american\" + 0.025*\"new\" + 0.014*\"year\" + 0.013*\"california\" + 0.013*\"warrior\" + 0.012*\"north\" + 0.012*\"terri\"\n", + "2019-01-31 00:32:40,337 : INFO : topic #44 (0.020): 0.029*\"rooftop\" + 0.028*\"final\" + 0.023*\"wife\" + 0.022*\"tourist\" + 0.019*\"champion\" + 0.018*\"taxpay\" + 0.015*\"tiepolo\" + 0.014*\"open\" + 0.014*\"chamber\" + 0.014*\"women\"\n", + "2019-01-31 00:32:40,339 : INFO : topic #23 (0.020): 0.133*\"audit\" + 0.068*\"best\" + 0.035*\"yawn\" + 0.029*\"jacksonvil\" + 0.023*\"japanes\" + 0.023*\"noll\" + 0.022*\"festiv\" + 0.022*\"intern\" + 0.018*\"women\" + 0.015*\"winner\"\n", + "2019-01-31 00:32:40,340 : INFO : topic #16 (0.020): 0.051*\"king\" + 0.034*\"priest\" + 0.022*\"quarterli\" + 0.018*\"duke\" + 0.018*\"idiosyncrat\" + 0.016*\"grammat\" + 0.016*\"rotterdam\" + 0.014*\"maria\" + 0.014*\"count\" + 0.014*\"portugues\"\n", + "2019-01-31 00:32:40,345 : INFO : topic diff=0.007005, rho=0.045129\n", + "2019-01-31 00:32:40,500 : INFO : PROGRESS: pass 0, at document #984000/4922894\n", + "2019-01-31 00:32:41,895 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:32:42,162 : INFO : topic #31 (0.020): 0.060*\"fusiform\" + 0.025*\"scientist\" + 0.024*\"player\" + 0.022*\"taxpay\" + 0.019*\"place\" + 0.013*\"clot\" + 0.013*\"leagu\" + 0.011*\"folei\" + 0.010*\"ruler\" + 0.010*\"yawn\"\n", + "2019-01-31 00:32:42,163 : INFO : topic #0 (0.020): 0.066*\"statewid\" + 0.040*\"line\" + 0.036*\"arsen\" + 0.033*\"raid\" + 0.028*\"museo\" + 0.022*\"traceabl\" + 0.019*\"serv\" + 0.015*\"pain\" + 0.014*\"exhaust\" + 0.012*\"artist\"\n", + "2019-01-31 00:32:42,164 : INFO : topic #10 (0.020): 0.011*\"cdd\" + 0.008*\"disco\" + 0.007*\"media\" + 0.007*\"pathwai\" + 0.007*\"have\" + 0.007*\"proper\" + 0.007*\"hormon\" + 0.006*\"caus\" + 0.006*\"acid\" + 0.006*\"treat\"\n", + "2019-01-31 00:32:42,165 : INFO : topic #29 (0.020): 0.016*\"companhia\" + 0.011*\"million\" + 0.009*\"yawn\" + 0.008*\"bank\" + 0.008*\"govern\" + 0.008*\"start\" + 0.007*\"busi\" + 0.007*\"function\" + 0.007*\"market\" + 0.007*\"countri\"\n", + "2019-01-31 00:32:42,166 : INFO : topic #34 (0.020): 0.075*\"start\" + 0.034*\"cotton\" + 0.030*\"unionist\" + 0.028*\"american\" + 0.025*\"new\" + 0.014*\"year\" + 0.013*\"california\" + 0.013*\"warrior\" + 0.012*\"north\" + 0.012*\"terri\"\n", + "2019-01-31 00:32:42,172 : INFO : topic diff=0.007549, rho=0.045083\n", + "2019-01-31 00:32:42,329 : INFO : PROGRESS: pass 0, at document #986000/4922894\n", + "2019-01-31 00:32:43,743 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:32:44,009 : INFO : topic #12 (0.020): 0.009*\"number\" + 0.008*\"frontal\" + 0.007*\"gener\" + 0.007*\"exampl\" + 0.006*\"utopian\" + 0.006*\"measur\" + 0.006*\"théori\" + 0.006*\"southern\" + 0.006*\"method\" + 0.006*\"poet\"\n", + "2019-01-31 00:32:44,010 : INFO : topic #15 (0.020): 0.013*\"small\" + 0.011*\"organ\" + 0.010*\"develop\" + 0.010*\"commun\" + 0.009*\"cultur\" + 0.009*\"group\" + 0.009*\"word\" + 0.008*\"peopl\" + 0.007*\"human\" + 0.007*\"student\"\n", + "2019-01-31 00:32:44,011 : INFO : topic #10 (0.020): 0.011*\"cdd\" + 0.008*\"disco\" + 0.007*\"media\" + 0.007*\"have\" + 0.007*\"pathwai\" + 0.007*\"proper\" + 0.007*\"hormon\" + 0.006*\"caus\" + 0.006*\"acid\" + 0.006*\"treat\"\n", + "2019-01-31 00:32:44,013 : INFO : topic #3 (0.020): 0.037*\"present\" + 0.026*\"offic\" + 0.025*\"minist\" + 0.021*\"serv\" + 0.019*\"member\" + 0.018*\"gener\" + 0.018*\"govern\" + 0.017*\"nation\" + 0.017*\"seri\" + 0.014*\"chickasaw\"\n", + "2019-01-31 00:32:44,014 : INFO : topic #0 (0.020): 0.066*\"statewid\" + 0.040*\"line\" + 0.037*\"arsen\" + 0.033*\"raid\" + 0.028*\"museo\" + 0.022*\"traceabl\" + 0.019*\"serv\" + 0.015*\"pain\" + 0.014*\"exhaust\" + 0.012*\"artist\"\n", + "2019-01-31 00:32:44,019 : INFO : topic diff=0.008941, rho=0.045038\n", + "2019-01-31 00:32:44,175 : INFO : PROGRESS: pass 0, at document #988000/4922894\n", + "2019-01-31 00:32:45,573 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:32:45,839 : INFO : topic #20 (0.020): 0.137*\"scholar\" + 0.038*\"struggl\" + 0.036*\"high\" + 0.028*\"educ\" + 0.023*\"collector\" + 0.017*\"yawn\" + 0.013*\"prognosi\" + 0.011*\"gothic\" + 0.010*\"district\" + 0.009*\"task\"\n", + "2019-01-31 00:32:45,840 : INFO : topic #13 (0.020): 0.026*\"australia\" + 0.025*\"london\" + 0.025*\"new\" + 0.024*\"sourc\" + 0.023*\"england\" + 0.022*\"australian\" + 0.020*\"ireland\" + 0.019*\"british\" + 0.016*\"youth\" + 0.014*\"wale\"\n", + "2019-01-31 00:32:45,841 : INFO : topic #22 (0.020): 0.036*\"spars\" + 0.024*\"factor\" + 0.020*\"adulthood\" + 0.016*\"feel\" + 0.015*\"male\" + 0.014*\"hostil\" + 0.011*\"genu\" + 0.011*\"plaisir\" + 0.010*\"live\" + 0.009*\"yawn\"\n", + "2019-01-31 00:32:45,842 : INFO : topic #21 (0.020): 0.036*\"samford\" + 0.022*\"mexico\" + 0.021*\"spain\" + 0.019*\"del\" + 0.013*\"soviet\" + 0.011*\"carlo\" + 0.011*\"santa\" + 0.011*\"juan\" + 0.011*\"mexican\" + 0.011*\"francisco\"\n", + "2019-01-31 00:32:45,843 : INFO : topic #46 (0.020): 0.018*\"norwai\" + 0.017*\"sweden\" + 0.017*\"norwegian\" + 0.017*\"stop\" + 0.016*\"swedish\" + 0.013*\"wind\" + 0.011*\"treeless\" + 0.011*\"damag\" + 0.011*\"turkish\" + 0.011*\"replac\"\n", + "2019-01-31 00:32:45,849 : INFO : topic diff=0.007313, rho=0.044992\n", + "2019-01-31 00:32:46,008 : INFO : PROGRESS: pass 0, at document #990000/4922894\n", + "2019-01-31 00:32:47,421 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:32:47,687 : INFO : topic #40 (0.020): 0.089*\"unit\" + 0.023*\"schuster\" + 0.023*\"collector\" + 0.022*\"institut\" + 0.019*\"requir\" + 0.018*\"student\" + 0.015*\"professor\" + 0.012*\"governor\" + 0.012*\"word\" + 0.012*\"http\"\n", + "2019-01-31 00:32:47,688 : INFO : topic #44 (0.020): 0.030*\"rooftop\" + 0.030*\"final\" + 0.023*\"wife\" + 0.021*\"tourist\" + 0.019*\"champion\" + 0.019*\"taxpay\" + 0.014*\"tiepolo\" + 0.014*\"martin\" + 0.014*\"chamber\" + 0.014*\"women\"\n", + "2019-01-31 00:32:47,690 : INFO : topic #29 (0.020): 0.016*\"companhia\" + 0.011*\"million\" + 0.009*\"yawn\" + 0.008*\"bank\" + 0.008*\"govern\" + 0.008*\"start\" + 0.007*\"busi\" + 0.007*\"function\" + 0.007*\"market\" + 0.007*\"industri\"\n", + "2019-01-31 00:32:47,691 : INFO : topic #39 (0.020): 0.044*\"canada\" + 0.035*\"canadian\" + 0.019*\"toronto\" + 0.018*\"hoar\" + 0.017*\"ontario\" + 0.013*\"new\" + 0.013*\"taxpay\" + 0.012*\"scientist\" + 0.011*\"misericordia\" + 0.011*\"novotná\"\n", + "2019-01-31 00:32:47,692 : INFO : topic #4 (0.020): 0.020*\"enfranchis\" + 0.015*\"pour\" + 0.014*\"depress\" + 0.011*\"elabor\" + 0.010*\"mode\" + 0.009*\"produc\" + 0.008*\"veget\" + 0.007*\"uruguayan\" + 0.007*\"mandir\" + 0.007*\"encyclopedia\"\n", + "2019-01-31 00:32:47,697 : INFO : topic diff=0.009152, rho=0.044947\n", + "2019-01-31 00:32:47,910 : INFO : PROGRESS: pass 0, at document #992000/4922894\n", + "2019-01-31 00:32:49,287 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:32:49,553 : INFO : topic #20 (0.020): 0.139*\"scholar\" + 0.038*\"high\" + 0.038*\"struggl\" + 0.028*\"educ\" + 0.023*\"collector\" + 0.018*\"yawn\" + 0.013*\"prognosi\" + 0.011*\"gothic\" + 0.010*\"district\" + 0.009*\"task\"\n", + "2019-01-31 00:32:49,554 : INFO : topic #16 (0.020): 0.049*\"king\" + 0.034*\"priest\" + 0.021*\"quarterli\" + 0.018*\"idiosyncrat\" + 0.018*\"duke\" + 0.017*\"grammat\" + 0.016*\"rotterdam\" + 0.014*\"maria\" + 0.014*\"count\" + 0.013*\"portugues\"\n", + "2019-01-31 00:32:49,555 : INFO : topic #33 (0.020): 0.065*\"french\" + 0.045*\"franc\" + 0.031*\"pari\" + 0.022*\"sail\" + 0.022*\"jean\" + 0.018*\"daphn\" + 0.014*\"lazi\" + 0.013*\"loui\" + 0.011*\"piec\" + 0.010*\"wine\"\n", + "2019-01-31 00:32:49,556 : INFO : topic #2 (0.020): 0.051*\"isl\" + 0.039*\"shield\" + 0.018*\"narrat\" + 0.015*\"scot\" + 0.013*\"pope\" + 0.012*\"blur\" + 0.011*\"coalit\" + 0.010*\"class\" + 0.010*\"nativist\" + 0.009*\"fleet\"\n", + "2019-01-31 00:32:49,557 : INFO : topic #42 (0.020): 0.049*\"german\" + 0.031*\"germani\" + 0.014*\"vol\" + 0.013*\"berlin\" + 0.012*\"israel\" + 0.012*\"jewish\" + 0.012*\"der\" + 0.009*\"austria\" + 0.009*\"european\" + 0.009*\"europ\"\n", + "2019-01-31 00:32:49,563 : INFO : topic diff=0.007153, rho=0.044901\n", + "2019-01-31 00:32:49,718 : INFO : PROGRESS: pass 0, at document #994000/4922894\n", + "2019-01-31 00:32:51,099 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 00:32:51,366 : INFO : topic #7 (0.020): 0.021*\"snatch\" + 0.019*\"di\" + 0.018*\"factor\" + 0.015*\"margin\" + 0.015*\"yawn\" + 0.013*\"bone\" + 0.012*\"faster\" + 0.012*\"life\" + 0.012*\"daughter\" + 0.011*\"deal\"\n", + "2019-01-31 00:32:51,367 : INFO : topic #36 (0.020): 0.011*\"pop\" + 0.011*\"network\" + 0.011*\"prognosi\" + 0.009*\"develop\" + 0.008*\"companhia\" + 0.008*\"serv\" + 0.008*\"cytokin\" + 0.008*\"softwar\" + 0.008*\"user\" + 0.008*\"base\"\n", + "2019-01-31 00:32:51,369 : INFO : topic #14 (0.020): 0.024*\"forc\" + 0.023*\"aggress\" + 0.021*\"armi\" + 0.020*\"walter\" + 0.017*\"com\" + 0.016*\"oper\" + 0.013*\"unionist\" + 0.012*\"airbu\" + 0.012*\"militari\" + 0.011*\"airmen\"\n", + "2019-01-31 00:32:51,370 : INFO : topic #34 (0.020): 0.076*\"start\" + 0.035*\"cotton\" + 0.031*\"unionist\" + 0.028*\"american\" + 0.025*\"new\" + 0.014*\"year\" + 0.014*\"warrior\" + 0.013*\"california\" + 0.013*\"north\" + 0.012*\"terri\"\n", + "2019-01-31 00:32:51,371 : INFO : topic #38 (0.020): 0.023*\"walter\" + 0.010*\"aza\" + 0.010*\"battalion\" + 0.008*\"forc\" + 0.008*\"king\" + 0.007*\"teufel\" + 0.007*\"empath\" + 0.007*\"armi\" + 0.007*\"centuri\" + 0.006*\"till\"\n", + "2019-01-31 00:32:51,377 : INFO : topic diff=0.006745, rho=0.044856\n", + "2019-01-31 00:32:51,533 : INFO : PROGRESS: pass 0, at document #996000/4922894\n", + "2019-01-31 00:32:52,944 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:32:53,210 : INFO : topic #35 (0.020): 0.051*\"russia\" + 0.039*\"sovereignti\" + 0.031*\"rural\" + 0.028*\"poison\" + 0.027*\"personifi\" + 0.023*\"reprint\" + 0.019*\"moscow\" + 0.019*\"poland\" + 0.015*\"unfortun\" + 0.015*\"tyrant\"\n", + "2019-01-31 00:32:53,212 : INFO : topic #13 (0.020): 0.028*\"london\" + 0.025*\"australia\" + 0.025*\"new\" + 0.024*\"sourc\" + 0.022*\"england\" + 0.022*\"australian\" + 0.019*\"british\" + 0.019*\"ireland\" + 0.016*\"youth\" + 0.014*\"wale\"\n", + "2019-01-31 00:32:53,213 : INFO : topic #27 (0.020): 0.069*\"questionnair\" + 0.022*\"ret\" + 0.019*\"candid\" + 0.018*\"taxpay\" + 0.013*\"driver\" + 0.012*\"horac\" + 0.011*\"tornado\" + 0.011*\"landslid\" + 0.011*\"fool\" + 0.011*\"find\"\n", + "2019-01-31 00:32:53,214 : INFO : topic #4 (0.020): 0.021*\"enfranchis\" + 0.015*\"pour\" + 0.015*\"depress\" + 0.011*\"elabor\" + 0.010*\"mode\" + 0.009*\"produc\" + 0.008*\"veget\" + 0.007*\"candid\" + 0.007*\"uruguayan\" + 0.007*\"mandir\"\n", + "2019-01-31 00:32:53,215 : INFO : topic #32 (0.020): 0.058*\"district\" + 0.045*\"vigour\" + 0.043*\"popolo\" + 0.042*\"tortur\" + 0.028*\"area\" + 0.028*\"cotton\" + 0.025*\"regim\" + 0.023*\"multitud\" + 0.021*\"citi\" + 0.018*\"commun\"\n", + "2019-01-31 00:32:53,221 : INFO : topic diff=0.007562, rho=0.044811\n", + "2019-01-31 00:32:53,371 : INFO : PROGRESS: pass 0, at document #998000/4922894\n", + "2019-01-31 00:32:54,728 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:32:54,994 : INFO : topic #23 (0.020): 0.132*\"audit\" + 0.070*\"best\" + 0.034*\"yawn\" + 0.028*\"jacksonvil\" + 0.023*\"japanes\" + 0.023*\"festiv\" + 0.022*\"noll\" + 0.021*\"intern\" + 0.018*\"women\" + 0.015*\"winner\"\n", + "2019-01-31 00:32:54,995 : INFO : topic #3 (0.020): 0.035*\"present\" + 0.027*\"offic\" + 0.024*\"minist\" + 0.021*\"serv\" + 0.019*\"member\" + 0.018*\"gener\" + 0.018*\"govern\" + 0.018*\"nation\" + 0.017*\"seri\" + 0.015*\"chickasaw\"\n", + "2019-01-31 00:32:54,997 : INFO : topic #2 (0.020): 0.051*\"isl\" + 0.038*\"shield\" + 0.018*\"narrat\" + 0.015*\"scot\" + 0.013*\"pope\" + 0.012*\"blur\" + 0.011*\"coalit\" + 0.010*\"nativist\" + 0.010*\"class\" + 0.009*\"bahá\"\n", + "2019-01-31 00:32:54,998 : INFO : topic #37 (0.020): 0.010*\"man\" + 0.009*\"love\" + 0.007*\"gestur\" + 0.005*\"blue\" + 0.005*\"vision\" + 0.004*\"litig\" + 0.004*\"bewild\" + 0.004*\"night\" + 0.004*\"comic\" + 0.004*\"black\"\n", + "2019-01-31 00:32:54,999 : INFO : topic #43 (0.020): 0.063*\"elect\" + 0.057*\"parti\" + 0.025*\"democrat\" + 0.024*\"voluntari\" + 0.020*\"member\" + 0.018*\"polici\" + 0.015*\"republ\" + 0.014*\"seaport\" + 0.014*\"selma\" + 0.014*\"report\"\n", + "2019-01-31 00:32:55,005 : INFO : topic diff=0.007929, rho=0.044766\n", + "2019-01-31 00:32:57,762 : INFO : -11.721 per-word bound, 3375.1 perplexity estimate based on a held-out corpus of 2000 documents with 592509 words\n", + "2019-01-31 00:32:57,762 : INFO : PROGRESS: pass 0, at document #1000000/4922894\n", + "2019-01-31 00:32:59,172 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:32:59,439 : INFO : topic #27 (0.020): 0.070*\"questionnair\" + 0.021*\"ret\" + 0.020*\"taxpay\" + 0.019*\"candid\" + 0.013*\"driver\" + 0.011*\"horac\" + 0.011*\"tornado\" + 0.011*\"find\" + 0.010*\"fool\" + 0.010*\"landslid\"\n", + "2019-01-31 00:32:59,440 : INFO : topic #12 (0.020): 0.009*\"number\" + 0.008*\"frontal\" + 0.007*\"gener\" + 0.006*\"utopian\" + 0.006*\"exampl\" + 0.006*\"théori\" + 0.006*\"measur\" + 0.006*\"southern\" + 0.006*\"method\" + 0.006*\"servitud\"\n", + "2019-01-31 00:32:59,441 : INFO : topic #14 (0.020): 0.024*\"forc\" + 0.023*\"aggress\" + 0.021*\"armi\" + 0.019*\"walter\" + 0.017*\"com\" + 0.016*\"oper\" + 0.013*\"unionist\" + 0.012*\"airbu\" + 0.012*\"airmen\" + 0.011*\"militari\"\n", + "2019-01-31 00:32:59,442 : INFO : topic #39 (0.020): 0.046*\"canada\" + 0.034*\"canadian\" + 0.020*\"toronto\" + 0.019*\"hoar\" + 0.017*\"ontario\" + 0.013*\"new\" + 0.013*\"taxpay\" + 0.012*\"scientist\" + 0.011*\"misericordia\" + 0.011*\"novotná\"\n", + "2019-01-31 00:32:59,443 : INFO : topic #13 (0.020): 0.027*\"london\" + 0.025*\"australia\" + 0.025*\"new\" + 0.024*\"sourc\" + 0.022*\"australian\" + 0.022*\"england\" + 0.019*\"british\" + 0.018*\"ireland\" + 0.017*\"youth\" + 0.013*\"wale\"\n", + "2019-01-31 00:32:59,449 : INFO : topic diff=0.008569, rho=0.044721\n", + "2019-01-31 00:32:59,609 : INFO : PROGRESS: pass 0, at document #1002000/4922894\n", + "2019-01-31 00:33:01,032 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:33:01,298 : INFO : topic #15 (0.020): 0.013*\"small\" + 0.011*\"organ\" + 0.010*\"develop\" + 0.010*\"commun\" + 0.009*\"group\" + 0.009*\"cultur\" + 0.009*\"word\" + 0.008*\"peopl\" + 0.007*\"human\" + 0.007*\"student\"\n", + "2019-01-31 00:33:01,299 : INFO : topic #14 (0.020): 0.024*\"forc\" + 0.023*\"aggress\" + 0.020*\"armi\" + 0.019*\"walter\" + 0.017*\"com\" + 0.016*\"oper\" + 0.013*\"unionist\" + 0.012*\"airbu\" + 0.012*\"airmen\" + 0.012*\"militari\"\n", + "2019-01-31 00:33:01,300 : INFO : topic #35 (0.020): 0.050*\"russia\" + 0.039*\"sovereignti\" + 0.030*\"rural\" + 0.027*\"poison\" + 0.025*\"personifi\" + 0.024*\"reprint\" + 0.019*\"moscow\" + 0.018*\"poland\" + 0.015*\"unfortun\" + 0.015*\"tyrant\"\n", + "2019-01-31 00:33:01,301 : INFO : topic #3 (0.020): 0.035*\"present\" + 0.027*\"offic\" + 0.025*\"minist\" + 0.020*\"serv\" + 0.019*\"member\" + 0.018*\"govern\" + 0.018*\"gener\" + 0.018*\"nation\" + 0.016*\"seri\" + 0.015*\"chickasaw\"\n", + "2019-01-31 00:33:01,303 : INFO : topic #46 (0.020): 0.018*\"norwai\" + 0.018*\"sweden\" + 0.018*\"stop\" + 0.017*\"norwegian\" + 0.016*\"swedish\" + 0.014*\"wind\" + 0.012*\"replac\" + 0.012*\"treeless\" + 0.012*\"huntsvil\" + 0.011*\"damag\"\n", + "2019-01-31 00:33:01,308 : INFO : topic diff=0.007388, rho=0.044677\n", + "2019-01-31 00:33:01,465 : INFO : PROGRESS: pass 0, at document #1004000/4922894\n", + "2019-01-31 00:33:02,873 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:33:03,139 : INFO : topic #22 (0.020): 0.035*\"spars\" + 0.025*\"factor\" + 0.021*\"adulthood\" + 0.017*\"feel\" + 0.015*\"male\" + 0.015*\"hostil\" + 0.011*\"plaisir\" + 0.010*\"genu\" + 0.010*\"live\" + 0.009*\"yawn\"\n", + "2019-01-31 00:33:03,140 : INFO : topic #27 (0.020): 0.071*\"questionnair\" + 0.020*\"ret\" + 0.020*\"taxpay\" + 0.019*\"candid\" + 0.013*\"driver\" + 0.011*\"fool\" + 0.011*\"horac\" + 0.011*\"tornado\" + 0.011*\"find\" + 0.010*\"landslid\"\n", + "2019-01-31 00:33:03,141 : INFO : topic #3 (0.020): 0.035*\"present\" + 0.027*\"offic\" + 0.025*\"minist\" + 0.020*\"serv\" + 0.019*\"member\" + 0.019*\"govern\" + 0.018*\"gener\" + 0.018*\"nation\" + 0.016*\"seri\" + 0.016*\"chickasaw\"\n", + "2019-01-31 00:33:03,142 : INFO : topic #17 (0.020): 0.076*\"church\" + 0.022*\"christian\" + 0.021*\"cathol\" + 0.019*\"bishop\" + 0.015*\"sail\" + 0.014*\"retroflex\" + 0.011*\"parish\" + 0.010*\"historiographi\" + 0.009*\"centuri\" + 0.009*\"relationship\"\n", + "2019-01-31 00:33:03,144 : INFO : topic #6 (0.020): 0.073*\"fewer\" + 0.024*\"epiru\" + 0.024*\"septemb\" + 0.018*\"teacher\" + 0.016*\"stake\" + 0.012*\"rodríguez\" + 0.012*\"proclaim\" + 0.012*\"movi\" + 0.011*\"direct\" + 0.010*\"acrimoni\"\n", + "2019-01-31 00:33:03,150 : INFO : topic diff=0.007951, rho=0.044632\n", + "2019-01-31 00:33:03,305 : INFO : PROGRESS: pass 0, at document #1006000/4922894\n", + "2019-01-31 00:33:04,701 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 00:33:04,967 : INFO : topic #1 (0.020): 0.055*\"china\" + 0.047*\"chilton\" + 0.025*\"kong\" + 0.025*\"hong\" + 0.019*\"korea\" + 0.016*\"korean\" + 0.015*\"shirin\" + 0.014*\"leah\" + 0.014*\"sourc\" + 0.013*\"min\"\n", + "2019-01-31 00:33:04,969 : INFO : topic #44 (0.020): 0.030*\"rooftop\" + 0.028*\"final\" + 0.023*\"wife\" + 0.021*\"tourist\" + 0.019*\"champion\" + 0.018*\"taxpay\" + 0.015*\"martin\" + 0.015*\"tiepolo\" + 0.014*\"women\" + 0.014*\"open\"\n", + "2019-01-31 00:33:04,970 : INFO : topic #0 (0.020): 0.065*\"statewid\" + 0.040*\"line\" + 0.037*\"arsen\" + 0.034*\"raid\" + 0.027*\"museo\" + 0.021*\"traceabl\" + 0.019*\"serv\" + 0.014*\"pain\" + 0.014*\"exhaust\" + 0.012*\"gai\"\n", + "2019-01-31 00:33:04,971 : INFO : topic #5 (0.020): 0.039*\"abroad\" + 0.029*\"son\" + 0.027*\"rel\" + 0.025*\"reconstruct\" + 0.020*\"band\" + 0.017*\"muscl\" + 0.016*\"simultan\" + 0.014*\"charcoal\" + 0.013*\"toyota\" + 0.010*\"myspac\"\n", + "2019-01-31 00:33:04,972 : INFO : topic #39 (0.020): 0.045*\"canada\" + 0.035*\"canadian\" + 0.021*\"toronto\" + 0.018*\"hoar\" + 0.018*\"ontario\" + 0.013*\"taxpay\" + 0.013*\"new\" + 0.013*\"scientist\" + 0.011*\"misericordia\" + 0.011*\"novotná\"\n", + "2019-01-31 00:33:04,978 : INFO : topic diff=0.006917, rho=0.044588\n", + "2019-01-31 00:33:05,134 : INFO : PROGRESS: pass 0, at document #1008000/4922894\n", + "2019-01-31 00:33:06,543 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:33:06,809 : INFO : topic #41 (0.020): 0.046*\"citi\" + 0.030*\"new\" + 0.022*\"palmer\" + 0.016*\"strategist\" + 0.015*\"year\" + 0.013*\"center\" + 0.012*\"open\" + 0.010*\"includ\" + 0.010*\"lobe\" + 0.009*\"dai\"\n", + "2019-01-31 00:33:06,810 : INFO : topic #47 (0.020): 0.066*\"muscl\" + 0.033*\"perceptu\" + 0.020*\"theater\" + 0.018*\"place\" + 0.017*\"compos\" + 0.015*\"damn\" + 0.014*\"olympo\" + 0.013*\"orchestr\" + 0.012*\"word\" + 0.012*\"major\"\n", + "2019-01-31 00:33:06,811 : INFO : topic #31 (0.020): 0.061*\"fusiform\" + 0.025*\"scientist\" + 0.024*\"player\" + 0.022*\"taxpay\" + 0.019*\"place\" + 0.012*\"leagu\" + 0.012*\"clot\" + 0.011*\"folei\" + 0.010*\"ruler\" + 0.010*\"yawn\"\n", + "2019-01-31 00:33:06,813 : INFO : topic #25 (0.020): 0.030*\"ring\" + 0.018*\"warmth\" + 0.017*\"area\" + 0.017*\"lagrang\" + 0.013*\"mount\" + 0.009*\"foam\" + 0.009*\"palmer\" + 0.009*\"north\" + 0.008*\"land\" + 0.008*\"vacant\"\n", + "2019-01-31 00:33:06,814 : INFO : topic #22 (0.020): 0.035*\"spars\" + 0.025*\"factor\" + 0.021*\"adulthood\" + 0.016*\"feel\" + 0.015*\"male\" + 0.015*\"hostil\" + 0.012*\"plaisir\" + 0.011*\"genu\" + 0.010*\"live\" + 0.009*\"yawn\"\n", + "2019-01-31 00:33:06,819 : INFO : topic diff=0.007734, rho=0.044544\n", + "2019-01-31 00:33:06,978 : INFO : PROGRESS: pass 0, at document #1010000/4922894\n", + "2019-01-31 00:33:08,379 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:33:08,645 : INFO : topic #36 (0.020): 0.011*\"prognosi\" + 0.011*\"network\" + 0.011*\"pop\" + 0.009*\"develop\" + 0.008*\"serv\" + 0.008*\"cytokin\" + 0.008*\"softwar\" + 0.008*\"base\" + 0.008*\"companhia\" + 0.008*\"user\"\n", + "2019-01-31 00:33:08,646 : INFO : topic #5 (0.020): 0.039*\"abroad\" + 0.029*\"son\" + 0.027*\"rel\" + 0.025*\"reconstruct\" + 0.021*\"band\" + 0.017*\"muscl\" + 0.016*\"simultan\" + 0.014*\"charcoal\" + 0.013*\"toyota\" + 0.010*\"myspac\"\n", + "2019-01-31 00:33:08,647 : INFO : topic #44 (0.020): 0.031*\"rooftop\" + 0.029*\"final\" + 0.022*\"wife\" + 0.021*\"tourist\" + 0.020*\"champion\" + 0.019*\"taxpay\" + 0.015*\"tiepolo\" + 0.015*\"martin\" + 0.014*\"chamber\" + 0.014*\"women\"\n", + "2019-01-31 00:33:08,648 : INFO : topic #4 (0.020): 0.020*\"enfranchis\" + 0.015*\"pour\" + 0.015*\"depress\" + 0.011*\"elabor\" + 0.010*\"mode\" + 0.009*\"veget\" + 0.008*\"produc\" + 0.007*\"candid\" + 0.007*\"uruguayan\" + 0.007*\"mandir\"\n", + "2019-01-31 00:33:08,650 : INFO : topic #41 (0.020): 0.046*\"citi\" + 0.030*\"new\" + 0.022*\"palmer\" + 0.016*\"strategist\" + 0.015*\"year\" + 0.013*\"center\" + 0.012*\"open\" + 0.010*\"includ\" + 0.010*\"lobe\" + 0.009*\"dai\"\n", + "2019-01-31 00:33:08,655 : INFO : topic diff=0.008426, rho=0.044499\n", + "2019-01-31 00:33:08,807 : INFO : PROGRESS: pass 0, at document #1012000/4922894\n", + "2019-01-31 00:33:10,194 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:33:10,462 : INFO : topic #10 (0.020): 0.012*\"cdd\" + 0.008*\"disco\" + 0.007*\"proper\" + 0.007*\"media\" + 0.007*\"pathwai\" + 0.007*\"caus\" + 0.006*\"have\" + 0.006*\"hormon\" + 0.006*\"acid\" + 0.006*\"treat\"\n", + "2019-01-31 00:33:10,463 : INFO : topic #29 (0.020): 0.016*\"companhia\" + 0.010*\"million\" + 0.008*\"yawn\" + 0.008*\"bank\" + 0.008*\"govern\" + 0.008*\"start\" + 0.007*\"market\" + 0.007*\"function\" + 0.007*\"busi\" + 0.007*\"countri\"\n", + "2019-01-31 00:33:10,464 : INFO : topic #31 (0.020): 0.061*\"fusiform\" + 0.025*\"scientist\" + 0.024*\"player\" + 0.022*\"taxpay\" + 0.019*\"place\" + 0.012*\"leagu\" + 0.012*\"clot\" + 0.011*\"folei\" + 0.010*\"yawn\" + 0.010*\"ruler\"\n", + "2019-01-31 00:33:10,465 : INFO : topic #20 (0.020): 0.138*\"scholar\" + 0.039*\"struggl\" + 0.036*\"high\" + 0.029*\"educ\" + 0.023*\"collector\" + 0.018*\"yawn\" + 0.013*\"prognosi\" + 0.011*\"gothic\" + 0.010*\"district\" + 0.009*\"task\"\n", + "2019-01-31 00:33:10,466 : INFO : topic #30 (0.020): 0.036*\"cleveland\" + 0.035*\"leagu\" + 0.030*\"place\" + 0.027*\"taxpay\" + 0.024*\"scientist\" + 0.023*\"crete\" + 0.021*\"folei\" + 0.017*\"goal\" + 0.015*\"martin\" + 0.012*\"schmitz\"\n", + "2019-01-31 00:33:10,473 : INFO : topic diff=0.007525, rho=0.044455\n", + "2019-01-31 00:33:10,630 : INFO : PROGRESS: pass 0, at document #1014000/4922894\n", + "2019-01-31 00:33:12,203 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:33:12,470 : INFO : topic #4 (0.020): 0.020*\"enfranchis\" + 0.015*\"pour\" + 0.015*\"depress\" + 0.011*\"elabor\" + 0.010*\"mode\" + 0.008*\"produc\" + 0.008*\"veget\" + 0.007*\"uruguayan\" + 0.007*\"candid\" + 0.007*\"mandir\"\n", + "2019-01-31 00:33:12,471 : INFO : topic #14 (0.020): 0.025*\"forc\" + 0.025*\"aggress\" + 0.020*\"armi\" + 0.019*\"walter\" + 0.019*\"com\" + 0.015*\"oper\" + 0.013*\"unionist\" + 0.012*\"airbu\" + 0.012*\"militari\" + 0.011*\"airmen\"\n", + "2019-01-31 00:33:12,472 : INFO : topic #38 (0.020): 0.022*\"walter\" + 0.011*\"aza\" + 0.009*\"battalion\" + 0.009*\"forc\" + 0.008*\"teufel\" + 0.008*\"empath\" + 0.008*\"king\" + 0.007*\"till\" + 0.007*\"armi\" + 0.006*\"centuri\"\n", + "2019-01-31 00:33:12,473 : INFO : topic #3 (0.020): 0.035*\"present\" + 0.028*\"offic\" + 0.026*\"minist\" + 0.020*\"serv\" + 0.019*\"govern\" + 0.018*\"member\" + 0.018*\"gener\" + 0.018*\"nation\" + 0.016*\"chickasaw\" + 0.016*\"seri\"\n", + "2019-01-31 00:33:12,474 : INFO : topic #30 (0.020): 0.036*\"cleveland\" + 0.035*\"leagu\" + 0.030*\"place\" + 0.028*\"taxpay\" + 0.024*\"scientist\" + 0.023*\"crete\" + 0.021*\"folei\" + 0.017*\"goal\" + 0.016*\"martin\" + 0.012*\"schmitz\"\n", + "2019-01-31 00:33:12,480 : INFO : topic diff=0.006863, rho=0.044412\n", + "2019-01-31 00:33:12,634 : INFO : PROGRESS: pass 0, at document #1016000/4922894\n", + "2019-01-31 00:33:14,036 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:33:14,302 : INFO : topic #17 (0.020): 0.076*\"church\" + 0.022*\"cathol\" + 0.021*\"christian\" + 0.019*\"bishop\" + 0.015*\"sail\" + 0.014*\"retroflex\" + 0.011*\"parish\" + 0.010*\"historiographi\" + 0.009*\"centuri\" + 0.009*\"relationship\"\n", + "2019-01-31 00:33:14,304 : INFO : topic #16 (0.020): 0.045*\"king\" + 0.034*\"priest\" + 0.020*\"quarterli\" + 0.020*\"idiosyncrat\" + 0.018*\"duke\" + 0.017*\"rotterdam\" + 0.016*\"grammat\" + 0.014*\"portugues\" + 0.014*\"princ\" + 0.014*\"maria\"\n", + "2019-01-31 00:33:14,305 : INFO : topic #20 (0.020): 0.138*\"scholar\" + 0.039*\"struggl\" + 0.036*\"high\" + 0.029*\"educ\" + 0.023*\"collector\" + 0.018*\"yawn\" + 0.013*\"prognosi\" + 0.010*\"gothic\" + 0.010*\"district\" + 0.009*\"task\"\n", + "2019-01-31 00:33:14,306 : INFO : topic #22 (0.020): 0.034*\"spars\" + 0.025*\"factor\" + 0.021*\"adulthood\" + 0.017*\"feel\" + 0.015*\"male\" + 0.015*\"hostil\" + 0.012*\"plaisir\" + 0.011*\"genu\" + 0.010*\"live\" + 0.009*\"yawn\"\n", + "2019-01-31 00:33:14,307 : INFO : topic #31 (0.020): 0.060*\"fusiform\" + 0.026*\"scientist\" + 0.024*\"player\" + 0.022*\"taxpay\" + 0.019*\"place\" + 0.012*\"clot\" + 0.012*\"leagu\" + 0.011*\"folei\" + 0.010*\"reconstruct\" + 0.010*\"yawn\"\n", + "2019-01-31 00:33:14,313 : INFO : topic diff=0.006995, rho=0.044368\n", + "2019-01-31 00:33:14,464 : INFO : PROGRESS: pass 0, at document #1018000/4922894\n", + "2019-01-31 00:33:15,827 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:33:16,094 : INFO : topic #8 (0.020): 0.026*\"law\" + 0.023*\"cortic\" + 0.021*\"act\" + 0.018*\"start\" + 0.014*\"ricardo\" + 0.014*\"case\" + 0.012*\"polaris\" + 0.009*\"replac\" + 0.008*\"legal\" + 0.008*\"judaism\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 00:33:16,095 : INFO : topic #12 (0.020): 0.009*\"number\" + 0.007*\"frontal\" + 0.007*\"exampl\" + 0.007*\"gener\" + 0.006*\"utopian\" + 0.006*\"théori\" + 0.006*\"measur\" + 0.006*\"poet\" + 0.006*\"servitud\" + 0.006*\"method\"\n", + "2019-01-31 00:33:16,096 : INFO : topic #20 (0.020): 0.138*\"scholar\" + 0.039*\"struggl\" + 0.036*\"high\" + 0.029*\"educ\" + 0.023*\"collector\" + 0.018*\"yawn\" + 0.013*\"prognosi\" + 0.010*\"gothic\" + 0.010*\"district\" + 0.009*\"task\"\n", + "2019-01-31 00:33:16,097 : INFO : topic #15 (0.020): 0.012*\"small\" + 0.011*\"organ\" + 0.011*\"develop\" + 0.010*\"commun\" + 0.009*\"group\" + 0.008*\"cultur\" + 0.008*\"word\" + 0.008*\"peopl\" + 0.007*\"human\" + 0.007*\"student\"\n", + "2019-01-31 00:33:16,098 : INFO : topic #2 (0.020): 0.048*\"isl\" + 0.037*\"shield\" + 0.019*\"narrat\" + 0.014*\"scot\" + 0.013*\"pope\" + 0.012*\"blur\" + 0.012*\"nativist\" + 0.010*\"coalit\" + 0.010*\"class\" + 0.009*\"fleet\"\n", + "2019-01-31 00:33:16,105 : INFO : topic diff=0.007742, rho=0.044324\n", + "2019-01-31 00:33:18,785 : INFO : -11.480 per-word bound, 2857.0 perplexity estimate based on a held-out corpus of 2000 documents with 550974 words\n", + "2019-01-31 00:33:18,786 : INFO : PROGRESS: pass 0, at document #1020000/4922894\n", + "2019-01-31 00:33:20,183 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:33:20,449 : INFO : topic #11 (0.020): 0.028*\"john\" + 0.016*\"will\" + 0.013*\"jame\" + 0.012*\"rival\" + 0.012*\"david\" + 0.010*\"georg\" + 0.010*\"mexican–american\" + 0.009*\"slur\" + 0.008*\"paul\" + 0.008*\"rhyme\"\n", + "2019-01-31 00:33:20,450 : INFO : topic #44 (0.020): 0.031*\"rooftop\" + 0.029*\"final\" + 0.022*\"wife\" + 0.021*\"tourist\" + 0.019*\"champion\" + 0.018*\"taxpay\" + 0.015*\"tiepolo\" + 0.015*\"martin\" + 0.015*\"chamber\" + 0.014*\"women\"\n", + "2019-01-31 00:33:20,451 : INFO : topic #35 (0.020): 0.052*\"russia\" + 0.041*\"sovereignti\" + 0.031*\"rural\" + 0.027*\"poison\" + 0.025*\"personifi\" + 0.024*\"reprint\" + 0.020*\"moscow\" + 0.018*\"poland\" + 0.016*\"unfortun\" + 0.014*\"tyrant\"\n", + "2019-01-31 00:33:20,452 : INFO : topic #36 (0.020): 0.011*\"network\" + 0.011*\"prognosi\" + 0.011*\"pop\" + 0.009*\"develop\" + 0.008*\"serv\" + 0.008*\"base\" + 0.008*\"companhia\" + 0.008*\"cytokin\" + 0.007*\"softwar\" + 0.007*\"includ\"\n", + "2019-01-31 00:33:20,453 : INFO : topic #4 (0.020): 0.020*\"enfranchis\" + 0.015*\"pour\" + 0.015*\"depress\" + 0.011*\"elabor\" + 0.010*\"mode\" + 0.009*\"veget\" + 0.008*\"produc\" + 0.007*\"uruguayan\" + 0.007*\"candid\" + 0.007*\"fuel\"\n", + "2019-01-31 00:33:20,459 : INFO : topic diff=0.007775, rho=0.044281\n", + "2019-01-31 00:33:20,676 : INFO : PROGRESS: pass 0, at document #1022000/4922894\n", + "2019-01-31 00:33:22,119 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:33:22,385 : INFO : topic #14 (0.020): 0.025*\"forc\" + 0.024*\"aggress\" + 0.020*\"armi\" + 0.020*\"walter\" + 0.019*\"com\" + 0.015*\"oper\" + 0.013*\"unionist\" + 0.012*\"militari\" + 0.011*\"airbu\" + 0.011*\"airmen\"\n", + "2019-01-31 00:33:22,386 : INFO : topic #40 (0.020): 0.092*\"unit\" + 0.022*\"collector\" + 0.022*\"schuster\" + 0.022*\"institut\" + 0.020*\"requir\" + 0.018*\"student\" + 0.015*\"professor\" + 0.012*\"word\" + 0.011*\"governor\" + 0.011*\"http\"\n", + "2019-01-31 00:33:22,387 : INFO : topic #21 (0.020): 0.039*\"samford\" + 0.024*\"spain\" + 0.021*\"mexico\" + 0.019*\"del\" + 0.013*\"soviet\" + 0.011*\"santa\" + 0.011*\"carlo\" + 0.011*\"lizard\" + 0.011*\"juan\" + 0.011*\"josé\"\n", + "2019-01-31 00:33:22,388 : INFO : topic #1 (0.020): 0.052*\"china\" + 0.047*\"chilton\" + 0.028*\"kong\" + 0.026*\"hong\" + 0.019*\"korea\" + 0.017*\"korean\" + 0.015*\"leah\" + 0.014*\"shirin\" + 0.013*\"sourc\" + 0.013*\"min\"\n", + "2019-01-31 00:33:22,389 : INFO : topic #13 (0.020): 0.026*\"london\" + 0.025*\"australia\" + 0.025*\"new\" + 0.025*\"sourc\" + 0.022*\"australian\" + 0.021*\"england\" + 0.019*\"british\" + 0.018*\"ireland\" + 0.016*\"youth\" + 0.015*\"wale\"\n", + "2019-01-31 00:33:22,395 : INFO : topic diff=0.007903, rho=0.044237\n", + "2019-01-31 00:33:22,553 : INFO : PROGRESS: pass 0, at document #1024000/4922894\n", + "2019-01-31 00:33:23,987 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:33:24,253 : INFO : topic #11 (0.020): 0.028*\"john\" + 0.016*\"will\" + 0.013*\"jame\" + 0.012*\"rival\" + 0.012*\"david\" + 0.010*\"mexican–american\" + 0.010*\"georg\" + 0.009*\"slur\" + 0.008*\"paul\" + 0.008*\"rhyme\"\n", + "2019-01-31 00:33:24,254 : INFO : topic #21 (0.020): 0.039*\"samford\" + 0.024*\"spain\" + 0.021*\"mexico\" + 0.019*\"del\" + 0.013*\"soviet\" + 0.012*\"santa\" + 0.011*\"carlo\" + 0.011*\"juan\" + 0.011*\"lizard\" + 0.011*\"francisco\"\n", + "2019-01-31 00:33:24,255 : INFO : topic #38 (0.020): 0.023*\"walter\" + 0.010*\"aza\" + 0.009*\"battalion\" + 0.009*\"forc\" + 0.008*\"empath\" + 0.007*\"king\" + 0.007*\"armi\" + 0.007*\"teufel\" + 0.007*\"till\" + 0.007*\"centuri\"\n", + "2019-01-31 00:33:24,256 : INFO : topic #13 (0.020): 0.026*\"london\" + 0.025*\"australia\" + 0.025*\"new\" + 0.025*\"sourc\" + 0.022*\"australian\" + 0.021*\"england\" + 0.019*\"british\" + 0.018*\"ireland\" + 0.016*\"youth\" + 0.015*\"wale\"\n", + "2019-01-31 00:33:24,257 : INFO : topic #26 (0.020): 0.031*\"workplac\" + 0.030*\"champion\" + 0.028*\"woman\" + 0.025*\"olymp\" + 0.023*\"men\" + 0.022*\"medal\" + 0.020*\"event\" + 0.018*\"alic\" + 0.018*\"atheist\" + 0.017*\"nation\"\n", + "2019-01-31 00:33:24,263 : INFO : topic diff=0.006557, rho=0.044194\n", + "2019-01-31 00:33:24,421 : INFO : PROGRESS: pass 0, at document #1026000/4922894\n", + "2019-01-31 00:33:25,835 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:33:26,101 : INFO : topic #36 (0.020): 0.012*\"network\" + 0.011*\"prognosi\" + 0.011*\"pop\" + 0.009*\"develop\" + 0.008*\"serv\" + 0.008*\"includ\" + 0.008*\"base\" + 0.008*\"softwar\" + 0.008*\"companhia\" + 0.008*\"cytokin\"\n", + "2019-01-31 00:33:26,102 : INFO : topic #19 (0.020): 0.013*\"languag\" + 0.010*\"woodcut\" + 0.010*\"form\" + 0.010*\"origin\" + 0.009*\"centuri\" + 0.008*\"mean\" + 0.007*\"charact\" + 0.007*\"like\" + 0.007*\"uruguayan\" + 0.007*\"trade\"\n", + "2019-01-31 00:33:26,104 : INFO : topic #2 (0.020): 0.049*\"isl\" + 0.037*\"shield\" + 0.019*\"narrat\" + 0.014*\"scot\" + 0.013*\"pope\" + 0.012*\"blur\" + 0.012*\"nativist\" + 0.010*\"coalit\" + 0.009*\"class\" + 0.009*\"fleet\"\n", + "2019-01-31 00:33:26,105 : INFO : topic #24 (0.020): 0.042*\"book\" + 0.035*\"publicis\" + 0.024*\"word\" + 0.018*\"new\" + 0.014*\"edit\" + 0.014*\"nicola\" + 0.013*\"presid\" + 0.012*\"storag\" + 0.012*\"worldwid\" + 0.011*\"magazin\"\n", + "2019-01-31 00:33:26,106 : INFO : topic #21 (0.020): 0.040*\"samford\" + 0.024*\"spain\" + 0.021*\"mexico\" + 0.019*\"del\" + 0.013*\"soviet\" + 0.011*\"juan\" + 0.011*\"santa\" + 0.011*\"carlo\" + 0.011*\"lizard\" + 0.011*\"francisco\"\n", + "2019-01-31 00:33:26,112 : INFO : topic diff=0.006824, rho=0.044151\n", + "2019-01-31 00:33:26,266 : INFO : PROGRESS: pass 0, at document #1028000/4922894\n", + "2019-01-31 00:33:27,660 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:33:27,926 : INFO : topic #32 (0.020): 0.058*\"district\" + 0.046*\"vigour\" + 0.043*\"popolo\" + 0.039*\"tortur\" + 0.029*\"cotton\" + 0.027*\"area\" + 0.026*\"regim\" + 0.023*\"multitud\" + 0.021*\"citi\" + 0.019*\"commun\"\n", + "2019-01-31 00:33:27,927 : INFO : topic #10 (0.020): 0.012*\"cdd\" + 0.009*\"proper\" + 0.008*\"disco\" + 0.007*\"media\" + 0.007*\"pathwai\" + 0.007*\"have\" + 0.007*\"caus\" + 0.006*\"hormon\" + 0.006*\"treat\" + 0.006*\"effect\"\n", + "2019-01-31 00:33:27,928 : INFO : topic #15 (0.020): 0.012*\"small\" + 0.011*\"organ\" + 0.011*\"develop\" + 0.010*\"commun\" + 0.009*\"group\" + 0.008*\"cultur\" + 0.008*\"word\" + 0.008*\"peopl\" + 0.007*\"human\" + 0.007*\"student\"\n", + "2019-01-31 00:33:27,929 : INFO : topic #1 (0.020): 0.053*\"china\" + 0.048*\"chilton\" + 0.027*\"kong\" + 0.026*\"hong\" + 0.019*\"korea\" + 0.017*\"korean\" + 0.015*\"leah\" + 0.013*\"sourc\" + 0.013*\"kim\" + 0.013*\"shirin\"\n", + "2019-01-31 00:33:27,930 : INFO : topic #4 (0.020): 0.020*\"enfranchis\" + 0.015*\"pour\" + 0.014*\"depress\" + 0.011*\"elabor\" + 0.010*\"mode\" + 0.009*\"veget\" + 0.008*\"produc\" + 0.007*\"candid\" + 0.007*\"uruguayan\" + 0.007*\"fuel\"\n", + "2019-01-31 00:33:27,936 : INFO : topic diff=0.006720, rho=0.044108\n", + "2019-01-31 00:33:28,094 : INFO : PROGRESS: pass 0, at document #1030000/4922894\n", + "2019-01-31 00:33:29,511 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:33:29,777 : INFO : topic #3 (0.020): 0.035*\"present\" + 0.028*\"offic\" + 0.025*\"minist\" + 0.021*\"serv\" + 0.019*\"govern\" + 0.018*\"gener\" + 0.018*\"member\" + 0.018*\"nation\" + 0.016*\"seri\" + 0.016*\"chickasaw\"\n", + "2019-01-31 00:33:29,778 : INFO : topic #35 (0.020): 0.053*\"russia\" + 0.038*\"sovereignti\" + 0.031*\"rural\" + 0.026*\"poison\" + 0.025*\"personifi\" + 0.023*\"reprint\" + 0.019*\"moscow\" + 0.017*\"poland\" + 0.016*\"unfortun\" + 0.015*\"malaysia\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 00:33:29,779 : INFO : topic #45 (0.020): 0.020*\"fifteenth\" + 0.020*\"jpg\" + 0.015*\"colder\" + 0.015*\"illicit\" + 0.015*\"black\" + 0.015*\"western\" + 0.012*\"record\" + 0.010*\"blind\" + 0.008*\"light\" + 0.008*\"green\"\n", + "2019-01-31 00:33:29,781 : INFO : topic #37 (0.020): 0.011*\"man\" + 0.009*\"love\" + 0.008*\"gestur\" + 0.006*\"blue\" + 0.005*\"vision\" + 0.004*\"litig\" + 0.004*\"bewild\" + 0.004*\"comic\" + 0.004*\"night\" + 0.004*\"black\"\n", + "2019-01-31 00:33:29,782 : INFO : topic #31 (0.020): 0.062*\"fusiform\" + 0.025*\"scientist\" + 0.025*\"player\" + 0.022*\"taxpay\" + 0.019*\"place\" + 0.013*\"clot\" + 0.012*\"leagu\" + 0.011*\"folei\" + 0.010*\"ruler\" + 0.010*\"yawn\"\n", + "2019-01-31 00:33:29,788 : INFO : topic diff=0.008297, rho=0.044065\n", + "2019-01-31 00:33:29,944 : INFO : PROGRESS: pass 0, at document #1032000/4922894\n", + "2019-01-31 00:33:31,364 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:33:31,631 : INFO : topic #19 (0.020): 0.013*\"languag\" + 0.010*\"woodcut\" + 0.010*\"form\" + 0.010*\"origin\" + 0.009*\"centuri\" + 0.008*\"mean\" + 0.007*\"charact\" + 0.007*\"like\" + 0.007*\"uruguayan\" + 0.007*\"trade\"\n", + "2019-01-31 00:33:31,632 : INFO : topic #32 (0.020): 0.057*\"district\" + 0.046*\"vigour\" + 0.042*\"popolo\" + 0.039*\"tortur\" + 0.028*\"cotton\" + 0.028*\"area\" + 0.026*\"regim\" + 0.023*\"multitud\" + 0.021*\"citi\" + 0.019*\"commun\"\n", + "2019-01-31 00:33:31,633 : INFO : topic #34 (0.020): 0.072*\"start\" + 0.034*\"cotton\" + 0.031*\"unionist\" + 0.029*\"american\" + 0.025*\"new\" + 0.014*\"warrior\" + 0.014*\"year\" + 0.013*\"california\" + 0.013*\"north\" + 0.013*\"terri\"\n", + "2019-01-31 00:33:31,634 : INFO : topic #17 (0.020): 0.074*\"church\" + 0.023*\"cathol\" + 0.020*\"christian\" + 0.019*\"bishop\" + 0.015*\"sail\" + 0.014*\"retroflex\" + 0.010*\"parish\" + 0.010*\"historiographi\" + 0.009*\"centuri\" + 0.009*\"relationship\"\n", + "2019-01-31 00:33:31,636 : INFO : topic #38 (0.020): 0.023*\"walter\" + 0.011*\"aza\" + 0.009*\"battalion\" + 0.009*\"forc\" + 0.008*\"empath\" + 0.007*\"teufel\" + 0.007*\"king\" + 0.007*\"armi\" + 0.007*\"centuri\" + 0.007*\"till\"\n", + "2019-01-31 00:33:31,641 : INFO : topic diff=0.007242, rho=0.044023\n", + "2019-01-31 00:33:31,795 : INFO : PROGRESS: pass 0, at document #1034000/4922894\n", + "2019-01-31 00:33:33,188 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:33:33,456 : INFO : topic #40 (0.020): 0.090*\"unit\" + 0.022*\"collector\" + 0.022*\"institut\" + 0.022*\"schuster\" + 0.020*\"requir\" + 0.018*\"student\" + 0.015*\"professor\" + 0.012*\"word\" + 0.011*\"governor\" + 0.011*\"http\"\n", + "2019-01-31 00:33:33,457 : INFO : topic #16 (0.020): 0.046*\"king\" + 0.032*\"priest\" + 0.019*\"idiosyncrat\" + 0.019*\"quarterli\" + 0.018*\"duke\" + 0.016*\"grammat\" + 0.016*\"rotterdam\" + 0.014*\"portugues\" + 0.014*\"princ\" + 0.014*\"count\"\n", + "2019-01-31 00:33:33,458 : INFO : topic #0 (0.020): 0.066*\"statewid\" + 0.040*\"arsen\" + 0.039*\"line\" + 0.034*\"raid\" + 0.031*\"museo\" + 0.020*\"traceabl\" + 0.018*\"serv\" + 0.014*\"pain\" + 0.014*\"exhaust\" + 0.013*\"gai\"\n", + "2019-01-31 00:33:33,459 : INFO : topic #38 (0.020): 0.023*\"walter\" + 0.011*\"aza\" + 0.009*\"battalion\" + 0.009*\"forc\" + 0.008*\"empath\" + 0.008*\"teufel\" + 0.007*\"king\" + 0.007*\"armi\" + 0.007*\"till\" + 0.007*\"centuri\"\n", + "2019-01-31 00:33:33,460 : INFO : topic #25 (0.020): 0.030*\"ring\" + 0.017*\"area\" + 0.016*\"warmth\" + 0.016*\"lagrang\" + 0.013*\"mount\" + 0.009*\"palmer\" + 0.009*\"north\" + 0.009*\"foam\" + 0.009*\"vacant\" + 0.008*\"sourc\"\n", + "2019-01-31 00:33:33,466 : INFO : topic diff=0.006693, rho=0.043980\n", + "2019-01-31 00:33:33,621 : INFO : PROGRESS: pass 0, at document #1036000/4922894\n", + "2019-01-31 00:33:35,041 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:33:35,307 : INFO : topic #26 (0.020): 0.031*\"workplac\" + 0.030*\"champion\" + 0.027*\"woman\" + 0.025*\"olymp\" + 0.023*\"men\" + 0.022*\"medal\" + 0.021*\"event\" + 0.018*\"alic\" + 0.018*\"atheist\" + 0.017*\"nation\"\n", + "2019-01-31 00:33:35,308 : INFO : topic #31 (0.020): 0.060*\"fusiform\" + 0.025*\"scientist\" + 0.025*\"player\" + 0.022*\"taxpay\" + 0.019*\"place\" + 0.013*\"clot\" + 0.013*\"leagu\" + 0.011*\"folei\" + 0.010*\"yawn\" + 0.010*\"ruler\"\n", + "2019-01-31 00:33:35,309 : INFO : topic #39 (0.020): 0.042*\"canada\" + 0.035*\"canadian\" + 0.020*\"toronto\" + 0.018*\"hoar\" + 0.017*\"ontario\" + 0.013*\"new\" + 0.012*\"scientist\" + 0.012*\"taxpay\" + 0.012*\"misericordia\" + 0.011*\"novotná\"\n", + "2019-01-31 00:33:35,311 : INFO : topic #38 (0.020): 0.023*\"walter\" + 0.011*\"aza\" + 0.009*\"battalion\" + 0.009*\"forc\" + 0.008*\"teufel\" + 0.008*\"empath\" + 0.007*\"king\" + 0.007*\"armi\" + 0.007*\"till\" + 0.007*\"centuri\"\n", + "2019-01-31 00:33:35,312 : INFO : topic #41 (0.020): 0.044*\"citi\" + 0.030*\"new\" + 0.022*\"palmer\" + 0.016*\"strategist\" + 0.014*\"year\" + 0.013*\"center\" + 0.012*\"open\" + 0.010*\"includ\" + 0.009*\"lobe\" + 0.009*\"highli\"\n", + "2019-01-31 00:33:35,318 : INFO : topic diff=0.006282, rho=0.043937\n", + "2019-01-31 00:33:35,473 : INFO : PROGRESS: pass 0, at document #1038000/4922894\n", + "2019-01-31 00:33:36,879 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:33:37,146 : INFO : topic #29 (0.020): 0.017*\"companhia\" + 0.010*\"million\" + 0.008*\"bank\" + 0.008*\"yawn\" + 0.008*\"govern\" + 0.008*\"market\" + 0.008*\"start\" + 0.007*\"busi\" + 0.007*\"industri\" + 0.007*\"function\"\n", + "2019-01-31 00:33:37,147 : INFO : topic #42 (0.020): 0.046*\"german\" + 0.030*\"germani\" + 0.016*\"berlin\" + 0.014*\"israel\" + 0.013*\"vol\" + 0.013*\"der\" + 0.012*\"jewish\" + 0.009*\"hungarian\" + 0.009*\"european\" + 0.009*\"austria\"\n", + "2019-01-31 00:33:37,148 : INFO : topic #30 (0.020): 0.036*\"cleveland\" + 0.036*\"leagu\" + 0.031*\"place\" + 0.028*\"taxpay\" + 0.024*\"scientist\" + 0.024*\"crete\" + 0.022*\"folei\" + 0.016*\"goal\" + 0.015*\"martin\" + 0.012*\"schmitz\"\n", + "2019-01-31 00:33:37,149 : INFO : topic #11 (0.020): 0.028*\"john\" + 0.015*\"will\" + 0.013*\"jame\" + 0.012*\"rival\" + 0.012*\"david\" + 0.010*\"mexican–american\" + 0.009*\"georg\" + 0.009*\"slur\" + 0.008*\"paul\" + 0.008*\"rhyme\"\n", + "2019-01-31 00:33:37,151 : INFO : topic #48 (0.020): 0.076*\"januari\" + 0.076*\"march\" + 0.075*\"octob\" + 0.074*\"sens\" + 0.069*\"notion\" + 0.068*\"april\" + 0.067*\"decatur\" + 0.067*\"juli\" + 0.066*\"august\" + 0.065*\"judici\"\n", + "2019-01-31 00:33:37,156 : INFO : topic diff=0.006991, rho=0.043895\n", + "2019-01-31 00:33:39,941 : INFO : -11.607 per-word bound, 3118.7 perplexity estimate based on a held-out corpus of 2000 documents with 590235 words\n", + "2019-01-31 00:33:39,942 : INFO : PROGRESS: pass 0, at document #1040000/4922894\n", + "2019-01-31 00:33:41,381 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:33:41,647 : INFO : topic #15 (0.020): 0.012*\"small\" + 0.011*\"organ\" + 0.010*\"develop\" + 0.010*\"commun\" + 0.009*\"group\" + 0.008*\"cultur\" + 0.008*\"word\" + 0.008*\"peopl\" + 0.007*\"human\" + 0.006*\"student\"\n", + "2019-01-31 00:33:41,648 : INFO : topic #19 (0.020): 0.013*\"languag\" + 0.010*\"woodcut\" + 0.010*\"form\" + 0.010*\"origin\" + 0.009*\"centuri\" + 0.008*\"mean\" + 0.007*\"charact\" + 0.007*\"like\" + 0.007*\"uruguayan\" + 0.007*\"trade\"\n", + "2019-01-31 00:33:41,649 : INFO : topic #10 (0.020): 0.011*\"cdd\" + 0.009*\"disco\" + 0.008*\"proper\" + 0.007*\"have\" + 0.007*\"media\" + 0.007*\"caus\" + 0.007*\"pathwai\" + 0.006*\"acid\" + 0.006*\"hormon\" + 0.006*\"effect\"\n", + "2019-01-31 00:33:41,650 : INFO : topic #17 (0.020): 0.073*\"church\" + 0.023*\"cathol\" + 0.020*\"christian\" + 0.019*\"bishop\" + 0.015*\"sail\" + 0.014*\"retroflex\" + 0.011*\"parish\" + 0.009*\"historiographi\" + 0.009*\"centuri\" + 0.009*\"poll\"\n", + "2019-01-31 00:33:41,651 : INFO : topic #46 (0.020): 0.018*\"stop\" + 0.016*\"swedish\" + 0.016*\"norwai\" + 0.016*\"sweden\" + 0.015*\"wind\" + 0.015*\"treeless\" + 0.014*\"norwegian\" + 0.013*\"damag\" + 0.013*\"turkish\" + 0.012*\"replac\"\n", + "2019-01-31 00:33:41,657 : INFO : topic diff=0.008986, rho=0.043853\n", + "2019-01-31 00:33:41,813 : INFO : PROGRESS: pass 0, at document #1042000/4922894\n", + "2019-01-31 00:33:43,222 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:33:43,488 : INFO : topic #0 (0.020): 0.066*\"statewid\" + 0.041*\"arsen\" + 0.039*\"line\" + 0.034*\"raid\" + 0.030*\"museo\" + 0.020*\"traceabl\" + 0.018*\"serv\" + 0.014*\"exhaust\" + 0.014*\"pain\" + 0.013*\"gai\"\n", + "2019-01-31 00:33:43,489 : INFO : topic #30 (0.020): 0.036*\"leagu\" + 0.036*\"cleveland\" + 0.031*\"place\" + 0.028*\"taxpay\" + 0.024*\"scientist\" + 0.023*\"crete\" + 0.022*\"folei\" + 0.016*\"goal\" + 0.016*\"martin\" + 0.012*\"schmitz\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 00:33:43,490 : INFO : topic #47 (0.020): 0.065*\"muscl\" + 0.033*\"perceptu\" + 0.020*\"theater\" + 0.017*\"place\" + 0.017*\"compos\" + 0.016*\"damn\" + 0.015*\"physician\" + 0.014*\"orchestr\" + 0.014*\"olympo\" + 0.011*\"word\"\n", + "2019-01-31 00:33:43,492 : INFO : topic #6 (0.020): 0.072*\"fewer\" + 0.025*\"epiru\" + 0.023*\"septemb\" + 0.019*\"teacher\" + 0.017*\"stake\" + 0.013*\"rodríguez\" + 0.012*\"proclaim\" + 0.011*\"movi\" + 0.011*\"direct\" + 0.011*\"acrimoni\"\n", + "2019-01-31 00:33:43,493 : INFO : topic #32 (0.020): 0.057*\"district\" + 0.047*\"vigour\" + 0.043*\"popolo\" + 0.039*\"tortur\" + 0.028*\"cotton\" + 0.027*\"area\" + 0.025*\"regim\" + 0.023*\"multitud\" + 0.021*\"citi\" + 0.019*\"commun\"\n", + "2019-01-31 00:33:43,498 : INFO : topic diff=0.007438, rho=0.043811\n", + "2019-01-31 00:33:43,657 : INFO : PROGRESS: pass 0, at document #1044000/4922894\n", + "2019-01-31 00:33:45,080 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:33:45,346 : INFO : topic #11 (0.020): 0.028*\"john\" + 0.015*\"will\" + 0.013*\"jame\" + 0.012*\"rival\" + 0.011*\"david\" + 0.010*\"mexican–american\" + 0.009*\"georg\" + 0.009*\"slur\" + 0.008*\"paul\" + 0.008*\"rhyme\"\n", + "2019-01-31 00:33:45,347 : INFO : topic #8 (0.020): 0.028*\"law\" + 0.023*\"cortic\" + 0.020*\"act\" + 0.018*\"start\" + 0.014*\"ricardo\" + 0.013*\"case\" + 0.011*\"polaris\" + 0.009*\"legal\" + 0.008*\"replac\" + 0.007*\"judaism\"\n", + "2019-01-31 00:33:45,348 : INFO : topic #21 (0.020): 0.039*\"samford\" + 0.023*\"spain\" + 0.020*\"mexico\" + 0.019*\"del\" + 0.014*\"soviet\" + 0.012*\"juan\" + 0.011*\"santa\" + 0.011*\"lizard\" + 0.011*\"carlo\" + 0.011*\"francisco\"\n", + "2019-01-31 00:33:45,349 : INFO : topic #20 (0.020): 0.140*\"scholar\" + 0.039*\"struggl\" + 0.036*\"high\" + 0.029*\"educ\" + 0.022*\"collector\" + 0.018*\"yawn\" + 0.013*\"prognosi\" + 0.009*\"gothic\" + 0.009*\"district\" + 0.009*\"task\"\n", + "2019-01-31 00:33:45,350 : INFO : topic #48 (0.020): 0.075*\"march\" + 0.074*\"januari\" + 0.074*\"octob\" + 0.073*\"sens\" + 0.067*\"notion\" + 0.066*\"april\" + 0.066*\"juli\" + 0.065*\"august\" + 0.065*\"decatur\" + 0.064*\"judici\"\n", + "2019-01-31 00:33:45,356 : INFO : topic diff=0.008850, rho=0.043769\n", + "2019-01-31 00:33:45,511 : INFO : PROGRESS: pass 0, at document #1046000/4922894\n", + "2019-01-31 00:33:46,920 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:33:47,187 : INFO : topic #41 (0.020): 0.044*\"citi\" + 0.030*\"new\" + 0.022*\"palmer\" + 0.016*\"strategist\" + 0.015*\"year\" + 0.013*\"center\" + 0.012*\"open\" + 0.010*\"includ\" + 0.009*\"lobe\" + 0.009*\"highli\"\n", + "2019-01-31 00:33:47,188 : INFO : topic #27 (0.020): 0.071*\"questionnair\" + 0.019*\"candid\" + 0.019*\"taxpay\" + 0.014*\"fool\" + 0.013*\"driver\" + 0.012*\"ret\" + 0.012*\"horac\" + 0.012*\"find\" + 0.012*\"tornado\" + 0.010*\"champion\"\n", + "2019-01-31 00:33:47,189 : INFO : topic #1 (0.020): 0.055*\"china\" + 0.050*\"chilton\" + 0.026*\"kong\" + 0.025*\"hong\" + 0.020*\"korea\" + 0.018*\"korean\" + 0.015*\"leah\" + 0.014*\"sourc\" + 0.013*\"kim\" + 0.013*\"shirin\"\n", + "2019-01-31 00:33:47,190 : INFO : topic #4 (0.020): 0.021*\"enfranchis\" + 0.015*\"pour\" + 0.014*\"depress\" + 0.011*\"elabor\" + 0.010*\"mode\" + 0.009*\"veget\" + 0.008*\"produc\" + 0.008*\"candid\" + 0.007*\"uruguayan\" + 0.007*\"encyclopedia\"\n", + "2019-01-31 00:33:47,191 : INFO : topic #9 (0.020): 0.068*\"bone\" + 0.045*\"american\" + 0.031*\"valour\" + 0.021*\"dutch\" + 0.018*\"folei\" + 0.018*\"player\" + 0.017*\"english\" + 0.017*\"polit\" + 0.013*\"acrimoni\" + 0.011*\"simpler\"\n", + "2019-01-31 00:33:47,197 : INFO : topic diff=0.006886, rho=0.043727\n", + "2019-01-31 00:33:47,350 : INFO : PROGRESS: pass 0, at document #1048000/4922894\n", + "2019-01-31 00:33:48,741 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:33:49,007 : INFO : topic #3 (0.020): 0.035*\"present\" + 0.027*\"offic\" + 0.025*\"minist\" + 0.020*\"serv\" + 0.019*\"gener\" + 0.018*\"nation\" + 0.018*\"member\" + 0.018*\"govern\" + 0.016*\"seri\" + 0.015*\"chickasaw\"\n", + "2019-01-31 00:33:49,008 : INFO : topic #42 (0.020): 0.047*\"german\" + 0.030*\"germani\" + 0.015*\"berlin\" + 0.014*\"israel\" + 0.014*\"vol\" + 0.013*\"der\" + 0.012*\"jewish\" + 0.009*\"european\" + 0.009*\"isra\" + 0.008*\"austria\"\n", + "2019-01-31 00:33:49,010 : INFO : topic #24 (0.020): 0.042*\"book\" + 0.035*\"publicis\" + 0.024*\"word\" + 0.018*\"new\" + 0.015*\"edit\" + 0.014*\"nicola\" + 0.013*\"presid\" + 0.012*\"storag\" + 0.011*\"magazin\" + 0.011*\"worldwid\"\n", + "2019-01-31 00:33:49,011 : INFO : topic #0 (0.020): 0.065*\"statewid\" + 0.042*\"arsen\" + 0.038*\"line\" + 0.033*\"raid\" + 0.031*\"museo\" + 0.020*\"traceabl\" + 0.018*\"serv\" + 0.015*\"pain\" + 0.014*\"exhaust\" + 0.013*\"gai\"\n", + "2019-01-31 00:33:49,012 : INFO : topic #23 (0.020): 0.134*\"audit\" + 0.069*\"best\" + 0.035*\"yawn\" + 0.029*\"jacksonvil\" + 0.026*\"japanes\" + 0.021*\"festiv\" + 0.021*\"noll\" + 0.019*\"intern\" + 0.018*\"women\" + 0.015*\"winner\"\n", + "2019-01-31 00:33:49,018 : INFO : topic diff=0.006464, rho=0.043685\n", + "2019-01-31 00:33:49,173 : INFO : PROGRESS: pass 0, at document #1050000/4922894\n", + "2019-01-31 00:33:50,573 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:33:50,838 : INFO : topic #6 (0.020): 0.072*\"fewer\" + 0.024*\"epiru\" + 0.023*\"septemb\" + 0.019*\"teacher\" + 0.018*\"stake\" + 0.013*\"rodríguez\" + 0.012*\"proclaim\" + 0.011*\"direct\" + 0.011*\"movi\" + 0.010*\"acrimoni\"\n", + "2019-01-31 00:33:50,840 : INFO : topic #20 (0.020): 0.139*\"scholar\" + 0.039*\"struggl\" + 0.035*\"high\" + 0.029*\"educ\" + 0.021*\"collector\" + 0.018*\"yawn\" + 0.013*\"prognosi\" + 0.010*\"gothic\" + 0.010*\"district\" + 0.010*\"task\"\n", + "2019-01-31 00:33:50,841 : INFO : topic #40 (0.020): 0.092*\"unit\" + 0.022*\"schuster\" + 0.022*\"collector\" + 0.022*\"institut\" + 0.020*\"requir\" + 0.017*\"student\" + 0.014*\"professor\" + 0.012*\"word\" + 0.012*\"http\" + 0.011*\"governor\"\n", + "2019-01-31 00:33:50,842 : INFO : topic #18 (0.020): 0.010*\"théori\" + 0.007*\"later\" + 0.007*\"kill\" + 0.007*\"sack\" + 0.006*\"dai\" + 0.005*\"retrospect\" + 0.004*\"like\" + 0.004*\"deal\" + 0.004*\"end\" + 0.004*\"help\"\n", + "2019-01-31 00:33:50,843 : INFO : topic #14 (0.020): 0.024*\"forc\" + 0.023*\"aggress\" + 0.020*\"armi\" + 0.020*\"walter\" + 0.018*\"com\" + 0.014*\"oper\" + 0.013*\"unionist\" + 0.012*\"airbu\" + 0.012*\"militari\" + 0.011*\"airmen\"\n", + "2019-01-31 00:33:50,849 : INFO : topic diff=0.007840, rho=0.043644\n", + "2019-01-31 00:33:51,001 : INFO : PROGRESS: pass 0, at document #1052000/4922894\n", + "2019-01-31 00:33:52,376 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:33:52,642 : INFO : topic #4 (0.020): 0.021*\"enfranchis\" + 0.015*\"pour\" + 0.014*\"depress\" + 0.011*\"elabor\" + 0.009*\"mode\" + 0.008*\"veget\" + 0.008*\"produc\" + 0.007*\"candid\" + 0.007*\"encyclopedia\" + 0.007*\"uruguayan\"\n", + "2019-01-31 00:33:52,643 : INFO : topic #0 (0.020): 0.064*\"statewid\" + 0.042*\"arsen\" + 0.037*\"line\" + 0.032*\"raid\" + 0.030*\"museo\" + 0.019*\"traceabl\" + 0.017*\"serv\" + 0.015*\"pain\" + 0.015*\"exhaust\" + 0.013*\"gai\"\n", + "2019-01-31 00:33:52,644 : INFO : topic #43 (0.020): 0.063*\"elect\" + 0.059*\"parti\" + 0.024*\"voluntari\" + 0.021*\"member\" + 0.021*\"democrat\" + 0.018*\"polici\" + 0.014*\"bypass\" + 0.013*\"report\" + 0.013*\"republ\" + 0.013*\"liber\"\n", + "2019-01-31 00:33:52,645 : INFO : topic #32 (0.020): 0.056*\"district\" + 0.047*\"vigour\" + 0.044*\"popolo\" + 0.039*\"tortur\" + 0.027*\"cotton\" + 0.027*\"area\" + 0.025*\"regim\" + 0.024*\"multitud\" + 0.021*\"citi\" + 0.019*\"commun\"\n", + "2019-01-31 00:33:52,646 : INFO : topic #15 (0.020): 0.012*\"small\" + 0.011*\"organ\" + 0.010*\"develop\" + 0.010*\"commun\" + 0.009*\"group\" + 0.009*\"word\" + 0.008*\"peopl\" + 0.008*\"cultur\" + 0.007*\"human\" + 0.006*\"socialist\"\n", + "2019-01-31 00:33:52,652 : INFO : topic diff=0.007742, rho=0.043602\n", + "2019-01-31 00:33:52,857 : INFO : PROGRESS: pass 0, at document #1054000/4922894\n", + "2019-01-31 00:33:54,248 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:33:54,515 : INFO : topic #28 (0.020): 0.030*\"build\" + 0.027*\"hous\" + 0.022*\"rivièr\" + 0.017*\"buford\" + 0.012*\"histor\" + 0.011*\"briarwood\" + 0.011*\"strategist\" + 0.011*\"constitut\" + 0.010*\"depress\" + 0.010*\"linear\"\n", + "2019-01-31 00:33:54,516 : INFO : topic #38 (0.020): 0.023*\"walter\" + 0.012*\"aza\" + 0.009*\"battalion\" + 0.008*\"forc\" + 0.008*\"teufel\" + 0.008*\"till\" + 0.007*\"empath\" + 0.007*\"king\" + 0.007*\"armi\" + 0.007*\"centuri\"\n", + "2019-01-31 00:33:54,517 : INFO : topic #34 (0.020): 0.070*\"start\" + 0.033*\"cotton\" + 0.031*\"unionist\" + 0.030*\"american\" + 0.025*\"new\" + 0.014*\"year\" + 0.014*\"warrior\" + 0.013*\"california\" + 0.013*\"terri\" + 0.013*\"north\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 00:33:54,518 : INFO : topic #18 (0.020): 0.010*\"théori\" + 0.007*\"later\" + 0.007*\"kill\" + 0.007*\"sack\" + 0.006*\"dai\" + 0.005*\"retrospect\" + 0.004*\"like\" + 0.004*\"end\" + 0.004*\"deal\" + 0.004*\"help\"\n", + "2019-01-31 00:33:54,519 : INFO : topic #8 (0.020): 0.027*\"law\" + 0.022*\"cortic\" + 0.020*\"act\" + 0.018*\"start\" + 0.014*\"ricardo\" + 0.012*\"polaris\" + 0.012*\"case\" + 0.008*\"legal\" + 0.008*\"replac\" + 0.007*\"judaism\"\n", + "2019-01-31 00:33:54,525 : INFO : topic diff=0.007114, rho=0.043561\n", + "2019-01-31 00:33:54,679 : INFO : PROGRESS: pass 0, at document #1056000/4922894\n", + "2019-01-31 00:33:56,067 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:33:56,333 : INFO : topic #44 (0.020): 0.032*\"rooftop\" + 0.028*\"final\" + 0.021*\"wife\" + 0.021*\"tourist\" + 0.020*\"champion\" + 0.017*\"taxpay\" + 0.015*\"tiepolo\" + 0.015*\"martin\" + 0.015*\"chamber\" + 0.013*\"open\"\n", + "2019-01-31 00:33:56,334 : INFO : topic #31 (0.020): 0.061*\"fusiform\" + 0.025*\"scientist\" + 0.025*\"player\" + 0.022*\"taxpay\" + 0.019*\"place\" + 0.013*\"clot\" + 0.012*\"leagu\" + 0.011*\"folei\" + 0.010*\"yawn\" + 0.010*\"ruler\"\n", + "2019-01-31 00:33:56,335 : INFO : topic #27 (0.020): 0.072*\"questionnair\" + 0.019*\"taxpay\" + 0.018*\"candid\" + 0.014*\"fool\" + 0.013*\"ret\" + 0.012*\"driver\" + 0.012*\"tornado\" + 0.012*\"find\" + 0.011*\"horac\" + 0.010*\"champion\"\n", + "2019-01-31 00:33:56,336 : INFO : topic #33 (0.020): 0.061*\"french\" + 0.044*\"franc\" + 0.031*\"pari\" + 0.024*\"sail\" + 0.024*\"jean\" + 0.018*\"daphn\" + 0.013*\"lazi\" + 0.013*\"piec\" + 0.013*\"loui\" + 0.010*\"wine\"\n", + "2019-01-31 00:33:56,337 : INFO : topic #1 (0.020): 0.053*\"china\" + 0.048*\"chilton\" + 0.025*\"kong\" + 0.025*\"hong\" + 0.021*\"korea\" + 0.018*\"korean\" + 0.016*\"leah\" + 0.015*\"sourc\" + 0.013*\"kim\" + 0.012*\"shirin\"\n", + "2019-01-31 00:33:56,343 : INFO : topic diff=0.007609, rho=0.043519\n", + "2019-01-31 00:33:56,497 : INFO : PROGRESS: pass 0, at document #1058000/4922894\n", + "2019-01-31 00:33:57,876 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:33:58,142 : INFO : topic #2 (0.020): 0.051*\"isl\" + 0.037*\"shield\" + 0.018*\"narrat\" + 0.015*\"scot\" + 0.013*\"pope\" + 0.011*\"blur\" + 0.011*\"nativist\" + 0.010*\"coalit\" + 0.008*\"sai\" + 0.008*\"bahá\"\n", + "2019-01-31 00:33:58,143 : INFO : topic #47 (0.020): 0.064*\"muscl\" + 0.034*\"perceptu\" + 0.020*\"theater\" + 0.017*\"place\" + 0.017*\"compos\" + 0.016*\"damn\" + 0.014*\"physician\" + 0.014*\"olympo\" + 0.013*\"orchestr\" + 0.012*\"word\"\n", + "2019-01-31 00:33:58,144 : INFO : topic #4 (0.020): 0.021*\"enfranchis\" + 0.015*\"pour\" + 0.014*\"depress\" + 0.010*\"elabor\" + 0.009*\"mode\" + 0.008*\"veget\" + 0.008*\"produc\" + 0.007*\"candid\" + 0.007*\"encyclopedia\" + 0.007*\"uruguayan\"\n", + "2019-01-31 00:33:58,145 : INFO : topic #37 (0.020): 0.010*\"man\" + 0.010*\"love\" + 0.008*\"gestur\" + 0.006*\"blue\" + 0.005*\"litig\" + 0.005*\"bewild\" + 0.004*\"vision\" + 0.004*\"comic\" + 0.004*\"madison\" + 0.004*\"night\"\n", + "2019-01-31 00:33:58,146 : INFO : topic #34 (0.020): 0.071*\"start\" + 0.032*\"cotton\" + 0.031*\"unionist\" + 0.030*\"american\" + 0.024*\"new\" + 0.014*\"terri\" + 0.013*\"year\" + 0.013*\"warrior\" + 0.013*\"california\" + 0.013*\"north\"\n", + "2019-01-31 00:33:58,152 : INFO : topic diff=0.006689, rho=0.043478\n", + "2019-01-31 00:34:00,893 : INFO : -11.641 per-word bound, 3194.2 perplexity estimate based on a held-out corpus of 2000 documents with 568585 words\n", + "2019-01-31 00:34:00,893 : INFO : PROGRESS: pass 0, at document #1060000/4922894\n", + "2019-01-31 00:34:02,319 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:34:02,585 : INFO : topic #35 (0.020): 0.052*\"russia\" + 0.036*\"sovereignti\" + 0.031*\"rural\" + 0.025*\"poison\" + 0.024*\"personifi\" + 0.022*\"reprint\" + 0.020*\"moscow\" + 0.018*\"unfortun\" + 0.016*\"poland\" + 0.015*\"malaysia\"\n", + "2019-01-31 00:34:02,586 : INFO : topic #41 (0.020): 0.044*\"citi\" + 0.031*\"new\" + 0.022*\"palmer\" + 0.015*\"strategist\" + 0.015*\"year\" + 0.013*\"center\" + 0.012*\"open\" + 0.011*\"includ\" + 0.010*\"lobe\" + 0.009*\"highli\"\n", + "2019-01-31 00:34:02,587 : INFO : topic #3 (0.020): 0.036*\"present\" + 0.027*\"minist\" + 0.026*\"offic\" + 0.020*\"serv\" + 0.019*\"gener\" + 0.019*\"member\" + 0.018*\"nation\" + 0.018*\"govern\" + 0.016*\"seri\" + 0.015*\"chickasaw\"\n", + "2019-01-31 00:34:02,588 : INFO : topic #46 (0.020): 0.018*\"stop\" + 0.017*\"damag\" + 0.016*\"sweden\" + 0.016*\"norwai\" + 0.015*\"swedish\" + 0.014*\"wind\" + 0.014*\"norwegian\" + 0.013*\"turkish\" + 0.012*\"treeless\" + 0.012*\"replac\"\n", + "2019-01-31 00:34:02,589 : INFO : topic #4 (0.020): 0.021*\"enfranchis\" + 0.015*\"pour\" + 0.014*\"depress\" + 0.010*\"elabor\" + 0.009*\"mode\" + 0.008*\"veget\" + 0.008*\"produc\" + 0.008*\"candid\" + 0.007*\"encyclopedia\" + 0.007*\"uruguayan\"\n", + "2019-01-31 00:34:02,595 : INFO : topic diff=0.007224, rho=0.043437\n", + "2019-01-31 00:34:02,748 : INFO : PROGRESS: pass 0, at document #1062000/4922894\n", + "2019-01-31 00:34:04,130 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:34:04,396 : INFO : topic #48 (0.020): 0.079*\"march\" + 0.074*\"octob\" + 0.074*\"januari\" + 0.073*\"sens\" + 0.069*\"notion\" + 0.068*\"april\" + 0.066*\"juli\" + 0.066*\"august\" + 0.066*\"decatur\" + 0.063*\"judici\"\n", + "2019-01-31 00:34:04,398 : INFO : topic #5 (0.020): 0.040*\"abroad\" + 0.029*\"son\" + 0.027*\"rel\" + 0.026*\"reconstruct\" + 0.021*\"band\" + 0.017*\"muscl\" + 0.017*\"simultan\" + 0.014*\"charcoal\" + 0.014*\"toyota\" + 0.010*\"vocabulari\"\n", + "2019-01-31 00:34:04,399 : INFO : topic #34 (0.020): 0.070*\"start\" + 0.032*\"cotton\" + 0.030*\"unionist\" + 0.030*\"american\" + 0.024*\"new\" + 0.013*\"terri\" + 0.013*\"warrior\" + 0.013*\"year\" + 0.013*\"north\" + 0.013*\"california\"\n", + "2019-01-31 00:34:04,400 : INFO : topic #23 (0.020): 0.135*\"audit\" + 0.067*\"best\" + 0.035*\"yawn\" + 0.031*\"jacksonvil\" + 0.026*\"japanes\" + 0.021*\"noll\" + 0.020*\"festiv\" + 0.018*\"women\" + 0.018*\"intern\" + 0.015*\"prison\"\n", + "2019-01-31 00:34:04,401 : INFO : topic #49 (0.020): 0.042*\"india\" + 0.028*\"incumb\" + 0.016*\"televis\" + 0.012*\"islam\" + 0.011*\"pakistan\" + 0.010*\"sri\" + 0.010*\"anglo\" + 0.010*\"affection\" + 0.010*\"alam\" + 0.010*\"khalsa\"\n", + "2019-01-31 00:34:04,407 : INFO : topic diff=0.006235, rho=0.043396\n", + "2019-01-31 00:34:04,564 : INFO : PROGRESS: pass 0, at document #1064000/4922894\n", + "2019-01-31 00:34:05,971 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:34:06,237 : INFO : topic #31 (0.020): 0.059*\"fusiform\" + 0.026*\"scientist\" + 0.025*\"player\" + 0.023*\"taxpay\" + 0.019*\"place\" + 0.014*\"clot\" + 0.012*\"leagu\" + 0.011*\"folei\" + 0.010*\"yawn\" + 0.009*\"barber\"\n", + "2019-01-31 00:34:06,238 : INFO : topic #39 (0.020): 0.043*\"canada\" + 0.036*\"canadian\" + 0.020*\"toronto\" + 0.019*\"hoar\" + 0.018*\"ontario\" + 0.013*\"new\" + 0.013*\"nba\" + 0.012*\"scientist\" + 0.011*\"taxpay\" + 0.011*\"hydrogen\"\n", + "2019-01-31 00:34:06,239 : INFO : topic #8 (0.020): 0.028*\"law\" + 0.023*\"cortic\" + 0.019*\"act\" + 0.019*\"start\" + 0.013*\"ricardo\" + 0.012*\"case\" + 0.012*\"polaris\" + 0.009*\"legal\" + 0.008*\"replac\" + 0.007*\"judaism\"\n", + "2019-01-31 00:34:06,240 : INFO : topic #20 (0.020): 0.140*\"scholar\" + 0.039*\"struggl\" + 0.034*\"high\" + 0.029*\"educ\" + 0.021*\"collector\" + 0.018*\"yawn\" + 0.013*\"prognosi\" + 0.010*\"district\" + 0.009*\"gothic\" + 0.009*\"task\"\n", + "2019-01-31 00:34:06,241 : INFO : topic #13 (0.020): 0.027*\"australia\" + 0.025*\"sourc\" + 0.025*\"new\" + 0.024*\"london\" + 0.023*\"england\" + 0.022*\"australian\" + 0.020*\"british\" + 0.017*\"ireland\" + 0.016*\"youth\" + 0.014*\"wale\"\n", + "2019-01-31 00:34:06,247 : INFO : topic diff=0.006765, rho=0.043355\n", + "2019-01-31 00:34:06,408 : INFO : PROGRESS: pass 0, at document #1066000/4922894\n", + "2019-01-31 00:34:07,842 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:34:08,108 : INFO : topic #46 (0.020): 0.018*\"stop\" + 0.016*\"damag\" + 0.016*\"norwai\" + 0.015*\"sweden\" + 0.015*\"swedish\" + 0.014*\"norwegian\" + 0.013*\"wind\" + 0.013*\"treeless\" + 0.013*\"turkish\" + 0.012*\"huntsvil\"\n", + "2019-01-31 00:34:08,109 : INFO : topic #33 (0.020): 0.060*\"french\" + 0.045*\"franc\" + 0.031*\"pari\" + 0.024*\"sail\" + 0.023*\"jean\" + 0.018*\"daphn\" + 0.013*\"lazi\" + 0.013*\"loui\" + 0.012*\"piec\" + 0.010*\"wine\"\n", + "2019-01-31 00:34:08,110 : INFO : topic #36 (0.020): 0.011*\"prognosi\" + 0.011*\"network\" + 0.010*\"pop\" + 0.008*\"develop\" + 0.008*\"serv\" + 0.008*\"cytokin\" + 0.008*\"user\" + 0.008*\"base\" + 0.008*\"includ\" + 0.007*\"softwar\"\n", + "2019-01-31 00:34:08,111 : INFO : topic #1 (0.020): 0.055*\"china\" + 0.047*\"chilton\" + 0.025*\"kong\" + 0.025*\"hong\" + 0.023*\"korea\" + 0.018*\"korean\" + 0.016*\"leah\" + 0.016*\"sourc\" + 0.014*\"kim\" + 0.012*\"ashvil\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 00:34:08,112 : INFO : topic #48 (0.020): 0.079*\"march\" + 0.075*\"octob\" + 0.073*\"sens\" + 0.073*\"januari\" + 0.068*\"april\" + 0.068*\"notion\" + 0.065*\"decatur\" + 0.065*\"juli\" + 0.065*\"august\" + 0.062*\"judici\"\n", + "2019-01-31 00:34:08,118 : INFO : topic diff=0.007163, rho=0.043315\n", + "2019-01-31 00:34:08,271 : INFO : PROGRESS: pass 0, at document #1068000/4922894\n", + "2019-01-31 00:34:09,669 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:34:09,935 : INFO : topic #43 (0.020): 0.065*\"elect\" + 0.057*\"parti\" + 0.023*\"voluntari\" + 0.022*\"democrat\" + 0.021*\"member\" + 0.017*\"polici\" + 0.015*\"republ\" + 0.013*\"report\" + 0.013*\"seaport\" + 0.013*\"liber\"\n", + "2019-01-31 00:34:09,936 : INFO : topic #17 (0.020): 0.076*\"church\" + 0.021*\"christian\" + 0.021*\"cathol\" + 0.019*\"bishop\" + 0.015*\"sail\" + 0.014*\"retroflex\" + 0.010*\"parish\" + 0.010*\"relationship\" + 0.009*\"centuri\" + 0.009*\"historiographi\"\n", + "2019-01-31 00:34:09,937 : INFO : topic #21 (0.020): 0.039*\"samford\" + 0.023*\"spain\" + 0.020*\"mexico\" + 0.019*\"del\" + 0.013*\"soviet\" + 0.012*\"juan\" + 0.011*\"santa\" + 0.011*\"lizard\" + 0.011*\"josé\" + 0.011*\"francisco\"\n", + "2019-01-31 00:34:09,938 : INFO : topic #31 (0.020): 0.059*\"fusiform\" + 0.026*\"scientist\" + 0.025*\"player\" + 0.023*\"taxpay\" + 0.019*\"place\" + 0.014*\"clot\" + 0.012*\"leagu\" + 0.011*\"folei\" + 0.010*\"yawn\" + 0.009*\"ruler\"\n", + "2019-01-31 00:34:09,939 : INFO : topic #37 (0.020): 0.010*\"man\" + 0.009*\"love\" + 0.008*\"gestur\" + 0.005*\"blue\" + 0.005*\"bewild\" + 0.005*\"litig\" + 0.004*\"dixi\" + 0.004*\"vision\" + 0.004*\"comic\" + 0.004*\"night\"\n", + "2019-01-31 00:34:09,945 : INFO : topic diff=0.006457, rho=0.043274\n", + "2019-01-31 00:34:10,102 : INFO : PROGRESS: pass 0, at document #1070000/4922894\n", + "2019-01-31 00:34:11,502 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:34:11,768 : INFO : topic #40 (0.020): 0.092*\"unit\" + 0.025*\"collector\" + 0.022*\"schuster\" + 0.022*\"institut\" + 0.019*\"requir\" + 0.017*\"student\" + 0.015*\"professor\" + 0.012*\"word\" + 0.011*\"governor\" + 0.011*\"http\"\n", + "2019-01-31 00:34:11,769 : INFO : topic #24 (0.020): 0.042*\"book\" + 0.035*\"publicis\" + 0.024*\"word\" + 0.017*\"new\" + 0.014*\"edit\" + 0.013*\"nicola\" + 0.013*\"presid\" + 0.012*\"storag\" + 0.011*\"magazin\" + 0.011*\"collect\"\n", + "2019-01-31 00:34:11,770 : INFO : topic #34 (0.020): 0.070*\"start\" + 0.031*\"cotton\" + 0.031*\"unionist\" + 0.030*\"american\" + 0.024*\"new\" + 0.014*\"warrior\" + 0.014*\"terri\" + 0.013*\"year\" + 0.013*\"california\" + 0.013*\"north\"\n", + "2019-01-31 00:34:11,771 : INFO : topic #49 (0.020): 0.043*\"india\" + 0.031*\"incumb\" + 0.016*\"televis\" + 0.012*\"islam\" + 0.011*\"pakistan\" + 0.011*\"sri\" + 0.010*\"anglo\" + 0.010*\"muskoge\" + 0.010*\"affection\" + 0.010*\"alam\"\n", + "2019-01-31 00:34:11,772 : INFO : topic #5 (0.020): 0.039*\"abroad\" + 0.029*\"son\" + 0.027*\"rel\" + 0.027*\"reconstruct\" + 0.022*\"band\" + 0.017*\"muscl\" + 0.016*\"simultan\" + 0.014*\"charcoal\" + 0.014*\"toyota\" + 0.010*\"myspac\"\n", + "2019-01-31 00:34:11,778 : INFO : topic diff=0.005978, rho=0.043234\n", + "2019-01-31 00:34:11,938 : INFO : PROGRESS: pass 0, at document #1072000/4922894\n", + "2019-01-31 00:34:13,350 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:34:13,616 : INFO : topic #2 (0.020): 0.049*\"isl\" + 0.038*\"shield\" + 0.018*\"narrat\" + 0.014*\"scot\" + 0.013*\"pope\" + 0.012*\"blur\" + 0.011*\"nativist\" + 0.010*\"coalit\" + 0.009*\"fleet\" + 0.008*\"bahá\"\n", + "2019-01-31 00:34:13,617 : INFO : topic #23 (0.020): 0.135*\"audit\" + 0.067*\"best\" + 0.035*\"yawn\" + 0.032*\"jacksonvil\" + 0.025*\"japanes\" + 0.021*\"noll\" + 0.020*\"festiv\" + 0.019*\"women\" + 0.018*\"intern\" + 0.015*\"prison\"\n", + "2019-01-31 00:34:13,618 : INFO : topic #4 (0.020): 0.021*\"enfranchis\" + 0.015*\"pour\" + 0.014*\"depress\" + 0.010*\"mode\" + 0.009*\"elabor\" + 0.008*\"veget\" + 0.008*\"produc\" + 0.007*\"candid\" + 0.007*\"uruguayan\" + 0.007*\"mandir\"\n", + "2019-01-31 00:34:13,620 : INFO : topic #42 (0.020): 0.044*\"german\" + 0.030*\"germani\" + 0.015*\"jewish\" + 0.015*\"berlin\" + 0.013*\"israel\" + 0.013*\"vol\" + 0.012*\"der\" + 0.009*\"jeremiah\" + 0.009*\"european\" + 0.008*\"europ\"\n", + "2019-01-31 00:34:13,621 : INFO : topic #47 (0.020): 0.065*\"muscl\" + 0.035*\"perceptu\" + 0.020*\"theater\" + 0.018*\"place\" + 0.017*\"compos\" + 0.017*\"damn\" + 0.014*\"olympo\" + 0.014*\"physician\" + 0.013*\"orchestr\" + 0.011*\"word\"\n", + "2019-01-31 00:34:13,627 : INFO : topic diff=0.007211, rho=0.043193\n", + "2019-01-31 00:34:13,785 : INFO : PROGRESS: pass 0, at document #1074000/4922894\n", + "2019-01-31 00:34:15,240 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:34:15,506 : INFO : topic #12 (0.020): 0.009*\"number\" + 0.007*\"frontal\" + 0.007*\"théori\" + 0.007*\"gener\" + 0.007*\"exampl\" + 0.006*\"southern\" + 0.006*\"poet\" + 0.006*\"measur\" + 0.006*\"servitud\" + 0.005*\"utopian\"\n", + "2019-01-31 00:34:15,507 : INFO : topic #28 (0.020): 0.030*\"build\" + 0.026*\"hous\" + 0.022*\"rivièr\" + 0.017*\"buford\" + 0.013*\"histor\" + 0.011*\"briarwood\" + 0.011*\"strategist\" + 0.011*\"constitut\" + 0.010*\"depress\" + 0.010*\"silicon\"\n", + "2019-01-31 00:34:15,509 : INFO : topic #37 (0.020): 0.010*\"man\" + 0.010*\"love\" + 0.008*\"gestur\" + 0.005*\"blue\" + 0.005*\"litig\" + 0.005*\"bewild\" + 0.004*\"vision\" + 0.004*\"comic\" + 0.004*\"dixi\" + 0.004*\"septemb\"\n", + "2019-01-31 00:34:15,510 : INFO : topic #40 (0.020): 0.091*\"unit\" + 0.025*\"collector\" + 0.024*\"schuster\" + 0.022*\"institut\" + 0.019*\"requir\" + 0.017*\"student\" + 0.015*\"professor\" + 0.012*\"word\" + 0.011*\"governor\" + 0.011*\"http\"\n", + "2019-01-31 00:34:15,511 : INFO : topic #15 (0.020): 0.012*\"small\" + 0.011*\"organ\" + 0.011*\"develop\" + 0.010*\"commun\" + 0.009*\"group\" + 0.009*\"word\" + 0.008*\"cultur\" + 0.008*\"peopl\" + 0.006*\"human\" + 0.006*\"woman\"\n", + "2019-01-31 00:34:15,517 : INFO : topic diff=0.005948, rho=0.043153\n", + "2019-01-31 00:34:15,672 : INFO : PROGRESS: pass 0, at document #1076000/4922894\n", + "2019-01-31 00:34:17,088 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:34:17,355 : INFO : topic #6 (0.020): 0.072*\"fewer\" + 0.025*\"septemb\" + 0.024*\"epiru\" + 0.019*\"stake\" + 0.019*\"teacher\" + 0.013*\"proclaim\" + 0.012*\"rodríguez\" + 0.011*\"direct\" + 0.011*\"movi\" + 0.011*\"acrimoni\"\n", + "2019-01-31 00:34:17,356 : INFO : topic #2 (0.020): 0.051*\"isl\" + 0.038*\"shield\" + 0.018*\"narrat\" + 0.014*\"scot\" + 0.013*\"pope\" + 0.012*\"blur\" + 0.011*\"nativist\" + 0.010*\"coalit\" + 0.009*\"fleet\" + 0.009*\"sai\"\n", + "2019-01-31 00:34:17,357 : INFO : topic #27 (0.020): 0.072*\"questionnair\" + 0.019*\"candid\" + 0.018*\"taxpay\" + 0.013*\"fool\" + 0.012*\"driver\" + 0.012*\"ret\" + 0.012*\"tornado\" + 0.011*\"find\" + 0.011*\"horac\" + 0.010*\"champion\"\n", + "2019-01-31 00:34:17,358 : INFO : topic #38 (0.020): 0.022*\"walter\" + 0.013*\"aza\" + 0.009*\"battalion\" + 0.008*\"teufel\" + 0.008*\"forc\" + 0.008*\"till\" + 0.008*\"empath\" + 0.007*\"king\" + 0.007*\"armi\" + 0.006*\"centuri\"\n", + "2019-01-31 00:34:17,359 : INFO : topic #15 (0.020): 0.012*\"small\" + 0.012*\"organ\" + 0.011*\"develop\" + 0.010*\"commun\" + 0.009*\"group\" + 0.009*\"word\" + 0.008*\"cultur\" + 0.008*\"peopl\" + 0.006*\"human\" + 0.006*\"student\"\n", + "2019-01-31 00:34:17,366 : INFO : topic diff=0.007542, rho=0.043113\n", + "2019-01-31 00:34:17,525 : INFO : PROGRESS: pass 0, at document #1078000/4922894\n", + "2019-01-31 00:34:18,959 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:34:19,225 : INFO : topic #12 (0.020): 0.009*\"number\" + 0.007*\"frontal\" + 0.007*\"théori\" + 0.007*\"gener\" + 0.007*\"exampl\" + 0.006*\"poet\" + 0.006*\"southern\" + 0.006*\"servitud\" + 0.005*\"measur\" + 0.005*\"differ\"\n", + "2019-01-31 00:34:19,227 : INFO : topic #10 (0.020): 0.011*\"cdd\" + 0.008*\"disco\" + 0.008*\"acid\" + 0.007*\"media\" + 0.007*\"have\" + 0.007*\"proper\" + 0.007*\"pathwai\" + 0.007*\"caus\" + 0.006*\"treat\" + 0.006*\"hormon\"\n", + "2019-01-31 00:34:19,228 : INFO : topic #40 (0.020): 0.091*\"unit\" + 0.025*\"collector\" + 0.024*\"schuster\" + 0.022*\"institut\" + 0.019*\"requir\" + 0.017*\"student\" + 0.015*\"professor\" + 0.012*\"word\" + 0.011*\"governor\" + 0.011*\"http\"\n", + "2019-01-31 00:34:19,229 : INFO : topic #4 (0.020): 0.021*\"enfranchis\" + 0.014*\"pour\" + 0.014*\"depress\" + 0.010*\"elabor\" + 0.010*\"mode\" + 0.008*\"veget\" + 0.008*\"candid\" + 0.008*\"produc\" + 0.007*\"uruguayan\" + 0.007*\"encyclopedia\"\n", + "2019-01-31 00:34:19,230 : INFO : topic #32 (0.020): 0.055*\"district\" + 0.046*\"vigour\" + 0.044*\"popolo\" + 0.038*\"tortur\" + 0.028*\"area\" + 0.027*\"cotton\" + 0.025*\"regim\" + 0.025*\"multitud\" + 0.022*\"citi\" + 0.019*\"cede\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 00:34:19,236 : INFO : topic diff=0.006228, rho=0.043073\n", + "2019-01-31 00:34:21,897 : INFO : -11.672 per-word bound, 3262.0 perplexity estimate based on a held-out corpus of 2000 documents with 526071 words\n", + "2019-01-31 00:34:21,898 : INFO : PROGRESS: pass 0, at document #1080000/4922894\n", + "2019-01-31 00:34:23,286 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:34:23,553 : INFO : topic #10 (0.020): 0.011*\"cdd\" + 0.008*\"disco\" + 0.008*\"acid\" + 0.007*\"have\" + 0.007*\"proper\" + 0.007*\"media\" + 0.007*\"pathwai\" + 0.006*\"caus\" + 0.006*\"treat\" + 0.006*\"effect\"\n", + "2019-01-31 00:34:23,554 : INFO : topic #0 (0.020): 0.064*\"statewid\" + 0.041*\"arsen\" + 0.039*\"line\" + 0.034*\"raid\" + 0.030*\"museo\" + 0.020*\"traceabl\" + 0.017*\"serv\" + 0.015*\"pain\" + 0.014*\"exhaust\" + 0.013*\"gai\"\n", + "2019-01-31 00:34:23,555 : INFO : topic #20 (0.020): 0.142*\"scholar\" + 0.038*\"struggl\" + 0.035*\"high\" + 0.030*\"educ\" + 0.021*\"collector\" + 0.018*\"yawn\" + 0.013*\"prognosi\" + 0.010*\"district\" + 0.009*\"task\" + 0.009*\"gothic\"\n", + "2019-01-31 00:34:23,556 : INFO : topic #4 (0.020): 0.021*\"enfranchis\" + 0.014*\"pour\" + 0.014*\"depress\" + 0.010*\"elabor\" + 0.010*\"mode\" + 0.009*\"veget\" + 0.008*\"candid\" + 0.008*\"produc\" + 0.007*\"uruguayan\" + 0.007*\"encyclopedia\"\n", + "2019-01-31 00:34:23,557 : INFO : topic #27 (0.020): 0.071*\"questionnair\" + 0.019*\"candid\" + 0.018*\"taxpay\" + 0.013*\"fool\" + 0.013*\"driver\" + 0.012*\"tornado\" + 0.011*\"find\" + 0.011*\"ret\" + 0.011*\"horac\" + 0.010*\"théori\"\n", + "2019-01-31 00:34:23,563 : INFO : topic diff=0.006625, rho=0.043033\n", + "2019-01-31 00:34:23,717 : INFO : PROGRESS: pass 0, at document #1082000/4922894\n", + "2019-01-31 00:34:25,108 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:34:25,375 : INFO : topic #27 (0.020): 0.071*\"questionnair\" + 0.019*\"candid\" + 0.018*\"taxpay\" + 0.013*\"fool\" + 0.013*\"driver\" + 0.012*\"tornado\" + 0.011*\"find\" + 0.011*\"ret\" + 0.011*\"horac\" + 0.010*\"champion\"\n", + "2019-01-31 00:34:25,376 : INFO : topic #11 (0.020): 0.027*\"john\" + 0.014*\"will\" + 0.013*\"jame\" + 0.012*\"david\" + 0.011*\"rival\" + 0.009*\"mexican–american\" + 0.009*\"georg\" + 0.009*\"slur\" + 0.008*\"paul\" + 0.008*\"rhyme\"\n", + "2019-01-31 00:34:25,377 : INFO : topic #15 (0.020): 0.012*\"small\" + 0.011*\"organ\" + 0.011*\"develop\" + 0.010*\"commun\" + 0.009*\"group\" + 0.009*\"word\" + 0.008*\"cultur\" + 0.008*\"peopl\" + 0.006*\"student\" + 0.006*\"woman\"\n", + "2019-01-31 00:34:25,378 : INFO : topic #17 (0.020): 0.074*\"church\" + 0.021*\"christian\" + 0.021*\"cathol\" + 0.019*\"bishop\" + 0.015*\"sail\" + 0.014*\"retroflex\" + 0.010*\"relationship\" + 0.010*\"parish\" + 0.009*\"centuri\" + 0.009*\"cathedr\"\n", + "2019-01-31 00:34:25,380 : INFO : topic #16 (0.020): 0.045*\"king\" + 0.030*\"priest\" + 0.020*\"duke\" + 0.018*\"quarterli\" + 0.018*\"grammat\" + 0.018*\"idiosyncrat\" + 0.018*\"rotterdam\" + 0.015*\"count\" + 0.013*\"brazil\" + 0.012*\"princ\"\n", + "2019-01-31 00:34:25,385 : INFO : topic diff=0.006195, rho=0.042993\n", + "2019-01-31 00:34:25,540 : INFO : PROGRESS: pass 0, at document #1084000/4922894\n", + "2019-01-31 00:34:26,932 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:34:27,199 : INFO : topic #18 (0.020): 0.010*\"théori\" + 0.007*\"later\" + 0.007*\"sack\" + 0.006*\"kill\" + 0.006*\"dai\" + 0.005*\"retrospect\" + 0.005*\"like\" + 0.004*\"deal\" + 0.004*\"end\" + 0.004*\"help\"\n", + "2019-01-31 00:34:27,200 : INFO : topic #20 (0.020): 0.142*\"scholar\" + 0.038*\"struggl\" + 0.035*\"high\" + 0.030*\"educ\" + 0.022*\"collector\" + 0.018*\"yawn\" + 0.013*\"prognosi\" + 0.009*\"district\" + 0.009*\"task\" + 0.009*\"gothic\"\n", + "2019-01-31 00:34:27,201 : INFO : topic #33 (0.020): 0.060*\"french\" + 0.045*\"franc\" + 0.032*\"pari\" + 0.024*\"sail\" + 0.022*\"jean\" + 0.017*\"daphn\" + 0.013*\"lazi\" + 0.012*\"loui\" + 0.012*\"piec\" + 0.011*\"wine\"\n", + "2019-01-31 00:34:27,202 : INFO : topic #43 (0.020): 0.064*\"elect\" + 0.055*\"parti\" + 0.023*\"voluntari\" + 0.022*\"democrat\" + 0.021*\"member\" + 0.018*\"polici\" + 0.016*\"liber\" + 0.014*\"republ\" + 0.013*\"seaport\" + 0.013*\"report\"\n", + "2019-01-31 00:34:27,203 : INFO : topic #34 (0.020): 0.071*\"start\" + 0.036*\"cotton\" + 0.030*\"unionist\" + 0.029*\"american\" + 0.024*\"new\" + 0.014*\"warrior\" + 0.013*\"california\" + 0.013*\"year\" + 0.013*\"terri\" + 0.013*\"north\"\n", + "2019-01-31 00:34:27,209 : INFO : topic diff=0.006214, rho=0.042954\n", + "2019-01-31 00:34:27,364 : INFO : PROGRESS: pass 0, at document #1086000/4922894\n", + "2019-01-31 00:34:28,764 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:34:29,030 : INFO : topic #32 (0.020): 0.055*\"district\" + 0.045*\"vigour\" + 0.044*\"popolo\" + 0.039*\"tortur\" + 0.028*\"cotton\" + 0.028*\"area\" + 0.025*\"multitud\" + 0.024*\"regim\" + 0.022*\"citi\" + 0.019*\"commun\"\n", + "2019-01-31 00:34:29,031 : INFO : topic #0 (0.020): 0.064*\"statewid\" + 0.041*\"arsen\" + 0.039*\"line\" + 0.034*\"raid\" + 0.030*\"museo\" + 0.020*\"traceabl\" + 0.017*\"serv\" + 0.015*\"pain\" + 0.014*\"exhaust\" + 0.013*\"gai\"\n", + "2019-01-31 00:34:29,032 : INFO : topic #22 (0.020): 0.034*\"spars\" + 0.024*\"factor\" + 0.023*\"adulthood\" + 0.016*\"feel\" + 0.015*\"hostil\" + 0.014*\"male\" + 0.011*\"plaisir\" + 0.011*\"genu\" + 0.010*\"live\" + 0.009*\"yawn\"\n", + "2019-01-31 00:34:29,033 : INFO : topic #9 (0.020): 0.068*\"bone\" + 0.041*\"american\" + 0.031*\"valour\" + 0.020*\"dutch\" + 0.018*\"folei\" + 0.018*\"player\" + 0.018*\"english\" + 0.016*\"polit\" + 0.012*\"acrimoni\" + 0.011*\"simpler\"\n", + "2019-01-31 00:34:29,034 : INFO : topic #37 (0.020): 0.010*\"man\" + 0.010*\"love\" + 0.008*\"gestur\" + 0.005*\"blue\" + 0.005*\"bewild\" + 0.005*\"litig\" + 0.004*\"dixi\" + 0.004*\"vision\" + 0.004*\"comic\" + 0.004*\"night\"\n", + "2019-01-31 00:34:29,040 : INFO : topic diff=0.007532, rho=0.042914\n", + "2019-01-31 00:34:29,254 : INFO : PROGRESS: pass 0, at document #1088000/4922894\n", + "2019-01-31 00:34:30,656 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:34:30,923 : INFO : topic #29 (0.020): 0.017*\"companhia\" + 0.011*\"million\" + 0.008*\"yawn\" + 0.008*\"bank\" + 0.008*\"market\" + 0.008*\"busi\" + 0.008*\"govern\" + 0.008*\"start\" + 0.007*\"function\" + 0.007*\"industri\"\n", + "2019-01-31 00:34:30,924 : INFO : topic #20 (0.020): 0.142*\"scholar\" + 0.038*\"struggl\" + 0.035*\"high\" + 0.030*\"educ\" + 0.023*\"collector\" + 0.018*\"yawn\" + 0.013*\"prognosi\" + 0.010*\"task\" + 0.009*\"district\" + 0.009*\"gothic\"\n", + "2019-01-31 00:34:30,925 : INFO : topic #33 (0.020): 0.059*\"french\" + 0.045*\"franc\" + 0.031*\"pari\" + 0.024*\"sail\" + 0.022*\"jean\" + 0.017*\"daphn\" + 0.013*\"lazi\" + 0.013*\"loui\" + 0.012*\"piec\" + 0.011*\"wine\"\n", + "2019-01-31 00:34:30,926 : INFO : topic #48 (0.020): 0.079*\"march\" + 0.075*\"octob\" + 0.074*\"januari\" + 0.074*\"sens\" + 0.070*\"april\" + 0.069*\"notion\" + 0.068*\"juli\" + 0.067*\"decatur\" + 0.066*\"august\" + 0.065*\"judici\"\n", + "2019-01-31 00:34:30,927 : INFO : topic #26 (0.020): 0.031*\"workplac\" + 0.029*\"champion\" + 0.028*\"woman\" + 0.027*\"men\" + 0.025*\"olymp\" + 0.022*\"medal\" + 0.021*\"event\" + 0.019*\"atheist\" + 0.019*\"alic\" + 0.017*\"rainfal\"\n", + "2019-01-31 00:34:30,933 : INFO : topic diff=0.005381, rho=0.042875\n", + "2019-01-31 00:34:31,098 : INFO : PROGRESS: pass 0, at document #1090000/4922894\n", + "2019-01-31 00:34:32,508 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:34:32,774 : INFO : topic #43 (0.020): 0.064*\"elect\" + 0.055*\"parti\" + 0.023*\"voluntari\" + 0.021*\"democrat\" + 0.021*\"member\" + 0.018*\"polici\" + 0.015*\"liber\" + 0.014*\"republ\" + 0.013*\"report\" + 0.013*\"seaport\"\n", + "2019-01-31 00:34:32,775 : INFO : topic #32 (0.020): 0.055*\"district\" + 0.045*\"vigour\" + 0.044*\"popolo\" + 0.039*\"tortur\" + 0.028*\"cotton\" + 0.027*\"area\" + 0.025*\"multitud\" + 0.024*\"regim\" + 0.022*\"citi\" + 0.019*\"commun\"\n", + "2019-01-31 00:34:32,777 : INFO : topic #29 (0.020): 0.017*\"companhia\" + 0.011*\"million\" + 0.008*\"yawn\" + 0.008*\"bank\" + 0.008*\"busi\" + 0.008*\"market\" + 0.008*\"govern\" + 0.008*\"start\" + 0.007*\"function\" + 0.007*\"industri\"\n", + "2019-01-31 00:34:32,778 : INFO : topic #37 (0.020): 0.010*\"man\" + 0.009*\"love\" + 0.008*\"gestur\" + 0.005*\"blue\" + 0.005*\"bewild\" + 0.005*\"vision\" + 0.005*\"litig\" + 0.004*\"dixi\" + 0.004*\"comic\" + 0.004*\"septemb\"\n", + "2019-01-31 00:34:32,779 : INFO : topic #42 (0.020): 0.043*\"german\" + 0.029*\"germani\" + 0.014*\"berlin\" + 0.014*\"jewish\" + 0.014*\"israel\" + 0.013*\"vol\" + 0.013*\"der\" + 0.009*\"jeremiah\" + 0.009*\"european\" + 0.009*\"europ\"\n", + "2019-01-31 00:34:32,785 : INFO : topic diff=0.006816, rho=0.042835\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 00:34:32,939 : INFO : PROGRESS: pass 0, at document #1092000/4922894\n", + "2019-01-31 00:34:34,316 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:34:34,582 : INFO : topic #24 (0.020): 0.042*\"book\" + 0.034*\"publicis\" + 0.024*\"word\" + 0.018*\"new\" + 0.014*\"edit\" + 0.013*\"nicola\" + 0.013*\"presid\" + 0.012*\"storag\" + 0.011*\"worldwid\" + 0.011*\"magazin\"\n", + "2019-01-31 00:34:34,584 : INFO : topic #7 (0.020): 0.020*\"snatch\" + 0.019*\"di\" + 0.017*\"factor\" + 0.015*\"margin\" + 0.015*\"yawn\" + 0.014*\"bone\" + 0.012*\"life\" + 0.012*\"faster\" + 0.012*\"daughter\" + 0.011*\"deal\"\n", + "2019-01-31 00:34:34,585 : INFO : topic #30 (0.020): 0.037*\"cleveland\" + 0.036*\"leagu\" + 0.030*\"place\" + 0.028*\"taxpay\" + 0.024*\"scientist\" + 0.024*\"folei\" + 0.023*\"crete\" + 0.017*\"goal\" + 0.015*\"martin\" + 0.012*\"schmitz\"\n", + "2019-01-31 00:34:34,586 : INFO : topic #22 (0.020): 0.033*\"spars\" + 0.024*\"factor\" + 0.023*\"adulthood\" + 0.017*\"feel\" + 0.015*\"hostil\" + 0.014*\"male\" + 0.011*\"plaisir\" + 0.011*\"genu\" + 0.010*\"live\" + 0.009*\"yawn\"\n", + "2019-01-31 00:34:34,587 : INFO : topic #40 (0.020): 0.088*\"unit\" + 0.024*\"collector\" + 0.024*\"schuster\" + 0.021*\"institut\" + 0.020*\"requir\" + 0.017*\"student\" + 0.014*\"professor\" + 0.012*\"word\" + 0.012*\"governor\" + 0.011*\"http\"\n", + "2019-01-31 00:34:34,593 : INFO : topic diff=0.007883, rho=0.042796\n", + "2019-01-31 00:34:34,748 : INFO : PROGRESS: pass 0, at document #1094000/4922894\n", + "2019-01-31 00:34:36,137 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:34:36,403 : INFO : topic #43 (0.020): 0.064*\"elect\" + 0.055*\"parti\" + 0.023*\"voluntari\" + 0.021*\"democrat\" + 0.021*\"member\" + 0.017*\"polici\" + 0.015*\"liber\" + 0.014*\"republ\" + 0.013*\"report\" + 0.013*\"seaport\"\n", + "2019-01-31 00:34:36,404 : INFO : topic #1 (0.020): 0.057*\"china\" + 0.047*\"chilton\" + 0.023*\"hong\" + 0.023*\"korea\" + 0.023*\"kong\" + 0.019*\"korean\" + 0.016*\"sourc\" + 0.015*\"leah\" + 0.014*\"kim\" + 0.013*\"ashvil\"\n", + "2019-01-31 00:34:36,405 : INFO : topic #24 (0.020): 0.042*\"book\" + 0.034*\"publicis\" + 0.024*\"word\" + 0.018*\"new\" + 0.014*\"edit\" + 0.013*\"nicola\" + 0.013*\"presid\" + 0.012*\"storag\" + 0.011*\"magazin\" + 0.011*\"collect\"\n", + "2019-01-31 00:34:36,406 : INFO : topic #4 (0.020): 0.021*\"enfranchis\" + 0.014*\"depress\" + 0.014*\"pour\" + 0.010*\"elabor\" + 0.010*\"mode\" + 0.009*\"veget\" + 0.008*\"candid\" + 0.008*\"encyclopedia\" + 0.008*\"produc\" + 0.007*\"uruguayan\"\n", + "2019-01-31 00:34:36,407 : INFO : topic #44 (0.020): 0.031*\"rooftop\" + 0.028*\"final\" + 0.023*\"tourist\" + 0.022*\"wife\" + 0.019*\"champion\" + 0.017*\"taxpay\" + 0.014*\"chamber\" + 0.014*\"martin\" + 0.014*\"tiepolo\" + 0.012*\"open\"\n", + "2019-01-31 00:34:36,413 : INFO : topic diff=0.006432, rho=0.042757\n", + "2019-01-31 00:34:36,571 : INFO : PROGRESS: pass 0, at document #1096000/4922894\n", + "2019-01-31 00:34:37,976 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:34:38,242 : INFO : topic #35 (0.020): 0.055*\"russia\" + 0.033*\"sovereignti\" + 0.032*\"rural\" + 0.024*\"personifi\" + 0.024*\"poison\" + 0.021*\"reprint\" + 0.020*\"moscow\" + 0.016*\"poland\" + 0.016*\"unfortun\" + 0.015*\"malaysia\"\n", + "2019-01-31 00:34:38,243 : INFO : topic #39 (0.020): 0.042*\"canada\" + 0.035*\"canadian\" + 0.019*\"toronto\" + 0.019*\"hoar\" + 0.016*\"ontario\" + 0.013*\"new\" + 0.013*\"hydrogen\" + 0.011*\"scientist\" + 0.011*\"taxpay\" + 0.011*\"misericordia\"\n", + "2019-01-31 00:34:38,244 : INFO : topic #14 (0.020): 0.024*\"forc\" + 0.024*\"aggress\" + 0.020*\"armi\" + 0.020*\"walter\" + 0.018*\"com\" + 0.014*\"oper\" + 0.013*\"unionist\" + 0.013*\"militari\" + 0.012*\"airbu\" + 0.012*\"refut\"\n", + "2019-01-31 00:34:38,245 : INFO : topic #30 (0.020): 0.037*\"cleveland\" + 0.036*\"leagu\" + 0.030*\"place\" + 0.028*\"taxpay\" + 0.024*\"scientist\" + 0.023*\"folei\" + 0.023*\"crete\" + 0.017*\"goal\" + 0.016*\"martin\" + 0.013*\"schmitz\"\n", + "2019-01-31 00:34:38,246 : INFO : topic #13 (0.020): 0.028*\"australia\" + 0.026*\"london\" + 0.026*\"sourc\" + 0.025*\"new\" + 0.023*\"australian\" + 0.022*\"england\" + 0.019*\"british\" + 0.019*\"ireland\" + 0.015*\"youth\" + 0.013*\"wale\"\n", + "2019-01-31 00:34:38,252 : INFO : topic diff=0.008384, rho=0.042718\n", + "2019-01-31 00:34:38,407 : INFO : PROGRESS: pass 0, at document #1098000/4922894\n", + "2019-01-31 00:34:39,784 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:34:40,051 : INFO : topic #32 (0.020): 0.056*\"district\" + 0.045*\"vigour\" + 0.043*\"popolo\" + 0.041*\"tortur\" + 0.028*\"area\" + 0.027*\"cotton\" + 0.025*\"multitud\" + 0.024*\"regim\" + 0.022*\"citi\" + 0.019*\"cede\"\n", + "2019-01-31 00:34:40,053 : INFO : topic #34 (0.020): 0.072*\"start\" + 0.034*\"cotton\" + 0.030*\"unionist\" + 0.030*\"american\" + 0.025*\"new\" + 0.014*\"warrior\" + 0.014*\"year\" + 0.013*\"terri\" + 0.013*\"california\" + 0.012*\"north\"\n", + "2019-01-31 00:34:40,054 : INFO : topic #18 (0.020): 0.010*\"théori\" + 0.007*\"later\" + 0.007*\"sack\" + 0.006*\"kill\" + 0.006*\"dai\" + 0.005*\"retrospect\" + 0.005*\"like\" + 0.004*\"end\" + 0.004*\"deal\" + 0.004*\"help\"\n", + "2019-01-31 00:34:40,055 : INFO : topic #31 (0.020): 0.062*\"fusiform\" + 0.025*\"scientist\" + 0.025*\"player\" + 0.023*\"taxpay\" + 0.020*\"place\" + 0.014*\"clot\" + 0.012*\"leagu\" + 0.011*\"folei\" + 0.010*\"yawn\" + 0.009*\"barber\"\n", + "2019-01-31 00:34:40,056 : INFO : topic #33 (0.020): 0.059*\"french\" + 0.044*\"franc\" + 0.032*\"pari\" + 0.024*\"sail\" + 0.023*\"jean\" + 0.017*\"daphn\" + 0.014*\"lazi\" + 0.013*\"loui\" + 0.011*\"piec\" + 0.010*\"wine\"\n", + "2019-01-31 00:34:40,062 : INFO : topic diff=0.006874, rho=0.042679\n", + "2019-01-31 00:34:42,779 : INFO : -11.583 per-word bound, 3068.5 perplexity estimate based on a held-out corpus of 2000 documents with 563914 words\n", + "2019-01-31 00:34:42,780 : INFO : PROGRESS: pass 0, at document #1100000/4922894\n", + "2019-01-31 00:34:44,178 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:34:44,445 : INFO : topic #15 (0.020): 0.012*\"small\" + 0.012*\"organ\" + 0.011*\"develop\" + 0.010*\"commun\" + 0.009*\"group\" + 0.008*\"word\" + 0.008*\"cultur\" + 0.008*\"peopl\" + 0.007*\"human\" + 0.006*\"student\"\n", + "2019-01-31 00:34:44,446 : INFO : topic #1 (0.020): 0.056*\"china\" + 0.049*\"chilton\" + 0.023*\"hong\" + 0.023*\"kong\" + 0.023*\"korea\" + 0.018*\"korean\" + 0.016*\"sourc\" + 0.015*\"leah\" + 0.014*\"kim\" + 0.013*\"ashvil\"\n", + "2019-01-31 00:34:44,447 : INFO : topic #47 (0.020): 0.065*\"muscl\" + 0.035*\"perceptu\" + 0.022*\"theater\" + 0.018*\"place\" + 0.017*\"compos\" + 0.016*\"damn\" + 0.014*\"physician\" + 0.014*\"olympo\" + 0.013*\"orchestr\" + 0.012*\"word\"\n", + "2019-01-31 00:34:44,448 : INFO : topic #13 (0.020): 0.028*\"australia\" + 0.026*\"sourc\" + 0.026*\"london\" + 0.024*\"new\" + 0.023*\"australian\" + 0.022*\"england\" + 0.019*\"british\" + 0.018*\"ireland\" + 0.015*\"youth\" + 0.013*\"wale\"\n", + "2019-01-31 00:34:44,449 : INFO : topic #12 (0.020): 0.008*\"number\" + 0.007*\"frontal\" + 0.007*\"théori\" + 0.007*\"gener\" + 0.006*\"southern\" + 0.006*\"exampl\" + 0.006*\"servitud\" + 0.006*\"poet\" + 0.006*\"method\" + 0.006*\"measur\"\n", + "2019-01-31 00:34:44,455 : INFO : topic diff=0.007173, rho=0.042640\n", + "2019-01-31 00:34:44,612 : INFO : PROGRESS: pass 0, at document #1102000/4922894\n", + "2019-01-31 00:34:46,015 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:34:46,282 : INFO : topic #34 (0.020): 0.072*\"start\" + 0.034*\"cotton\" + 0.030*\"unionist\" + 0.030*\"american\" + 0.025*\"new\" + 0.014*\"year\" + 0.014*\"warrior\" + 0.013*\"california\" + 0.013*\"terri\" + 0.012*\"north\"\n", + "2019-01-31 00:34:46,283 : INFO : topic #44 (0.020): 0.032*\"rooftop\" + 0.028*\"final\" + 0.023*\"wife\" + 0.022*\"tourist\" + 0.019*\"champion\" + 0.017*\"taxpay\" + 0.015*\"chamber\" + 0.014*\"tiepolo\" + 0.014*\"martin\" + 0.012*\"women\"\n", + "2019-01-31 00:34:46,284 : INFO : topic #49 (0.020): 0.042*\"india\" + 0.031*\"incumb\" + 0.015*\"televis\" + 0.013*\"pakistan\" + 0.012*\"islam\" + 0.011*\"muskoge\" + 0.011*\"tajikistan\" + 0.011*\"khalsa\" + 0.010*\"anglo\" + 0.010*\"sri\"\n", + "2019-01-31 00:34:46,285 : INFO : topic #33 (0.020): 0.059*\"french\" + 0.044*\"franc\" + 0.033*\"pari\" + 0.024*\"sail\" + 0.023*\"jean\" + 0.017*\"daphn\" + 0.014*\"lazi\" + 0.013*\"loui\" + 0.011*\"piec\" + 0.010*\"wine\"\n", + "2019-01-31 00:34:46,286 : INFO : topic #16 (0.020): 0.044*\"king\" + 0.028*\"priest\" + 0.021*\"duke\" + 0.020*\"grammat\" + 0.017*\"idiosyncrat\" + 0.017*\"quarterli\" + 0.017*\"rotterdam\" + 0.014*\"count\" + 0.013*\"maria\" + 0.013*\"portugues\"\n", + "2019-01-31 00:34:46,292 : INFO : topic diff=0.007395, rho=0.042601\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 00:34:46,454 : INFO : PROGRESS: pass 0, at document #1104000/4922894\n", + "2019-01-31 00:34:47,886 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:34:48,152 : INFO : topic #28 (0.020): 0.030*\"build\" + 0.025*\"hous\" + 0.021*\"rivièr\" + 0.017*\"buford\" + 0.012*\"histor\" + 0.012*\"briarwood\" + 0.011*\"constitut\" + 0.010*\"depress\" + 0.010*\"strategist\" + 0.010*\"rosenwald\"\n", + "2019-01-31 00:34:48,154 : INFO : topic #22 (0.020): 0.033*\"spars\" + 0.024*\"factor\" + 0.023*\"adulthood\" + 0.017*\"feel\" + 0.015*\"hostil\" + 0.014*\"male\" + 0.011*\"plaisir\" + 0.011*\"genu\" + 0.010*\"live\" + 0.009*\"yawn\"\n", + "2019-01-31 00:34:48,155 : INFO : topic #10 (0.020): 0.013*\"cdd\" + 0.008*\"disco\" + 0.008*\"media\" + 0.007*\"have\" + 0.007*\"pathwai\" + 0.007*\"proper\" + 0.007*\"acid\" + 0.006*\"caus\" + 0.006*\"treat\" + 0.006*\"effect\"\n", + "2019-01-31 00:34:48,156 : INFO : topic #32 (0.020): 0.056*\"district\" + 0.045*\"vigour\" + 0.043*\"popolo\" + 0.041*\"tortur\" + 0.028*\"area\" + 0.027*\"cotton\" + 0.025*\"multitud\" + 0.024*\"regim\" + 0.022*\"citi\" + 0.019*\"commun\"\n", + "2019-01-31 00:34:48,157 : INFO : topic #7 (0.020): 0.021*\"snatch\" + 0.020*\"di\" + 0.017*\"factor\" + 0.015*\"margin\" + 0.015*\"yawn\" + 0.014*\"bone\" + 0.012*\"life\" + 0.012*\"faster\" + 0.011*\"daughter\" + 0.011*\"deal\"\n", + "2019-01-31 00:34:48,163 : INFO : topic diff=0.008300, rho=0.042563\n", + "2019-01-31 00:34:48,318 : INFO : PROGRESS: pass 0, at document #1106000/4922894\n", + "2019-01-31 00:34:49,706 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:34:49,971 : INFO : topic #31 (0.020): 0.062*\"fusiform\" + 0.025*\"scientist\" + 0.024*\"player\" + 0.023*\"taxpay\" + 0.020*\"place\" + 0.014*\"clot\" + 0.012*\"leagu\" + 0.011*\"folei\" + 0.010*\"yawn\" + 0.009*\"reconstruct\"\n", + "2019-01-31 00:34:49,972 : INFO : topic #1 (0.020): 0.057*\"china\" + 0.050*\"chilton\" + 0.023*\"hong\" + 0.023*\"korea\" + 0.023*\"kong\" + 0.018*\"korean\" + 0.016*\"sourc\" + 0.015*\"leah\" + 0.015*\"kim\" + 0.013*\"ashvil\"\n", + "2019-01-31 00:34:49,973 : INFO : topic #35 (0.020): 0.056*\"russia\" + 0.034*\"sovereignti\" + 0.033*\"rural\" + 0.026*\"personifi\" + 0.023*\"poison\" + 0.023*\"reprint\" + 0.020*\"moscow\" + 0.016*\"poland\" + 0.016*\"unfortun\" + 0.014*\"malaysia\"\n", + "2019-01-31 00:34:49,974 : INFO : topic #11 (0.020): 0.027*\"john\" + 0.014*\"will\" + 0.013*\"jame\" + 0.012*\"david\" + 0.011*\"rival\" + 0.009*\"mexican–american\" + 0.009*\"georg\" + 0.009*\"slur\" + 0.008*\"paul\" + 0.008*\"rhyme\"\n", + "2019-01-31 00:34:49,975 : INFO : topic #46 (0.020): 0.020*\"stop\" + 0.015*\"treeless\" + 0.015*\"norwai\" + 0.015*\"sweden\" + 0.015*\"damag\" + 0.014*\"swedish\" + 0.014*\"huntsvil\" + 0.014*\"norwegian\" + 0.013*\"wind\" + 0.011*\"replac\"\n", + "2019-01-31 00:34:49,981 : INFO : topic diff=0.007876, rho=0.042524\n", + "2019-01-31 00:34:50,136 : INFO : PROGRESS: pass 0, at document #1108000/4922894\n", + "2019-01-31 00:34:51,505 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:34:51,771 : INFO : topic #19 (0.020): 0.014*\"languag\" + 0.010*\"form\" + 0.010*\"woodcut\" + 0.009*\"origin\" + 0.009*\"centuri\" + 0.008*\"mean\" + 0.007*\"uruguayan\" + 0.007*\"like\" + 0.007*\"charact\" + 0.006*\"trade\"\n", + "2019-01-31 00:34:51,772 : INFO : topic #15 (0.020): 0.012*\"small\" + 0.011*\"develop\" + 0.011*\"organ\" + 0.010*\"commun\" + 0.009*\"word\" + 0.008*\"group\" + 0.008*\"cultur\" + 0.008*\"peopl\" + 0.007*\"human\" + 0.006*\"student\"\n", + "2019-01-31 00:34:51,774 : INFO : topic #18 (0.020): 0.010*\"théori\" + 0.007*\"later\" + 0.007*\"sack\" + 0.006*\"kill\" + 0.006*\"dai\" + 0.005*\"retrospect\" + 0.005*\"like\" + 0.004*\"end\" + 0.004*\"deal\" + 0.004*\"man\"\n", + "2019-01-31 00:34:51,775 : INFO : topic #28 (0.020): 0.030*\"build\" + 0.025*\"hous\" + 0.021*\"rivièr\" + 0.017*\"buford\" + 0.012*\"histor\" + 0.012*\"briarwood\" + 0.011*\"constitut\" + 0.010*\"depress\" + 0.010*\"strategist\" + 0.010*\"rosenwald\"\n", + "2019-01-31 00:34:51,776 : INFO : topic #38 (0.020): 0.022*\"walter\" + 0.013*\"aza\" + 0.009*\"battalion\" + 0.008*\"teufel\" + 0.008*\"forc\" + 0.008*\"empath\" + 0.008*\"till\" + 0.007*\"king\" + 0.007*\"armi\" + 0.006*\"centuri\"\n", + "2019-01-31 00:34:51,782 : INFO : topic diff=0.006043, rho=0.042486\n", + "2019-01-31 00:34:51,936 : INFO : PROGRESS: pass 0, at document #1110000/4922894\n", + "2019-01-31 00:34:53,315 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:34:53,581 : INFO : topic #11 (0.020): 0.027*\"john\" + 0.014*\"will\" + 0.013*\"jame\" + 0.012*\"david\" + 0.011*\"rival\" + 0.009*\"georg\" + 0.009*\"mexican–american\" + 0.009*\"slur\" + 0.008*\"paul\" + 0.008*\"rhyme\"\n", + "2019-01-31 00:34:53,582 : INFO : topic #6 (0.020): 0.071*\"fewer\" + 0.025*\"septemb\" + 0.024*\"epiru\" + 0.019*\"teacher\" + 0.018*\"stake\" + 0.013*\"proclaim\" + 0.013*\"rodríguez\" + 0.012*\"direct\" + 0.011*\"movi\" + 0.010*\"acrimoni\"\n", + "2019-01-31 00:34:53,584 : INFO : topic #19 (0.020): 0.014*\"languag\" + 0.010*\"form\" + 0.010*\"woodcut\" + 0.009*\"origin\" + 0.009*\"centuri\" + 0.008*\"mean\" + 0.007*\"uruguayan\" + 0.007*\"like\" + 0.007*\"charact\" + 0.006*\"trade\"\n", + "2019-01-31 00:34:53,585 : INFO : topic #42 (0.020): 0.043*\"german\" + 0.028*\"germani\" + 0.015*\"vol\" + 0.015*\"berlin\" + 0.013*\"jewish\" + 0.013*\"der\" + 0.013*\"israel\" + 0.009*\"european\" + 0.009*\"europ\" + 0.009*\"itali\"\n", + "2019-01-31 00:34:53,586 : INFO : topic #14 (0.020): 0.024*\"forc\" + 0.022*\"aggress\" + 0.020*\"armi\" + 0.020*\"walter\" + 0.018*\"com\" + 0.014*\"oper\" + 0.013*\"unionist\" + 0.013*\"militari\" + 0.012*\"airbu\" + 0.012*\"refut\"\n", + "2019-01-31 00:34:53,592 : INFO : topic diff=0.006477, rho=0.042448\n", + "2019-01-31 00:34:53,747 : INFO : PROGRESS: pass 0, at document #1112000/4922894\n", + "2019-01-31 00:34:55,142 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:34:55,408 : INFO : topic #9 (0.020): 0.065*\"bone\" + 0.041*\"american\" + 0.032*\"valour\" + 0.021*\"dutch\" + 0.018*\"english\" + 0.018*\"player\" + 0.017*\"folei\" + 0.015*\"polit\" + 0.012*\"simpler\" + 0.011*\"acrimoni\"\n", + "2019-01-31 00:34:55,410 : INFO : topic #6 (0.020): 0.070*\"fewer\" + 0.025*\"septemb\" + 0.024*\"epiru\" + 0.019*\"teacher\" + 0.018*\"stake\" + 0.013*\"rodríguez\" + 0.013*\"proclaim\" + 0.012*\"direct\" + 0.011*\"movi\" + 0.010*\"acrimoni\"\n", + "2019-01-31 00:34:55,411 : INFO : topic #32 (0.020): 0.057*\"district\" + 0.046*\"vigour\" + 0.043*\"popolo\" + 0.040*\"tortur\" + 0.028*\"area\" + 0.026*\"cotton\" + 0.025*\"multitud\" + 0.024*\"regim\" + 0.022*\"citi\" + 0.019*\"commun\"\n", + "2019-01-31 00:34:55,412 : INFO : topic #22 (0.020): 0.033*\"spars\" + 0.024*\"factor\" + 0.023*\"adulthood\" + 0.016*\"feel\" + 0.015*\"hostil\" + 0.014*\"male\" + 0.011*\"plaisir\" + 0.011*\"genu\" + 0.010*\"live\" + 0.009*\"yawn\"\n", + "2019-01-31 00:34:55,413 : INFO : topic #28 (0.020): 0.030*\"build\" + 0.025*\"hous\" + 0.021*\"rivièr\" + 0.017*\"buford\" + 0.012*\"histor\" + 0.012*\"briarwood\" + 0.011*\"constitut\" + 0.010*\"strategist\" + 0.010*\"depress\" + 0.010*\"rosenwald\"\n", + "2019-01-31 00:34:55,419 : INFO : topic diff=0.006224, rho=0.042409\n", + "2019-01-31 00:34:55,571 : INFO : PROGRESS: pass 0, at document #1114000/4922894\n", + "2019-01-31 00:34:56,950 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:34:57,216 : INFO : topic #29 (0.020): 0.018*\"companhia\" + 0.011*\"million\" + 0.008*\"busi\" + 0.008*\"yawn\" + 0.008*\"bank\" + 0.008*\"market\" + 0.008*\"govern\" + 0.007*\"start\" + 0.007*\"industri\" + 0.007*\"function\"\n", + "2019-01-31 00:34:57,217 : INFO : topic #30 (0.020): 0.036*\"leagu\" + 0.036*\"cleveland\" + 0.030*\"place\" + 0.028*\"taxpay\" + 0.024*\"scientist\" + 0.024*\"crete\" + 0.023*\"folei\" + 0.017*\"goal\" + 0.015*\"martin\" + 0.012*\"schmitz\"\n", + "2019-01-31 00:34:57,218 : INFO : topic #34 (0.020): 0.072*\"start\" + 0.034*\"cotton\" + 0.030*\"unionist\" + 0.029*\"american\" + 0.025*\"new\" + 0.014*\"year\" + 0.013*\"warrior\" + 0.013*\"california\" + 0.012*\"terri\" + 0.012*\"north\"\n", + "2019-01-31 00:34:57,219 : INFO : topic #42 (0.020): 0.043*\"german\" + 0.029*\"germani\" + 0.014*\"vol\" + 0.014*\"berlin\" + 0.013*\"jewish\" + 0.013*\"der\" + 0.013*\"israel\" + 0.009*\"european\" + 0.009*\"europ\" + 0.009*\"itali\"\n", + "2019-01-31 00:34:57,220 : INFO : topic #45 (0.020): 0.022*\"jpg\" + 0.021*\"fifteenth\" + 0.016*\"illicit\" + 0.015*\"colder\" + 0.015*\"black\" + 0.015*\"western\" + 0.012*\"record\" + 0.010*\"blind\" + 0.009*\"light\" + 0.007*\"green\"\n", + "2019-01-31 00:34:57,226 : INFO : topic diff=0.006855, rho=0.042371\n", + "2019-01-31 00:34:57,378 : INFO : PROGRESS: pass 0, at document #1116000/4922894\n", + "2019-01-31 00:34:58,752 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 00:34:59,018 : INFO : topic #21 (0.020): 0.037*\"samford\" + 0.022*\"spain\" + 0.018*\"mexico\" + 0.018*\"del\" + 0.013*\"soviet\" + 0.012*\"santa\" + 0.012*\"carlo\" + 0.011*\"juan\" + 0.011*\"francisco\" + 0.011*\"lizard\"\n", + "2019-01-31 00:34:59,019 : INFO : topic #1 (0.020): 0.057*\"china\" + 0.049*\"chilton\" + 0.024*\"hong\" + 0.024*\"kong\" + 0.024*\"korea\" + 0.019*\"korean\" + 0.017*\"sourc\" + 0.015*\"leah\" + 0.014*\"kim\" + 0.013*\"ashvil\"\n", + "2019-01-31 00:34:59,020 : INFO : topic #33 (0.020): 0.059*\"french\" + 0.043*\"franc\" + 0.032*\"pari\" + 0.023*\"sail\" + 0.022*\"jean\" + 0.017*\"daphn\" + 0.013*\"lazi\" + 0.013*\"loui\" + 0.011*\"piec\" + 0.010*\"wine\"\n", + "2019-01-31 00:34:59,021 : INFO : topic #0 (0.020): 0.065*\"statewid\" + 0.040*\"arsen\" + 0.039*\"line\" + 0.036*\"raid\" + 0.029*\"museo\" + 0.023*\"pain\" + 0.018*\"traceabl\" + 0.017*\"serv\" + 0.013*\"exhaust\" + 0.013*\"gai\"\n", + "2019-01-31 00:34:59,022 : INFO : topic #3 (0.020): 0.036*\"present\" + 0.026*\"offic\" + 0.025*\"minist\" + 0.021*\"nation\" + 0.020*\"serv\" + 0.019*\"govern\" + 0.019*\"member\" + 0.018*\"gener\" + 0.017*\"seri\" + 0.015*\"appeas\"\n", + "2019-01-31 00:34:59,028 : INFO : topic diff=0.007364, rho=0.042333\n", + "2019-01-31 00:34:59,242 : INFO : PROGRESS: pass 0, at document #1118000/4922894\n", + "2019-01-31 00:35:00,659 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:35:00,925 : INFO : topic #7 (0.020): 0.021*\"snatch\" + 0.020*\"di\" + 0.018*\"factor\" + 0.015*\"yawn\" + 0.015*\"margin\" + 0.014*\"bone\" + 0.012*\"life\" + 0.012*\"faster\" + 0.011*\"deal\" + 0.011*\"daughter\"\n", + "2019-01-31 00:35:00,927 : INFO : topic #4 (0.020): 0.022*\"enfranchis\" + 0.015*\"depress\" + 0.014*\"pour\" + 0.009*\"elabor\" + 0.009*\"mode\" + 0.008*\"veget\" + 0.008*\"produc\" + 0.008*\"candid\" + 0.007*\"encyclopedia\" + 0.007*\"uruguayan\"\n", + "2019-01-31 00:35:00,928 : INFO : topic #21 (0.020): 0.037*\"samford\" + 0.023*\"spain\" + 0.018*\"mexico\" + 0.018*\"del\" + 0.015*\"soviet\" + 0.012*\"santa\" + 0.011*\"juan\" + 0.011*\"carlo\" + 0.011*\"francisco\" + 0.011*\"lizard\"\n", + "2019-01-31 00:35:00,929 : INFO : topic #16 (0.020): 0.045*\"king\" + 0.031*\"priest\" + 0.020*\"grammat\" + 0.020*\"duke\" + 0.018*\"idiosyncrat\" + 0.017*\"quarterli\" + 0.017*\"rotterdam\" + 0.014*\"portugues\" + 0.014*\"count\" + 0.013*\"maria\"\n", + "2019-01-31 00:35:00,930 : INFO : topic #37 (0.020): 0.010*\"man\" + 0.009*\"love\" + 0.008*\"gestur\" + 0.005*\"blue\" + 0.005*\"comic\" + 0.005*\"litig\" + 0.005*\"vision\" + 0.005*\"bewild\" + 0.004*\"septemb\" + 0.004*\"black\"\n", + "2019-01-31 00:35:00,936 : INFO : topic diff=0.006929, rho=0.042295\n", + "2019-01-31 00:35:03,682 : INFO : -11.629 per-word bound, 3166.4 perplexity estimate based on a held-out corpus of 2000 documents with 566734 words\n", + "2019-01-31 00:35:03,682 : INFO : PROGRESS: pass 0, at document #1120000/4922894\n", + "2019-01-31 00:35:05,087 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:35:05,354 : INFO : topic #2 (0.020): 0.048*\"isl\" + 0.038*\"shield\" + 0.017*\"narrat\" + 0.014*\"scot\" + 0.012*\"pope\" + 0.011*\"blur\" + 0.011*\"class\" + 0.010*\"nativist\" + 0.010*\"coalit\" + 0.009*\"sai\"\n", + "2019-01-31 00:35:05,355 : INFO : topic #41 (0.020): 0.044*\"citi\" + 0.031*\"new\" + 0.023*\"palmer\" + 0.014*\"year\" + 0.014*\"strategist\" + 0.012*\"center\" + 0.012*\"open\" + 0.011*\"includ\" + 0.010*\"hot\" + 0.010*\"lobe\"\n", + "2019-01-31 00:35:05,357 : INFO : topic #26 (0.020): 0.030*\"workplac\" + 0.030*\"champion\" + 0.027*\"woman\" + 0.027*\"olymp\" + 0.025*\"men\" + 0.022*\"medal\" + 0.021*\"event\" + 0.019*\"atheist\" + 0.017*\"rainfal\" + 0.017*\"alic\"\n", + "2019-01-31 00:35:05,358 : INFO : topic #34 (0.020): 0.071*\"start\" + 0.033*\"cotton\" + 0.030*\"unionist\" + 0.029*\"american\" + 0.026*\"new\" + 0.014*\"year\" + 0.014*\"warrior\" + 0.013*\"california\" + 0.013*\"terri\" + 0.012*\"north\"\n", + "2019-01-31 00:35:05,359 : INFO : topic #46 (0.020): 0.019*\"stop\" + 0.019*\"norwai\" + 0.016*\"norwegian\" + 0.016*\"sweden\" + 0.015*\"swedish\" + 0.014*\"damag\" + 0.013*\"treeless\" + 0.013*\"wind\" + 0.012*\"huntsvil\" + 0.012*\"financ\"\n", + "2019-01-31 00:35:05,365 : INFO : topic diff=0.006813, rho=0.042258\n", + "2019-01-31 00:35:05,526 : INFO : PROGRESS: pass 0, at document #1122000/4922894\n", + "2019-01-31 00:35:06,945 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:35:07,211 : INFO : topic #15 (0.020): 0.012*\"develop\" + 0.012*\"small\" + 0.011*\"organ\" + 0.011*\"commun\" + 0.009*\"word\" + 0.008*\"group\" + 0.008*\"cultur\" + 0.008*\"peopl\" + 0.007*\"human\" + 0.006*\"workplac\"\n", + "2019-01-31 00:35:07,212 : INFO : topic #47 (0.020): 0.066*\"muscl\" + 0.033*\"perceptu\" + 0.021*\"theater\" + 0.018*\"place\" + 0.018*\"damn\" + 0.017*\"compos\" + 0.016*\"olympo\" + 0.013*\"orchestr\" + 0.013*\"physician\" + 0.011*\"word\"\n", + "2019-01-31 00:35:07,213 : INFO : topic #46 (0.020): 0.020*\"norwai\" + 0.019*\"stop\" + 0.017*\"norwegian\" + 0.016*\"sweden\" + 0.015*\"swedish\" + 0.014*\"treeless\" + 0.014*\"damag\" + 0.013*\"wind\" + 0.012*\"huntsvil\" + 0.011*\"financ\"\n", + "2019-01-31 00:35:07,214 : INFO : topic #5 (0.020): 0.039*\"abroad\" + 0.029*\"son\" + 0.028*\"rel\" + 0.026*\"reconstruct\" + 0.021*\"band\" + 0.018*\"muscl\" + 0.017*\"simultan\" + 0.014*\"charcoal\" + 0.014*\"toyota\" + 0.010*\"myspac\"\n", + "2019-01-31 00:35:07,215 : INFO : topic #14 (0.020): 0.024*\"forc\" + 0.022*\"aggress\" + 0.020*\"walter\" + 0.020*\"armi\" + 0.018*\"com\" + 0.014*\"oper\" + 0.014*\"militari\" + 0.013*\"unionist\" + 0.012*\"refut\" + 0.012*\"airbu\"\n", + "2019-01-31 00:35:07,221 : INFO : topic diff=0.007671, rho=0.042220\n", + "2019-01-31 00:35:07,379 : INFO : PROGRESS: pass 0, at document #1124000/4922894\n", + "2019-01-31 00:35:08,788 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:35:09,054 : INFO : topic #10 (0.020): 0.012*\"cdd\" + 0.008*\"disco\" + 0.008*\"media\" + 0.008*\"pathwai\" + 0.008*\"have\" + 0.007*\"treat\" + 0.007*\"proper\" + 0.006*\"caus\" + 0.006*\"acid\" + 0.006*\"gastrointestin\"\n", + "2019-01-31 00:35:09,055 : INFO : topic #9 (0.020): 0.067*\"bone\" + 0.042*\"american\" + 0.032*\"valour\" + 0.021*\"dutch\" + 0.018*\"english\" + 0.017*\"folei\" + 0.017*\"player\" + 0.016*\"polit\" + 0.012*\"simpler\" + 0.011*\"acrimoni\"\n", + "2019-01-31 00:35:09,056 : INFO : topic #20 (0.020): 0.143*\"scholar\" + 0.038*\"struggl\" + 0.035*\"high\" + 0.029*\"educ\" + 0.022*\"collector\" + 0.018*\"yawn\" + 0.013*\"prognosi\" + 0.009*\"gothic\" + 0.009*\"district\" + 0.009*\"task\"\n", + "2019-01-31 00:35:09,057 : INFO : topic #37 (0.020): 0.010*\"man\" + 0.009*\"love\" + 0.008*\"gestur\" + 0.005*\"blue\" + 0.005*\"comic\" + 0.005*\"litig\" + 0.004*\"vision\" + 0.004*\"bewild\" + 0.004*\"septemb\" + 0.004*\"black\"\n", + "2019-01-31 00:35:09,059 : INFO : topic #35 (0.020): 0.053*\"russia\" + 0.035*\"sovereignti\" + 0.031*\"rural\" + 0.030*\"rsm\" + 0.026*\"personifi\" + 0.023*\"poison\" + 0.022*\"reprint\" + 0.020*\"moscow\" + 0.016*\"poland\" + 0.016*\"unfortun\"\n", + "2019-01-31 00:35:09,064 : INFO : topic diff=0.008978, rho=0.042182\n", + "2019-01-31 00:35:09,221 : INFO : PROGRESS: pass 0, at document #1126000/4922894\n", + "2019-01-31 00:35:10,630 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:35:10,896 : INFO : topic #29 (0.020): 0.018*\"companhia\" + 0.010*\"million\" + 0.009*\"bank\" + 0.009*\"busi\" + 0.008*\"market\" + 0.008*\"yawn\" + 0.008*\"govern\" + 0.007*\"start\" + 0.007*\"industri\" + 0.007*\"function\"\n", + "2019-01-31 00:35:10,898 : INFO : topic #32 (0.020): 0.057*\"district\" + 0.046*\"vigour\" + 0.044*\"popolo\" + 0.040*\"tortur\" + 0.028*\"area\" + 0.026*\"cotton\" + 0.024*\"multitud\" + 0.024*\"regim\" + 0.022*\"citi\" + 0.019*\"commun\"\n", + "2019-01-31 00:35:10,899 : INFO : topic #6 (0.020): 0.070*\"fewer\" + 0.026*\"septemb\" + 0.025*\"epiru\" + 0.019*\"teacher\" + 0.018*\"stake\" + 0.013*\"proclaim\" + 0.012*\"rodríguez\" + 0.012*\"direct\" + 0.011*\"movi\" + 0.010*\"acrimoni\"\n", + "2019-01-31 00:35:10,900 : INFO : topic #7 (0.020): 0.021*\"snatch\" + 0.020*\"di\" + 0.018*\"factor\" + 0.015*\"yawn\" + 0.015*\"margin\" + 0.014*\"bone\" + 0.012*\"life\" + 0.012*\"faster\" + 0.011*\"daughter\" + 0.011*\"deal\"\n", + "2019-01-31 00:35:10,901 : INFO : topic #38 (0.020): 0.022*\"walter\" + 0.013*\"aza\" + 0.009*\"battalion\" + 0.009*\"teufel\" + 0.008*\"forc\" + 0.008*\"till\" + 0.008*\"king\" + 0.007*\"empath\" + 0.007*\"armi\" + 0.006*\"centuri\"\n", + "2019-01-31 00:35:10,907 : INFO : topic diff=0.006269, rho=0.042145\n", + "2019-01-31 00:35:11,062 : INFO : PROGRESS: pass 0, at document #1128000/4922894\n", + "2019-01-31 00:35:12,460 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:35:12,727 : INFO : topic #6 (0.020): 0.070*\"fewer\" + 0.026*\"septemb\" + 0.025*\"epiru\" + 0.019*\"teacher\" + 0.018*\"stake\" + 0.013*\"proclaim\" + 0.013*\"rodríguez\" + 0.012*\"direct\" + 0.011*\"movi\" + 0.010*\"acrimoni\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 00:35:12,728 : INFO : topic #22 (0.020): 0.033*\"spars\" + 0.024*\"factor\" + 0.023*\"adulthood\" + 0.016*\"feel\" + 0.015*\"male\" + 0.014*\"hostil\" + 0.011*\"plaisir\" + 0.011*\"genu\" + 0.010*\"live\" + 0.009*\"yawn\"\n", + "2019-01-31 00:35:12,729 : INFO : topic #41 (0.020): 0.044*\"citi\" + 0.031*\"new\" + 0.024*\"palmer\" + 0.014*\"year\" + 0.014*\"strategist\" + 0.012*\"center\" + 0.012*\"open\" + 0.011*\"includ\" + 0.010*\"hot\" + 0.010*\"lobe\"\n", + "2019-01-31 00:35:12,730 : INFO : topic #25 (0.020): 0.031*\"ring\" + 0.023*\"lagrang\" + 0.017*\"warmth\" + 0.016*\"area\" + 0.015*\"mount\" + 0.010*\"palmer\" + 0.008*\"north\" + 0.008*\"foam\" + 0.008*\"vacant\" + 0.008*\"land\"\n", + "2019-01-31 00:35:12,731 : INFO : topic #4 (0.020): 0.021*\"enfranchis\" + 0.015*\"depress\" + 0.014*\"pour\" + 0.009*\"mode\" + 0.009*\"elabor\" + 0.008*\"veget\" + 0.007*\"produc\" + 0.007*\"candid\" + 0.007*\"uruguayan\" + 0.007*\"encyclopedia\"\n", + "2019-01-31 00:35:12,737 : INFO : topic diff=0.007026, rho=0.042108\n", + "2019-01-31 00:35:12,890 : INFO : PROGRESS: pass 0, at document #1130000/4922894\n", + "2019-01-31 00:35:14,274 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:35:14,541 : INFO : topic #48 (0.020): 0.081*\"march\" + 0.077*\"sens\" + 0.074*\"octob\" + 0.071*\"januari\" + 0.069*\"notion\" + 0.067*\"april\" + 0.066*\"juli\" + 0.066*\"judici\" + 0.066*\"decatur\" + 0.065*\"august\"\n", + "2019-01-31 00:35:14,542 : INFO : topic #3 (0.020): 0.036*\"present\" + 0.027*\"offic\" + 0.026*\"minist\" + 0.021*\"nation\" + 0.020*\"serv\" + 0.020*\"govern\" + 0.019*\"member\" + 0.017*\"gener\" + 0.017*\"seri\" + 0.014*\"appeas\"\n", + "2019-01-31 00:35:14,543 : INFO : topic #2 (0.020): 0.047*\"isl\" + 0.038*\"shield\" + 0.017*\"narrat\" + 0.014*\"scot\" + 0.012*\"pope\" + 0.012*\"blur\" + 0.011*\"class\" + 0.011*\"nativist\" + 0.010*\"coalit\" + 0.009*\"bahá\"\n", + "2019-01-31 00:35:14,544 : INFO : topic #32 (0.020): 0.057*\"district\" + 0.046*\"vigour\" + 0.044*\"popolo\" + 0.041*\"tortur\" + 0.028*\"area\" + 0.027*\"cotton\" + 0.024*\"regim\" + 0.024*\"multitud\" + 0.022*\"citi\" + 0.019*\"commun\"\n", + "2019-01-31 00:35:14,545 : INFO : topic #13 (0.020): 0.025*\"sourc\" + 0.025*\"australia\" + 0.025*\"london\" + 0.024*\"new\" + 0.022*\"australian\" + 0.020*\"england\" + 0.019*\"british\" + 0.017*\"ireland\" + 0.015*\"youth\" + 0.013*\"ipa\"\n", + "2019-01-31 00:35:14,551 : INFO : topic diff=0.007217, rho=0.042070\n", + "2019-01-31 00:35:14,702 : INFO : PROGRESS: pass 0, at document #1132000/4922894\n", + "2019-01-31 00:35:16,063 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:35:16,330 : INFO : topic #16 (0.020): 0.046*\"king\" + 0.031*\"priest\" + 0.021*\"grammat\" + 0.019*\"duke\" + 0.018*\"quarterli\" + 0.017*\"idiosyncrat\" + 0.017*\"rotterdam\" + 0.014*\"portugues\" + 0.014*\"count\" + 0.013*\"maria\"\n", + "2019-01-31 00:35:16,331 : INFO : topic #0 (0.020): 0.066*\"statewid\" + 0.039*\"line\" + 0.037*\"raid\" + 0.037*\"arsen\" + 0.028*\"museo\" + 0.020*\"pain\" + 0.019*\"traceabl\" + 0.017*\"serv\" + 0.013*\"exhaust\" + 0.012*\"gai\"\n", + "2019-01-31 00:35:16,332 : INFO : topic #11 (0.020): 0.027*\"john\" + 0.014*\"will\" + 0.013*\"jame\" + 0.012*\"david\" + 0.011*\"rival\" + 0.009*\"mexican–american\" + 0.009*\"georg\" + 0.009*\"slur\" + 0.008*\"paul\" + 0.008*\"rhyme\"\n", + "2019-01-31 00:35:16,333 : INFO : topic #4 (0.020): 0.021*\"enfranchis\" + 0.015*\"depress\" + 0.014*\"pour\" + 0.009*\"elabor\" + 0.009*\"mode\" + 0.009*\"veget\" + 0.007*\"produc\" + 0.007*\"candid\" + 0.007*\"uruguayan\" + 0.007*\"encyclopedia\"\n", + "2019-01-31 00:35:16,334 : INFO : topic #9 (0.020): 0.069*\"bone\" + 0.043*\"american\" + 0.031*\"valour\" + 0.019*\"dutch\" + 0.018*\"folei\" + 0.017*\"english\" + 0.017*\"player\" + 0.017*\"polit\" + 0.012*\"simpler\" + 0.011*\"acrimoni\"\n", + "2019-01-31 00:35:16,340 : INFO : topic diff=0.006899, rho=0.042033\n", + "2019-01-31 00:35:16,499 : INFO : PROGRESS: pass 0, at document #1134000/4922894\n", + "2019-01-31 00:35:17,931 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:35:18,197 : INFO : topic #45 (0.020): 0.022*\"jpg\" + 0.021*\"fifteenth\" + 0.017*\"illicit\" + 0.016*\"colder\" + 0.015*\"western\" + 0.015*\"black\" + 0.012*\"record\" + 0.010*\"blind\" + 0.008*\"light\" + 0.007*\"green\"\n", + "2019-01-31 00:35:18,199 : INFO : topic #18 (0.020): 0.010*\"théori\" + 0.007*\"later\" + 0.007*\"sack\" + 0.006*\"kill\" + 0.006*\"dai\" + 0.005*\"retrospect\" + 0.005*\"like\" + 0.004*\"end\" + 0.004*\"help\" + 0.004*\"man\"\n", + "2019-01-31 00:35:18,200 : INFO : topic #13 (0.020): 0.025*\"sourc\" + 0.025*\"australia\" + 0.025*\"london\" + 0.024*\"new\" + 0.023*\"australian\" + 0.020*\"england\" + 0.019*\"british\" + 0.018*\"ireland\" + 0.015*\"youth\" + 0.013*\"ipa\"\n", + "2019-01-31 00:35:18,201 : INFO : topic #3 (0.020): 0.036*\"present\" + 0.027*\"offic\" + 0.026*\"minist\" + 0.021*\"nation\" + 0.020*\"govern\" + 0.020*\"serv\" + 0.019*\"member\" + 0.017*\"gener\" + 0.017*\"seri\" + 0.014*\"appeas\"\n", + "2019-01-31 00:35:18,202 : INFO : topic #0 (0.020): 0.067*\"statewid\" + 0.039*\"line\" + 0.037*\"raid\" + 0.037*\"arsen\" + 0.028*\"museo\" + 0.020*\"pain\" + 0.019*\"traceabl\" + 0.017*\"serv\" + 0.013*\"exhaust\" + 0.012*\"gai\"\n", + "2019-01-31 00:35:18,208 : INFO : topic diff=0.007484, rho=0.041996\n", + "2019-01-31 00:35:18,364 : INFO : PROGRESS: pass 0, at document #1136000/4922894\n", + "2019-01-31 00:35:19,774 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:35:20,040 : INFO : topic #42 (0.020): 0.043*\"german\" + 0.029*\"germani\" + 0.016*\"jewish\" + 0.015*\"vol\" + 0.015*\"berlin\" + 0.013*\"der\" + 0.013*\"israel\" + 0.009*\"european\" + 0.009*\"itali\" + 0.009*\"europ\"\n", + "2019-01-31 00:35:20,041 : INFO : topic #13 (0.020): 0.026*\"sourc\" + 0.026*\"australia\" + 0.025*\"london\" + 0.024*\"new\" + 0.023*\"australian\" + 0.021*\"england\" + 0.019*\"british\" + 0.018*\"ireland\" + 0.015*\"youth\" + 0.013*\"wale\"\n", + "2019-01-31 00:35:20,042 : INFO : topic #40 (0.020): 0.089*\"unit\" + 0.026*\"collector\" + 0.023*\"schuster\" + 0.021*\"institut\" + 0.020*\"requir\" + 0.017*\"student\" + 0.014*\"professor\" + 0.012*\"word\" + 0.012*\"governor\" + 0.011*\"degre\"\n", + "2019-01-31 00:35:20,043 : INFO : topic #19 (0.020): 0.014*\"languag\" + 0.010*\"woodcut\" + 0.010*\"form\" + 0.010*\"origin\" + 0.009*\"centuri\" + 0.008*\"mean\" + 0.007*\"like\" + 0.007*\"charact\" + 0.007*\"uruguayan\" + 0.006*\"known\"\n", + "2019-01-31 00:35:20,044 : INFO : topic #11 (0.020): 0.027*\"john\" + 0.014*\"will\" + 0.013*\"jame\" + 0.012*\"david\" + 0.011*\"rival\" + 0.009*\"georg\" + 0.009*\"mexican–american\" + 0.009*\"slur\" + 0.008*\"rhyme\" + 0.008*\"paul\"\n", + "2019-01-31 00:35:20,050 : INFO : topic diff=0.006667, rho=0.041959\n", + "2019-01-31 00:35:20,206 : INFO : PROGRESS: pass 0, at document #1138000/4922894\n", + "2019-01-31 00:35:21,598 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:35:21,864 : INFO : topic #35 (0.020): 0.054*\"russia\" + 0.040*\"rural\" + 0.036*\"sovereignti\" + 0.026*\"personifi\" + 0.023*\"rsm\" + 0.022*\"poison\" + 0.021*\"reprint\" + 0.019*\"moscow\" + 0.015*\"unfortun\" + 0.015*\"poland\"\n", + "2019-01-31 00:35:21,865 : INFO : topic #44 (0.020): 0.031*\"rooftop\" + 0.029*\"final\" + 0.023*\"wife\" + 0.021*\"tourist\" + 0.018*\"taxpay\" + 0.017*\"champion\" + 0.015*\"martin\" + 0.014*\"chamber\" + 0.014*\"tiepolo\" + 0.013*\"open\"\n", + "2019-01-31 00:35:21,866 : INFO : topic #9 (0.020): 0.070*\"bone\" + 0.042*\"american\" + 0.030*\"valour\" + 0.019*\"dutch\" + 0.018*\"folei\" + 0.017*\"english\" + 0.017*\"player\" + 0.016*\"polit\" + 0.012*\"simpler\" + 0.011*\"acrimoni\"\n", + "2019-01-31 00:35:21,867 : INFO : topic #29 (0.020): 0.018*\"companhia\" + 0.010*\"million\" + 0.010*\"bank\" + 0.008*\"busi\" + 0.008*\"market\" + 0.008*\"yawn\" + 0.007*\"govern\" + 0.007*\"start\" + 0.007*\"industri\" + 0.007*\"function\"\n", + "2019-01-31 00:35:21,868 : INFO : topic #47 (0.020): 0.064*\"muscl\" + 0.033*\"perceptu\" + 0.021*\"theater\" + 0.018*\"place\" + 0.017*\"compos\" + 0.016*\"damn\" + 0.015*\"orchestr\" + 0.015*\"olympo\" + 0.013*\"physician\" + 0.011*\"word\"\n", + "2019-01-31 00:35:21,874 : INFO : topic diff=0.009771, rho=0.041922\n", + "2019-01-31 00:35:24,538 : INFO : -11.660 per-word bound, 3235.1 perplexity estimate based on a held-out corpus of 2000 documents with 541570 words\n", + "2019-01-31 00:35:24,539 : INFO : PROGRESS: pass 0, at document #1140000/4922894\n", + "2019-01-31 00:35:25,931 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:35:26,197 : INFO : topic #41 (0.020): 0.045*\"citi\" + 0.031*\"new\" + 0.023*\"palmer\" + 0.014*\"year\" + 0.014*\"strategist\" + 0.013*\"center\" + 0.011*\"open\" + 0.011*\"includ\" + 0.010*\"lobe\" + 0.009*\"hot\"\n", + "2019-01-31 00:35:26,198 : INFO : topic #49 (0.020): 0.042*\"india\" + 0.031*\"incumb\" + 0.014*\"televis\" + 0.013*\"pakistan\" + 0.012*\"islam\" + 0.011*\"khalsa\" + 0.011*\"tajikistan\" + 0.011*\"anglo\" + 0.010*\"muskoge\" + 0.010*\"alam\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 00:35:26,200 : INFO : topic #38 (0.020): 0.023*\"walter\" + 0.013*\"aza\" + 0.009*\"battalion\" + 0.008*\"teufel\" + 0.008*\"forc\" + 0.007*\"king\" + 0.007*\"till\" + 0.007*\"empath\" + 0.007*\"armi\" + 0.006*\"centuri\"\n", + "2019-01-31 00:35:26,201 : INFO : topic #29 (0.020): 0.018*\"companhia\" + 0.010*\"million\" + 0.009*\"bank\" + 0.009*\"busi\" + 0.008*\"market\" + 0.008*\"yawn\" + 0.007*\"govern\" + 0.007*\"industri\" + 0.007*\"start\" + 0.007*\"function\"\n", + "2019-01-31 00:35:26,202 : INFO : topic #47 (0.020): 0.064*\"muscl\" + 0.034*\"perceptu\" + 0.020*\"theater\" + 0.018*\"place\" + 0.017*\"compos\" + 0.016*\"damn\" + 0.015*\"orchestr\" + 0.015*\"olympo\" + 0.013*\"physician\" + 0.011*\"word\"\n", + "2019-01-31 00:35:26,208 : INFO : topic diff=0.006620, rho=0.041885\n", + "2019-01-31 00:35:26,363 : INFO : PROGRESS: pass 0, at document #1142000/4922894\n", + "2019-01-31 00:35:27,746 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:35:28,012 : INFO : topic #26 (0.020): 0.031*\"workplac\" + 0.029*\"champion\" + 0.028*\"woman\" + 0.026*\"olymp\" + 0.025*\"men\" + 0.021*\"medal\" + 0.021*\"event\" + 0.019*\"atheist\" + 0.018*\"alic\" + 0.017*\"rainfal\"\n", + "2019-01-31 00:35:28,013 : INFO : topic #32 (0.020): 0.056*\"district\" + 0.047*\"vigour\" + 0.043*\"popolo\" + 0.040*\"tortur\" + 0.028*\"area\" + 0.026*\"cotton\" + 0.024*\"regim\" + 0.024*\"multitud\" + 0.021*\"citi\" + 0.019*\"commun\"\n", + "2019-01-31 00:35:28,014 : INFO : topic #28 (0.020): 0.030*\"build\" + 0.026*\"hous\" + 0.020*\"rivièr\" + 0.017*\"buford\" + 0.013*\"histor\" + 0.011*\"constitut\" + 0.010*\"briarwood\" + 0.010*\"strategist\" + 0.010*\"depress\" + 0.010*\"silicon\"\n", + "2019-01-31 00:35:28,016 : INFO : topic #12 (0.020): 0.008*\"frontal\" + 0.008*\"number\" + 0.007*\"gener\" + 0.007*\"théori\" + 0.007*\"servitud\" + 0.006*\"southern\" + 0.006*\"poet\" + 0.006*\"exampl\" + 0.006*\"measur\" + 0.006*\"method\"\n", + "2019-01-31 00:35:28,017 : INFO : topic #4 (0.020): 0.022*\"enfranchis\" + 0.015*\"depress\" + 0.014*\"pour\" + 0.009*\"elabor\" + 0.009*\"mode\" + 0.008*\"veget\" + 0.007*\"produc\" + 0.007*\"candid\" + 0.007*\"uruguayan\" + 0.007*\"develop\"\n", + "2019-01-31 00:35:28,022 : INFO : topic diff=0.006957, rho=0.041849\n", + "2019-01-31 00:35:28,183 : INFO : PROGRESS: pass 0, at document #1144000/4922894\n", + "2019-01-31 00:35:29,579 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:35:29,849 : INFO : topic #43 (0.020): 0.063*\"elect\" + 0.053*\"parti\" + 0.023*\"voluntari\" + 0.022*\"member\" + 0.021*\"democrat\" + 0.017*\"polici\" + 0.015*\"republ\" + 0.015*\"liber\" + 0.013*\"report\" + 0.013*\"selma\"\n", + "2019-01-31 00:35:29,850 : INFO : topic #35 (0.020): 0.055*\"russia\" + 0.039*\"rural\" + 0.035*\"sovereignti\" + 0.026*\"personifi\" + 0.023*\"poison\" + 0.021*\"reprint\" + 0.020*\"rsm\" + 0.020*\"moscow\" + 0.015*\"poland\" + 0.015*\"unfortun\"\n", + "2019-01-31 00:35:29,851 : INFO : topic #19 (0.020): 0.014*\"languag\" + 0.010*\"woodcut\" + 0.010*\"form\" + 0.010*\"origin\" + 0.009*\"centuri\" + 0.008*\"mean\" + 0.007*\"charact\" + 0.007*\"like\" + 0.007*\"uruguayan\" + 0.006*\"known\"\n", + "2019-01-31 00:35:29,852 : INFO : topic #12 (0.020): 0.009*\"frontal\" + 0.008*\"number\" + 0.007*\"gener\" + 0.007*\"théori\" + 0.007*\"servitud\" + 0.007*\"southern\" + 0.006*\"poet\" + 0.006*\"exampl\" + 0.006*\"measur\" + 0.006*\"method\"\n", + "2019-01-31 00:35:29,853 : INFO : topic #49 (0.020): 0.042*\"india\" + 0.031*\"incumb\" + 0.014*\"televis\" + 0.013*\"pakistan\" + 0.012*\"islam\" + 0.011*\"khalsa\" + 0.011*\"tajikistan\" + 0.010*\"anglo\" + 0.010*\"singh\" + 0.010*\"muskoge\"\n", + "2019-01-31 00:35:29,859 : INFO : topic diff=0.006565, rho=0.041812\n", + "2019-01-31 00:35:30,014 : INFO : PROGRESS: pass 0, at document #1146000/4922894\n", + "2019-01-31 00:35:31,404 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:35:31,671 : INFO : topic #49 (0.020): 0.042*\"india\" + 0.031*\"incumb\" + 0.014*\"televis\" + 0.014*\"pakistan\" + 0.011*\"islam\" + 0.011*\"khalsa\" + 0.010*\"tajikistan\" + 0.010*\"anglo\" + 0.010*\"singh\" + 0.010*\"alam\"\n", + "2019-01-31 00:35:31,673 : INFO : topic #19 (0.020): 0.013*\"languag\" + 0.010*\"form\" + 0.010*\"woodcut\" + 0.010*\"origin\" + 0.010*\"centuri\" + 0.008*\"mean\" + 0.007*\"charact\" + 0.007*\"like\" + 0.007*\"uruguayan\" + 0.006*\"trade\"\n", + "2019-01-31 00:35:31,674 : INFO : topic #41 (0.020): 0.045*\"citi\" + 0.031*\"new\" + 0.023*\"palmer\" + 0.014*\"strategist\" + 0.014*\"year\" + 0.012*\"center\" + 0.011*\"open\" + 0.011*\"includ\" + 0.010*\"lobe\" + 0.009*\"hot\"\n", + "2019-01-31 00:35:31,675 : INFO : topic #18 (0.020): 0.010*\"théori\" + 0.007*\"later\" + 0.007*\"sack\" + 0.006*\"kill\" + 0.006*\"dai\" + 0.005*\"retrospect\" + 0.005*\"like\" + 0.004*\"end\" + 0.004*\"help\" + 0.004*\"man\"\n", + "2019-01-31 00:35:31,676 : INFO : topic #6 (0.020): 0.071*\"fewer\" + 0.025*\"septemb\" + 0.023*\"epiru\" + 0.020*\"teacher\" + 0.018*\"stake\" + 0.013*\"rodríguez\" + 0.012*\"proclaim\" + 0.012*\"direct\" + 0.011*\"movi\" + 0.010*\"acrimoni\"\n", + "2019-01-31 00:35:31,682 : INFO : topic diff=0.007417, rho=0.041776\n", + "2019-01-31 00:35:31,842 : INFO : PROGRESS: pass 0, at document #1148000/4922894\n", + "2019-01-31 00:35:33,262 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:35:33,529 : INFO : topic #36 (0.020): 0.012*\"network\" + 0.012*\"pop\" + 0.011*\"prognosi\" + 0.009*\"develop\" + 0.008*\"serv\" + 0.008*\"cytokin\" + 0.008*\"brio\" + 0.007*\"base\" + 0.007*\"softwar\" + 0.007*\"championship\"\n", + "2019-01-31 00:35:33,530 : INFO : topic #20 (0.020): 0.138*\"scholar\" + 0.039*\"struggl\" + 0.033*\"high\" + 0.030*\"educ\" + 0.021*\"collector\" + 0.018*\"yawn\" + 0.013*\"prognosi\" + 0.010*\"district\" + 0.009*\"gothic\" + 0.009*\"task\"\n", + "2019-01-31 00:35:33,531 : INFO : topic #31 (0.020): 0.061*\"fusiform\" + 0.024*\"scientist\" + 0.023*\"player\" + 0.023*\"taxpay\" + 0.020*\"place\" + 0.014*\"clot\" + 0.012*\"leagu\" + 0.011*\"folei\" + 0.010*\"yawn\" + 0.009*\"reconstruct\"\n", + "2019-01-31 00:35:33,532 : INFO : topic #33 (0.020): 0.060*\"french\" + 0.044*\"franc\" + 0.034*\"pari\" + 0.024*\"sail\" + 0.023*\"jean\" + 0.018*\"daphn\" + 0.015*\"lazi\" + 0.014*\"loui\" + 0.011*\"piec\" + 0.009*\"wine\"\n", + "2019-01-31 00:35:33,533 : INFO : topic #21 (0.020): 0.036*\"samford\" + 0.023*\"spain\" + 0.019*\"mexico\" + 0.018*\"del\" + 0.015*\"soviet\" + 0.012*\"santa\" + 0.012*\"lizard\" + 0.011*\"francisco\" + 0.011*\"juan\" + 0.010*\"carlo\"\n", + "2019-01-31 00:35:33,539 : INFO : topic diff=0.006646, rho=0.041739\n", + "2019-01-31 00:35:33,752 : INFO : PROGRESS: pass 0, at document #1150000/4922894\n", + "2019-01-31 00:35:35,186 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:35:35,452 : INFO : topic #30 (0.020): 0.036*\"leagu\" + 0.036*\"cleveland\" + 0.030*\"place\" + 0.028*\"taxpay\" + 0.024*\"scientist\" + 0.024*\"crete\" + 0.022*\"folei\" + 0.017*\"goal\" + 0.016*\"martin\" + 0.013*\"schmitz\"\n", + "2019-01-31 00:35:35,453 : INFO : topic #25 (0.020): 0.032*\"ring\" + 0.022*\"lagrang\" + 0.017*\"warmth\" + 0.016*\"area\" + 0.015*\"mount\" + 0.010*\"palmer\" + 0.008*\"north\" + 0.008*\"vacant\" + 0.008*\"land\" + 0.008*\"foam\"\n", + "2019-01-31 00:35:35,454 : INFO : topic #28 (0.020): 0.030*\"build\" + 0.025*\"hous\" + 0.021*\"rivièr\" + 0.019*\"buford\" + 0.013*\"histor\" + 0.011*\"linear\" + 0.011*\"briarwood\" + 0.011*\"constitut\" + 0.010*\"strategist\" + 0.010*\"depress\"\n", + "2019-01-31 00:35:35,455 : INFO : topic #35 (0.020): 0.053*\"russia\" + 0.037*\"rural\" + 0.034*\"sovereignti\" + 0.025*\"personifi\" + 0.023*\"poison\" + 0.021*\"reprint\" + 0.019*\"moscow\" + 0.018*\"rsm\" + 0.015*\"poland\" + 0.015*\"unfortun\"\n", + "2019-01-31 00:35:35,456 : INFO : topic #29 (0.020): 0.019*\"companhia\" + 0.011*\"million\" + 0.010*\"bank\" + 0.009*\"busi\" + 0.009*\"market\" + 0.008*\"yawn\" + 0.007*\"govern\" + 0.007*\"industri\" + 0.007*\"start\" + 0.007*\"function\"\n", + "2019-01-31 00:35:35,463 : INFO : topic diff=0.007564, rho=0.041703\n", + "2019-01-31 00:35:35,615 : INFO : PROGRESS: pass 0, at document #1152000/4922894\n", + "2019-01-31 00:35:36,991 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:35:37,257 : INFO : topic #11 (0.020): 0.027*\"john\" + 0.015*\"will\" + 0.013*\"jame\" + 0.011*\"david\" + 0.011*\"rival\" + 0.010*\"georg\" + 0.009*\"mexican–american\" + 0.009*\"slur\" + 0.008*\"rhyme\" + 0.008*\"paul\"\n", + "2019-01-31 00:35:37,258 : INFO : topic #10 (0.020): 0.012*\"cdd\" + 0.008*\"have\" + 0.008*\"disco\" + 0.008*\"media\" + 0.007*\"pathwai\" + 0.007*\"treat\" + 0.007*\"caus\" + 0.006*\"hormon\" + 0.006*\"acid\" + 0.006*\"proper\"\n", + "2019-01-31 00:35:37,259 : INFO : topic #29 (0.020): 0.019*\"companhia\" + 0.011*\"million\" + 0.009*\"bank\" + 0.009*\"busi\" + 0.009*\"market\" + 0.008*\"yawn\" + 0.007*\"govern\" + 0.007*\"industri\" + 0.007*\"start\" + 0.007*\"function\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 00:35:37,260 : INFO : topic #7 (0.020): 0.020*\"snatch\" + 0.020*\"di\" + 0.017*\"factor\" + 0.015*\"yawn\" + 0.015*\"margin\" + 0.014*\"bone\" + 0.012*\"life\" + 0.012*\"faster\" + 0.011*\"daughter\" + 0.011*\"deal\"\n", + "2019-01-31 00:35:37,261 : INFO : topic #21 (0.020): 0.036*\"samford\" + 0.023*\"spain\" + 0.018*\"mexico\" + 0.018*\"del\" + 0.015*\"soviet\" + 0.012*\"santa\" + 0.012*\"lizard\" + 0.011*\"francisco\" + 0.011*\"juan\" + 0.010*\"carlo\"\n", + "2019-01-31 00:35:37,267 : INFO : topic diff=0.006275, rho=0.041667\n", + "2019-01-31 00:35:37,428 : INFO : PROGRESS: pass 0, at document #1154000/4922894\n", + "2019-01-31 00:35:38,853 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:35:39,119 : INFO : topic #5 (0.020): 0.040*\"abroad\" + 0.029*\"son\" + 0.028*\"rel\" + 0.026*\"reconstruct\" + 0.021*\"band\" + 0.017*\"muscl\" + 0.017*\"simultan\" + 0.014*\"charcoal\" + 0.014*\"toyota\" + 0.010*\"myspac\"\n", + "2019-01-31 00:35:39,120 : INFO : topic #17 (0.020): 0.077*\"church\" + 0.021*\"cathol\" + 0.020*\"christian\" + 0.020*\"bishop\" + 0.015*\"sail\" + 0.014*\"retroflex\" + 0.010*\"centuri\" + 0.010*\"relationship\" + 0.009*\"poll\" + 0.009*\"cathedr\"\n", + "2019-01-31 00:35:39,122 : INFO : topic #15 (0.020): 0.011*\"develop\" + 0.011*\"small\" + 0.011*\"commun\" + 0.011*\"organ\" + 0.009*\"word\" + 0.009*\"cultur\" + 0.008*\"group\" + 0.008*\"peopl\" + 0.007*\"woman\" + 0.007*\"human\"\n", + "2019-01-31 00:35:39,123 : INFO : topic #19 (0.020): 0.014*\"languag\" + 0.010*\"centuri\" + 0.010*\"form\" + 0.010*\"origin\" + 0.009*\"woodcut\" + 0.008*\"mean\" + 0.007*\"like\" + 0.007*\"uruguayan\" + 0.007*\"charact\" + 0.006*\"trade\"\n", + "2019-01-31 00:35:39,124 : INFO : topic #37 (0.020): 0.010*\"man\" + 0.009*\"love\" + 0.008*\"gestur\" + 0.006*\"blue\" + 0.005*\"bewild\" + 0.005*\"comic\" + 0.005*\"vision\" + 0.004*\"septemb\" + 0.004*\"litig\" + 0.004*\"dixi\"\n", + "2019-01-31 00:35:39,130 : INFO : topic diff=0.007083, rho=0.041631\n", + "2019-01-31 00:35:39,281 : INFO : PROGRESS: pass 0, at document #1156000/4922894\n", + "2019-01-31 00:35:40,654 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:35:40,920 : INFO : topic #20 (0.020): 0.137*\"scholar\" + 0.039*\"struggl\" + 0.032*\"high\" + 0.030*\"educ\" + 0.022*\"collector\" + 0.019*\"yawn\" + 0.013*\"prognosi\" + 0.010*\"district\" + 0.010*\"gothic\" + 0.009*\"task\"\n", + "2019-01-31 00:35:40,921 : INFO : topic #22 (0.020): 0.033*\"spars\" + 0.024*\"factor\" + 0.023*\"adulthood\" + 0.016*\"feel\" + 0.014*\"male\" + 0.014*\"hostil\" + 0.011*\"plaisir\" + 0.010*\"live\" + 0.010*\"genu\" + 0.009*\"yawn\"\n", + "2019-01-31 00:35:40,922 : INFO : topic #41 (0.020): 0.044*\"citi\" + 0.031*\"new\" + 0.022*\"palmer\" + 0.014*\"year\" + 0.013*\"strategist\" + 0.013*\"center\" + 0.011*\"open\" + 0.011*\"includ\" + 0.010*\"lobe\" + 0.009*\"hot\"\n", + "2019-01-31 00:35:40,923 : INFO : topic #11 (0.020): 0.027*\"john\" + 0.015*\"will\" + 0.013*\"jame\" + 0.011*\"david\" + 0.011*\"rival\" + 0.009*\"georg\" + 0.009*\"slur\" + 0.009*\"mexican–american\" + 0.008*\"rhyme\" + 0.008*\"paul\"\n", + "2019-01-31 00:35:40,924 : INFO : topic #16 (0.020): 0.045*\"king\" + 0.031*\"priest\" + 0.020*\"grammat\" + 0.018*\"quarterli\" + 0.018*\"duke\" + 0.017*\"idiosyncrat\" + 0.017*\"rotterdam\" + 0.015*\"count\" + 0.013*\"brazil\" + 0.012*\"portugues\"\n", + "2019-01-31 00:35:40,930 : INFO : topic diff=0.007047, rho=0.041595\n", + "2019-01-31 00:35:41,082 : INFO : PROGRESS: pass 0, at document #1158000/4922894\n", + "2019-01-31 00:35:42,471 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:35:42,737 : INFO : topic #48 (0.020): 0.079*\"march\" + 0.077*\"sens\" + 0.077*\"octob\" + 0.072*\"januari\" + 0.071*\"notion\" + 0.069*\"juli\" + 0.067*\"judici\" + 0.067*\"august\" + 0.067*\"april\" + 0.066*\"decatur\"\n", + "2019-01-31 00:35:42,739 : INFO : topic #43 (0.020): 0.064*\"elect\" + 0.054*\"parti\" + 0.024*\"voluntari\" + 0.021*\"member\" + 0.021*\"democrat\" + 0.017*\"polici\" + 0.014*\"republ\" + 0.014*\"liber\" + 0.014*\"selma\" + 0.013*\"report\"\n", + "2019-01-31 00:35:42,740 : INFO : topic #22 (0.020): 0.033*\"spars\" + 0.024*\"factor\" + 0.023*\"adulthood\" + 0.016*\"feel\" + 0.014*\"male\" + 0.014*\"hostil\" + 0.011*\"plaisir\" + 0.010*\"live\" + 0.010*\"genu\" + 0.009*\"yawn\"\n", + "2019-01-31 00:35:42,741 : INFO : topic #35 (0.020): 0.054*\"russia\" + 0.037*\"rural\" + 0.034*\"sovereignti\" + 0.026*\"personifi\" + 0.022*\"poison\" + 0.021*\"reprint\" + 0.019*\"moscow\" + 0.016*\"unfortun\" + 0.015*\"rsm\" + 0.015*\"poland\"\n", + "2019-01-31 00:35:42,742 : INFO : topic #25 (0.020): 0.032*\"ring\" + 0.021*\"lagrang\" + 0.017*\"warmth\" + 0.016*\"area\" + 0.015*\"mount\" + 0.009*\"palmer\" + 0.008*\"north\" + 0.008*\"vacant\" + 0.008*\"foam\" + 0.008*\"lobe\"\n", + "2019-01-31 00:35:42,748 : INFO : topic diff=0.005839, rho=0.041559\n", + "2019-01-31 00:35:45,468 : INFO : -12.230 per-word bound, 4804.3 perplexity estimate based on a held-out corpus of 2000 documents with 589084 words\n", + "2019-01-31 00:35:45,469 : INFO : PROGRESS: pass 0, at document #1160000/4922894\n", + "2019-01-31 00:35:46,869 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:35:47,135 : INFO : topic #24 (0.020): 0.041*\"book\" + 0.035*\"publicis\" + 0.024*\"word\" + 0.018*\"new\" + 0.015*\"edit\" + 0.013*\"presid\" + 0.012*\"storag\" + 0.012*\"nicola\" + 0.012*\"worldwid\" + 0.011*\"author\"\n", + "2019-01-31 00:35:47,136 : INFO : topic #37 (0.020): 0.010*\"man\" + 0.009*\"love\" + 0.007*\"gestur\" + 0.006*\"blue\" + 0.005*\"vision\" + 0.005*\"bewild\" + 0.005*\"comic\" + 0.004*\"septemb\" + 0.004*\"litig\" + 0.004*\"dixi\"\n", + "2019-01-31 00:35:47,137 : INFO : topic #41 (0.020): 0.044*\"citi\" + 0.030*\"new\" + 0.023*\"palmer\" + 0.013*\"strategist\" + 0.013*\"year\" + 0.013*\"center\" + 0.012*\"open\" + 0.011*\"includ\" + 0.010*\"lobe\" + 0.009*\"hot\"\n", + "2019-01-31 00:35:47,139 : INFO : topic #9 (0.020): 0.073*\"bone\" + 0.042*\"american\" + 0.029*\"valour\" + 0.020*\"dutch\" + 0.018*\"folei\" + 0.017*\"player\" + 0.017*\"polit\" + 0.016*\"english\" + 0.013*\"simpler\" + 0.012*\"acrimoni\"\n", + "2019-01-31 00:35:47,140 : INFO : topic #6 (0.020): 0.071*\"fewer\" + 0.025*\"septemb\" + 0.023*\"epiru\" + 0.019*\"teacher\" + 0.017*\"stake\" + 0.012*\"rodríguez\" + 0.012*\"proclaim\" + 0.011*\"direct\" + 0.011*\"movi\" + 0.010*\"acrimoni\"\n", + "2019-01-31 00:35:47,146 : INFO : topic diff=0.008513, rho=0.041523\n", + "2019-01-31 00:35:47,300 : INFO : PROGRESS: pass 0, at document #1162000/4922894\n", + "2019-01-31 00:35:48,692 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:35:48,958 : INFO : topic #18 (0.020): 0.010*\"théori\" + 0.007*\"later\" + 0.007*\"sack\" + 0.006*\"kill\" + 0.006*\"dai\" + 0.005*\"retrospect\" + 0.005*\"like\" + 0.005*\"end\" + 0.004*\"call\" + 0.004*\"man\"\n", + "2019-01-31 00:35:48,959 : INFO : topic #44 (0.020): 0.030*\"rooftop\" + 0.028*\"final\" + 0.024*\"wife\" + 0.021*\"tourist\" + 0.018*\"taxpay\" + 0.017*\"champion\" + 0.015*\"chamber\" + 0.014*\"martin\" + 0.014*\"tiepolo\" + 0.012*\"winner\"\n", + "2019-01-31 00:35:48,960 : INFO : topic #37 (0.020): 0.009*\"man\" + 0.009*\"love\" + 0.007*\"gestur\" + 0.006*\"blue\" + 0.005*\"vision\" + 0.005*\"bewild\" + 0.005*\"comic\" + 0.004*\"septemb\" + 0.004*\"litig\" + 0.004*\"dixi\"\n", + "2019-01-31 00:35:48,961 : INFO : topic #3 (0.020): 0.038*\"present\" + 0.028*\"minist\" + 0.026*\"offic\" + 0.021*\"nation\" + 0.020*\"govern\" + 0.019*\"member\" + 0.018*\"gener\" + 0.018*\"serv\" + 0.016*\"seri\" + 0.015*\"start\"\n", + "2019-01-31 00:35:48,962 : INFO : topic #20 (0.020): 0.139*\"scholar\" + 0.039*\"struggl\" + 0.032*\"high\" + 0.030*\"educ\" + 0.021*\"collector\" + 0.018*\"yawn\" + 0.013*\"prognosi\" + 0.010*\"district\" + 0.010*\"gothic\" + 0.009*\"task\"\n", + "2019-01-31 00:35:48,968 : INFO : topic diff=0.006946, rho=0.041487\n", + "2019-01-31 00:35:49,120 : INFO : PROGRESS: pass 0, at document #1164000/4922894\n", + "2019-01-31 00:35:50,492 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:35:50,759 : INFO : topic #18 (0.020): 0.010*\"théori\" + 0.007*\"later\" + 0.007*\"sack\" + 0.006*\"kill\" + 0.006*\"dai\" + 0.005*\"retrospect\" + 0.005*\"like\" + 0.005*\"end\" + 0.004*\"call\" + 0.004*\"help\"\n", + "2019-01-31 00:35:50,760 : INFO : topic #24 (0.020): 0.041*\"book\" + 0.035*\"publicis\" + 0.024*\"word\" + 0.017*\"new\" + 0.014*\"edit\" + 0.013*\"presid\" + 0.012*\"storag\" + 0.012*\"nicola\" + 0.012*\"worldwid\" + 0.011*\"author\"\n", + "2019-01-31 00:35:50,761 : INFO : topic #35 (0.020): 0.054*\"russia\" + 0.037*\"rural\" + 0.034*\"sovereignti\" + 0.026*\"personifi\" + 0.022*\"poison\" + 0.021*\"reprint\" + 0.019*\"moscow\" + 0.015*\"unfortun\" + 0.015*\"poland\" + 0.015*\"malaysia\"\n", + "2019-01-31 00:35:50,762 : INFO : topic #7 (0.020): 0.020*\"snatch\" + 0.020*\"di\" + 0.017*\"factor\" + 0.015*\"yawn\" + 0.015*\"margin\" + 0.014*\"bone\" + 0.013*\"life\" + 0.012*\"faster\" + 0.011*\"daughter\" + 0.011*\"deal\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 00:35:50,763 : INFO : topic #0 (0.020): 0.071*\"statewid\" + 0.042*\"raid\" + 0.039*\"arsen\" + 0.038*\"line\" + 0.030*\"museo\" + 0.019*\"traceabl\" + 0.017*\"pain\" + 0.017*\"serv\" + 0.014*\"exhaust\" + 0.012*\"oper\"\n", + "2019-01-31 00:35:50,769 : INFO : topic diff=0.006318, rho=0.041451\n", + "2019-01-31 00:35:50,921 : INFO : PROGRESS: pass 0, at document #1166000/4922894\n", + "2019-01-31 00:35:52,301 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:35:52,567 : INFO : topic #32 (0.020): 0.055*\"district\" + 0.046*\"vigour\" + 0.043*\"popolo\" + 0.041*\"tortur\" + 0.028*\"cotton\" + 0.028*\"area\" + 0.024*\"regim\" + 0.024*\"multitud\" + 0.021*\"citi\" + 0.019*\"commun\"\n", + "2019-01-31 00:35:52,568 : INFO : topic #36 (0.020): 0.013*\"network\" + 0.011*\"pop\" + 0.010*\"oper\" + 0.010*\"prognosi\" + 0.009*\"develop\" + 0.008*\"serv\" + 0.008*\"cytokin\" + 0.007*\"base\" + 0.007*\"brio\" + 0.007*\"softwar\"\n", + "2019-01-31 00:35:52,569 : INFO : topic #28 (0.020): 0.029*\"build\" + 0.026*\"hous\" + 0.020*\"rivièr\" + 0.019*\"buford\" + 0.013*\"histor\" + 0.011*\"briarwood\" + 0.011*\"strategist\" + 0.010*\"constitut\" + 0.010*\"linear\" + 0.010*\"depress\"\n", + "2019-01-31 00:35:52,571 : INFO : topic #11 (0.020): 0.028*\"john\" + 0.015*\"will\" + 0.013*\"jame\" + 0.011*\"rival\" + 0.011*\"david\" + 0.010*\"georg\" + 0.009*\"slur\" + 0.009*\"mexican–american\" + 0.008*\"rhyme\" + 0.008*\"paul\"\n", + "2019-01-31 00:35:52,572 : INFO : topic #42 (0.020): 0.044*\"german\" + 0.029*\"germani\" + 0.015*\"jewish\" + 0.015*\"vol\" + 0.013*\"israel\" + 0.013*\"berlin\" + 0.013*\"der\" + 0.010*\"european\" + 0.009*\"europ\" + 0.009*\"itali\"\n", + "2019-01-31 00:35:52,577 : INFO : topic diff=0.007075, rho=0.041416\n", + "2019-01-31 00:35:52,733 : INFO : PROGRESS: pass 0, at document #1168000/4922894\n", + "2019-01-31 00:35:54,135 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:35:54,401 : INFO : topic #13 (0.020): 0.026*\"sourc\" + 0.025*\"australia\" + 0.024*\"london\" + 0.024*\"new\" + 0.023*\"australian\" + 0.021*\"england\" + 0.019*\"british\" + 0.018*\"ireland\" + 0.015*\"rotterdam\" + 0.015*\"youth\"\n", + "2019-01-31 00:35:54,402 : INFO : topic #21 (0.020): 0.037*\"samford\" + 0.023*\"spain\" + 0.020*\"mexico\" + 0.018*\"del\" + 0.016*\"soviet\" + 0.012*\"santa\" + 0.012*\"lizard\" + 0.012*\"francisco\" + 0.011*\"juan\" + 0.010*\"carlo\"\n", + "2019-01-31 00:35:54,404 : INFO : topic #11 (0.020): 0.027*\"john\" + 0.015*\"will\" + 0.013*\"jame\" + 0.011*\"david\" + 0.011*\"rival\" + 0.009*\"georg\" + 0.009*\"slur\" + 0.009*\"mexican–american\" + 0.008*\"rhyme\" + 0.008*\"paul\"\n", + "2019-01-31 00:35:54,405 : INFO : topic #39 (0.020): 0.046*\"canada\" + 0.037*\"canadian\" + 0.020*\"toronto\" + 0.019*\"ontario\" + 0.019*\"hoar\" + 0.013*\"new\" + 0.012*\"hydrogen\" + 0.012*\"novotná\" + 0.012*\"misericordia\" + 0.011*\"araz\"\n", + "2019-01-31 00:35:54,406 : INFO : topic #3 (0.020): 0.037*\"present\" + 0.027*\"minist\" + 0.027*\"offic\" + 0.021*\"nation\" + 0.020*\"govern\" + 0.019*\"member\" + 0.019*\"serv\" + 0.018*\"gener\" + 0.016*\"seri\" + 0.014*\"start\"\n", + "2019-01-31 00:35:54,412 : INFO : topic diff=0.005852, rho=0.041380\n", + "2019-01-31 00:35:54,567 : INFO : PROGRESS: pass 0, at document #1170000/4922894\n", + "2019-01-31 00:35:55,946 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:35:56,212 : INFO : topic #49 (0.020): 0.041*\"india\" + 0.029*\"incumb\" + 0.015*\"islam\" + 0.013*\"televis\" + 0.013*\"pakistan\" + 0.012*\"muskoge\" + 0.011*\"khalsa\" + 0.010*\"alam\" + 0.010*\"tajikistan\" + 0.010*\"anglo\"\n", + "2019-01-31 00:35:56,213 : INFO : topic #16 (0.020): 0.046*\"king\" + 0.032*\"priest\" + 0.019*\"grammat\" + 0.019*\"quarterli\" + 0.019*\"duke\" + 0.017*\"idiosyncrat\" + 0.016*\"rotterdam\" + 0.015*\"brazil\" + 0.014*\"count\" + 0.013*\"portugues\"\n", + "2019-01-31 00:35:56,215 : INFO : topic #34 (0.020): 0.072*\"start\" + 0.033*\"cotton\" + 0.033*\"unionist\" + 0.029*\"american\" + 0.026*\"new\" + 0.014*\"year\" + 0.013*\"warrior\" + 0.013*\"california\" + 0.012*\"north\" + 0.012*\"terri\"\n", + "2019-01-31 00:35:56,216 : INFO : topic #15 (0.020): 0.011*\"develop\" + 0.011*\"small\" + 0.011*\"organ\" + 0.011*\"commun\" + 0.009*\"word\" + 0.009*\"group\" + 0.008*\"cultur\" + 0.008*\"peopl\" + 0.007*\"human\" + 0.007*\"woman\"\n", + "2019-01-31 00:35:56,217 : INFO : topic #23 (0.020): 0.138*\"audit\" + 0.068*\"best\" + 0.035*\"yawn\" + 0.032*\"jacksonvil\" + 0.025*\"japanes\" + 0.021*\"festiv\" + 0.021*\"noll\" + 0.020*\"women\" + 0.020*\"intern\" + 0.014*\"prison\"\n", + "2019-01-31 00:35:56,223 : INFO : topic diff=0.006069, rho=0.041345\n", + "2019-01-31 00:35:56,379 : INFO : PROGRESS: pass 0, at document #1172000/4922894\n", + "2019-01-31 00:35:57,766 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:35:58,032 : INFO : topic #2 (0.020): 0.044*\"isl\" + 0.037*\"shield\" + 0.019*\"narrat\" + 0.013*\"scot\" + 0.012*\"nativist\" + 0.012*\"blur\" + 0.011*\"pope\" + 0.010*\"bahá\" + 0.009*\"class\" + 0.009*\"coalit\"\n", + "2019-01-31 00:35:58,033 : INFO : topic #13 (0.020): 0.026*\"australia\" + 0.026*\"sourc\" + 0.025*\"london\" + 0.024*\"new\" + 0.023*\"australian\" + 0.021*\"england\" + 0.019*\"british\" + 0.018*\"ireland\" + 0.015*\"youth\" + 0.015*\"rotterdam\"\n", + "2019-01-31 00:35:58,034 : INFO : topic #21 (0.020): 0.037*\"samford\" + 0.023*\"spain\" + 0.021*\"mexico\" + 0.019*\"del\" + 0.016*\"soviet\" + 0.012*\"lizard\" + 0.012*\"santa\" + 0.012*\"francisco\" + 0.011*\"juan\" + 0.010*\"carlo\"\n", + "2019-01-31 00:35:58,035 : INFO : topic #36 (0.020): 0.012*\"network\" + 0.011*\"pop\" + 0.010*\"prognosi\" + 0.010*\"oper\" + 0.009*\"develop\" + 0.008*\"serv\" + 0.008*\"cytokin\" + 0.008*\"base\" + 0.007*\"softwar\" + 0.007*\"user\"\n", + "2019-01-31 00:35:58,037 : INFO : topic #42 (0.020): 0.043*\"german\" + 0.029*\"germani\" + 0.015*\"jewish\" + 0.014*\"vol\" + 0.013*\"berlin\" + 0.013*\"israel\" + 0.013*\"der\" + 0.010*\"european\" + 0.009*\"europ\" + 0.009*\"itali\"\n", + "2019-01-31 00:35:58,042 : INFO : topic diff=0.006696, rho=0.041310\n", + "2019-01-31 00:35:58,198 : INFO : PROGRESS: pass 0, at document #1174000/4922894\n", + "2019-01-31 00:35:59,595 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:35:59,861 : INFO : topic #39 (0.020): 0.046*\"canada\" + 0.036*\"canadian\" + 0.020*\"toronto\" + 0.019*\"ontario\" + 0.018*\"hoar\" + 0.013*\"new\" + 0.012*\"hydrogen\" + 0.012*\"araz\" + 0.011*\"misericordia\" + 0.011*\"novotná\"\n", + "2019-01-31 00:35:59,862 : INFO : topic #17 (0.020): 0.079*\"church\" + 0.021*\"cathol\" + 0.021*\"christian\" + 0.020*\"bishop\" + 0.016*\"sail\" + 0.014*\"retroflex\" + 0.010*\"relationship\" + 0.010*\"centuri\" + 0.009*\"cathedr\" + 0.009*\"poll\"\n", + "2019-01-31 00:35:59,863 : INFO : topic #41 (0.020): 0.044*\"citi\" + 0.030*\"new\" + 0.022*\"palmer\" + 0.013*\"strategist\" + 0.013*\"year\" + 0.012*\"center\" + 0.012*\"open\" + 0.011*\"includ\" + 0.010*\"lobe\" + 0.009*\"dai\"\n", + "2019-01-31 00:35:59,864 : INFO : topic #11 (0.020): 0.027*\"john\" + 0.015*\"will\" + 0.013*\"jame\" + 0.011*\"rival\" + 0.011*\"david\" + 0.009*\"georg\" + 0.009*\"mexican–american\" + 0.009*\"slur\" + 0.008*\"rhyme\" + 0.008*\"paul\"\n", + "2019-01-31 00:35:59,865 : INFO : topic #46 (0.020): 0.018*\"stop\" + 0.017*\"norwai\" + 0.017*\"norwegian\" + 0.016*\"swedish\" + 0.015*\"sweden\" + 0.015*\"unjust\" + 0.015*\"wind\" + 0.014*\"damag\" + 0.011*\"financ\" + 0.011*\"treeless\"\n", + "2019-01-31 00:35:59,871 : INFO : topic diff=0.007020, rho=0.041274\n", + "2019-01-31 00:36:00,027 : INFO : PROGRESS: pass 0, at document #1176000/4922894\n", + "2019-01-31 00:36:01,413 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:36:01,680 : INFO : topic #2 (0.020): 0.044*\"isl\" + 0.036*\"shield\" + 0.019*\"narrat\" + 0.014*\"scot\" + 0.012*\"blur\" + 0.012*\"nativist\" + 0.011*\"pope\" + 0.010*\"bahá\" + 0.010*\"class\" + 0.009*\"coalit\"\n", + "2019-01-31 00:36:01,681 : INFO : topic #46 (0.020): 0.018*\"stop\" + 0.017*\"norwai\" + 0.017*\"norwegian\" + 0.015*\"swedish\" + 0.015*\"sweden\" + 0.015*\"damag\" + 0.014*\"unjust\" + 0.014*\"wind\" + 0.011*\"turkish\" + 0.011*\"financ\"\n", + "2019-01-31 00:36:01,682 : INFO : topic #42 (0.020): 0.043*\"german\" + 0.029*\"germani\" + 0.015*\"jewish\" + 0.015*\"vol\" + 0.014*\"berlin\" + 0.013*\"israel\" + 0.013*\"der\" + 0.010*\"european\" + 0.009*\"europ\" + 0.009*\"itali\"\n", + "2019-01-31 00:36:01,683 : INFO : topic #30 (0.020): 0.037*\"leagu\" + 0.036*\"cleveland\" + 0.030*\"place\" + 0.028*\"taxpay\" + 0.025*\"scientist\" + 0.024*\"crete\" + 0.022*\"folei\" + 0.016*\"goal\" + 0.016*\"martin\" + 0.012*\"schmitz\"\n", + "2019-01-31 00:36:01,684 : INFO : topic #20 (0.020): 0.140*\"scholar\" + 0.039*\"struggl\" + 0.034*\"high\" + 0.030*\"educ\" + 0.022*\"collector\" + 0.018*\"yawn\" + 0.013*\"prognosi\" + 0.010*\"district\" + 0.010*\"gothic\" + 0.009*\"task\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 00:36:01,690 : INFO : topic diff=0.005963, rho=0.041239\n", + "2019-01-31 00:36:01,847 : INFO : PROGRESS: pass 0, at document #1178000/4922894\n", + "2019-01-31 00:36:03,242 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:36:03,509 : INFO : topic #46 (0.020): 0.018*\"stop\" + 0.018*\"norwai\" + 0.017*\"norwegian\" + 0.016*\"swedish\" + 0.015*\"sweden\" + 0.015*\"damag\" + 0.015*\"wind\" + 0.014*\"unjust\" + 0.011*\"turkish\" + 0.011*\"denmark\"\n", + "2019-01-31 00:36:03,511 : INFO : topic #25 (0.020): 0.031*\"ring\" + 0.019*\"lagrang\" + 0.017*\"warmth\" + 0.016*\"area\" + 0.015*\"mount\" + 0.009*\"palmer\" + 0.009*\"foam\" + 0.008*\"north\" + 0.008*\"vacant\" + 0.008*\"land\"\n", + "2019-01-31 00:36:03,512 : INFO : topic #29 (0.020): 0.020*\"companhia\" + 0.011*\"million\" + 0.009*\"bank\" + 0.009*\"market\" + 0.009*\"busi\" + 0.008*\"yawn\" + 0.007*\"industri\" + 0.007*\"start\" + 0.007*\"produc\" + 0.007*\"govern\"\n", + "2019-01-31 00:36:03,513 : INFO : topic #33 (0.020): 0.058*\"french\" + 0.044*\"franc\" + 0.033*\"pari\" + 0.024*\"jean\" + 0.024*\"sail\" + 0.017*\"daphn\" + 0.014*\"lazi\" + 0.013*\"loui\" + 0.012*\"piec\" + 0.010*\"wine\"\n", + "2019-01-31 00:36:03,514 : INFO : topic #13 (0.020): 0.026*\"australia\" + 0.025*\"sourc\" + 0.025*\"london\" + 0.024*\"new\" + 0.022*\"australian\" + 0.021*\"england\" + 0.019*\"british\" + 0.017*\"ireland\" + 0.015*\"youth\" + 0.015*\"rotterdam\"\n", + "2019-01-31 00:36:03,520 : INFO : topic diff=0.007834, rho=0.041204\n", + "2019-01-31 00:36:06,233 : INFO : -11.496 per-word bound, 2888.2 perplexity estimate based on a held-out corpus of 2000 documents with 539919 words\n", + "2019-01-31 00:36:06,234 : INFO : PROGRESS: pass 0, at document #1180000/4922894\n", + "2019-01-31 00:36:07,638 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:36:07,904 : INFO : topic #45 (0.020): 0.022*\"jpg\" + 0.022*\"fifteenth\" + 0.016*\"illicit\" + 0.016*\"black\" + 0.016*\"colder\" + 0.015*\"western\" + 0.012*\"record\" + 0.011*\"blind\" + 0.008*\"light\" + 0.007*\"green\"\n", + "2019-01-31 00:36:07,905 : INFO : topic #19 (0.020): 0.013*\"languag\" + 0.010*\"woodcut\" + 0.010*\"centuri\" + 0.010*\"form\" + 0.010*\"origin\" + 0.008*\"mean\" + 0.007*\"like\" + 0.007*\"charact\" + 0.007*\"uruguayan\" + 0.007*\"trade\"\n", + "2019-01-31 00:36:07,906 : INFO : topic #35 (0.020): 0.053*\"russia\" + 0.037*\"sovereignti\" + 0.036*\"rural\" + 0.027*\"personifi\" + 0.022*\"poison\" + 0.021*\"reprint\" + 0.021*\"moscow\" + 0.016*\"unfortun\" + 0.016*\"malaysia\" + 0.015*\"poland\"\n", + "2019-01-31 00:36:07,907 : INFO : topic #38 (0.020): 0.023*\"walter\" + 0.011*\"aza\" + 0.009*\"battalion\" + 0.008*\"teufel\" + 0.008*\"forc\" + 0.008*\"empath\" + 0.007*\"armi\" + 0.007*\"till\" + 0.007*\"king\" + 0.006*\"militari\"\n", + "2019-01-31 00:36:07,908 : INFO : topic #30 (0.020): 0.037*\"leagu\" + 0.036*\"cleveland\" + 0.030*\"place\" + 0.028*\"taxpay\" + 0.025*\"scientist\" + 0.024*\"crete\" + 0.022*\"folei\" + 0.016*\"goal\" + 0.016*\"martin\" + 0.012*\"schmitz\"\n", + "2019-01-31 00:36:07,914 : INFO : topic diff=0.007236, rho=0.041169\n", + "2019-01-31 00:36:08,069 : INFO : PROGRESS: pass 0, at document #1182000/4922894\n", + "2019-01-31 00:36:09,458 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:36:09,725 : INFO : topic #22 (0.020): 0.033*\"spars\" + 0.024*\"adulthood\" + 0.024*\"factor\" + 0.017*\"feel\" + 0.015*\"male\" + 0.015*\"hostil\" + 0.011*\"live\" + 0.011*\"plaisir\" + 0.011*\"genu\" + 0.010*\"yawn\"\n", + "2019-01-31 00:36:09,726 : INFO : topic #33 (0.020): 0.059*\"french\" + 0.045*\"franc\" + 0.034*\"pari\" + 0.024*\"jean\" + 0.023*\"sail\" + 0.017*\"daphn\" + 0.014*\"lazi\" + 0.013*\"loui\" + 0.011*\"piec\" + 0.010*\"wine\"\n", + "2019-01-31 00:36:09,727 : INFO : topic #24 (0.020): 0.041*\"book\" + 0.035*\"publicis\" + 0.023*\"word\" + 0.017*\"new\" + 0.014*\"edit\" + 0.012*\"presid\" + 0.012*\"storag\" + 0.012*\"nicola\" + 0.012*\"worldwid\" + 0.011*\"author\"\n", + "2019-01-31 00:36:09,728 : INFO : topic #27 (0.020): 0.072*\"questionnair\" + 0.019*\"taxpay\" + 0.018*\"candid\" + 0.014*\"tornado\" + 0.013*\"driver\" + 0.012*\"fool\" + 0.012*\"find\" + 0.011*\"horac\" + 0.011*\"ret\" + 0.010*\"théori\"\n", + "2019-01-31 00:36:09,729 : INFO : topic #0 (0.020): 0.071*\"statewid\" + 0.041*\"raid\" + 0.039*\"line\" + 0.038*\"arsen\" + 0.028*\"museo\" + 0.019*\"traceabl\" + 0.017*\"serv\" + 0.016*\"pain\" + 0.013*\"exhaust\" + 0.012*\"oper\"\n", + "2019-01-31 00:36:09,735 : INFO : topic diff=0.005971, rho=0.041135\n", + "2019-01-31 00:36:09,950 : INFO : PROGRESS: pass 0, at document #1184000/4922894\n", + "2019-01-31 00:36:11,352 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:36:11,618 : INFO : topic #48 (0.020): 0.079*\"octob\" + 0.075*\"march\" + 0.075*\"sens\" + 0.070*\"notion\" + 0.070*\"januari\" + 0.067*\"juli\" + 0.065*\"august\" + 0.065*\"april\" + 0.064*\"judici\" + 0.064*\"decatur\"\n", + "2019-01-31 00:36:11,619 : INFO : topic #1 (0.020): 0.054*\"china\" + 0.049*\"chilton\" + 0.026*\"hong\" + 0.025*\"kong\" + 0.023*\"korea\" + 0.019*\"korean\" + 0.017*\"sourc\" + 0.015*\"shirin\" + 0.013*\"leah\" + 0.013*\"kim\"\n", + "2019-01-31 00:36:11,621 : INFO : topic #23 (0.020): 0.139*\"audit\" + 0.070*\"best\" + 0.034*\"yawn\" + 0.033*\"jacksonvil\" + 0.025*\"japanes\" + 0.021*\"festiv\" + 0.021*\"noll\" + 0.019*\"women\" + 0.018*\"intern\" + 0.014*\"prison\"\n", + "2019-01-31 00:36:11,621 : INFO : topic #16 (0.020): 0.047*\"king\" + 0.033*\"priest\" + 0.020*\"quarterli\" + 0.020*\"duke\" + 0.020*\"grammat\" + 0.016*\"idiosyncrat\" + 0.015*\"rotterdam\" + 0.015*\"brazil\" + 0.014*\"princ\" + 0.013*\"count\"\n", + "2019-01-31 00:36:11,623 : INFO : topic #18 (0.020): 0.010*\"théori\" + 0.007*\"later\" + 0.007*\"sack\" + 0.006*\"kill\" + 0.006*\"dai\" + 0.005*\"retrospect\" + 0.005*\"like\" + 0.004*\"end\" + 0.004*\"call\" + 0.004*\"man\"\n", + "2019-01-31 00:36:11,629 : INFO : topic diff=0.008042, rho=0.041100\n", + "2019-01-31 00:36:11,785 : INFO : PROGRESS: pass 0, at document #1186000/4922894\n", + "2019-01-31 00:36:13,339 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:36:13,607 : INFO : topic #7 (0.020): 0.020*\"snatch\" + 0.019*\"di\" + 0.017*\"factor\" + 0.016*\"yawn\" + 0.015*\"margin\" + 0.014*\"bone\" + 0.012*\"life\" + 0.012*\"faster\" + 0.012*\"daughter\" + 0.011*\"deal\"\n", + "2019-01-31 00:36:13,608 : INFO : topic #33 (0.020): 0.059*\"french\" + 0.045*\"franc\" + 0.034*\"pari\" + 0.024*\"jean\" + 0.023*\"sail\" + 0.017*\"daphn\" + 0.014*\"lazi\" + 0.013*\"loui\" + 0.011*\"piec\" + 0.010*\"wine\"\n", + "2019-01-31 00:36:13,609 : INFO : topic #10 (0.020): 0.012*\"cdd\" + 0.008*\"disco\" + 0.008*\"media\" + 0.008*\"have\" + 0.007*\"caus\" + 0.007*\"hormon\" + 0.007*\"pathwai\" + 0.007*\"treat\" + 0.006*\"gastrointestin\" + 0.006*\"proper\"\n", + "2019-01-31 00:36:13,610 : INFO : topic #6 (0.020): 0.072*\"fewer\" + 0.025*\"septemb\" + 0.023*\"epiru\" + 0.019*\"teacher\" + 0.017*\"stake\" + 0.013*\"rodríguez\" + 0.012*\"proclaim\" + 0.011*\"direct\" + 0.011*\"movi\" + 0.010*\"director\"\n", + "2019-01-31 00:36:13,612 : INFO : topic #22 (0.020): 0.033*\"spars\" + 0.024*\"factor\" + 0.023*\"adulthood\" + 0.017*\"feel\" + 0.015*\"male\" + 0.014*\"hostil\" + 0.011*\"live\" + 0.011*\"genu\" + 0.011*\"plaisir\" + 0.009*\"yawn\"\n", + "2019-01-31 00:36:13,617 : INFO : topic diff=0.006065, rho=0.041065\n", + "2019-01-31 00:36:13,773 : INFO : PROGRESS: pass 0, at document #1188000/4922894\n", + "2019-01-31 00:36:15,174 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:36:15,440 : INFO : topic #46 (0.020): 0.019*\"stop\" + 0.018*\"norwai\" + 0.017*\"norwegian\" + 0.016*\"swedish\" + 0.015*\"sweden\" + 0.014*\"wind\" + 0.014*\"damag\" + 0.013*\"unjust\" + 0.011*\"turkish\" + 0.011*\"denmark\"\n", + "2019-01-31 00:36:15,441 : INFO : topic #19 (0.020): 0.014*\"languag\" + 0.010*\"woodcut\" + 0.010*\"centuri\" + 0.010*\"form\" + 0.009*\"origin\" + 0.008*\"mean\" + 0.007*\"charact\" + 0.007*\"like\" + 0.007*\"uruguayan\" + 0.007*\"god\"\n", + "2019-01-31 00:36:15,442 : INFO : topic #16 (0.020): 0.046*\"king\" + 0.034*\"priest\" + 0.020*\"quarterli\" + 0.020*\"duke\" + 0.019*\"grammat\" + 0.017*\"idiosyncrat\" + 0.015*\"rotterdam\" + 0.014*\"brazil\" + 0.013*\"princ\" + 0.013*\"count\"\n", + "2019-01-31 00:36:15,444 : INFO : topic #45 (0.020): 0.022*\"jpg\" + 0.021*\"fifteenth\" + 0.017*\"colder\" + 0.017*\"illicit\" + 0.016*\"black\" + 0.015*\"western\" + 0.012*\"record\" + 0.011*\"blind\" + 0.008*\"light\" + 0.007*\"green\"\n", + "2019-01-31 00:36:15,445 : INFO : topic #30 (0.020): 0.037*\"leagu\" + 0.036*\"cleveland\" + 0.030*\"place\" + 0.027*\"taxpay\" + 0.025*\"scientist\" + 0.024*\"crete\" + 0.022*\"folei\" + 0.016*\"goal\" + 0.015*\"martin\" + 0.011*\"schmitz\"\n", + "2019-01-31 00:36:15,450 : INFO : topic diff=0.006913, rho=0.041030\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 00:36:15,607 : INFO : PROGRESS: pass 0, at document #1190000/4922894\n", + "2019-01-31 00:36:17,016 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:36:17,283 : INFO : topic #0 (0.020): 0.070*\"statewid\" + 0.040*\"raid\" + 0.039*\"line\" + 0.038*\"arsen\" + 0.028*\"museo\" + 0.020*\"traceabl\" + 0.017*\"serv\" + 0.017*\"pain\" + 0.013*\"exhaust\" + 0.012*\"artist\"\n", + "2019-01-31 00:36:17,284 : INFO : topic #23 (0.020): 0.140*\"audit\" + 0.070*\"best\" + 0.034*\"yawn\" + 0.032*\"jacksonvil\" + 0.025*\"japanes\" + 0.021*\"festiv\" + 0.021*\"noll\" + 0.020*\"women\" + 0.018*\"intern\" + 0.013*\"prison\"\n", + "2019-01-31 00:36:17,285 : INFO : topic #25 (0.020): 0.032*\"ring\" + 0.019*\"lagrang\" + 0.017*\"warmth\" + 0.016*\"area\" + 0.014*\"mount\" + 0.009*\"palmer\" + 0.009*\"foam\" + 0.008*\"north\" + 0.008*\"vacant\" + 0.008*\"land\"\n", + "2019-01-31 00:36:17,286 : INFO : topic #2 (0.020): 0.047*\"isl\" + 0.036*\"shield\" + 0.018*\"narrat\" + 0.014*\"scot\" + 0.012*\"nativist\" + 0.012*\"blur\" + 0.011*\"pope\" + 0.010*\"fleet\" + 0.009*\"bahá\" + 0.009*\"class\"\n", + "2019-01-31 00:36:17,287 : INFO : topic #34 (0.020): 0.072*\"start\" + 0.033*\"unionist\" + 0.033*\"cotton\" + 0.030*\"american\" + 0.026*\"new\" + 0.015*\"year\" + 0.013*\"warrior\" + 0.013*\"california\" + 0.012*\"north\" + 0.012*\"terri\"\n", + "2019-01-31 00:36:17,293 : INFO : topic diff=0.006854, rho=0.040996\n", + "2019-01-31 00:36:17,449 : INFO : PROGRESS: pass 0, at document #1192000/4922894\n", + "2019-01-31 00:36:18,844 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:36:19,111 : INFO : topic #43 (0.020): 0.064*\"elect\" + 0.054*\"parti\" + 0.024*\"voluntari\" + 0.023*\"democrat\" + 0.021*\"member\" + 0.017*\"polici\" + 0.015*\"republ\" + 0.014*\"bypass\" + 0.014*\"liber\" + 0.013*\"report\"\n", + "2019-01-31 00:36:19,112 : INFO : topic #4 (0.020): 0.020*\"enfranchis\" + 0.015*\"depress\" + 0.014*\"pour\" + 0.009*\"elabor\" + 0.009*\"mode\" + 0.008*\"veget\" + 0.007*\"produc\" + 0.007*\"candid\" + 0.007*\"encyclopedia\" + 0.007*\"uruguayan\"\n", + "2019-01-31 00:36:19,113 : INFO : topic #0 (0.020): 0.070*\"statewid\" + 0.040*\"raid\" + 0.039*\"line\" + 0.038*\"arsen\" + 0.028*\"museo\" + 0.020*\"traceabl\" + 0.017*\"serv\" + 0.017*\"pain\" + 0.013*\"exhaust\" + 0.012*\"artist\"\n", + "2019-01-31 00:36:19,114 : INFO : topic #10 (0.020): 0.012*\"cdd\" + 0.008*\"disco\" + 0.008*\"have\" + 0.008*\"media\" + 0.007*\"hormon\" + 0.007*\"caus\" + 0.007*\"pathwai\" + 0.006*\"treat\" + 0.006*\"proper\" + 0.006*\"effect\"\n", + "2019-01-31 00:36:19,115 : INFO : topic #3 (0.020): 0.038*\"present\" + 0.028*\"offic\" + 0.025*\"minist\" + 0.021*\"nation\" + 0.020*\"govern\" + 0.018*\"member\" + 0.018*\"serv\" + 0.018*\"gener\" + 0.016*\"chickasaw\" + 0.015*\"seri\"\n", + "2019-01-31 00:36:19,121 : INFO : topic diff=0.005556, rho=0.040962\n", + "2019-01-31 00:36:19,277 : INFO : PROGRESS: pass 0, at document #1194000/4922894\n", + "2019-01-31 00:36:20,674 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:36:20,940 : INFO : topic #23 (0.020): 0.140*\"audit\" + 0.069*\"best\" + 0.034*\"yawn\" + 0.032*\"jacksonvil\" + 0.025*\"japanes\" + 0.022*\"festiv\" + 0.021*\"noll\" + 0.020*\"women\" + 0.018*\"intern\" + 0.013*\"prison\"\n", + "2019-01-31 00:36:20,941 : INFO : topic #26 (0.020): 0.032*\"workplac\" + 0.030*\"champion\" + 0.028*\"woman\" + 0.024*\"olymp\" + 0.024*\"men\" + 0.021*\"event\" + 0.021*\"medal\" + 0.018*\"rainfal\" + 0.018*\"nation\" + 0.018*\"alic\"\n", + "2019-01-31 00:36:20,942 : INFO : topic #8 (0.020): 0.027*\"law\" + 0.023*\"cortic\" + 0.018*\"start\" + 0.016*\"act\" + 0.015*\"ricardo\" + 0.012*\"case\" + 0.010*\"polaris\" + 0.009*\"order\" + 0.009*\"legal\" + 0.008*\"replac\"\n", + "2019-01-31 00:36:20,943 : INFO : topic #0 (0.020): 0.070*\"statewid\" + 0.040*\"line\" + 0.039*\"raid\" + 0.038*\"arsen\" + 0.028*\"museo\" + 0.019*\"traceabl\" + 0.018*\"serv\" + 0.016*\"pain\" + 0.013*\"exhaust\" + 0.012*\"oper\"\n", + "2019-01-31 00:36:20,944 : INFO : topic #42 (0.020): 0.044*\"german\" + 0.030*\"germani\" + 0.015*\"vol\" + 0.015*\"jewish\" + 0.014*\"berlin\" + 0.014*\"israel\" + 0.013*\"der\" + 0.009*\"european\" + 0.009*\"itali\" + 0.008*\"austria\"\n", + "2019-01-31 00:36:20,950 : INFO : topic diff=0.005746, rho=0.040927\n", + "2019-01-31 00:36:21,106 : INFO : PROGRESS: pass 0, at document #1196000/4922894\n", + "2019-01-31 00:36:22,488 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:36:22,754 : INFO : topic #5 (0.020): 0.039*\"abroad\" + 0.029*\"son\" + 0.028*\"rel\" + 0.026*\"reconstruct\" + 0.021*\"band\" + 0.017*\"muscl\" + 0.017*\"simultan\" + 0.014*\"charcoal\" + 0.014*\"toyota\" + 0.010*\"myspac\"\n", + "2019-01-31 00:36:22,755 : INFO : topic #33 (0.020): 0.058*\"french\" + 0.044*\"franc\" + 0.032*\"pari\" + 0.023*\"sail\" + 0.022*\"jean\" + 0.016*\"daphn\" + 0.014*\"lazi\" + 0.013*\"loui\" + 0.011*\"piec\" + 0.009*\"wine\"\n", + "2019-01-31 00:36:22,757 : INFO : topic #44 (0.020): 0.031*\"rooftop\" + 0.028*\"final\" + 0.024*\"wife\" + 0.021*\"tourist\" + 0.018*\"champion\" + 0.017*\"taxpay\" + 0.016*\"chamber\" + 0.014*\"martin\" + 0.014*\"tiepolo\" + 0.012*\"open\"\n", + "2019-01-31 00:36:22,758 : INFO : topic #0 (0.020): 0.070*\"statewid\" + 0.040*\"line\" + 0.039*\"raid\" + 0.038*\"arsen\" + 0.028*\"museo\" + 0.020*\"traceabl\" + 0.017*\"serv\" + 0.016*\"pain\" + 0.013*\"exhaust\" + 0.012*\"artist\"\n", + "2019-01-31 00:36:22,759 : INFO : topic #37 (0.020): 0.010*\"man\" + 0.009*\"love\" + 0.008*\"comic\" + 0.007*\"gestur\" + 0.006*\"blue\" + 0.005*\"vision\" + 0.004*\"bewild\" + 0.004*\"dixi\" + 0.004*\"black\" + 0.004*\"litig\"\n", + "2019-01-31 00:36:22,765 : INFO : topic diff=0.006996, rho=0.040893\n", + "2019-01-31 00:36:22,915 : INFO : PROGRESS: pass 0, at document #1198000/4922894\n", + "2019-01-31 00:36:24,283 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:36:24,550 : INFO : topic #29 (0.020): 0.020*\"companhia\" + 0.011*\"million\" + 0.009*\"busi\" + 0.009*\"bank\" + 0.009*\"yawn\" + 0.009*\"market\" + 0.007*\"industri\" + 0.007*\"function\" + 0.007*\"start\" + 0.007*\"govern\"\n", + "2019-01-31 00:36:24,551 : INFO : topic #20 (0.020): 0.139*\"scholar\" + 0.040*\"struggl\" + 0.032*\"high\" + 0.031*\"educ\" + 0.022*\"collector\" + 0.019*\"yawn\" + 0.013*\"prognosi\" + 0.010*\"district\" + 0.009*\"gothic\" + 0.009*\"task\"\n", + "2019-01-31 00:36:24,552 : INFO : topic #40 (0.020): 0.089*\"unit\" + 0.025*\"collector\" + 0.022*\"schuster\" + 0.021*\"institut\" + 0.020*\"requir\" + 0.018*\"student\" + 0.015*\"professor\" + 0.012*\"word\" + 0.012*\"degre\" + 0.011*\"governor\"\n", + "2019-01-31 00:36:24,553 : INFO : topic #35 (0.020): 0.052*\"russia\" + 0.037*\"sovereignti\" + 0.034*\"rural\" + 0.025*\"personifi\" + 0.025*\"poison\" + 0.021*\"reprint\" + 0.021*\"moscow\" + 0.017*\"poland\" + 0.016*\"unfortun\" + 0.014*\"malaysia\"\n", + "2019-01-31 00:36:24,555 : INFO : topic #11 (0.020): 0.027*\"john\" + 0.015*\"will\" + 0.013*\"jame\" + 0.011*\"david\" + 0.011*\"rival\" + 0.009*\"georg\" + 0.009*\"mexican–american\" + 0.009*\"slur\" + 0.008*\"paul\" + 0.008*\"rhyme\"\n", + "2019-01-31 00:36:24,560 : INFO : topic diff=0.007585, rho=0.040859\n", + "2019-01-31 00:36:27,262 : INFO : -11.689 per-word bound, 3302.0 perplexity estimate based on a held-out corpus of 2000 documents with 554964 words\n", + "2019-01-31 00:36:27,263 : INFO : PROGRESS: pass 0, at document #1200000/4922894\n", + "2019-01-31 00:36:28,659 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:36:28,926 : INFO : topic #4 (0.020): 0.021*\"enfranchis\" + 0.015*\"depress\" + 0.014*\"pour\" + 0.010*\"mode\" + 0.009*\"elabor\" + 0.008*\"veget\" + 0.008*\"produc\" + 0.007*\"candid\" + 0.007*\"mandir\" + 0.007*\"uruguayan\"\n", + "2019-01-31 00:36:28,927 : INFO : topic #1 (0.020): 0.053*\"china\" + 0.052*\"chilton\" + 0.025*\"hong\" + 0.024*\"kong\" + 0.022*\"korea\" + 0.018*\"korean\" + 0.015*\"sourc\" + 0.014*\"shirin\" + 0.014*\"leah\" + 0.013*\"kim\"\n", + "2019-01-31 00:36:28,928 : INFO : topic #15 (0.020): 0.011*\"small\" + 0.011*\"develop\" + 0.011*\"commun\" + 0.011*\"organ\" + 0.009*\"word\" + 0.008*\"group\" + 0.008*\"cultur\" + 0.008*\"peopl\" + 0.007*\"summerhil\" + 0.006*\"human\"\n", + "2019-01-31 00:36:28,929 : INFO : topic #3 (0.020): 0.037*\"present\" + 0.027*\"offic\" + 0.026*\"minist\" + 0.021*\"nation\" + 0.020*\"govern\" + 0.019*\"member\" + 0.018*\"serv\" + 0.018*\"gener\" + 0.016*\"chickasaw\" + 0.015*\"seri\"\n", + "2019-01-31 00:36:28,930 : INFO : topic #30 (0.020): 0.037*\"leagu\" + 0.036*\"cleveland\" + 0.030*\"place\" + 0.027*\"taxpay\" + 0.025*\"scientist\" + 0.024*\"crete\" + 0.022*\"folei\" + 0.016*\"goal\" + 0.016*\"martin\" + 0.012*\"schmitz\"\n", + "2019-01-31 00:36:28,936 : INFO : topic diff=0.006620, rho=0.040825\n", + "2019-01-31 00:36:29,092 : INFO : PROGRESS: pass 0, at document #1202000/4922894\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 00:36:30,495 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:36:30,762 : INFO : topic #24 (0.020): 0.041*\"book\" + 0.035*\"publicis\" + 0.023*\"word\" + 0.017*\"new\" + 0.014*\"edit\" + 0.013*\"presid\" + 0.012*\"storag\" + 0.012*\"nicola\" + 0.012*\"worldwid\" + 0.011*\"author\"\n", + "2019-01-31 00:36:30,763 : INFO : topic #22 (0.020): 0.033*\"spars\" + 0.024*\"adulthood\" + 0.024*\"factor\" + 0.017*\"feel\" + 0.015*\"male\" + 0.015*\"hostil\" + 0.011*\"genu\" + 0.011*\"live\" + 0.011*\"plaisir\" + 0.010*\"yawn\"\n", + "2019-01-31 00:36:30,765 : INFO : topic #14 (0.020): 0.024*\"forc\" + 0.023*\"armi\" + 0.022*\"aggress\" + 0.021*\"walter\" + 0.018*\"com\" + 0.014*\"oper\" + 0.013*\"militari\" + 0.012*\"unionist\" + 0.012*\"airbu\" + 0.011*\"refut\"\n", + "2019-01-31 00:36:30,766 : INFO : topic #7 (0.020): 0.020*\"snatch\" + 0.020*\"di\" + 0.018*\"factor\" + 0.016*\"margin\" + 0.016*\"yawn\" + 0.014*\"bone\" + 0.013*\"life\" + 0.012*\"faster\" + 0.012*\"daughter\" + 0.011*\"deal\"\n", + "2019-01-31 00:36:30,767 : INFO : topic #25 (0.020): 0.032*\"ring\" + 0.020*\"lagrang\" + 0.018*\"warmth\" + 0.016*\"area\" + 0.015*\"mount\" + 0.009*\"palmer\" + 0.009*\"foam\" + 0.008*\"north\" + 0.008*\"land\" + 0.008*\"vacant\"\n", + "2019-01-31 00:36:30,772 : INFO : topic diff=0.006743, rho=0.040791\n", + "2019-01-31 00:36:30,925 : INFO : PROGRESS: pass 0, at document #1204000/4922894\n", + "2019-01-31 00:36:32,318 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:36:32,585 : INFO : topic #6 (0.020): 0.072*\"fewer\" + 0.024*\"septemb\" + 0.023*\"epiru\" + 0.019*\"teacher\" + 0.017*\"stake\" + 0.013*\"rodríguez\" + 0.012*\"proclaim\" + 0.011*\"direct\" + 0.011*\"movi\" + 0.010*\"acrimoni\"\n", + "2019-01-31 00:36:32,586 : INFO : topic #0 (0.020): 0.070*\"statewid\" + 0.039*\"line\" + 0.039*\"arsen\" + 0.038*\"raid\" + 0.029*\"museo\" + 0.020*\"traceabl\" + 0.018*\"serv\" + 0.016*\"pain\" + 0.013*\"exhaust\" + 0.012*\"artist\"\n", + "2019-01-31 00:36:32,587 : INFO : topic #14 (0.020): 0.024*\"forc\" + 0.022*\"armi\" + 0.022*\"aggress\" + 0.021*\"walter\" + 0.018*\"com\" + 0.014*\"oper\" + 0.013*\"militari\" + 0.012*\"airbu\" + 0.012*\"unionist\" + 0.011*\"airmen\"\n", + "2019-01-31 00:36:32,588 : INFO : topic #8 (0.020): 0.026*\"law\" + 0.023*\"cortic\" + 0.018*\"start\" + 0.017*\"act\" + 0.016*\"ricardo\" + 0.012*\"case\" + 0.011*\"polaris\" + 0.009*\"legal\" + 0.008*\"replac\" + 0.008*\"order\"\n", + "2019-01-31 00:36:32,590 : INFO : topic #33 (0.020): 0.059*\"french\" + 0.046*\"franc\" + 0.032*\"pari\" + 0.023*\"sail\" + 0.022*\"jean\" + 0.016*\"daphn\" + 0.014*\"lazi\" + 0.013*\"loui\" + 0.011*\"piec\" + 0.009*\"wine\"\n", + "2019-01-31 00:36:32,595 : INFO : topic diff=0.005168, rho=0.040757\n", + "2019-01-31 00:36:32,756 : INFO : PROGRESS: pass 0, at document #1206000/4922894\n", + "2019-01-31 00:36:34,154 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:36:34,421 : INFO : topic #47 (0.020): 0.063*\"muscl\" + 0.033*\"perceptu\" + 0.019*\"place\" + 0.018*\"theater\" + 0.017*\"compos\" + 0.016*\"damn\" + 0.014*\"orchestr\" + 0.014*\"olympo\" + 0.013*\"physician\" + 0.011*\"word\"\n", + "2019-01-31 00:36:34,422 : INFO : topic #5 (0.020): 0.039*\"abroad\" + 0.030*\"son\" + 0.028*\"rel\" + 0.025*\"reconstruct\" + 0.020*\"band\" + 0.017*\"muscl\" + 0.016*\"simultan\" + 0.014*\"charcoal\" + 0.014*\"toyota\" + 0.010*\"vocabulari\"\n", + "2019-01-31 00:36:34,423 : INFO : topic #49 (0.020): 0.042*\"india\" + 0.031*\"incumb\" + 0.014*\"islam\" + 0.013*\"televis\" + 0.011*\"tajikistan\" + 0.011*\"muskoge\" + 0.011*\"pakistan\" + 0.011*\"khalsa\" + 0.010*\"anglo\" + 0.009*\"alam\"\n", + "2019-01-31 00:36:34,424 : INFO : topic #12 (0.020): 0.010*\"number\" + 0.007*\"frontal\" + 0.007*\"théori\" + 0.007*\"gener\" + 0.006*\"southern\" + 0.006*\"poet\" + 0.006*\"exampl\" + 0.006*\"servitud\" + 0.006*\"measur\" + 0.005*\"differ\"\n", + "2019-01-31 00:36:34,425 : INFO : topic #44 (0.020): 0.032*\"rooftop\" + 0.029*\"final\" + 0.023*\"wife\" + 0.021*\"tourist\" + 0.018*\"champion\" + 0.017*\"taxpay\" + 0.016*\"chamber\" + 0.015*\"tiepolo\" + 0.014*\"martin\" + 0.012*\"open\"\n", + "2019-01-31 00:36:34,431 : INFO : topic diff=0.005536, rho=0.040723\n", + "2019-01-31 00:36:34,588 : INFO : PROGRESS: pass 0, at document #1208000/4922894\n", + "2019-01-31 00:36:35,992 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:36:36,258 : INFO : topic #38 (0.020): 0.023*\"walter\" + 0.012*\"aza\" + 0.009*\"battalion\" + 0.009*\"teufel\" + 0.008*\"forc\" + 0.008*\"empath\" + 0.008*\"till\" + 0.007*\"armi\" + 0.007*\"king\" + 0.006*\"militari\"\n", + "2019-01-31 00:36:36,259 : INFO : topic #3 (0.020): 0.037*\"present\" + 0.027*\"offic\" + 0.026*\"minist\" + 0.021*\"nation\" + 0.020*\"govern\" + 0.019*\"member\" + 0.018*\"gener\" + 0.018*\"serv\" + 0.016*\"seri\" + 0.016*\"chickasaw\"\n", + "2019-01-31 00:36:36,260 : INFO : topic #48 (0.020): 0.079*\"octob\" + 0.078*\"march\" + 0.074*\"sens\" + 0.071*\"notion\" + 0.069*\"januari\" + 0.067*\"juli\" + 0.066*\"august\" + 0.066*\"april\" + 0.065*\"decatur\" + 0.065*\"judici\"\n", + "2019-01-31 00:36:36,262 : INFO : topic #33 (0.020): 0.060*\"french\" + 0.045*\"franc\" + 0.032*\"pari\" + 0.023*\"sail\" + 0.023*\"jean\" + 0.016*\"daphn\" + 0.014*\"lazi\" + 0.013*\"loui\" + 0.011*\"piec\" + 0.010*\"wine\"\n", + "2019-01-31 00:36:36,263 : INFO : topic #25 (0.020): 0.032*\"ring\" + 0.019*\"lagrang\" + 0.017*\"warmth\" + 0.017*\"area\" + 0.015*\"mount\" + 0.009*\"palmer\" + 0.009*\"foam\" + 0.008*\"north\" + 0.008*\"land\" + 0.008*\"vacant\"\n", + "2019-01-31 00:36:36,269 : INFO : topic diff=0.005751, rho=0.040689\n", + "2019-01-31 00:36:36,422 : INFO : PROGRESS: pass 0, at document #1210000/4922894\n", + "2019-01-31 00:36:37,796 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:36:38,063 : INFO : topic #49 (0.020): 0.041*\"india\" + 0.031*\"incumb\" + 0.014*\"islam\" + 0.013*\"televis\" + 0.012*\"tajikistan\" + 0.012*\"anglo\" + 0.011*\"muskoge\" + 0.011*\"pakistan\" + 0.010*\"khalsa\" + 0.009*\"alam\"\n", + "2019-01-31 00:36:38,064 : INFO : topic #5 (0.020): 0.038*\"abroad\" + 0.030*\"son\" + 0.028*\"rel\" + 0.026*\"reconstruct\" + 0.020*\"band\" + 0.017*\"muscl\" + 0.017*\"simultan\" + 0.014*\"charcoal\" + 0.014*\"toyota\" + 0.010*\"vocabulari\"\n", + "2019-01-31 00:36:38,065 : INFO : topic #47 (0.020): 0.064*\"muscl\" + 0.033*\"perceptu\" + 0.019*\"theater\" + 0.019*\"place\" + 0.017*\"compos\" + 0.016*\"damn\" + 0.014*\"orchestr\" + 0.013*\"olympo\" + 0.012*\"physician\" + 0.011*\"word\"\n", + "2019-01-31 00:36:38,066 : INFO : topic #16 (0.020): 0.046*\"king\" + 0.031*\"priest\" + 0.021*\"quarterli\" + 0.019*\"duke\" + 0.019*\"grammat\" + 0.017*\"idiosyncrat\" + 0.015*\"rotterdam\" + 0.015*\"brazil\" + 0.014*\"princ\" + 0.013*\"portugues\"\n", + "2019-01-31 00:36:38,068 : INFO : topic #20 (0.020): 0.141*\"scholar\" + 0.040*\"struggl\" + 0.033*\"high\" + 0.031*\"educ\" + 0.022*\"collector\" + 0.019*\"yawn\" + 0.013*\"prognosi\" + 0.010*\"district\" + 0.009*\"gothic\" + 0.009*\"task\"\n", + "2019-01-31 00:36:38,073 : INFO : topic diff=0.005992, rho=0.040656\n", + "2019-01-31 00:36:38,230 : INFO : PROGRESS: pass 0, at document #1212000/4922894\n", + "2019-01-31 00:36:39,656 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:36:39,922 : INFO : topic #31 (0.020): 0.063*\"fusiform\" + 0.024*\"scientist\" + 0.023*\"player\" + 0.023*\"taxpay\" + 0.021*\"place\" + 0.014*\"clot\" + 0.012*\"leagu\" + 0.011*\"folei\" + 0.009*\"yawn\" + 0.009*\"ruler\"\n", + "2019-01-31 00:36:39,924 : INFO : topic #40 (0.020): 0.088*\"unit\" + 0.025*\"collector\" + 0.022*\"institut\" + 0.021*\"schuster\" + 0.020*\"requir\" + 0.018*\"student\" + 0.014*\"professor\" + 0.012*\"word\" + 0.011*\"governor\" + 0.011*\"degre\"\n", + "2019-01-31 00:36:39,925 : INFO : topic #7 (0.020): 0.020*\"di\" + 0.020*\"snatch\" + 0.018*\"factor\" + 0.016*\"margin\" + 0.016*\"yawn\" + 0.014*\"bone\" + 0.013*\"life\" + 0.012*\"faster\" + 0.012*\"daughter\" + 0.012*\"deal\"\n", + "2019-01-31 00:36:39,926 : INFO : topic #20 (0.020): 0.139*\"scholar\" + 0.041*\"struggl\" + 0.033*\"high\" + 0.031*\"educ\" + 0.022*\"collector\" + 0.019*\"yawn\" + 0.013*\"prognosi\" + 0.010*\"district\" + 0.009*\"gothic\" + 0.009*\"task\"\n", + "2019-01-31 00:36:39,927 : INFO : topic #5 (0.020): 0.039*\"abroad\" + 0.030*\"son\" + 0.028*\"rel\" + 0.026*\"reconstruct\" + 0.020*\"band\" + 0.017*\"muscl\" + 0.016*\"simultan\" + 0.014*\"charcoal\" + 0.014*\"toyota\" + 0.010*\"myspac\"\n", + "2019-01-31 00:36:39,933 : INFO : topic diff=0.007340, rho=0.040622\n", + "2019-01-31 00:36:40,147 : INFO : PROGRESS: pass 0, at document #1214000/4922894\n", + "2019-01-31 00:36:41,558 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:36:41,825 : INFO : topic #2 (0.020): 0.046*\"isl\" + 0.037*\"shield\" + 0.019*\"narrat\" + 0.014*\"scot\" + 0.012*\"pope\" + 0.012*\"nativist\" + 0.012*\"blur\" + 0.010*\"bahá\" + 0.010*\"coalit\" + 0.009*\"class\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 00:36:41,826 : INFO : topic #22 (0.020): 0.034*\"spars\" + 0.024*\"factor\" + 0.023*\"adulthood\" + 0.016*\"feel\" + 0.015*\"male\" + 0.014*\"hostil\" + 0.011*\"plaisir\" + 0.011*\"genu\" + 0.010*\"live\" + 0.009*\"yawn\"\n", + "2019-01-31 00:36:41,828 : INFO : topic #6 (0.020): 0.073*\"fewer\" + 0.024*\"septemb\" + 0.022*\"epiru\" + 0.018*\"teacher\" + 0.017*\"stake\" + 0.013*\"rodríguez\" + 0.012*\"proclaim\" + 0.011*\"movi\" + 0.011*\"direct\" + 0.010*\"acrimoni\"\n", + "2019-01-31 00:36:41,829 : INFO : topic #28 (0.020): 0.030*\"build\" + 0.027*\"hous\" + 0.020*\"rivièr\" + 0.018*\"buford\" + 0.013*\"histor\" + 0.011*\"briarwood\" + 0.011*\"strategist\" + 0.010*\"constitut\" + 0.010*\"linear\" + 0.010*\"depress\"\n", + "2019-01-31 00:36:41,830 : INFO : topic #20 (0.020): 0.140*\"scholar\" + 0.041*\"struggl\" + 0.033*\"high\" + 0.031*\"educ\" + 0.022*\"collector\" + 0.019*\"yawn\" + 0.013*\"prognosi\" + 0.009*\"district\" + 0.009*\"gothic\" + 0.009*\"task\"\n", + "2019-01-31 00:36:41,836 : INFO : topic diff=0.005980, rho=0.040589\n", + "2019-01-31 00:36:41,990 : INFO : PROGRESS: pass 0, at document #1216000/4922894\n", + "2019-01-31 00:36:43,381 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:36:43,648 : INFO : topic #10 (0.020): 0.013*\"cdd\" + 0.008*\"disco\" + 0.008*\"media\" + 0.007*\"have\" + 0.007*\"treat\" + 0.007*\"caus\" + 0.006*\"hormon\" + 0.006*\"pathwai\" + 0.006*\"effect\" + 0.006*\"proper\"\n", + "2019-01-31 00:36:43,649 : INFO : topic #24 (0.020): 0.041*\"book\" + 0.035*\"publicis\" + 0.023*\"word\" + 0.017*\"new\" + 0.015*\"edit\" + 0.013*\"presid\" + 0.012*\"nicola\" + 0.012*\"storag\" + 0.011*\"worldwid\" + 0.011*\"author\"\n", + "2019-01-31 00:36:43,650 : INFO : topic #23 (0.020): 0.138*\"audit\" + 0.071*\"best\" + 0.034*\"yawn\" + 0.030*\"jacksonvil\" + 0.023*\"japanes\" + 0.021*\"noll\" + 0.021*\"festiv\" + 0.019*\"women\" + 0.018*\"intern\" + 0.014*\"prison\"\n", + "2019-01-31 00:36:43,651 : INFO : topic #29 (0.020): 0.020*\"companhia\" + 0.011*\"million\" + 0.010*\"bank\" + 0.009*\"busi\" + 0.008*\"market\" + 0.008*\"yawn\" + 0.007*\"industri\" + 0.007*\"start\" + 0.007*\"govern\" + 0.007*\"function\"\n", + "2019-01-31 00:36:43,652 : INFO : topic #40 (0.020): 0.087*\"unit\" + 0.025*\"collector\" + 0.022*\"schuster\" + 0.021*\"institut\" + 0.020*\"requir\" + 0.018*\"student\" + 0.014*\"professor\" + 0.012*\"word\" + 0.011*\"degre\" + 0.011*\"governor\"\n", + "2019-01-31 00:36:43,658 : INFO : topic diff=0.006676, rho=0.040555\n", + "2019-01-31 00:36:43,817 : INFO : PROGRESS: pass 0, at document #1218000/4922894\n", + "2019-01-31 00:36:45,206 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:36:45,472 : INFO : topic #47 (0.020): 0.062*\"muscl\" + 0.033*\"perceptu\" + 0.019*\"place\" + 0.019*\"theater\" + 0.017*\"damn\" + 0.016*\"compos\" + 0.013*\"orchestr\" + 0.013*\"olympo\" + 0.012*\"physician\" + 0.011*\"word\"\n", + "2019-01-31 00:36:45,473 : INFO : topic #39 (0.020): 0.048*\"canada\" + 0.039*\"canadian\" + 0.022*\"toronto\" + 0.020*\"hoar\" + 0.019*\"ontario\" + 0.013*\"new\" + 0.012*\"hydrogen\" + 0.012*\"novotná\" + 0.011*\"misericordia\" + 0.011*\"araz\"\n", + "2019-01-31 00:36:45,474 : INFO : topic #45 (0.020): 0.021*\"jpg\" + 0.021*\"fifteenth\" + 0.017*\"illicit\" + 0.017*\"colder\" + 0.016*\"black\" + 0.014*\"western\" + 0.012*\"record\" + 0.011*\"blind\" + 0.008*\"light\" + 0.007*\"green\"\n", + "2019-01-31 00:36:45,476 : INFO : topic #22 (0.020): 0.034*\"spars\" + 0.024*\"factor\" + 0.023*\"adulthood\" + 0.016*\"feel\" + 0.015*\"male\" + 0.014*\"hostil\" + 0.011*\"plaisir\" + 0.011*\"genu\" + 0.010*\"live\" + 0.009*\"yawn\"\n", + "2019-01-31 00:36:45,477 : INFO : topic #12 (0.020): 0.009*\"number\" + 0.008*\"poet\" + 0.007*\"frontal\" + 0.007*\"théori\" + 0.006*\"gener\" + 0.006*\"southern\" + 0.006*\"exampl\" + 0.006*\"servitud\" + 0.006*\"measur\" + 0.005*\"utopian\"\n", + "2019-01-31 00:36:45,482 : INFO : topic diff=0.006979, rho=0.040522\n", + "2019-01-31 00:36:48,134 : INFO : -11.796 per-word bound, 3557.0 perplexity estimate based on a held-out corpus of 2000 documents with 533248 words\n", + "2019-01-31 00:36:48,135 : INFO : PROGRESS: pass 0, at document #1220000/4922894\n", + "2019-01-31 00:36:49,527 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:36:49,794 : INFO : topic #28 (0.020): 0.030*\"build\" + 0.028*\"hous\" + 0.020*\"rivièr\" + 0.018*\"buford\" + 0.013*\"histor\" + 0.012*\"briarwood\" + 0.011*\"strategist\" + 0.010*\"linear\" + 0.010*\"constitut\" + 0.010*\"depress\"\n", + "2019-01-31 00:36:49,795 : INFO : topic #40 (0.020): 0.087*\"unit\" + 0.025*\"collector\" + 0.022*\"schuster\" + 0.022*\"institut\" + 0.020*\"requir\" + 0.018*\"student\" + 0.014*\"professor\" + 0.012*\"word\" + 0.011*\"governor\" + 0.011*\"degre\"\n", + "2019-01-31 00:36:49,796 : INFO : topic #21 (0.020): 0.036*\"samford\" + 0.021*\"spain\" + 0.020*\"del\" + 0.019*\"mexico\" + 0.014*\"soviet\" + 0.012*\"lizard\" + 0.012*\"juan\" + 0.011*\"francisco\" + 0.011*\"santa\" + 0.011*\"carlo\"\n", + "2019-01-31 00:36:49,797 : INFO : topic #39 (0.020): 0.048*\"canada\" + 0.038*\"canadian\" + 0.021*\"toronto\" + 0.020*\"hoar\" + 0.019*\"ontario\" + 0.013*\"new\" + 0.012*\"hydrogen\" + 0.012*\"novotná\" + 0.011*\"misericordia\" + 0.010*\"araz\"\n", + "2019-01-31 00:36:49,799 : INFO : topic #14 (0.020): 0.024*\"forc\" + 0.022*\"armi\" + 0.021*\"aggress\" + 0.021*\"walter\" + 0.018*\"com\" + 0.014*\"oper\" + 0.013*\"unionist\" + 0.012*\"militari\" + 0.012*\"airbu\" + 0.011*\"airmen\"\n", + "2019-01-31 00:36:49,805 : INFO : topic diff=0.007897, rho=0.040489\n", + "2019-01-31 00:36:49,958 : INFO : PROGRESS: pass 0, at document #1222000/4922894\n", + "2019-01-31 00:36:51,349 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:36:51,616 : INFO : topic #4 (0.020): 0.021*\"enfranchis\" + 0.015*\"depress\" + 0.014*\"pour\" + 0.009*\"elabor\" + 0.009*\"mode\" + 0.008*\"veget\" + 0.008*\"produc\" + 0.007*\"encyclopedia\" + 0.007*\"candid\" + 0.007*\"mandir\"\n", + "2019-01-31 00:36:51,617 : INFO : topic #49 (0.020): 0.042*\"india\" + 0.033*\"incumb\" + 0.013*\"televis\" + 0.012*\"islam\" + 0.012*\"tajikistan\" + 0.012*\"anglo\" + 0.010*\"pakistan\" + 0.010*\"muskoge\" + 0.010*\"khalsa\" + 0.010*\"alam\"\n", + "2019-01-31 00:36:51,619 : INFO : topic #11 (0.020): 0.027*\"john\" + 0.015*\"will\" + 0.013*\"jame\" + 0.011*\"david\" + 0.011*\"rival\" + 0.009*\"mexican–american\" + 0.009*\"georg\" + 0.009*\"slur\" + 0.008*\"paul\" + 0.008*\"rhyme\"\n", + "2019-01-31 00:36:51,620 : INFO : topic #32 (0.020): 0.054*\"district\" + 0.047*\"vigour\" + 0.043*\"popolo\" + 0.042*\"tortur\" + 0.028*\"cotton\" + 0.027*\"area\" + 0.025*\"regim\" + 0.024*\"multitud\" + 0.022*\"citi\" + 0.018*\"commun\"\n", + "2019-01-31 00:36:51,621 : INFO : topic #5 (0.020): 0.039*\"abroad\" + 0.030*\"son\" + 0.027*\"rel\" + 0.026*\"reconstruct\" + 0.020*\"band\" + 0.017*\"muscl\" + 0.016*\"simultan\" + 0.014*\"charcoal\" + 0.014*\"toyota\" + 0.010*\"myspac\"\n", + "2019-01-31 00:36:51,626 : INFO : topic diff=0.005738, rho=0.040456\n", + "2019-01-31 00:36:51,787 : INFO : PROGRESS: pass 0, at document #1224000/4922894\n", + "2019-01-31 00:36:53,215 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:36:53,481 : INFO : topic #35 (0.020): 0.057*\"russia\" + 0.039*\"sovereignti\" + 0.035*\"rural\" + 0.023*\"personifi\" + 0.022*\"poison\" + 0.022*\"moscow\" + 0.021*\"reprint\" + 0.016*\"unfortun\" + 0.016*\"poland\" + 0.014*\"indonesia\"\n", + "2019-01-31 00:36:53,482 : INFO : topic #4 (0.020): 0.020*\"enfranchis\" + 0.015*\"depress\" + 0.013*\"pour\" + 0.009*\"elabor\" + 0.009*\"mode\" + 0.008*\"veget\" + 0.008*\"produc\" + 0.007*\"candid\" + 0.007*\"encyclopedia\" + 0.007*\"uruguayan\"\n", + "2019-01-31 00:36:53,483 : INFO : topic #20 (0.020): 0.142*\"scholar\" + 0.041*\"struggl\" + 0.033*\"high\" + 0.030*\"educ\" + 0.023*\"collector\" + 0.019*\"yawn\" + 0.013*\"prognosi\" + 0.009*\"district\" + 0.009*\"task\" + 0.009*\"class\"\n", + "2019-01-31 00:36:53,484 : INFO : topic #38 (0.020): 0.023*\"walter\" + 0.011*\"aza\" + 0.009*\"battalion\" + 0.009*\"forc\" + 0.009*\"teufel\" + 0.008*\"empath\" + 0.008*\"till\" + 0.007*\"armi\" + 0.006*\"king\" + 0.006*\"militari\"\n", + "2019-01-31 00:36:53,486 : INFO : topic #41 (0.020): 0.044*\"citi\" + 0.030*\"new\" + 0.022*\"palmer\" + 0.014*\"strategist\" + 0.013*\"year\" + 0.012*\"open\" + 0.012*\"center\" + 0.011*\"includ\" + 0.010*\"lobe\" + 0.009*\"dai\"\n", + "2019-01-31 00:36:53,491 : INFO : topic diff=0.006623, rho=0.040423\n", + "2019-01-31 00:36:53,644 : INFO : PROGRESS: pass 0, at document #1226000/4922894\n", + "2019-01-31 00:36:55,025 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:36:55,291 : INFO : topic #24 (0.020): 0.041*\"book\" + 0.035*\"publicis\" + 0.023*\"word\" + 0.017*\"new\" + 0.015*\"edit\" + 0.013*\"presid\" + 0.012*\"nicola\" + 0.012*\"worldwid\" + 0.012*\"storag\" + 0.011*\"magazin\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 00:36:55,293 : INFO : topic #22 (0.020): 0.034*\"spars\" + 0.024*\"factor\" + 0.022*\"adulthood\" + 0.016*\"feel\" + 0.014*\"male\" + 0.013*\"hostil\" + 0.011*\"plaisir\" + 0.011*\"genu\" + 0.010*\"live\" + 0.009*\"yawn\"\n", + "2019-01-31 00:36:55,294 : INFO : topic #32 (0.020): 0.054*\"district\" + 0.047*\"vigour\" + 0.043*\"popolo\" + 0.042*\"tortur\" + 0.028*\"cotton\" + 0.026*\"area\" + 0.024*\"regim\" + 0.024*\"multitud\" + 0.022*\"citi\" + 0.018*\"commun\"\n", + "2019-01-31 00:36:55,295 : INFO : topic #49 (0.020): 0.042*\"india\" + 0.032*\"incumb\" + 0.013*\"televis\" + 0.012*\"islam\" + 0.011*\"anglo\" + 0.011*\"tajikistan\" + 0.011*\"pakistan\" + 0.010*\"muskoge\" + 0.010*\"khalsa\" + 0.010*\"alam\"\n", + "2019-01-31 00:36:55,296 : INFO : topic #9 (0.020): 0.069*\"bone\" + 0.041*\"american\" + 0.030*\"valour\" + 0.018*\"dutch\" + 0.018*\"folei\" + 0.018*\"player\" + 0.017*\"polit\" + 0.016*\"english\" + 0.013*\"acrimoni\" + 0.012*\"simpler\"\n", + "2019-01-31 00:36:55,302 : INFO : topic diff=0.006572, rho=0.040390\n", + "2019-01-31 00:36:55,464 : INFO : PROGRESS: pass 0, at document #1228000/4922894\n", + "2019-01-31 00:36:56,899 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:36:57,165 : INFO : topic #23 (0.020): 0.138*\"audit\" + 0.070*\"best\" + 0.035*\"yawn\" + 0.030*\"jacksonvil\" + 0.024*\"japanes\" + 0.022*\"festiv\" + 0.021*\"noll\" + 0.019*\"women\" + 0.019*\"intern\" + 0.014*\"prison\"\n", + "2019-01-31 00:36:57,166 : INFO : topic #40 (0.020): 0.087*\"unit\" + 0.025*\"collector\" + 0.022*\"schuster\" + 0.022*\"institut\" + 0.020*\"requir\" + 0.018*\"student\" + 0.015*\"professor\" + 0.012*\"word\" + 0.011*\"governor\" + 0.011*\"degre\"\n", + "2019-01-31 00:36:57,167 : INFO : topic #14 (0.020): 0.024*\"forc\" + 0.022*\"armi\" + 0.021*\"aggress\" + 0.021*\"walter\" + 0.017*\"com\" + 0.014*\"oper\" + 0.013*\"unionist\" + 0.013*\"diversifi\" + 0.013*\"militari\" + 0.011*\"airbu\"\n", + "2019-01-31 00:36:57,168 : INFO : topic #10 (0.020): 0.013*\"cdd\" + 0.008*\"disco\" + 0.007*\"media\" + 0.007*\"caus\" + 0.007*\"have\" + 0.007*\"hormon\" + 0.006*\"treat\" + 0.006*\"pathwai\" + 0.006*\"proper\" + 0.006*\"effect\"\n", + "2019-01-31 00:36:57,169 : INFO : topic #25 (0.020): 0.031*\"ring\" + 0.018*\"warmth\" + 0.018*\"lagrang\" + 0.017*\"area\" + 0.015*\"mount\" + 0.009*\"palmer\" + 0.008*\"north\" + 0.008*\"foam\" + 0.008*\"land\" + 0.008*\"vacant\"\n", + "2019-01-31 00:36:57,175 : INFO : topic diff=0.007349, rho=0.040357\n", + "2019-01-31 00:36:57,334 : INFO : PROGRESS: pass 0, at document #1230000/4922894\n", + "2019-01-31 00:36:58,747 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:36:59,013 : INFO : topic #45 (0.020): 0.021*\"jpg\" + 0.020*\"fifteenth\" + 0.017*\"illicit\" + 0.017*\"colder\" + 0.015*\"black\" + 0.014*\"western\" + 0.012*\"record\" + 0.010*\"blind\" + 0.007*\"light\" + 0.007*\"hand\"\n", + "2019-01-31 00:36:59,014 : INFO : topic #48 (0.020): 0.078*\"octob\" + 0.077*\"march\" + 0.076*\"sens\" + 0.071*\"notion\" + 0.069*\"januari\" + 0.068*\"juli\" + 0.067*\"august\" + 0.066*\"decatur\" + 0.065*\"judici\" + 0.065*\"april\"\n", + "2019-01-31 00:36:59,016 : INFO : topic #2 (0.020): 0.047*\"isl\" + 0.037*\"shield\" + 0.018*\"narrat\" + 0.013*\"scot\" + 0.012*\"pope\" + 0.012*\"blur\" + 0.011*\"nativist\" + 0.010*\"bahá\" + 0.010*\"coalit\" + 0.009*\"fleet\"\n", + "2019-01-31 00:36:59,017 : INFO : topic #17 (0.020): 0.075*\"church\" + 0.022*\"cathol\" + 0.020*\"christian\" + 0.020*\"bishop\" + 0.016*\"sail\" + 0.014*\"retroflex\" + 0.010*\"centuri\" + 0.009*\"relationship\" + 0.009*\"cathedr\" + 0.009*\"historiographi\"\n", + "2019-01-31 00:36:59,018 : INFO : topic #49 (0.020): 0.043*\"india\" + 0.032*\"incumb\" + 0.013*\"islam\" + 0.012*\"televis\" + 0.011*\"anglo\" + 0.011*\"tajikistan\" + 0.011*\"pakistan\" + 0.010*\"muskoge\" + 0.010*\"alam\" + 0.010*\"khalsa\"\n", + "2019-01-31 00:36:59,024 : INFO : topic diff=0.006716, rho=0.040324\n", + "2019-01-31 00:36:59,193 : INFO : PROGRESS: pass 0, at document #1232000/4922894\n", + "2019-01-31 00:37:00,678 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:37:00,945 : INFO : topic #14 (0.020): 0.024*\"forc\" + 0.023*\"armi\" + 0.022*\"aggress\" + 0.020*\"walter\" + 0.017*\"com\" + 0.014*\"oper\" + 0.013*\"unionist\" + 0.013*\"militari\" + 0.012*\"diversifi\" + 0.011*\"refut\"\n", + "2019-01-31 00:37:00,946 : INFO : topic #22 (0.020): 0.034*\"spars\" + 0.024*\"factor\" + 0.022*\"adulthood\" + 0.016*\"feel\" + 0.014*\"male\" + 0.014*\"hostil\" + 0.011*\"plaisir\" + 0.011*\"genu\" + 0.010*\"live\" + 0.009*\"yawn\"\n", + "2019-01-31 00:37:00,947 : INFO : topic #30 (0.020): 0.036*\"cleveland\" + 0.036*\"leagu\" + 0.030*\"place\" + 0.027*\"taxpay\" + 0.025*\"scientist\" + 0.024*\"crete\" + 0.022*\"folei\" + 0.017*\"goal\" + 0.015*\"martin\" + 0.012*\"schmitz\"\n", + "2019-01-31 00:37:00,948 : INFO : topic #37 (0.020): 0.010*\"man\" + 0.009*\"love\" + 0.007*\"gestur\" + 0.007*\"comic\" + 0.006*\"blue\" + 0.004*\"black\" + 0.004*\"septemb\" + 0.004*\"vision\" + 0.004*\"litig\" + 0.004*\"bewild\"\n", + "2019-01-31 00:37:00,949 : INFO : topic #38 (0.020): 0.023*\"walter\" + 0.011*\"aza\" + 0.009*\"battalion\" + 0.009*\"forc\" + 0.008*\"teufel\" + 0.008*\"empath\" + 0.007*\"armi\" + 0.007*\"till\" + 0.006*\"militari\" + 0.006*\"pour\"\n", + "2019-01-31 00:37:00,955 : INFO : topic diff=0.005569, rho=0.040291\n", + "2019-01-31 00:37:01,113 : INFO : PROGRESS: pass 0, at document #1234000/4922894\n", + "2019-01-31 00:37:02,521 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:37:02,787 : INFO : topic #2 (0.020): 0.046*\"isl\" + 0.038*\"shield\" + 0.018*\"narrat\" + 0.013*\"scot\" + 0.012*\"pope\" + 0.012*\"blur\" + 0.011*\"nativist\" + 0.011*\"fleet\" + 0.010*\"bahá\" + 0.010*\"coalit\"\n", + "2019-01-31 00:37:02,788 : INFO : topic #13 (0.020): 0.027*\"australia\" + 0.026*\"london\" + 0.025*\"sourc\" + 0.025*\"new\" + 0.023*\"australian\" + 0.022*\"england\" + 0.019*\"british\" + 0.018*\"ireland\" + 0.016*\"youth\" + 0.014*\"wale\"\n", + "2019-01-31 00:37:02,789 : INFO : topic #40 (0.020): 0.087*\"unit\" + 0.024*\"collector\" + 0.022*\"schuster\" + 0.022*\"institut\" + 0.020*\"requir\" + 0.018*\"student\" + 0.015*\"professor\" + 0.012*\"word\" + 0.011*\"degre\" + 0.011*\"governor\"\n", + "2019-01-31 00:37:02,790 : INFO : topic #11 (0.020): 0.027*\"john\" + 0.015*\"will\" + 0.013*\"jame\" + 0.011*\"david\" + 0.011*\"rival\" + 0.010*\"mexican–american\" + 0.009*\"georg\" + 0.009*\"slur\" + 0.008*\"paul\" + 0.008*\"rhyme\"\n", + "2019-01-31 00:37:02,791 : INFO : topic #44 (0.020): 0.031*\"rooftop\" + 0.028*\"final\" + 0.022*\"wife\" + 0.021*\"tourist\" + 0.018*\"champion\" + 0.016*\"taxpay\" + 0.015*\"chamber\" + 0.014*\"tiepolo\" + 0.014*\"martin\" + 0.012*\"open\"\n", + "2019-01-31 00:37:02,797 : INFO : topic diff=0.006951, rho=0.040258\n", + "2019-01-31 00:37:02,953 : INFO : PROGRESS: pass 0, at document #1236000/4922894\n", + "2019-01-31 00:37:04,358 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:37:04,625 : INFO : topic #9 (0.020): 0.068*\"bone\" + 0.040*\"american\" + 0.030*\"valour\" + 0.019*\"dutch\" + 0.018*\"player\" + 0.018*\"folei\" + 0.017*\"polit\" + 0.016*\"english\" + 0.012*\"acrimoni\" + 0.012*\"simpler\"\n", + "2019-01-31 00:37:04,626 : INFO : topic #45 (0.020): 0.021*\"jpg\" + 0.020*\"fifteenth\" + 0.017*\"illicit\" + 0.017*\"colder\" + 0.015*\"black\" + 0.014*\"western\" + 0.012*\"record\" + 0.010*\"blind\" + 0.007*\"light\" + 0.007*\"hand\"\n", + "2019-01-31 00:37:04,628 : INFO : topic #21 (0.020): 0.037*\"samford\" + 0.023*\"spain\" + 0.020*\"mexico\" + 0.020*\"del\" + 0.014*\"soviet\" + 0.012*\"lizard\" + 0.012*\"juan\" + 0.011*\"mexican\" + 0.011*\"francisco\" + 0.010*\"carlo\"\n", + "2019-01-31 00:37:04,629 : INFO : topic #20 (0.020): 0.143*\"scholar\" + 0.041*\"struggl\" + 0.033*\"high\" + 0.030*\"educ\" + 0.023*\"collector\" + 0.019*\"yawn\" + 0.013*\"prognosi\" + 0.009*\"class\" + 0.009*\"task\" + 0.009*\"district\"\n", + "2019-01-31 00:37:04,630 : INFO : topic #42 (0.020): 0.043*\"german\" + 0.029*\"germani\" + 0.015*\"vol\" + 0.014*\"jewish\" + 0.014*\"der\" + 0.013*\"israel\" + 0.013*\"berlin\" + 0.010*\"european\" + 0.009*\"austria\" + 0.009*\"europ\"\n", + "2019-01-31 00:37:04,636 : INFO : topic diff=0.006980, rho=0.040226\n", + "2019-01-31 00:37:04,788 : INFO : PROGRESS: pass 0, at document #1238000/4922894\n", + "2019-01-31 00:37:06,158 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:37:06,425 : INFO : topic #8 (0.020): 0.027*\"law\" + 0.023*\"cortic\" + 0.018*\"start\" + 0.017*\"act\" + 0.017*\"ricardo\" + 0.012*\"case\" + 0.011*\"polaris\" + 0.009*\"replac\" + 0.009*\"legal\" + 0.007*\"order\"\n", + "2019-01-31 00:37:06,427 : INFO : topic #43 (0.020): 0.062*\"elect\" + 0.053*\"parti\" + 0.023*\"voluntari\" + 0.023*\"democrat\" + 0.021*\"member\" + 0.017*\"polici\" + 0.014*\"republ\" + 0.014*\"report\" + 0.013*\"liber\" + 0.013*\"selma\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 00:37:06,428 : INFO : topic #13 (0.020): 0.026*\"australia\" + 0.025*\"sourc\" + 0.025*\"london\" + 0.025*\"new\" + 0.022*\"australian\" + 0.022*\"england\" + 0.019*\"british\" + 0.018*\"ireland\" + 0.015*\"youth\" + 0.014*\"wale\"\n", + "2019-01-31 00:37:06,429 : INFO : topic #0 (0.020): 0.070*\"statewid\" + 0.039*\"line\" + 0.038*\"arsen\" + 0.036*\"raid\" + 0.031*\"museo\" + 0.020*\"traceabl\" + 0.018*\"serv\" + 0.014*\"pain\" + 0.013*\"exhaust\" + 0.012*\"artist\"\n", + "2019-01-31 00:37:06,431 : INFO : topic #17 (0.020): 0.074*\"church\" + 0.022*\"cathol\" + 0.020*\"christian\" + 0.019*\"bishop\" + 0.016*\"sail\" + 0.014*\"retroflex\" + 0.009*\"centuri\" + 0.009*\"monasteri\" + 0.009*\"relationship\" + 0.009*\"cathedr\"\n", + "2019-01-31 00:37:06,437 : INFO : topic diff=0.006379, rho=0.040193\n", + "2019-01-31 00:37:09,131 : INFO : -11.836 per-word bound, 3654.9 perplexity estimate based on a held-out corpus of 2000 documents with 559726 words\n", + "2019-01-31 00:37:09,131 : INFO : PROGRESS: pass 0, at document #1240000/4922894\n", + "2019-01-31 00:37:10,521 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:37:10,788 : INFO : topic #7 (0.020): 0.020*\"snatch\" + 0.020*\"di\" + 0.018*\"factor\" + 0.016*\"yawn\" + 0.015*\"margin\" + 0.014*\"bone\" + 0.013*\"life\" + 0.012*\"faster\" + 0.012*\"deal\" + 0.012*\"daughter\"\n", + "2019-01-31 00:37:10,789 : INFO : topic #0 (0.020): 0.069*\"statewid\" + 0.039*\"line\" + 0.038*\"arsen\" + 0.036*\"raid\" + 0.030*\"museo\" + 0.021*\"traceabl\" + 0.018*\"serv\" + 0.014*\"pain\" + 0.013*\"exhaust\" + 0.012*\"artist\"\n", + "2019-01-31 00:37:10,790 : INFO : topic #36 (0.020): 0.013*\"network\" + 0.011*\"prognosi\" + 0.011*\"pop\" + 0.008*\"develop\" + 0.008*\"cytokin\" + 0.008*\"serv\" + 0.008*\"oper\" + 0.008*\"softwar\" + 0.007*\"base\" + 0.007*\"diggin\"\n", + "2019-01-31 00:37:10,791 : INFO : topic #2 (0.020): 0.046*\"isl\" + 0.038*\"shield\" + 0.018*\"narrat\" + 0.013*\"scot\" + 0.013*\"pope\" + 0.012*\"blur\" + 0.011*\"nativist\" + 0.010*\"fleet\" + 0.010*\"class\" + 0.010*\"coalit\"\n", + "2019-01-31 00:37:10,792 : INFO : topic #23 (0.020): 0.138*\"audit\" + 0.071*\"best\" + 0.036*\"yawn\" + 0.029*\"jacksonvil\" + 0.023*\"japanes\" + 0.021*\"noll\" + 0.021*\"festiv\" + 0.019*\"intern\" + 0.019*\"women\" + 0.014*\"prison\"\n", + "2019-01-31 00:37:10,798 : INFO : topic diff=0.006861, rho=0.040161\n", + "2019-01-31 00:37:10,955 : INFO : PROGRESS: pass 0, at document #1242000/4922894\n", + "2019-01-31 00:37:12,359 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:37:12,628 : INFO : topic #22 (0.020): 0.034*\"spars\" + 0.024*\"factor\" + 0.021*\"adulthood\" + 0.015*\"feel\" + 0.014*\"male\" + 0.013*\"hostil\" + 0.011*\"plaisir\" + 0.010*\"genu\" + 0.010*\"live\" + 0.009*\"yawn\"\n", + "2019-01-31 00:37:12,629 : INFO : topic #27 (0.020): 0.071*\"questionnair\" + 0.019*\"candid\" + 0.018*\"taxpay\" + 0.014*\"tornado\" + 0.014*\"driver\" + 0.012*\"find\" + 0.012*\"ret\" + 0.011*\"landslid\" + 0.010*\"fool\" + 0.010*\"théori\"\n", + "2019-01-31 00:37:12,631 : INFO : topic #15 (0.020): 0.011*\"small\" + 0.011*\"organ\" + 0.011*\"commun\" + 0.010*\"develop\" + 0.009*\"word\" + 0.009*\"group\" + 0.008*\"peopl\" + 0.008*\"cultur\" + 0.007*\"human\" + 0.007*\"woman\"\n", + "2019-01-31 00:37:12,632 : INFO : topic #18 (0.020): 0.010*\"théori\" + 0.007*\"later\" + 0.007*\"sack\" + 0.006*\"kill\" + 0.006*\"dai\" + 0.005*\"retrospect\" + 0.005*\"end\" + 0.005*\"like\" + 0.004*\"call\" + 0.004*\"kenworthi\"\n", + "2019-01-31 00:37:12,633 : INFO : topic #42 (0.020): 0.044*\"german\" + 0.030*\"germani\" + 0.015*\"vol\" + 0.014*\"israel\" + 0.014*\"jewish\" + 0.013*\"der\" + 0.013*\"berlin\" + 0.010*\"european\" + 0.009*\"austria\" + 0.009*\"europ\"\n", + "2019-01-31 00:37:12,639 : INFO : topic diff=0.005765, rho=0.040129\n", + "2019-01-31 00:37:12,808 : INFO : PROGRESS: pass 0, at document #1244000/4922894\n", + "2019-01-31 00:37:14,259 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:37:14,525 : INFO : topic #27 (0.020): 0.071*\"questionnair\" + 0.019*\"candid\" + 0.018*\"taxpay\" + 0.014*\"tornado\" + 0.014*\"driver\" + 0.012*\"ret\" + 0.012*\"find\" + 0.011*\"landslid\" + 0.010*\"fool\" + 0.010*\"théori\"\n", + "2019-01-31 00:37:14,527 : INFO : topic #29 (0.020): 0.021*\"companhia\" + 0.011*\"million\" + 0.010*\"bank\" + 0.010*\"busi\" + 0.008*\"market\" + 0.008*\"yawn\" + 0.008*\"industri\" + 0.007*\"manag\" + 0.007*\"govern\" + 0.007*\"produc\"\n", + "2019-01-31 00:37:14,528 : INFO : topic #30 (0.020): 0.037*\"leagu\" + 0.036*\"cleveland\" + 0.030*\"place\" + 0.027*\"taxpay\" + 0.025*\"scientist\" + 0.024*\"crete\" + 0.022*\"folei\" + 0.017*\"goal\" + 0.015*\"martin\" + 0.012*\"schmitz\"\n", + "2019-01-31 00:37:14,529 : INFO : topic #42 (0.020): 0.043*\"german\" + 0.029*\"germani\" + 0.015*\"vol\" + 0.014*\"jewish\" + 0.014*\"berlin\" + 0.014*\"israel\" + 0.013*\"der\" + 0.010*\"european\" + 0.009*\"europ\" + 0.009*\"austria\"\n", + "2019-01-31 00:37:14,530 : INFO : topic #39 (0.020): 0.048*\"canada\" + 0.037*\"canadian\" + 0.020*\"toronto\" + 0.019*\"hoar\" + 0.018*\"ontario\" + 0.014*\"new\" + 0.012*\"novotná\" + 0.012*\"misericordia\" + 0.012*\"hydrogen\" + 0.011*\"quebec\"\n", + "2019-01-31 00:37:14,536 : INFO : topic diff=0.007045, rho=0.040096\n", + "2019-01-31 00:37:14,747 : INFO : PROGRESS: pass 0, at document #1246000/4922894\n", + "2019-01-31 00:37:16,160 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:37:16,426 : INFO : topic #0 (0.020): 0.070*\"statewid\" + 0.040*\"line\" + 0.037*\"arsen\" + 0.037*\"raid\" + 0.030*\"museo\" + 0.021*\"traceabl\" + 0.018*\"serv\" + 0.014*\"pain\" + 0.013*\"exhaust\" + 0.012*\"artist\"\n", + "2019-01-31 00:37:16,427 : INFO : topic #16 (0.020): 0.047*\"king\" + 0.030*\"priest\" + 0.019*\"duke\" + 0.019*\"grammat\" + 0.019*\"quarterli\" + 0.017*\"idiosyncrat\" + 0.016*\"brazil\" + 0.015*\"portugues\" + 0.015*\"rotterdam\" + 0.013*\"portrait\"\n", + "2019-01-31 00:37:16,428 : INFO : topic #42 (0.020): 0.044*\"german\" + 0.029*\"germani\" + 0.015*\"vol\" + 0.014*\"jewish\" + 0.014*\"israel\" + 0.014*\"berlin\" + 0.013*\"der\" + 0.010*\"european\" + 0.009*\"europ\" + 0.009*\"hungarian\"\n", + "2019-01-31 00:37:16,429 : INFO : topic #14 (0.020): 0.024*\"forc\" + 0.023*\"armi\" + 0.021*\"aggress\" + 0.021*\"walter\" + 0.017*\"com\" + 0.014*\"oper\" + 0.013*\"unionist\" + 0.013*\"militari\" + 0.012*\"diversifi\" + 0.012*\"airmen\"\n", + "2019-01-31 00:37:16,430 : INFO : topic #36 (0.020): 0.013*\"network\" + 0.011*\"prognosi\" + 0.010*\"pop\" + 0.009*\"develop\" + 0.008*\"cytokin\" + 0.008*\"serv\" + 0.008*\"oper\" + 0.007*\"softwar\" + 0.007*\"base\" + 0.007*\"diggin\"\n", + "2019-01-31 00:37:16,436 : INFO : topic diff=0.006898, rho=0.040064\n", + "2019-01-31 00:37:16,593 : INFO : PROGRESS: pass 0, at document #1248000/4922894\n", + "2019-01-31 00:37:17,998 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:37:18,264 : INFO : topic #39 (0.020): 0.050*\"canada\" + 0.038*\"canadian\" + 0.020*\"toronto\" + 0.019*\"hoar\" + 0.018*\"ontario\" + 0.013*\"new\" + 0.012*\"misericordia\" + 0.012*\"novotná\" + 0.012*\"hydrogen\" + 0.011*\"quebec\"\n", + "2019-01-31 00:37:18,265 : INFO : topic #38 (0.020): 0.024*\"walter\" + 0.010*\"aza\" + 0.010*\"battalion\" + 0.009*\"forc\" + 0.008*\"empath\" + 0.008*\"teufel\" + 0.007*\"armi\" + 0.007*\"king\" + 0.006*\"militari\" + 0.006*\"pour\"\n", + "2019-01-31 00:37:18,266 : INFO : topic #24 (0.020): 0.042*\"book\" + 0.035*\"publicis\" + 0.024*\"word\" + 0.017*\"new\" + 0.015*\"edit\" + 0.013*\"presid\" + 0.012*\"nicola\" + 0.012*\"storag\" + 0.012*\"worldwid\" + 0.011*\"author\"\n", + "2019-01-31 00:37:18,267 : INFO : topic #7 (0.020): 0.021*\"snatch\" + 0.020*\"di\" + 0.019*\"factor\" + 0.016*\"yawn\" + 0.015*\"margin\" + 0.014*\"bone\" + 0.013*\"life\" + 0.012*\"faster\" + 0.012*\"deal\" + 0.012*\"daughter\"\n", + "2019-01-31 00:37:18,268 : INFO : topic #34 (0.020): 0.072*\"start\" + 0.034*\"unionist\" + 0.031*\"american\" + 0.030*\"cotton\" + 0.027*\"new\" + 0.015*\"year\" + 0.015*\"warrior\" + 0.014*\"california\" + 0.013*\"terri\" + 0.012*\"north\"\n", + "2019-01-31 00:37:18,274 : INFO : topic diff=0.006420, rho=0.040032\n", + "2019-01-31 00:37:18,428 : INFO : PROGRESS: pass 0, at document #1250000/4922894\n", + "2019-01-31 00:37:19,796 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:37:20,062 : INFO : topic #39 (0.020): 0.050*\"canada\" + 0.038*\"canadian\" + 0.020*\"toronto\" + 0.019*\"hoar\" + 0.018*\"ontario\" + 0.013*\"new\" + 0.012*\"misericordia\" + 0.012*\"novotná\" + 0.012*\"hydrogen\" + 0.011*\"quebec\"\n", + "2019-01-31 00:37:20,063 : INFO : topic #38 (0.020): 0.024*\"walter\" + 0.010*\"aza\" + 0.010*\"battalion\" + 0.009*\"forc\" + 0.008*\"empath\" + 0.008*\"teufel\" + 0.007*\"armi\" + 0.007*\"king\" + 0.006*\"militari\" + 0.006*\"till\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 00:37:20,065 : INFO : topic #7 (0.020): 0.021*\"snatch\" + 0.020*\"di\" + 0.019*\"factor\" + 0.016*\"yawn\" + 0.015*\"margin\" + 0.014*\"bone\" + 0.013*\"life\" + 0.012*\"faster\" + 0.012*\"deal\" + 0.012*\"daughter\"\n", + "2019-01-31 00:37:20,066 : INFO : topic #5 (0.020): 0.038*\"abroad\" + 0.029*\"son\" + 0.027*\"rel\" + 0.026*\"reconstruct\" + 0.020*\"band\" + 0.017*\"muscl\" + 0.016*\"simultan\" + 0.014*\"charcoal\" + 0.014*\"toyota\" + 0.010*\"vocabulari\"\n", + "2019-01-31 00:37:20,067 : INFO : topic #11 (0.020): 0.027*\"john\" + 0.015*\"will\" + 0.013*\"jame\" + 0.012*\"david\" + 0.011*\"rival\" + 0.010*\"mexican–american\" + 0.009*\"georg\" + 0.009*\"slur\" + 0.008*\"paul\" + 0.008*\"rhyme\"\n", + "2019-01-31 00:37:20,073 : INFO : topic diff=0.007088, rho=0.040000\n", + "2019-01-31 00:37:20,227 : INFO : PROGRESS: pass 0, at document #1252000/4922894\n", + "2019-01-31 00:37:21,613 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:37:21,880 : INFO : topic #14 (0.020): 0.024*\"forc\" + 0.024*\"aggress\" + 0.021*\"armi\" + 0.020*\"walter\" + 0.016*\"com\" + 0.014*\"oper\" + 0.013*\"refut\" + 0.013*\"unionist\" + 0.012*\"militari\" + 0.012*\"airbu\"\n", + "2019-01-31 00:37:21,881 : INFO : topic #12 (0.020): 0.009*\"number\" + 0.008*\"poet\" + 0.007*\"frontal\" + 0.007*\"théori\" + 0.007*\"measur\" + 0.006*\"gener\" + 0.006*\"exampl\" + 0.006*\"southern\" + 0.006*\"method\" + 0.006*\"utopian\"\n", + "2019-01-31 00:37:21,882 : INFO : topic #8 (0.020): 0.027*\"law\" + 0.023*\"cortic\" + 0.018*\"start\" + 0.016*\"act\" + 0.016*\"ricardo\" + 0.012*\"case\" + 0.010*\"polaris\" + 0.009*\"replac\" + 0.009*\"legal\" + 0.007*\"judaism\"\n", + "2019-01-31 00:37:21,883 : INFO : topic #46 (0.020): 0.017*\"stop\" + 0.017*\"swedish\" + 0.016*\"sweden\" + 0.016*\"norwai\" + 0.016*\"norwegian\" + 0.015*\"damag\" + 0.014*\"wind\" + 0.013*\"turkish\" + 0.012*\"replac\" + 0.011*\"denmark\"\n", + "2019-01-31 00:37:21,884 : INFO : topic #9 (0.020): 0.069*\"bone\" + 0.040*\"american\" + 0.030*\"valour\" + 0.019*\"dutch\" + 0.018*\"folei\" + 0.017*\"player\" + 0.017*\"polit\" + 0.016*\"english\" + 0.012*\"acrimoni\" + 0.012*\"simpler\"\n", + "2019-01-31 00:37:21,890 : INFO : topic diff=0.007750, rho=0.039968\n", + "2019-01-31 00:37:22,041 : INFO : PROGRESS: pass 0, at document #1254000/4922894\n", + "2019-01-31 00:37:23,398 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:37:23,664 : INFO : topic #26 (0.020): 0.033*\"workplac\" + 0.030*\"champion\" + 0.026*\"woman\" + 0.025*\"olymp\" + 0.024*\"men\" + 0.020*\"medal\" + 0.020*\"event\" + 0.019*\"alic\" + 0.018*\"atheist\" + 0.017*\"taxpay\"\n", + "2019-01-31 00:37:23,665 : INFO : topic #4 (0.020): 0.021*\"enfranchis\" + 0.014*\"depress\" + 0.014*\"pour\" + 0.009*\"elabor\" + 0.009*\"mode\" + 0.008*\"veget\" + 0.008*\"produc\" + 0.007*\"candid\" + 0.007*\"uruguayan\" + 0.007*\"encyclopedia\"\n", + "2019-01-31 00:37:23,666 : INFO : topic #36 (0.020): 0.013*\"network\" + 0.011*\"prognosi\" + 0.010*\"pop\" + 0.008*\"develop\" + 0.008*\"cytokin\" + 0.008*\"oper\" + 0.008*\"serv\" + 0.008*\"softwar\" + 0.007*\"base\" + 0.007*\"user\"\n", + "2019-01-31 00:37:23,667 : INFO : topic #16 (0.020): 0.047*\"king\" + 0.030*\"priest\" + 0.019*\"grammat\" + 0.019*\"quarterli\" + 0.018*\"duke\" + 0.017*\"idiosyncrat\" + 0.016*\"brazil\" + 0.015*\"portugues\" + 0.015*\"rotterdam\" + 0.013*\"kingdom\"\n", + "2019-01-31 00:37:23,668 : INFO : topic #45 (0.020): 0.023*\"jpg\" + 0.022*\"fifteenth\" + 0.018*\"colder\" + 0.017*\"illicit\" + 0.016*\"black\" + 0.014*\"western\" + 0.012*\"record\" + 0.010*\"blind\" + 0.007*\"light\" + 0.007*\"green\"\n", + "2019-01-31 00:37:23,674 : INFO : topic diff=0.008235, rho=0.039936\n", + "2019-01-31 00:37:23,830 : INFO : PROGRESS: pass 0, at document #1256000/4922894\n", + "2019-01-31 00:37:25,208 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:37:25,474 : INFO : topic #30 (0.020): 0.037*\"leagu\" + 0.037*\"cleveland\" + 0.030*\"place\" + 0.027*\"taxpay\" + 0.025*\"scientist\" + 0.024*\"crete\" + 0.022*\"folei\" + 0.017*\"goal\" + 0.015*\"martin\" + 0.012*\"schmitz\"\n", + "2019-01-31 00:37:25,475 : INFO : topic #38 (0.020): 0.024*\"walter\" + 0.010*\"aza\" + 0.010*\"battalion\" + 0.009*\"forc\" + 0.008*\"teufel\" + 0.008*\"empath\" + 0.007*\"armi\" + 0.006*\"till\" + 0.006*\"king\" + 0.006*\"militari\"\n", + "2019-01-31 00:37:25,477 : INFO : topic #35 (0.020): 0.057*\"russia\" + 0.039*\"sovereignti\" + 0.036*\"rural\" + 0.024*\"reprint\" + 0.023*\"poison\" + 0.021*\"moscow\" + 0.021*\"personifi\" + 0.017*\"unfortun\" + 0.015*\"poland\" + 0.015*\"czech\"\n", + "2019-01-31 00:37:25,478 : INFO : topic #12 (0.020): 0.008*\"number\" + 0.008*\"poet\" + 0.007*\"frontal\" + 0.007*\"measur\" + 0.006*\"théori\" + 0.006*\"gener\" + 0.006*\"exampl\" + 0.006*\"southern\" + 0.006*\"servitud\" + 0.006*\"method\"\n", + "2019-01-31 00:37:25,479 : INFO : topic #24 (0.020): 0.041*\"book\" + 0.034*\"publicis\" + 0.024*\"word\" + 0.017*\"new\" + 0.015*\"edit\" + 0.013*\"presid\" + 0.012*\"nicola\" + 0.012*\"storag\" + 0.012*\"worldwid\" + 0.011*\"author\"\n", + "2019-01-31 00:37:25,485 : INFO : topic diff=0.006499, rho=0.039904\n", + "2019-01-31 00:37:25,638 : INFO : PROGRESS: pass 0, at document #1258000/4922894\n", + "2019-01-31 00:37:27,024 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:37:27,290 : INFO : topic #1 (0.020): 0.059*\"china\" + 0.051*\"chilton\" + 0.021*\"hong\" + 0.021*\"kong\" + 0.020*\"korea\" + 0.017*\"korean\" + 0.014*\"leah\" + 0.014*\"sourc\" + 0.013*\"shirin\" + 0.013*\"kim\"\n", + "2019-01-31 00:37:27,291 : INFO : topic #22 (0.020): 0.034*\"spars\" + 0.024*\"factor\" + 0.022*\"adulthood\" + 0.016*\"feel\" + 0.014*\"male\" + 0.013*\"hostil\" + 0.012*\"plaisir\" + 0.010*\"lanewai\" + 0.010*\"genu\" + 0.010*\"live\"\n", + "2019-01-31 00:37:27,292 : INFO : topic #27 (0.020): 0.072*\"questionnair\" + 0.019*\"candid\" + 0.018*\"taxpay\" + 0.013*\"driver\" + 0.012*\"tornado\" + 0.012*\"ret\" + 0.012*\"find\" + 0.011*\"fool\" + 0.011*\"landslid\" + 0.010*\"théori\"\n", + "2019-01-31 00:37:27,293 : INFO : topic #40 (0.020): 0.087*\"unit\" + 0.023*\"collector\" + 0.022*\"schuster\" + 0.022*\"institut\" + 0.020*\"requir\" + 0.018*\"student\" + 0.014*\"professor\" + 0.012*\"word\" + 0.011*\"governor\" + 0.011*\"degre\"\n", + "2019-01-31 00:37:27,295 : INFO : topic #12 (0.020): 0.009*\"number\" + 0.008*\"poet\" + 0.007*\"measur\" + 0.007*\"frontal\" + 0.006*\"théori\" + 0.006*\"exampl\" + 0.006*\"gener\" + 0.006*\"southern\" + 0.006*\"servitud\" + 0.006*\"method\"\n", + "2019-01-31 00:37:27,300 : INFO : topic diff=0.006583, rho=0.039873\n", + "2019-01-31 00:37:29,994 : INFO : -11.621 per-word bound, 3150.0 perplexity estimate based on a held-out corpus of 2000 documents with 547150 words\n", + "2019-01-31 00:37:29,994 : INFO : PROGRESS: pass 0, at document #1260000/4922894\n", + "2019-01-31 00:37:31,388 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:37:31,655 : INFO : topic #36 (0.020): 0.014*\"network\" + 0.011*\"prognosi\" + 0.010*\"pop\" + 0.009*\"develop\" + 0.008*\"cytokin\" + 0.008*\"serv\" + 0.008*\"oper\" + 0.008*\"softwar\" + 0.007*\"base\" + 0.007*\"diggin\"\n", + "2019-01-31 00:37:31,656 : INFO : topic #31 (0.020): 0.061*\"fusiform\" + 0.025*\"scientist\" + 0.024*\"taxpay\" + 0.024*\"player\" + 0.021*\"place\" + 0.014*\"clot\" + 0.012*\"leagu\" + 0.012*\"folei\" + 0.009*\"yawn\" + 0.009*\"barber\"\n", + "2019-01-31 00:37:31,657 : INFO : topic #24 (0.020): 0.042*\"book\" + 0.034*\"publicis\" + 0.024*\"word\" + 0.017*\"new\" + 0.015*\"edit\" + 0.013*\"presid\" + 0.012*\"nicola\" + 0.012*\"storag\" + 0.012*\"worldwid\" + 0.011*\"author\"\n", + "2019-01-31 00:37:31,658 : INFO : topic #2 (0.020): 0.046*\"isl\" + 0.037*\"shield\" + 0.019*\"narrat\" + 0.013*\"scot\" + 0.013*\"pope\" + 0.012*\"blur\" + 0.011*\"nativist\" + 0.010*\"coalit\" + 0.010*\"bahá\" + 0.010*\"fleet\"\n", + "2019-01-31 00:37:31,660 : INFO : topic #38 (0.020): 0.023*\"walter\" + 0.010*\"aza\" + 0.009*\"battalion\" + 0.009*\"forc\" + 0.008*\"teufel\" + 0.008*\"empath\" + 0.007*\"armi\" + 0.007*\"militari\" + 0.006*\"till\" + 0.006*\"centuri\"\n", + "2019-01-31 00:37:31,665 : INFO : topic diff=0.005669, rho=0.039841\n", + "2019-01-31 00:37:31,820 : INFO : PROGRESS: pass 0, at document #1262000/4922894\n", + "2019-01-31 00:37:33,216 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:37:33,483 : INFO : topic #1 (0.020): 0.059*\"china\" + 0.052*\"chilton\" + 0.021*\"hong\" + 0.020*\"kong\" + 0.020*\"korea\" + 0.017*\"korean\" + 0.014*\"sourc\" + 0.014*\"leah\" + 0.013*\"ashvil\" + 0.013*\"shirin\"\n", + "2019-01-31 00:37:33,484 : INFO : topic #10 (0.020): 0.012*\"cdd\" + 0.008*\"disco\" + 0.007*\"media\" + 0.007*\"caus\" + 0.007*\"have\" + 0.007*\"hormon\" + 0.006*\"pathwai\" + 0.006*\"proper\" + 0.006*\"treat\" + 0.006*\"activ\"\n", + "2019-01-31 00:37:33,485 : INFO : topic #41 (0.020): 0.043*\"citi\" + 0.029*\"new\" + 0.022*\"palmer\" + 0.015*\"strategist\" + 0.013*\"open\" + 0.012*\"center\" + 0.012*\"year\" + 0.011*\"includ\" + 0.010*\"lobe\" + 0.009*\"dai\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 00:37:33,486 : INFO : topic #26 (0.020): 0.033*\"workplac\" + 0.030*\"champion\" + 0.026*\"woman\" + 0.025*\"olymp\" + 0.024*\"men\" + 0.021*\"medal\" + 0.020*\"event\" + 0.018*\"atheist\" + 0.018*\"alic\" + 0.018*\"nation\"\n", + "2019-01-31 00:37:33,487 : INFO : topic #12 (0.020): 0.008*\"number\" + 0.008*\"poet\" + 0.007*\"measur\" + 0.007*\"frontal\" + 0.006*\"théori\" + 0.006*\"exampl\" + 0.006*\"southern\" + 0.006*\"gener\" + 0.006*\"servitud\" + 0.006*\"method\"\n", + "2019-01-31 00:37:33,493 : INFO : topic diff=0.006252, rho=0.039809\n", + "2019-01-31 00:37:33,647 : INFO : PROGRESS: pass 0, at document #1264000/4922894\n", + "2019-01-31 00:37:35,048 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:37:35,315 : INFO : topic #43 (0.020): 0.060*\"elect\" + 0.054*\"parti\" + 0.023*\"voluntari\" + 0.022*\"democrat\" + 0.021*\"member\" + 0.018*\"conserv\" + 0.017*\"liber\" + 0.016*\"polici\" + 0.014*\"republ\" + 0.013*\"report\"\n", + "2019-01-31 00:37:35,316 : INFO : topic #24 (0.020): 0.041*\"book\" + 0.034*\"publicis\" + 0.024*\"word\" + 0.017*\"new\" + 0.015*\"edit\" + 0.013*\"presid\" + 0.012*\"nicola\" + 0.012*\"storag\" + 0.012*\"worldwid\" + 0.011*\"author\"\n", + "2019-01-31 00:37:35,317 : INFO : topic #37 (0.020): 0.010*\"man\" + 0.009*\"love\" + 0.008*\"gestur\" + 0.006*\"blue\" + 0.006*\"comic\" + 0.004*\"septemb\" + 0.004*\"vision\" + 0.004*\"litig\" + 0.004*\"black\" + 0.004*\"charact\"\n", + "2019-01-31 00:37:35,318 : INFO : topic #27 (0.020): 0.071*\"questionnair\" + 0.019*\"candid\" + 0.018*\"taxpay\" + 0.014*\"driver\" + 0.013*\"find\" + 0.012*\"ret\" + 0.012*\"tornado\" + 0.011*\"landslid\" + 0.011*\"fool\" + 0.010*\"horac\"\n", + "2019-01-31 00:37:35,319 : INFO : topic #23 (0.020): 0.138*\"audit\" + 0.070*\"best\" + 0.034*\"yawn\" + 0.029*\"jacksonvil\" + 0.025*\"japanes\" + 0.023*\"noll\" + 0.020*\"festiv\" + 0.020*\"women\" + 0.018*\"intern\" + 0.013*\"prison\"\n", + "2019-01-31 00:37:35,325 : INFO : topic diff=0.005921, rho=0.039778\n", + "2019-01-31 00:37:35,482 : INFO : PROGRESS: pass 0, at document #1266000/4922894\n", + "2019-01-31 00:37:36,890 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:37:37,156 : INFO : topic #28 (0.020): 0.030*\"build\" + 0.026*\"hous\" + 0.020*\"rivièr\" + 0.017*\"buford\" + 0.013*\"histor\" + 0.011*\"briarwood\" + 0.011*\"strategist\" + 0.011*\"constitut\" + 0.010*\"linear\" + 0.009*\"depress\"\n", + "2019-01-31 00:37:37,157 : INFO : topic #45 (0.020): 0.023*\"jpg\" + 0.023*\"fifteenth\" + 0.017*\"illicit\" + 0.017*\"colder\" + 0.016*\"black\" + 0.014*\"western\" + 0.012*\"record\" + 0.010*\"blind\" + 0.007*\"green\" + 0.007*\"hand\"\n", + "2019-01-31 00:37:37,158 : INFO : topic #31 (0.020): 0.061*\"fusiform\" + 0.025*\"scientist\" + 0.024*\"taxpay\" + 0.023*\"player\" + 0.021*\"place\" + 0.014*\"clot\" + 0.013*\"leagu\" + 0.012*\"folei\" + 0.010*\"yawn\" + 0.009*\"barber\"\n", + "2019-01-31 00:37:37,159 : INFO : topic #10 (0.020): 0.012*\"cdd\" + 0.008*\"disco\" + 0.007*\"media\" + 0.007*\"caus\" + 0.007*\"have\" + 0.007*\"hormon\" + 0.006*\"proper\" + 0.006*\"pathwai\" + 0.006*\"treat\" + 0.005*\"effect\"\n", + "2019-01-31 00:37:37,160 : INFO : topic #21 (0.020): 0.035*\"samford\" + 0.023*\"spain\" + 0.019*\"del\" + 0.019*\"mexico\" + 0.014*\"soviet\" + 0.013*\"juan\" + 0.012*\"lizard\" + 0.011*\"carlo\" + 0.011*\"santa\" + 0.011*\"mexican\"\n", + "2019-01-31 00:37:37,166 : INFO : topic diff=0.006054, rho=0.039746\n", + "2019-01-31 00:37:37,327 : INFO : PROGRESS: pass 0, at document #1268000/4922894\n", + "2019-01-31 00:37:38,704 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:37:38,970 : INFO : topic #20 (0.020): 0.140*\"scholar\" + 0.041*\"struggl\" + 0.033*\"high\" + 0.030*\"educ\" + 0.023*\"collector\" + 0.019*\"yawn\" + 0.013*\"prognosi\" + 0.009*\"class\" + 0.009*\"task\" + 0.008*\"gothic\"\n", + "2019-01-31 00:37:38,972 : INFO : topic #25 (0.020): 0.031*\"ring\" + 0.018*\"warmth\" + 0.017*\"lagrang\" + 0.017*\"area\" + 0.016*\"mount\" + 0.009*\"palmer\" + 0.009*\"foam\" + 0.008*\"north\" + 0.008*\"land\" + 0.008*\"lobe\"\n", + "2019-01-31 00:37:38,973 : INFO : topic #8 (0.020): 0.026*\"law\" + 0.024*\"cortic\" + 0.018*\"start\" + 0.017*\"act\" + 0.015*\"ricardo\" + 0.012*\"case\" + 0.010*\"replac\" + 0.010*\"polaris\" + 0.008*\"legal\" + 0.007*\"judaism\"\n", + "2019-01-31 00:37:38,974 : INFO : topic #21 (0.020): 0.035*\"samford\" + 0.023*\"spain\" + 0.019*\"mexico\" + 0.019*\"del\" + 0.014*\"soviet\" + 0.013*\"juan\" + 0.011*\"lizard\" + 0.011*\"carlo\" + 0.011*\"santa\" + 0.010*\"mexican\"\n", + "2019-01-31 00:37:38,975 : INFO : topic #42 (0.020): 0.045*\"german\" + 0.030*\"germani\" + 0.015*\"jewish\" + 0.014*\"vol\" + 0.014*\"israel\" + 0.014*\"berlin\" + 0.013*\"der\" + 0.010*\"european\" + 0.009*\"europ\" + 0.009*\"hungarian\"\n", + "2019-01-31 00:37:38,981 : INFO : topic diff=0.006868, rho=0.039715\n", + "2019-01-31 00:37:39,136 : INFO : PROGRESS: pass 0, at document #1270000/4922894\n", + "2019-01-31 00:37:40,521 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:37:40,788 : INFO : topic #37 (0.020): 0.010*\"man\" + 0.009*\"love\" + 0.008*\"gestur\" + 0.006*\"comic\" + 0.006*\"blue\" + 0.004*\"septemb\" + 0.004*\"vision\" + 0.004*\"litig\" + 0.004*\"black\" + 0.004*\"dixi\"\n", + "2019-01-31 00:37:40,789 : INFO : topic #47 (0.020): 0.063*\"muscl\" + 0.033*\"perceptu\" + 0.021*\"theater\" + 0.019*\"place\" + 0.016*\"compos\" + 0.016*\"damn\" + 0.014*\"orchestr\" + 0.013*\"olympo\" + 0.012*\"physician\" + 0.012*\"word\"\n", + "2019-01-31 00:37:40,790 : INFO : topic #13 (0.020): 0.026*\"australia\" + 0.026*\"sourc\" + 0.025*\"london\" + 0.024*\"new\" + 0.023*\"england\" + 0.023*\"australian\" + 0.018*\"british\" + 0.017*\"ireland\" + 0.015*\"youth\" + 0.013*\"weekli\"\n", + "2019-01-31 00:37:40,791 : INFO : topic #27 (0.020): 0.070*\"questionnair\" + 0.019*\"candid\" + 0.018*\"taxpay\" + 0.013*\"driver\" + 0.012*\"find\" + 0.012*\"ret\" + 0.012*\"tornado\" + 0.011*\"landslid\" + 0.011*\"fool\" + 0.010*\"horac\"\n", + "2019-01-31 00:37:40,792 : INFO : topic #35 (0.020): 0.056*\"russia\" + 0.039*\"sovereignti\" + 0.038*\"rural\" + 0.024*\"reprint\" + 0.023*\"poison\" + 0.023*\"personifi\" + 0.021*\"moscow\" + 0.016*\"unfortun\" + 0.016*\"poland\" + 0.015*\"czech\"\n", + "2019-01-31 00:37:40,798 : INFO : topic diff=0.006453, rho=0.039684\n", + "2019-01-31 00:37:40,953 : INFO : PROGRESS: pass 0, at document #1272000/4922894\n", + "2019-01-31 00:37:42,340 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:37:42,605 : INFO : topic #15 (0.020): 0.011*\"small\" + 0.011*\"organ\" + 0.010*\"commun\" + 0.010*\"develop\" + 0.010*\"word\" + 0.008*\"group\" + 0.008*\"peopl\" + 0.008*\"cultur\" + 0.007*\"woman\" + 0.007*\"human\"\n", + "2019-01-31 00:37:42,607 : INFO : topic #26 (0.020): 0.033*\"workplac\" + 0.031*\"champion\" + 0.026*\"woman\" + 0.025*\"olymp\" + 0.025*\"men\" + 0.021*\"medal\" + 0.020*\"event\" + 0.018*\"atheist\" + 0.018*\"taxpay\" + 0.017*\"nation\"\n", + "2019-01-31 00:37:42,608 : INFO : topic #48 (0.020): 0.085*\"march\" + 0.076*\"octob\" + 0.074*\"sens\" + 0.072*\"januari\" + 0.072*\"juli\" + 0.068*\"judici\" + 0.068*\"notion\" + 0.068*\"april\" + 0.066*\"decatur\" + 0.066*\"august\"\n", + "2019-01-31 00:37:42,609 : INFO : topic #8 (0.020): 0.026*\"law\" + 0.024*\"cortic\" + 0.018*\"start\" + 0.017*\"act\" + 0.015*\"ricardo\" + 0.012*\"case\" + 0.010*\"replac\" + 0.010*\"polaris\" + 0.008*\"legal\" + 0.007*\"judaism\"\n", + "2019-01-31 00:37:42,610 : INFO : topic #18 (0.020): 0.010*\"théori\" + 0.007*\"later\" + 0.007*\"sack\" + 0.006*\"kill\" + 0.006*\"dai\" + 0.005*\"retrospect\" + 0.005*\"end\" + 0.004*\"like\" + 0.004*\"call\" + 0.004*\"kenworthi\"\n", + "2019-01-31 00:37:42,616 : INFO : topic diff=0.005854, rho=0.039653\n", + "2019-01-31 00:37:42,773 : INFO : PROGRESS: pass 0, at document #1274000/4922894\n", + "2019-01-31 00:37:44,234 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:37:44,500 : INFO : topic #9 (0.020): 0.070*\"bone\" + 0.040*\"american\" + 0.029*\"valour\" + 0.019*\"dutch\" + 0.017*\"folei\" + 0.017*\"polit\" + 0.017*\"player\" + 0.016*\"english\" + 0.011*\"simpler\" + 0.011*\"acrimoni\"\n", + "2019-01-31 00:37:44,502 : INFO : topic #6 (0.020): 0.071*\"fewer\" + 0.024*\"septemb\" + 0.023*\"epiru\" + 0.018*\"teacher\" + 0.016*\"stake\" + 0.012*\"proclaim\" + 0.012*\"rodríguez\" + 0.011*\"direct\" + 0.011*\"movi\" + 0.010*\"acrimoni\"\n", + "2019-01-31 00:37:44,503 : INFO : topic #19 (0.020): 0.017*\"languag\" + 0.010*\"centuri\" + 0.010*\"woodcut\" + 0.010*\"form\" + 0.009*\"origin\" + 0.009*\"mean\" + 0.007*\"trade\" + 0.007*\"uruguayan\" + 0.007*\"like\" + 0.006*\"god\"\n", + "2019-01-31 00:37:44,504 : INFO : topic #34 (0.020): 0.071*\"start\" + 0.032*\"unionist\" + 0.030*\"american\" + 0.030*\"cotton\" + 0.027*\"new\" + 0.015*\"year\" + 0.014*\"california\" + 0.014*\"warrior\" + 0.013*\"north\" + 0.012*\"terri\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 00:37:44,505 : INFO : topic #30 (0.020): 0.037*\"cleveland\" + 0.036*\"leagu\" + 0.030*\"place\" + 0.027*\"taxpay\" + 0.025*\"scientist\" + 0.023*\"crete\" + 0.021*\"folei\" + 0.017*\"goal\" + 0.014*\"martin\" + 0.011*\"schmitz\"\n", + "2019-01-31 00:37:44,511 : INFO : topic diff=0.005050, rho=0.039621\n", + "2019-01-31 00:37:44,672 : INFO : PROGRESS: pass 0, at document #1276000/4922894\n", + "2019-01-31 00:37:46,089 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:37:46,356 : INFO : topic #6 (0.020): 0.071*\"fewer\" + 0.024*\"septemb\" + 0.023*\"epiru\" + 0.018*\"teacher\" + 0.016*\"stake\" + 0.012*\"proclaim\" + 0.012*\"rodríguez\" + 0.011*\"movi\" + 0.011*\"direct\" + 0.010*\"acrimoni\"\n", + "2019-01-31 00:37:46,357 : INFO : topic #4 (0.020): 0.022*\"enfranchis\" + 0.015*\"depress\" + 0.014*\"pour\" + 0.009*\"mode\" + 0.009*\"elabor\" + 0.008*\"veget\" + 0.007*\"produc\" + 0.007*\"uruguayan\" + 0.007*\"candid\" + 0.006*\"encyclopedia\"\n", + "2019-01-31 00:37:46,358 : INFO : topic #28 (0.020): 0.030*\"build\" + 0.026*\"hous\" + 0.020*\"rivièr\" + 0.017*\"buford\" + 0.013*\"histor\" + 0.011*\"briarwood\" + 0.011*\"strategist\" + 0.011*\"constitut\" + 0.010*\"linear\" + 0.009*\"depress\"\n", + "2019-01-31 00:37:46,359 : INFO : topic #15 (0.020): 0.011*\"small\" + 0.011*\"organ\" + 0.011*\"commun\" + 0.010*\"develop\" + 0.010*\"word\" + 0.009*\"group\" + 0.008*\"peopl\" + 0.008*\"cultur\" + 0.007*\"woman\" + 0.007*\"human\"\n", + "2019-01-31 00:37:46,360 : INFO : topic #14 (0.020): 0.024*\"forc\" + 0.022*\"aggress\" + 0.020*\"armi\" + 0.020*\"walter\" + 0.017*\"com\" + 0.014*\"oper\" + 0.013*\"unionist\" + 0.013*\"refut\" + 0.012*\"airbu\" + 0.012*\"militari\"\n", + "2019-01-31 00:37:46,366 : INFO : topic diff=0.007411, rho=0.039590\n", + "2019-01-31 00:37:46,524 : INFO : PROGRESS: pass 0, at document #1278000/4922894\n", + "2019-01-31 00:37:47,921 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:37:48,187 : INFO : topic #0 (0.020): 0.068*\"statewid\" + 0.040*\"line\" + 0.039*\"raid\" + 0.038*\"arsen\" + 0.030*\"museo\" + 0.019*\"traceabl\" + 0.017*\"serv\" + 0.014*\"pain\" + 0.014*\"exhaust\" + 0.012*\"artist\"\n", + "2019-01-31 00:37:48,189 : INFO : topic #33 (0.020): 0.058*\"french\" + 0.045*\"franc\" + 0.030*\"pari\" + 0.025*\"jean\" + 0.023*\"sail\" + 0.019*\"daphn\" + 0.014*\"loui\" + 0.014*\"lazi\" + 0.013*\"piec\" + 0.008*\"wine\"\n", + "2019-01-31 00:37:48,190 : INFO : topic #45 (0.020): 0.024*\"jpg\" + 0.023*\"fifteenth\" + 0.017*\"illicit\" + 0.017*\"colder\" + 0.016*\"black\" + 0.014*\"western\" + 0.012*\"record\" + 0.011*\"blind\" + 0.007*\"light\" + 0.007*\"hand\"\n", + "2019-01-31 00:37:48,191 : INFO : topic #41 (0.020): 0.043*\"citi\" + 0.028*\"new\" + 0.022*\"palmer\" + 0.014*\"strategist\" + 0.013*\"open\" + 0.012*\"center\" + 0.012*\"year\" + 0.011*\"includ\" + 0.010*\"lobe\" + 0.010*\"dai\"\n", + "2019-01-31 00:37:48,192 : INFO : topic #3 (0.020): 0.035*\"present\" + 0.026*\"offic\" + 0.024*\"minist\" + 0.020*\"govern\" + 0.020*\"nation\" + 0.020*\"serv\" + 0.019*\"member\" + 0.018*\"gener\" + 0.016*\"seri\" + 0.015*\"chickasaw\"\n", + "2019-01-31 00:37:48,198 : INFO : topic diff=0.006415, rho=0.039559\n", + "2019-01-31 00:37:51,004 : INFO : -11.563 per-word bound, 3026.2 perplexity estimate based on a held-out corpus of 2000 documents with 579201 words\n", + "2019-01-31 00:37:51,005 : INFO : PROGRESS: pass 0, at document #1280000/4922894\n", + "2019-01-31 00:37:52,414 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:37:52,680 : INFO : topic #42 (0.020): 0.045*\"german\" + 0.030*\"germani\" + 0.015*\"vol\" + 0.014*\"jewish\" + 0.014*\"israel\" + 0.013*\"berlin\" + 0.013*\"der\" + 0.009*\"european\" + 0.009*\"europ\" + 0.009*\"itali\"\n", + "2019-01-31 00:37:52,681 : INFO : topic #19 (0.020): 0.017*\"languag\" + 0.010*\"centuri\" + 0.010*\"woodcut\" + 0.010*\"form\" + 0.009*\"origin\" + 0.009*\"mean\" + 0.007*\"trade\" + 0.007*\"god\" + 0.007*\"uruguayan\" + 0.007*\"english\"\n", + "2019-01-31 00:37:52,682 : INFO : topic #39 (0.020): 0.051*\"canada\" + 0.038*\"canadian\" + 0.020*\"toronto\" + 0.019*\"hoar\" + 0.018*\"ontario\" + 0.013*\"new\" + 0.013*\"hydrogen\" + 0.013*\"novotná\" + 0.012*\"misericordia\" + 0.012*\"quebec\"\n", + "2019-01-31 00:37:52,684 : INFO : topic #37 (0.020): 0.009*\"man\" + 0.009*\"love\" + 0.008*\"gestur\" + 0.006*\"blue\" + 0.006*\"comic\" + 0.005*\"septemb\" + 0.004*\"vision\" + 0.004*\"litig\" + 0.004*\"dixi\" + 0.004*\"charact\"\n", + "2019-01-31 00:37:52,685 : INFO : topic #46 (0.020): 0.018*\"stop\" + 0.018*\"damag\" + 0.018*\"swedish\" + 0.016*\"norwai\" + 0.015*\"sweden\" + 0.015*\"norwegian\" + 0.014*\"replac\" + 0.013*\"wind\" + 0.012*\"financ\" + 0.012*\"ton\"\n", + "2019-01-31 00:37:52,690 : INFO : topic diff=0.007558, rho=0.039528\n", + "2019-01-31 00:37:52,843 : INFO : PROGRESS: pass 0, at document #1282000/4922894\n", + "2019-01-31 00:37:54,203 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:37:54,468 : INFO : topic #38 (0.020): 0.023*\"walter\" + 0.010*\"aza\" + 0.009*\"battalion\" + 0.009*\"forc\" + 0.008*\"teufel\" + 0.007*\"empath\" + 0.007*\"armi\" + 0.007*\"militari\" + 0.007*\"till\" + 0.006*\"king\"\n", + "2019-01-31 00:37:54,469 : INFO : topic #45 (0.020): 0.023*\"jpg\" + 0.022*\"fifteenth\" + 0.017*\"illicit\" + 0.017*\"colder\" + 0.016*\"black\" + 0.015*\"western\" + 0.012*\"record\" + 0.011*\"blind\" + 0.007*\"light\" + 0.007*\"green\"\n", + "2019-01-31 00:37:54,470 : INFO : topic #1 (0.020): 0.059*\"china\" + 0.048*\"chilton\" + 0.022*\"hong\" + 0.021*\"kong\" + 0.019*\"korea\" + 0.016*\"korean\" + 0.014*\"leah\" + 0.014*\"shirin\" + 0.013*\"sourc\" + 0.013*\"ashvil\"\n", + "2019-01-31 00:37:54,472 : INFO : topic #10 (0.020): 0.012*\"cdd\" + 0.008*\"disco\" + 0.007*\"media\" + 0.007*\"pathwai\" + 0.007*\"caus\" + 0.007*\"have\" + 0.006*\"treat\" + 0.006*\"hormon\" + 0.006*\"effect\" + 0.006*\"proper\"\n", + "2019-01-31 00:37:54,473 : INFO : topic #34 (0.020): 0.070*\"start\" + 0.032*\"unionist\" + 0.030*\"cotton\" + 0.030*\"american\" + 0.027*\"new\" + 0.015*\"year\" + 0.015*\"california\" + 0.014*\"warrior\" + 0.013*\"north\" + 0.013*\"terri\"\n", + "2019-01-31 00:37:54,479 : INFO : topic diff=0.006323, rho=0.039498\n", + "2019-01-31 00:37:54,633 : INFO : PROGRESS: pass 0, at document #1284000/4922894\n", + "2019-01-31 00:37:56,030 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:37:56,296 : INFO : topic #47 (0.020): 0.063*\"muscl\" + 0.032*\"perceptu\" + 0.019*\"theater\" + 0.019*\"place\" + 0.017*\"damn\" + 0.017*\"compos\" + 0.014*\"orchestr\" + 0.013*\"olympo\" + 0.013*\"physician\" + 0.012*\"word\"\n", + "2019-01-31 00:37:56,297 : INFO : topic #39 (0.020): 0.050*\"canada\" + 0.038*\"canadian\" + 0.020*\"toronto\" + 0.019*\"hoar\" + 0.018*\"ontario\" + 0.014*\"new\" + 0.013*\"hydrogen\" + 0.012*\"novotná\" + 0.012*\"misericordia\" + 0.011*\"quebec\"\n", + "2019-01-31 00:37:56,298 : INFO : topic #43 (0.020): 0.061*\"elect\" + 0.054*\"parti\" + 0.023*\"voluntari\" + 0.023*\"democrat\" + 0.020*\"member\" + 0.016*\"polici\" + 0.015*\"liber\" + 0.015*\"conserv\" + 0.014*\"seaport\" + 0.014*\"selma\"\n", + "2019-01-31 00:37:56,299 : INFO : topic #25 (0.020): 0.030*\"ring\" + 0.018*\"warmth\" + 0.017*\"lagrang\" + 0.017*\"area\" + 0.015*\"mount\" + 0.009*\"palmer\" + 0.009*\"foam\" + 0.008*\"north\" + 0.008*\"land\" + 0.008*\"vacant\"\n", + "2019-01-31 00:37:56,301 : INFO : topic #29 (0.020): 0.021*\"companhia\" + 0.011*\"million\" + 0.010*\"busi\" + 0.010*\"bank\" + 0.008*\"market\" + 0.008*\"yawn\" + 0.007*\"industri\" + 0.007*\"manag\" + 0.007*\"govern\" + 0.007*\"produc\"\n", + "2019-01-31 00:37:56,306 : INFO : topic diff=0.006903, rho=0.039467\n", + "2019-01-31 00:37:56,460 : INFO : PROGRESS: pass 0, at document #1286000/4922894\n", + "2019-01-31 00:37:57,853 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:37:58,120 : INFO : topic #41 (0.020): 0.042*\"citi\" + 0.028*\"new\" + 0.022*\"palmer\" + 0.014*\"strategist\" + 0.013*\"open\" + 0.012*\"center\" + 0.012*\"year\" + 0.011*\"includ\" + 0.010*\"lobe\" + 0.009*\"dai\"\n", + "2019-01-31 00:37:58,121 : INFO : topic #44 (0.020): 0.033*\"rooftop\" + 0.028*\"final\" + 0.024*\"wife\" + 0.022*\"tourist\" + 0.018*\"champion\" + 0.016*\"taxpay\" + 0.015*\"chamber\" + 0.014*\"tiepolo\" + 0.013*\"martin\" + 0.013*\"open\"\n", + "2019-01-31 00:37:58,122 : INFO : topic #40 (0.020): 0.088*\"unit\" + 0.023*\"schuster\" + 0.022*\"collector\" + 0.021*\"institut\" + 0.020*\"requir\" + 0.018*\"student\" + 0.014*\"professor\" + 0.012*\"word\" + 0.011*\"governor\" + 0.011*\"degre\"\n", + "2019-01-31 00:37:58,123 : INFO : topic #46 (0.020): 0.018*\"stop\" + 0.018*\"damag\" + 0.017*\"swedish\" + 0.015*\"norwai\" + 0.015*\"sweden\" + 0.015*\"norwegian\" + 0.014*\"replac\" + 0.013*\"wind\" + 0.012*\"financ\" + 0.011*\"turkish\"\n", + "2019-01-31 00:37:58,124 : INFO : topic #7 (0.020): 0.021*\"snatch\" + 0.020*\"di\" + 0.018*\"factor\" + 0.015*\"yawn\" + 0.015*\"margin\" + 0.014*\"bone\" + 0.013*\"life\" + 0.012*\"faster\" + 0.012*\"daughter\" + 0.011*\"deal\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 00:37:58,130 : INFO : topic diff=0.006142, rho=0.039436\n", + "2019-01-31 00:37:58,282 : INFO : PROGRESS: pass 0, at document #1288000/4922894\n", + "2019-01-31 00:37:59,645 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:37:59,911 : INFO : topic #44 (0.020): 0.034*\"rooftop\" + 0.028*\"final\" + 0.024*\"wife\" + 0.022*\"tourist\" + 0.018*\"champion\" + 0.016*\"taxpay\" + 0.015*\"chamber\" + 0.014*\"tiepolo\" + 0.013*\"martin\" + 0.013*\"open\"\n", + "2019-01-31 00:37:59,912 : INFO : topic #10 (0.020): 0.012*\"cdd\" + 0.008*\"disco\" + 0.007*\"media\" + 0.007*\"pathwai\" + 0.006*\"caus\" + 0.006*\"have\" + 0.006*\"treat\" + 0.006*\"hormon\" + 0.006*\"proper\" + 0.006*\"effect\"\n", + "2019-01-31 00:37:59,913 : INFO : topic #46 (0.020): 0.018*\"stop\" + 0.018*\"damag\" + 0.017*\"swedish\" + 0.015*\"norwai\" + 0.015*\"sweden\" + 0.014*\"norwegian\" + 0.014*\"replac\" + 0.013*\"wind\" + 0.012*\"financ\" + 0.011*\"turkish\"\n", + "2019-01-31 00:37:59,914 : INFO : topic #49 (0.020): 0.042*\"india\" + 0.031*\"incumb\" + 0.014*\"islam\" + 0.012*\"muskoge\" + 0.012*\"pakistan\" + 0.012*\"anglo\" + 0.011*\"televis\" + 0.011*\"alam\" + 0.010*\"khalsa\" + 0.009*\"start\"\n", + "2019-01-31 00:37:59,916 : INFO : topic #25 (0.020): 0.030*\"ring\" + 0.018*\"warmth\" + 0.017*\"area\" + 0.017*\"lagrang\" + 0.015*\"mount\" + 0.009*\"palmer\" + 0.009*\"foam\" + 0.008*\"north\" + 0.008*\"land\" + 0.008*\"vacant\"\n", + "2019-01-31 00:37:59,921 : INFO : topic diff=0.006987, rho=0.039406\n", + "2019-01-31 00:38:00,077 : INFO : PROGRESS: pass 0, at document #1290000/4922894\n", + "2019-01-31 00:38:01,468 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:38:01,734 : INFO : topic #10 (0.020): 0.012*\"cdd\" + 0.008*\"disco\" + 0.007*\"media\" + 0.007*\"pathwai\" + 0.006*\"caus\" + 0.006*\"treat\" + 0.006*\"have\" + 0.006*\"proper\" + 0.006*\"hormon\" + 0.006*\"effect\"\n", + "2019-01-31 00:38:01,735 : INFO : topic #49 (0.020): 0.042*\"india\" + 0.031*\"incumb\" + 0.014*\"islam\" + 0.012*\"muskoge\" + 0.012*\"pakistan\" + 0.012*\"anglo\" + 0.011*\"televis\" + 0.011*\"alam\" + 0.010*\"khalsa\" + 0.009*\"start\"\n", + "2019-01-31 00:38:01,736 : INFO : topic #17 (0.020): 0.074*\"church\" + 0.022*\"christian\" + 0.021*\"cathol\" + 0.021*\"bishop\" + 0.017*\"sail\" + 0.014*\"retroflex\" + 0.009*\"centuri\" + 0.009*\"relationship\" + 0.009*\"cathedr\" + 0.009*\"historiographi\"\n", + "2019-01-31 00:38:01,737 : INFO : topic #25 (0.020): 0.030*\"ring\" + 0.018*\"warmth\" + 0.017*\"area\" + 0.016*\"lagrang\" + 0.015*\"mount\" + 0.009*\"palmer\" + 0.009*\"foam\" + 0.008*\"north\" + 0.008*\"vacant\" + 0.008*\"land\"\n", + "2019-01-31 00:38:01,739 : INFO : topic #15 (0.020): 0.011*\"small\" + 0.011*\"organ\" + 0.010*\"commun\" + 0.010*\"develop\" + 0.010*\"word\" + 0.009*\"group\" + 0.008*\"peopl\" + 0.008*\"cultur\" + 0.007*\"human\" + 0.007*\"woman\"\n", + "2019-01-31 00:38:01,744 : INFO : topic diff=0.005685, rho=0.039375\n", + "2019-01-31 00:38:01,904 : INFO : PROGRESS: pass 0, at document #1292000/4922894\n", + "2019-01-31 00:38:03,329 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:38:03,595 : INFO : topic #9 (0.020): 0.066*\"bone\" + 0.043*\"american\" + 0.030*\"valour\" + 0.018*\"dutch\" + 0.018*\"polit\" + 0.017*\"folei\" + 0.016*\"player\" + 0.016*\"english\" + 0.011*\"simpler\" + 0.011*\"acrimoni\"\n", + "2019-01-31 00:38:03,596 : INFO : topic #44 (0.020): 0.033*\"rooftop\" + 0.028*\"final\" + 0.024*\"wife\" + 0.022*\"tourist\" + 0.018*\"champion\" + 0.016*\"taxpay\" + 0.015*\"chamber\" + 0.014*\"tiepolo\" + 0.013*\"martin\" + 0.013*\"open\"\n", + "2019-01-31 00:38:03,597 : INFO : topic #11 (0.020): 0.026*\"john\" + 0.014*\"will\" + 0.012*\"jame\" + 0.012*\"david\" + 0.011*\"rival\" + 0.009*\"mexican–american\" + 0.009*\"georg\" + 0.008*\"slur\" + 0.008*\"paul\" + 0.008*\"rhyme\"\n", + "2019-01-31 00:38:03,598 : INFO : topic #0 (0.020): 0.068*\"statewid\" + 0.040*\"line\" + 0.037*\"raid\" + 0.037*\"arsen\" + 0.029*\"museo\" + 0.020*\"traceabl\" + 0.017*\"serv\" + 0.014*\"pain\" + 0.014*\"exhaust\" + 0.012*\"artist\"\n", + "2019-01-31 00:38:03,600 : INFO : topic #24 (0.020): 0.042*\"book\" + 0.034*\"publicis\" + 0.024*\"word\" + 0.017*\"new\" + 0.015*\"edit\" + 0.013*\"presid\" + 0.012*\"storag\" + 0.012*\"nicola\" + 0.012*\"worldwid\" + 0.011*\"author\"\n", + "2019-01-31 00:38:03,605 : INFO : topic diff=0.006066, rho=0.039344\n", + "2019-01-31 00:38:03,765 : INFO : PROGRESS: pass 0, at document #1294000/4922894\n", + "2019-01-31 00:38:05,180 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:38:05,447 : INFO : topic #8 (0.020): 0.026*\"law\" + 0.023*\"cortic\" + 0.018*\"start\" + 0.016*\"act\" + 0.016*\"ricardo\" + 0.012*\"case\" + 0.010*\"replac\" + 0.010*\"polaris\" + 0.008*\"legal\" + 0.007*\"judaism\"\n", + "2019-01-31 00:38:05,449 : INFO : topic #4 (0.020): 0.021*\"enfranchis\" + 0.015*\"depress\" + 0.014*\"pour\" + 0.009*\"veget\" + 0.009*\"mode\" + 0.009*\"elabor\" + 0.007*\"produc\" + 0.007*\"turn\" + 0.007*\"uruguayan\" + 0.007*\"candid\"\n", + "2019-01-31 00:38:05,450 : INFO : topic #20 (0.020): 0.138*\"scholar\" + 0.040*\"struggl\" + 0.032*\"high\" + 0.030*\"educ\" + 0.021*\"collector\" + 0.019*\"yawn\" + 0.013*\"prognosi\" + 0.010*\"gothic\" + 0.009*\"class\" + 0.009*\"district\"\n", + "2019-01-31 00:38:05,451 : INFO : topic #33 (0.020): 0.059*\"french\" + 0.047*\"franc\" + 0.030*\"pari\" + 0.024*\"jean\" + 0.024*\"sail\" + 0.018*\"daphn\" + 0.015*\"loui\" + 0.014*\"lazi\" + 0.012*\"piec\" + 0.008*\"wine\"\n", + "2019-01-31 00:38:05,452 : INFO : topic #49 (0.020): 0.042*\"india\" + 0.031*\"incumb\" + 0.014*\"islam\" + 0.012*\"pakistan\" + 0.012*\"muskoge\" + 0.012*\"anglo\" + 0.010*\"televis\" + 0.010*\"alam\" + 0.010*\"khalsa\" + 0.009*\"start\"\n", + "2019-01-31 00:38:05,458 : INFO : topic diff=0.005902, rho=0.039314\n", + "2019-01-31 00:38:05,614 : INFO : PROGRESS: pass 0, at document #1296000/4922894\n", + "2019-01-31 00:38:07,015 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:38:07,281 : INFO : topic #9 (0.020): 0.065*\"bone\" + 0.043*\"american\" + 0.030*\"valour\" + 0.018*\"dutch\" + 0.018*\"polit\" + 0.017*\"folei\" + 0.016*\"player\" + 0.016*\"english\" + 0.011*\"simpler\" + 0.011*\"acrimoni\"\n", + "2019-01-31 00:38:07,282 : INFO : topic #26 (0.020): 0.033*\"workplac\" + 0.030*\"champion\" + 0.026*\"woman\" + 0.025*\"men\" + 0.025*\"olymp\" + 0.021*\"medal\" + 0.020*\"event\" + 0.018*\"rainfal\" + 0.018*\"taxpay\" + 0.018*\"atheist\"\n", + "2019-01-31 00:38:07,283 : INFO : topic #2 (0.020): 0.047*\"isl\" + 0.037*\"shield\" + 0.018*\"narrat\" + 0.013*\"scot\" + 0.013*\"pope\" + 0.012*\"blur\" + 0.011*\"nativist\" + 0.010*\"coalit\" + 0.009*\"bahá\" + 0.009*\"class\"\n", + "2019-01-31 00:38:07,284 : INFO : topic #29 (0.020): 0.021*\"companhia\" + 0.011*\"million\" + 0.010*\"busi\" + 0.010*\"bank\" + 0.009*\"market\" + 0.008*\"yawn\" + 0.007*\"industri\" + 0.007*\"produc\" + 0.007*\"manag\" + 0.007*\"govern\"\n", + "2019-01-31 00:38:07,285 : INFO : topic #46 (0.020): 0.018*\"norwai\" + 0.018*\"stop\" + 0.017*\"damag\" + 0.016*\"swedish\" + 0.015*\"norwegian\" + 0.015*\"sweden\" + 0.013*\"replac\" + 0.013*\"wind\" + 0.012*\"financ\" + 0.012*\"treeless\"\n", + "2019-01-31 00:38:07,291 : INFO : topic diff=0.006657, rho=0.039284\n", + "2019-01-31 00:38:07,442 : INFO : PROGRESS: pass 0, at document #1298000/4922894\n", + "2019-01-31 00:38:08,799 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:38:09,065 : INFO : topic #49 (0.020): 0.041*\"india\" + 0.031*\"incumb\" + 0.015*\"islam\" + 0.012*\"muskoge\" + 0.012*\"pakistan\" + 0.011*\"anglo\" + 0.010*\"televis\" + 0.010*\"alam\" + 0.010*\"tajikistan\" + 0.010*\"khalsa\"\n", + "2019-01-31 00:38:09,066 : INFO : topic #26 (0.020): 0.033*\"workplac\" + 0.030*\"champion\" + 0.026*\"woman\" + 0.025*\"men\" + 0.025*\"olymp\" + 0.021*\"medal\" + 0.020*\"event\" + 0.019*\"rainfal\" + 0.018*\"taxpay\" + 0.018*\"atheist\"\n", + "2019-01-31 00:38:09,067 : INFO : topic #35 (0.020): 0.053*\"russia\" + 0.037*\"sovereignti\" + 0.036*\"rural\" + 0.027*\"personifi\" + 0.023*\"reprint\" + 0.023*\"poison\" + 0.019*\"moscow\" + 0.017*\"alexand\" + 0.016*\"poland\" + 0.015*\"unfortun\"\n", + "2019-01-31 00:38:09,068 : INFO : topic #46 (0.020): 0.018*\"stop\" + 0.018*\"norwai\" + 0.016*\"damag\" + 0.016*\"swedish\" + 0.015*\"norwegian\" + 0.015*\"sweden\" + 0.013*\"replac\" + 0.013*\"wind\" + 0.012*\"treeless\" + 0.011*\"financ\"\n", + "2019-01-31 00:38:09,069 : INFO : topic #44 (0.020): 0.032*\"rooftop\" + 0.028*\"final\" + 0.024*\"wife\" + 0.022*\"tourist\" + 0.018*\"champion\" + 0.016*\"taxpay\" + 0.014*\"chamber\" + 0.014*\"tiepolo\" + 0.013*\"martin\" + 0.012*\"open\"\n", + "2019-01-31 00:38:09,075 : INFO : topic diff=0.006940, rho=0.039253\n", + "2019-01-31 00:38:11,725 : INFO : -11.695 per-word bound, 3315.3 perplexity estimate based on a held-out corpus of 2000 documents with 525577 words\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 00:38:11,726 : INFO : PROGRESS: pass 0, at document #1300000/4922894\n", + "2019-01-31 00:38:13,089 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:38:13,355 : INFO : topic #20 (0.020): 0.137*\"scholar\" + 0.040*\"struggl\" + 0.032*\"high\" + 0.030*\"educ\" + 0.022*\"collector\" + 0.019*\"yawn\" + 0.014*\"prognosi\" + 0.011*\"gothic\" + 0.009*\"class\" + 0.009*\"task\"\n", + "2019-01-31 00:38:13,356 : INFO : topic #29 (0.020): 0.021*\"companhia\" + 0.011*\"million\" + 0.010*\"busi\" + 0.010*\"bank\" + 0.009*\"market\" + 0.008*\"yawn\" + 0.008*\"function\" + 0.007*\"manag\" + 0.007*\"industri\" + 0.007*\"produc\"\n", + "2019-01-31 00:38:13,357 : INFO : topic #17 (0.020): 0.075*\"church\" + 0.022*\"christian\" + 0.021*\"cathol\" + 0.020*\"bishop\" + 0.016*\"sail\" + 0.015*\"retroflex\" + 0.009*\"centuri\" + 0.009*\"relationship\" + 0.009*\"cathedr\" + 0.008*\"historiographi\"\n", + "2019-01-31 00:38:13,358 : INFO : topic #49 (0.020): 0.041*\"india\" + 0.031*\"incumb\" + 0.015*\"islam\" + 0.012*\"muskoge\" + 0.012*\"anglo\" + 0.012*\"pakistan\" + 0.010*\"televis\" + 0.010*\"alam\" + 0.010*\"khalsa\" + 0.010*\"tajikistan\"\n", + "2019-01-31 00:38:13,359 : INFO : topic #21 (0.020): 0.036*\"samford\" + 0.022*\"spain\" + 0.019*\"mexico\" + 0.018*\"del\" + 0.014*\"soviet\" + 0.013*\"juan\" + 0.011*\"lizard\" + 0.011*\"carlo\" + 0.011*\"santa\" + 0.011*\"francisco\"\n", + "2019-01-31 00:38:13,365 : INFO : topic diff=0.006368, rho=0.039223\n", + "2019-01-31 00:38:13,519 : INFO : PROGRESS: pass 0, at document #1302000/4922894\n", + "2019-01-31 00:38:14,902 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:38:15,168 : INFO : topic #49 (0.020): 0.040*\"india\" + 0.033*\"incumb\" + 0.014*\"islam\" + 0.012*\"muskoge\" + 0.012*\"pakistan\" + 0.012*\"anglo\" + 0.011*\"alam\" + 0.010*\"khalsa\" + 0.010*\"televis\" + 0.010*\"tajikistan\"\n", + "2019-01-31 00:38:15,170 : INFO : topic #41 (0.020): 0.043*\"citi\" + 0.028*\"new\" + 0.022*\"palmer\" + 0.014*\"strategist\" + 0.013*\"center\" + 0.012*\"open\" + 0.012*\"year\" + 0.011*\"includ\" + 0.010*\"lobe\" + 0.009*\"dai\"\n", + "2019-01-31 00:38:15,171 : INFO : topic #3 (0.020): 0.034*\"present\" + 0.027*\"offic\" + 0.024*\"minist\" + 0.021*\"govern\" + 0.021*\"nation\" + 0.019*\"member\" + 0.019*\"serv\" + 0.018*\"gener\" + 0.016*\"chickasaw\" + 0.016*\"seri\"\n", + "2019-01-31 00:38:15,172 : INFO : topic #18 (0.020): 0.010*\"théori\" + 0.007*\"later\" + 0.007*\"sack\" + 0.006*\"kill\" + 0.006*\"dai\" + 0.005*\"retrospect\" + 0.005*\"like\" + 0.005*\"end\" + 0.004*\"call\" + 0.004*\"man\"\n", + "2019-01-31 00:38:15,174 : INFO : topic #36 (0.020): 0.013*\"network\" + 0.011*\"prognosi\" + 0.010*\"pop\" + 0.008*\"develop\" + 0.008*\"cytokin\" + 0.007*\"serv\" + 0.007*\"user\" + 0.007*\"diggin\" + 0.007*\"base\" + 0.007*\"brio\"\n", + "2019-01-31 00:38:15,179 : INFO : topic diff=0.005951, rho=0.039193\n", + "2019-01-31 00:38:15,334 : INFO : PROGRESS: pass 0, at document #1304000/4922894\n", + "2019-01-31 00:38:16,716 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:38:16,982 : INFO : topic #40 (0.020): 0.088*\"unit\" + 0.023*\"schuster\" + 0.022*\"collector\" + 0.021*\"institut\" + 0.020*\"requir\" + 0.018*\"student\" + 0.014*\"professor\" + 0.012*\"word\" + 0.011*\"http\" + 0.011*\"governor\"\n", + "2019-01-31 00:38:16,983 : INFO : topic #3 (0.020): 0.034*\"present\" + 0.027*\"offic\" + 0.024*\"minist\" + 0.021*\"govern\" + 0.021*\"nation\" + 0.019*\"member\" + 0.019*\"serv\" + 0.018*\"gener\" + 0.016*\"seri\" + 0.016*\"chickasaw\"\n", + "2019-01-31 00:38:16,985 : INFO : topic #30 (0.020): 0.036*\"leagu\" + 0.035*\"cleveland\" + 0.029*\"place\" + 0.027*\"taxpay\" + 0.025*\"crete\" + 0.024*\"scientist\" + 0.023*\"folei\" + 0.017*\"goal\" + 0.014*\"martin\" + 0.011*\"player\"\n", + "2019-01-31 00:38:16,986 : INFO : topic #49 (0.020): 0.040*\"india\" + 0.032*\"incumb\" + 0.014*\"islam\" + 0.012*\"pakistan\" + 0.012*\"muskoge\" + 0.012*\"anglo\" + 0.011*\"alam\" + 0.011*\"televis\" + 0.010*\"khalsa\" + 0.009*\"tajikistan\"\n", + "2019-01-31 00:38:16,987 : INFO : topic #47 (0.020): 0.062*\"muscl\" + 0.033*\"perceptu\" + 0.020*\"theater\" + 0.019*\"place\" + 0.017*\"damn\" + 0.017*\"compos\" + 0.013*\"orchestr\" + 0.013*\"olympo\" + 0.013*\"physician\" + 0.012*\"word\"\n", + "2019-01-31 00:38:16,993 : INFO : topic diff=0.005795, rho=0.039163\n", + "2019-01-31 00:38:17,148 : INFO : PROGRESS: pass 0, at document #1306000/4922894\n", + "2019-01-31 00:38:18,544 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:38:18,814 : INFO : topic #20 (0.020): 0.137*\"scholar\" + 0.040*\"struggl\" + 0.032*\"high\" + 0.030*\"educ\" + 0.022*\"collector\" + 0.019*\"yawn\" + 0.014*\"prognosi\" + 0.011*\"gothic\" + 0.009*\"district\" + 0.009*\"task\"\n", + "2019-01-31 00:38:18,816 : INFO : topic #35 (0.020): 0.053*\"russia\" + 0.037*\"sovereignti\" + 0.035*\"rural\" + 0.027*\"personifi\" + 0.023*\"reprint\" + 0.023*\"poison\" + 0.021*\"moscow\" + 0.016*\"poland\" + 0.015*\"unfortun\" + 0.015*\"alexand\"\n", + "2019-01-31 00:38:18,817 : INFO : topic #41 (0.020): 0.043*\"citi\" + 0.029*\"new\" + 0.022*\"palmer\" + 0.014*\"strategist\" + 0.013*\"open\" + 0.012*\"center\" + 0.012*\"year\" + 0.011*\"includ\" + 0.010*\"lobe\" + 0.009*\"dai\"\n", + "2019-01-31 00:38:18,818 : INFO : topic #10 (0.020): 0.011*\"cdd\" + 0.008*\"disco\" + 0.008*\"media\" + 0.007*\"pathwai\" + 0.007*\"caus\" + 0.006*\"have\" + 0.006*\"treat\" + 0.006*\"hormon\" + 0.006*\"effect\" + 0.006*\"proper\"\n", + "2019-01-31 00:38:18,819 : INFO : topic #0 (0.020): 0.067*\"statewid\" + 0.040*\"line\" + 0.037*\"arsen\" + 0.036*\"raid\" + 0.029*\"museo\" + 0.019*\"traceabl\" + 0.018*\"serv\" + 0.014*\"exhaust\" + 0.014*\"pain\" + 0.012*\"artist\"\n", + "2019-01-31 00:38:18,825 : INFO : topic diff=0.005368, rho=0.039133\n", + "2019-01-31 00:38:18,981 : INFO : PROGRESS: pass 0, at document #1308000/4922894\n", + "2019-01-31 00:38:20,377 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:38:20,643 : INFO : topic #34 (0.020): 0.071*\"start\" + 0.032*\"unionist\" + 0.031*\"cotton\" + 0.030*\"american\" + 0.027*\"new\" + 0.015*\"year\" + 0.015*\"california\" + 0.014*\"warrior\" + 0.013*\"terri\" + 0.012*\"north\"\n", + "2019-01-31 00:38:20,644 : INFO : topic #10 (0.020): 0.011*\"cdd\" + 0.008*\"disco\" + 0.008*\"media\" + 0.007*\"pathwai\" + 0.007*\"caus\" + 0.006*\"have\" + 0.006*\"treat\" + 0.006*\"hormon\" + 0.006*\"effect\" + 0.006*\"proper\"\n", + "2019-01-31 00:38:20,645 : INFO : topic #3 (0.020): 0.034*\"present\" + 0.027*\"offic\" + 0.024*\"minist\" + 0.022*\"govern\" + 0.021*\"nation\" + 0.019*\"member\" + 0.019*\"serv\" + 0.018*\"gener\" + 0.016*\"seri\" + 0.016*\"chickasaw\"\n", + "2019-01-31 00:38:20,647 : INFO : topic #9 (0.020): 0.066*\"bone\" + 0.042*\"american\" + 0.030*\"valour\" + 0.018*\"dutch\" + 0.017*\"folei\" + 0.017*\"polit\" + 0.016*\"player\" + 0.016*\"english\" + 0.011*\"simpler\" + 0.011*\"acrimoni\"\n", + "2019-01-31 00:38:20,648 : INFO : topic #28 (0.020): 0.031*\"build\" + 0.025*\"hous\" + 0.021*\"rivièr\" + 0.017*\"buford\" + 0.013*\"histor\" + 0.011*\"strategist\" + 0.011*\"constitut\" + 0.011*\"briarwood\" + 0.010*\"linear\" + 0.010*\"highland\"\n", + "2019-01-31 00:38:20,654 : INFO : topic diff=0.005020, rho=0.039103\n", + "2019-01-31 00:38:20,869 : INFO : PROGRESS: pass 0, at document #1310000/4922894\n", + "2019-01-31 00:38:22,280 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:38:22,547 : INFO : topic #24 (0.020): 0.042*\"book\" + 0.034*\"publicis\" + 0.024*\"word\" + 0.018*\"new\" + 0.015*\"edit\" + 0.013*\"presid\" + 0.013*\"storag\" + 0.012*\"worldwid\" + 0.012*\"nicola\" + 0.011*\"collect\"\n", + "2019-01-31 00:38:22,549 : INFO : topic #43 (0.020): 0.061*\"elect\" + 0.054*\"parti\" + 0.023*\"democrat\" + 0.023*\"voluntari\" + 0.021*\"member\" + 0.017*\"polici\" + 0.015*\"liber\" + 0.015*\"republ\" + 0.014*\"selma\" + 0.014*\"seaport\"\n", + "2019-01-31 00:38:22,550 : INFO : topic #37 (0.020): 0.010*\"man\" + 0.009*\"love\" + 0.008*\"gestur\" + 0.006*\"comic\" + 0.006*\"blue\" + 0.005*\"septemb\" + 0.004*\"appear\" + 0.004*\"vision\" + 0.004*\"charact\" + 0.004*\"litig\"\n", + "2019-01-31 00:38:22,551 : INFO : topic #13 (0.020): 0.026*\"sourc\" + 0.026*\"australia\" + 0.025*\"new\" + 0.025*\"london\" + 0.022*\"australian\" + 0.022*\"england\" + 0.020*\"british\" + 0.017*\"ireland\" + 0.016*\"youth\" + 0.014*\"wale\"\n", + "2019-01-31 00:38:22,552 : INFO : topic #40 (0.020): 0.088*\"unit\" + 0.023*\"schuster\" + 0.022*\"collector\" + 0.022*\"institut\" + 0.020*\"requir\" + 0.018*\"student\" + 0.014*\"professor\" + 0.012*\"word\" + 0.012*\"http\" + 0.011*\"governor\"\n", + "2019-01-31 00:38:22,558 : INFO : topic diff=0.006056, rho=0.039073\n", + "2019-01-31 00:38:22,712 : INFO : PROGRESS: pass 0, at document #1312000/4922894\n", + "2019-01-31 00:38:24,099 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 00:38:24,365 : INFO : topic #17 (0.020): 0.074*\"church\" + 0.023*\"christian\" + 0.021*\"cathol\" + 0.020*\"bishop\" + 0.016*\"sail\" + 0.015*\"retroflex\" + 0.010*\"dioces\" + 0.009*\"centuri\" + 0.009*\"relationship\" + 0.009*\"cathedr\"\n", + "2019-01-31 00:38:24,366 : INFO : topic #0 (0.020): 0.066*\"statewid\" + 0.040*\"line\" + 0.037*\"arsen\" + 0.035*\"raid\" + 0.030*\"museo\" + 0.019*\"traceabl\" + 0.018*\"serv\" + 0.014*\"exhaust\" + 0.014*\"pain\" + 0.012*\"artist\"\n", + "2019-01-31 00:38:24,367 : INFO : topic #35 (0.020): 0.058*\"russia\" + 0.039*\"rural\" + 0.037*\"sovereignti\" + 0.026*\"personifi\" + 0.023*\"reprint\" + 0.022*\"poison\" + 0.021*\"moscow\" + 0.016*\"unfortun\" + 0.016*\"poland\" + 0.016*\"alexand\"\n", + "2019-01-31 00:38:24,368 : INFO : topic #16 (0.020): 0.047*\"king\" + 0.033*\"priest\" + 0.020*\"duke\" + 0.020*\"quarterli\" + 0.018*\"grammat\" + 0.018*\"idiosyncrat\" + 0.015*\"rotterdam\" + 0.015*\"brazil\" + 0.014*\"princ\" + 0.013*\"portugues\"\n", + "2019-01-31 00:38:24,369 : INFO : topic #20 (0.020): 0.138*\"scholar\" + 0.040*\"struggl\" + 0.033*\"high\" + 0.030*\"educ\" + 0.022*\"collector\" + 0.019*\"yawn\" + 0.014*\"prognosi\" + 0.011*\"gothic\" + 0.009*\"district\" + 0.009*\"task\"\n", + "2019-01-31 00:38:24,376 : INFO : topic diff=0.006993, rho=0.039043\n", + "2019-01-31 00:38:24,533 : INFO : PROGRESS: pass 0, at document #1314000/4922894\n", + "2019-01-31 00:38:25,919 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:38:26,185 : INFO : topic #0 (0.020): 0.070*\"statewid\" + 0.040*\"line\" + 0.037*\"arsen\" + 0.035*\"raid\" + 0.029*\"museo\" + 0.019*\"traceabl\" + 0.018*\"serv\" + 0.014*\"exhaust\" + 0.014*\"pain\" + 0.012*\"artist\"\n", + "2019-01-31 00:38:26,186 : INFO : topic #7 (0.020): 0.021*\"snatch\" + 0.020*\"di\" + 0.019*\"factor\" + 0.016*\"yawn\" + 0.015*\"margin\" + 0.014*\"bone\" + 0.013*\"life\" + 0.012*\"faster\" + 0.012*\"will\" + 0.012*\"deal\"\n", + "2019-01-31 00:38:26,187 : INFO : topic #24 (0.020): 0.042*\"book\" + 0.034*\"publicis\" + 0.024*\"word\" + 0.017*\"new\" + 0.015*\"edit\" + 0.013*\"presid\" + 0.012*\"storag\" + 0.012*\"worldwid\" + 0.012*\"nicola\" + 0.011*\"collect\"\n", + "2019-01-31 00:38:26,189 : INFO : topic #22 (0.020): 0.034*\"spars\" + 0.024*\"factor\" + 0.021*\"adulthood\" + 0.016*\"feel\" + 0.014*\"male\" + 0.013*\"hostil\" + 0.011*\"plaisir\" + 0.010*\"genu\" + 0.010*\"live\" + 0.009*\"yawn\"\n", + "2019-01-31 00:38:26,190 : INFO : topic #49 (0.020): 0.040*\"india\" + 0.033*\"incumb\" + 0.014*\"islam\" + 0.012*\"pakistan\" + 0.012*\"muskoge\" + 0.011*\"anglo\" + 0.011*\"alam\" + 0.011*\"khalsa\" + 0.011*\"televis\" + 0.009*\"tajikistan\"\n", + "2019-01-31 00:38:26,196 : INFO : topic diff=0.006283, rho=0.039014\n", + "2019-01-31 00:38:26,363 : INFO : PROGRESS: pass 0, at document #1316000/4922894\n", + "2019-01-31 00:38:27,776 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:38:28,045 : INFO : topic #38 (0.020): 0.023*\"walter\" + 0.010*\"aza\" + 0.009*\"battalion\" + 0.009*\"forc\" + 0.008*\"teufel\" + 0.007*\"armi\" + 0.007*\"empath\" + 0.007*\"militari\" + 0.006*\"king\" + 0.006*\"till\"\n", + "2019-01-31 00:38:28,047 : INFO : topic #4 (0.020): 0.022*\"enfranchis\" + 0.015*\"depress\" + 0.014*\"pour\" + 0.009*\"mode\" + 0.008*\"elabor\" + 0.008*\"veget\" + 0.007*\"produc\" + 0.007*\"encyclopedia\" + 0.007*\"uruguayan\" + 0.007*\"turn\"\n", + "2019-01-31 00:38:28,048 : INFO : topic #17 (0.020): 0.074*\"church\" + 0.023*\"christian\" + 0.021*\"cathol\" + 0.021*\"bishop\" + 0.016*\"sail\" + 0.015*\"retroflex\" + 0.010*\"dioces\" + 0.009*\"centuri\" + 0.009*\"relationship\" + 0.009*\"cathedr\"\n", + "2019-01-31 00:38:28,049 : INFO : topic #19 (0.020): 0.015*\"languag\" + 0.011*\"centuri\" + 0.010*\"form\" + 0.010*\"woodcut\" + 0.009*\"origin\" + 0.009*\"mean\" + 0.007*\"trade\" + 0.007*\"god\" + 0.007*\"like\" + 0.007*\"uruguayan\"\n", + "2019-01-31 00:38:28,050 : INFO : topic #44 (0.020): 0.033*\"rooftop\" + 0.028*\"final\" + 0.023*\"wife\" + 0.022*\"tourist\" + 0.017*\"champion\" + 0.016*\"taxpay\" + 0.015*\"chamber\" + 0.015*\"martin\" + 0.014*\"tiepolo\" + 0.013*\"open\"\n", + "2019-01-31 00:38:28,056 : INFO : topic diff=0.007139, rho=0.038984\n", + "2019-01-31 00:38:28,211 : INFO : PROGRESS: pass 0, at document #1318000/4922894\n", + "2019-01-31 00:38:29,620 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:38:29,886 : INFO : topic #17 (0.020): 0.074*\"church\" + 0.023*\"christian\" + 0.021*\"cathol\" + 0.021*\"bishop\" + 0.015*\"sail\" + 0.015*\"retroflex\" + 0.010*\"dioces\" + 0.009*\"centuri\" + 0.009*\"relationship\" + 0.008*\"poll\"\n", + "2019-01-31 00:38:29,887 : INFO : topic #13 (0.020): 0.026*\"australia\" + 0.026*\"sourc\" + 0.025*\"new\" + 0.025*\"london\" + 0.023*\"australian\" + 0.022*\"england\" + 0.020*\"british\" + 0.017*\"ireland\" + 0.016*\"youth\" + 0.014*\"wale\"\n", + "2019-01-31 00:38:29,888 : INFO : topic #42 (0.020): 0.043*\"german\" + 0.029*\"germani\" + 0.015*\"vol\" + 0.014*\"israel\" + 0.014*\"der\" + 0.013*\"jewish\" + 0.013*\"berlin\" + 0.010*\"european\" + 0.009*\"europ\" + 0.009*\"isra\"\n", + "2019-01-31 00:38:29,889 : INFO : topic #0 (0.020): 0.069*\"statewid\" + 0.040*\"line\" + 0.038*\"arsen\" + 0.034*\"raid\" + 0.030*\"museo\" + 0.019*\"traceabl\" + 0.018*\"serv\" + 0.014*\"exhaust\" + 0.014*\"pain\" + 0.012*\"artist\"\n", + "2019-01-31 00:38:29,890 : INFO : topic #12 (0.020): 0.008*\"number\" + 0.007*\"poet\" + 0.007*\"frontal\" + 0.007*\"théori\" + 0.006*\"gener\" + 0.006*\"measur\" + 0.006*\"exampl\" + 0.006*\"method\" + 0.006*\"southern\" + 0.006*\"differ\"\n", + "2019-01-31 00:38:29,896 : INFO : topic diff=0.005803, rho=0.038954\n", + "2019-01-31 00:38:32,569 : INFO : -11.792 per-word bound, 3546.0 perplexity estimate based on a held-out corpus of 2000 documents with 529492 words\n", + "2019-01-31 00:38:32,570 : INFO : PROGRESS: pass 0, at document #1320000/4922894\n", + "2019-01-31 00:38:33,951 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:38:34,217 : INFO : topic #26 (0.020): 0.034*\"workplac\" + 0.031*\"champion\" + 0.025*\"olymp\" + 0.025*\"woman\" + 0.024*\"men\" + 0.022*\"medal\" + 0.020*\"event\" + 0.019*\"rainfal\" + 0.018*\"atheist\" + 0.018*\"gold\"\n", + "2019-01-31 00:38:34,218 : INFO : topic #12 (0.020): 0.008*\"number\" + 0.007*\"poet\" + 0.007*\"frontal\" + 0.007*\"théori\" + 0.006*\"gener\" + 0.006*\"measur\" + 0.006*\"method\" + 0.006*\"exampl\" + 0.006*\"southern\" + 0.006*\"differ\"\n", + "2019-01-31 00:38:34,219 : INFO : topic #20 (0.020): 0.139*\"scholar\" + 0.040*\"struggl\" + 0.033*\"high\" + 0.030*\"educ\" + 0.023*\"collector\" + 0.019*\"yawn\" + 0.014*\"prognosi\" + 0.011*\"gothic\" + 0.009*\"class\" + 0.009*\"district\"\n", + "2019-01-31 00:38:34,220 : INFO : topic #28 (0.020): 0.030*\"build\" + 0.025*\"hous\" + 0.022*\"rivièr\" + 0.017*\"buford\" + 0.012*\"histor\" + 0.011*\"strategist\" + 0.011*\"constitut\" + 0.011*\"linear\" + 0.011*\"briarwood\" + 0.010*\"rosenwald\"\n", + "2019-01-31 00:38:34,221 : INFO : topic #4 (0.020): 0.022*\"enfranchis\" + 0.015*\"depress\" + 0.015*\"pour\" + 0.009*\"mode\" + 0.009*\"elabor\" + 0.008*\"veget\" + 0.007*\"produc\" + 0.007*\"encyclopedia\" + 0.007*\"uruguayan\" + 0.007*\"develop\"\n", + "2019-01-31 00:38:34,227 : INFO : topic diff=0.006061, rho=0.038925\n", + "2019-01-31 00:38:34,387 : INFO : PROGRESS: pass 0, at document #1322000/4922894\n", + "2019-01-31 00:38:35,801 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:38:36,067 : INFO : topic #39 (0.020): 0.050*\"canada\" + 0.039*\"canadian\" + 0.021*\"hoar\" + 0.020*\"toronto\" + 0.017*\"ontario\" + 0.014*\"hydrogen\" + 0.013*\"novotná\" + 0.013*\"new\" + 0.011*\"misericordia\" + 0.011*\"quebec\"\n", + "2019-01-31 00:38:36,068 : INFO : topic #28 (0.020): 0.030*\"build\" + 0.025*\"hous\" + 0.022*\"rivièr\" + 0.017*\"buford\" + 0.012*\"histor\" + 0.011*\"strategist\" + 0.011*\"constitut\" + 0.011*\"briarwood\" + 0.011*\"linear\" + 0.010*\"rosenwald\"\n", + "2019-01-31 00:38:36,069 : INFO : topic #32 (0.020): 0.052*\"district\" + 0.045*\"vigour\" + 0.043*\"popolo\" + 0.042*\"tortur\" + 0.031*\"cotton\" + 0.026*\"area\" + 0.023*\"regim\" + 0.023*\"multitud\" + 0.022*\"citi\" + 0.019*\"commun\"\n", + "2019-01-31 00:38:36,070 : INFO : topic #44 (0.020): 0.033*\"rooftop\" + 0.027*\"final\" + 0.023*\"wife\" + 0.022*\"tourist\" + 0.018*\"champion\" + 0.016*\"taxpay\" + 0.015*\"martin\" + 0.015*\"chamber\" + 0.015*\"tiepolo\" + 0.013*\"open\"\n", + "2019-01-31 00:38:36,071 : INFO : topic #0 (0.020): 0.069*\"statewid\" + 0.041*\"line\" + 0.038*\"arsen\" + 0.034*\"raid\" + 0.029*\"museo\" + 0.019*\"traceabl\" + 0.018*\"serv\" + 0.014*\"exhaust\" + 0.014*\"pain\" + 0.012*\"gai\"\n", + "2019-01-31 00:38:36,077 : INFO : topic diff=0.005934, rho=0.038895\n", + "2019-01-31 00:38:36,231 : INFO : PROGRESS: pass 0, at document #1324000/4922894\n", + "2019-01-31 00:38:37,615 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 00:38:37,881 : INFO : topic #35 (0.020): 0.057*\"russia\" + 0.038*\"rural\" + 0.037*\"sovereignti\" + 0.026*\"personifi\" + 0.023*\"reprint\" + 0.022*\"poison\" + 0.021*\"moscow\" + 0.015*\"unfortun\" + 0.015*\"poland\" + 0.014*\"alexand\"\n", + "2019-01-31 00:38:37,882 : INFO : topic #45 (0.020): 0.023*\"jpg\" + 0.023*\"fifteenth\" + 0.017*\"colder\" + 0.016*\"illicit\" + 0.016*\"western\" + 0.015*\"black\" + 0.013*\"record\" + 0.011*\"blind\" + 0.008*\"light\" + 0.007*\"green\"\n", + "2019-01-31 00:38:37,883 : INFO : topic #12 (0.020): 0.008*\"number\" + 0.007*\"frontal\" + 0.007*\"poet\" + 0.007*\"théori\" + 0.006*\"gener\" + 0.006*\"method\" + 0.006*\"southern\" + 0.006*\"measur\" + 0.006*\"exampl\" + 0.006*\"servitud\"\n", + "2019-01-31 00:38:37,884 : INFO : topic #11 (0.020): 0.026*\"john\" + 0.013*\"will\" + 0.012*\"jame\" + 0.012*\"david\" + 0.011*\"rival\" + 0.009*\"mexican–american\" + 0.009*\"georg\" + 0.008*\"paul\" + 0.008*\"slur\" + 0.008*\"rhyme\"\n", + "2019-01-31 00:38:37,885 : INFO : topic #49 (0.020): 0.040*\"india\" + 0.032*\"incumb\" + 0.014*\"islam\" + 0.011*\"pakistan\" + 0.011*\"anglo\" + 0.011*\"muskoge\" + 0.011*\"televis\" + 0.011*\"alam\" + 0.010*\"khalsa\" + 0.010*\"tajikistan\"\n", + "2019-01-31 00:38:37,891 : INFO : topic diff=0.006710, rho=0.038866\n", + "2019-01-31 00:38:38,045 : INFO : PROGRESS: pass 0, at document #1326000/4922894\n", + "2019-01-31 00:38:39,436 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:38:39,702 : INFO : topic #42 (0.020): 0.044*\"german\" + 0.030*\"germani\" + 0.015*\"vol\" + 0.014*\"israel\" + 0.014*\"jewish\" + 0.013*\"der\" + 0.013*\"berlin\" + 0.009*\"european\" + 0.009*\"europ\" + 0.009*\"itali\"\n", + "2019-01-31 00:38:39,703 : INFO : topic #9 (0.020): 0.066*\"bone\" + 0.044*\"american\" + 0.029*\"valour\" + 0.018*\"folei\" + 0.018*\"polit\" + 0.018*\"dutch\" + 0.017*\"player\" + 0.015*\"english\" + 0.012*\"simpler\" + 0.011*\"surnam\"\n", + "2019-01-31 00:38:39,705 : INFO : topic #46 (0.020): 0.021*\"stop\" + 0.018*\"damag\" + 0.016*\"norwai\" + 0.015*\"replac\" + 0.015*\"swedish\" + 0.015*\"wind\" + 0.013*\"treeless\" + 0.013*\"sweden\" + 0.013*\"norwegian\" + 0.011*\"huntsvil\"\n", + "2019-01-31 00:38:39,706 : INFO : topic #49 (0.020): 0.040*\"india\" + 0.032*\"incumb\" + 0.014*\"islam\" + 0.012*\"anglo\" + 0.012*\"pakistan\" + 0.011*\"televis\" + 0.011*\"muskoge\" + 0.011*\"alam\" + 0.010*\"khalsa\" + 0.010*\"tajikistan\"\n", + "2019-01-31 00:38:39,707 : INFO : topic #31 (0.020): 0.059*\"fusiform\" + 0.026*\"scientist\" + 0.025*\"player\" + 0.025*\"taxpay\" + 0.020*\"place\" + 0.014*\"clot\" + 0.013*\"leagu\" + 0.012*\"folei\" + 0.010*\"yawn\" + 0.009*\"reconstruct\"\n", + "2019-01-31 00:38:39,713 : INFO : topic diff=0.007468, rho=0.038837\n", + "2019-01-31 00:38:39,870 : INFO : PROGRESS: pass 0, at document #1328000/4922894\n", + "2019-01-31 00:38:41,274 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:38:41,543 : INFO : topic #30 (0.020): 0.036*\"leagu\" + 0.035*\"cleveland\" + 0.029*\"place\" + 0.027*\"taxpay\" + 0.024*\"crete\" + 0.024*\"scientist\" + 0.022*\"folei\" + 0.017*\"goal\" + 0.015*\"martin\" + 0.012*\"schmitz\"\n", + "2019-01-31 00:38:41,544 : INFO : topic #20 (0.020): 0.138*\"scholar\" + 0.039*\"struggl\" + 0.032*\"high\" + 0.030*\"educ\" + 0.023*\"collector\" + 0.018*\"yawn\" + 0.014*\"prognosi\" + 0.010*\"gothic\" + 0.009*\"district\" + 0.009*\"class\"\n", + "2019-01-31 00:38:41,545 : INFO : topic #17 (0.020): 0.075*\"church\" + 0.024*\"christian\" + 0.021*\"bishop\" + 0.021*\"cathol\" + 0.015*\"sail\" + 0.014*\"retroflex\" + 0.009*\"relationship\" + 0.009*\"centuri\" + 0.009*\"dioces\" + 0.009*\"cathedr\"\n", + "2019-01-31 00:38:41,546 : INFO : topic #9 (0.020): 0.067*\"bone\" + 0.043*\"american\" + 0.029*\"valour\" + 0.018*\"folei\" + 0.018*\"polit\" + 0.018*\"dutch\" + 0.017*\"player\" + 0.015*\"english\" + 0.012*\"simpler\" + 0.011*\"acrimoni\"\n", + "2019-01-31 00:38:41,547 : INFO : topic #10 (0.020): 0.011*\"cdd\" + 0.008*\"media\" + 0.007*\"disco\" + 0.007*\"pathwai\" + 0.007*\"caus\" + 0.006*\"have\" + 0.006*\"treat\" + 0.006*\"effect\" + 0.006*\"hormon\" + 0.006*\"proper\"\n", + "2019-01-31 00:38:41,553 : INFO : topic diff=0.006012, rho=0.038808\n", + "2019-01-31 00:38:41,705 : INFO : PROGRESS: pass 0, at document #1330000/4922894\n", + "2019-01-31 00:38:43,051 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:38:43,317 : INFO : topic #35 (0.020): 0.057*\"russia\" + 0.038*\"rural\" + 0.037*\"sovereignti\" + 0.026*\"personifi\" + 0.023*\"reprint\" + 0.021*\"poison\" + 0.020*\"moscow\" + 0.015*\"unfortun\" + 0.015*\"poland\" + 0.014*\"alexand\"\n", + "2019-01-31 00:38:43,318 : INFO : topic #46 (0.020): 0.020*\"stop\" + 0.017*\"damag\" + 0.016*\"norwai\" + 0.015*\"wind\" + 0.015*\"swedish\" + 0.014*\"replac\" + 0.014*\"sweden\" + 0.013*\"norwegian\" + 0.012*\"treeless\" + 0.011*\"huntsvil\"\n", + "2019-01-31 00:38:43,319 : INFO : topic #39 (0.020): 0.049*\"canada\" + 0.038*\"canadian\" + 0.020*\"toronto\" + 0.020*\"hoar\" + 0.017*\"ontario\" + 0.014*\"novotná\" + 0.014*\"hydrogen\" + 0.013*\"new\" + 0.012*\"misericordia\" + 0.010*\"quebec\"\n", + "2019-01-31 00:38:43,320 : INFO : topic #48 (0.020): 0.076*\"march\" + 0.075*\"sens\" + 0.074*\"octob\" + 0.068*\"juli\" + 0.068*\"januari\" + 0.066*\"notion\" + 0.066*\"august\" + 0.065*\"decatur\" + 0.065*\"april\" + 0.064*\"judici\"\n", + "2019-01-31 00:38:43,321 : INFO : topic #45 (0.020): 0.023*\"jpg\" + 0.022*\"fifteenth\" + 0.017*\"illicit\" + 0.017*\"colder\" + 0.016*\"western\" + 0.015*\"black\" + 0.013*\"record\" + 0.011*\"blind\" + 0.007*\"light\" + 0.007*\"green\"\n", + "2019-01-31 00:38:43,327 : INFO : topic diff=0.006987, rho=0.038778\n", + "2019-01-31 00:38:43,483 : INFO : PROGRESS: pass 0, at document #1332000/4922894\n", + "2019-01-31 00:38:44,884 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:38:45,150 : INFO : topic #44 (0.020): 0.034*\"rooftop\" + 0.026*\"final\" + 0.022*\"wife\" + 0.021*\"tourist\" + 0.018*\"champion\" + 0.016*\"taxpay\" + 0.015*\"chamber\" + 0.015*\"martin\" + 0.014*\"tiepolo\" + 0.013*\"open\"\n", + "2019-01-31 00:38:45,151 : INFO : topic #43 (0.020): 0.062*\"elect\" + 0.053*\"parti\" + 0.024*\"voluntari\" + 0.022*\"democrat\" + 0.020*\"member\" + 0.017*\"polici\" + 0.015*\"liber\" + 0.013*\"republ\" + 0.013*\"seaport\" + 0.013*\"selma\"\n", + "2019-01-31 00:38:45,152 : INFO : topic #11 (0.020): 0.026*\"john\" + 0.013*\"will\" + 0.012*\"jame\" + 0.012*\"david\" + 0.011*\"rival\" + 0.009*\"mexican–american\" + 0.009*\"georg\" + 0.008*\"paul\" + 0.008*\"slur\" + 0.008*\"rhyme\"\n", + "2019-01-31 00:38:45,154 : INFO : topic #6 (0.020): 0.073*\"fewer\" + 0.024*\"septemb\" + 0.023*\"epiru\" + 0.018*\"teacher\" + 0.017*\"stake\" + 0.013*\"rodríguez\" + 0.012*\"proclaim\" + 0.011*\"direct\" + 0.011*\"movi\" + 0.010*\"acrimoni\"\n", + "2019-01-31 00:38:45,155 : INFO : topic #28 (0.020): 0.031*\"build\" + 0.025*\"hous\" + 0.021*\"rivièr\" + 0.017*\"buford\" + 0.012*\"histor\" + 0.011*\"strategist\" + 0.011*\"constitut\" + 0.011*\"briarwood\" + 0.010*\"linear\" + 0.010*\"rosenwald\"\n", + "2019-01-31 00:38:45,160 : INFO : topic diff=0.007573, rho=0.038749\n", + "2019-01-31 00:38:45,318 : INFO : PROGRESS: pass 0, at document #1334000/4922894\n", + "2019-01-31 00:38:46,727 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:38:46,993 : INFO : topic #11 (0.020): 0.026*\"john\" + 0.013*\"will\" + 0.012*\"jame\" + 0.012*\"david\" + 0.011*\"rival\" + 0.010*\"mexican–american\" + 0.009*\"georg\" + 0.008*\"paul\" + 0.008*\"slur\" + 0.008*\"rhyme\"\n", + "2019-01-31 00:38:46,994 : INFO : topic #2 (0.020): 0.048*\"isl\" + 0.037*\"shield\" + 0.018*\"narrat\" + 0.014*\"scot\" + 0.013*\"pope\" + 0.011*\"blur\" + 0.011*\"nativist\" + 0.010*\"coalit\" + 0.009*\"bahá\" + 0.009*\"class\"\n", + "2019-01-31 00:38:46,995 : INFO : topic #36 (0.020): 0.012*\"network\" + 0.011*\"prognosi\" + 0.010*\"pop\" + 0.008*\"develop\" + 0.008*\"cytokin\" + 0.007*\"championship\" + 0.007*\"softwar\" + 0.007*\"user\" + 0.007*\"serv\" + 0.007*\"base\"\n", + "2019-01-31 00:38:46,996 : INFO : topic #1 (0.020): 0.053*\"china\" + 0.042*\"chilton\" + 0.023*\"korea\" + 0.022*\"hong\" + 0.021*\"kong\" + 0.018*\"korean\" + 0.017*\"sourc\" + 0.015*\"leah\" + 0.015*\"kim\" + 0.012*\"thailand\"\n", + "2019-01-31 00:38:46,997 : INFO : topic #48 (0.020): 0.076*\"sens\" + 0.074*\"march\" + 0.074*\"octob\" + 0.069*\"juli\" + 0.068*\"januari\" + 0.066*\"notion\" + 0.065*\"august\" + 0.064*\"april\" + 0.064*\"decatur\" + 0.064*\"judici\"\n", + "2019-01-31 00:38:47,003 : INFO : topic diff=0.006376, rho=0.038720\n", + "2019-01-31 00:38:47,157 : INFO : PROGRESS: pass 0, at document #1336000/4922894\n", + "2019-01-31 00:38:48,532 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:38:48,798 : INFO : topic #14 (0.020): 0.023*\"forc\" + 0.022*\"aggress\" + 0.020*\"walter\" + 0.019*\"armi\" + 0.016*\"com\" + 0.014*\"diversifi\" + 0.014*\"oper\" + 0.013*\"unionist\" + 0.013*\"airbu\" + 0.012*\"militari\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 00:38:48,800 : INFO : topic #45 (0.020): 0.023*\"jpg\" + 0.022*\"fifteenth\" + 0.017*\"illicit\" + 0.016*\"colder\" + 0.016*\"western\" + 0.015*\"black\" + 0.013*\"record\" + 0.011*\"blind\" + 0.007*\"light\" + 0.007*\"green\"\n", + "2019-01-31 00:38:48,801 : INFO : topic #19 (0.020): 0.015*\"languag\" + 0.011*\"centuri\" + 0.010*\"woodcut\" + 0.010*\"form\" + 0.009*\"origin\" + 0.009*\"mean\" + 0.007*\"trade\" + 0.007*\"like\" + 0.007*\"uruguayan\" + 0.006*\"god\"\n", + "2019-01-31 00:38:48,802 : INFO : topic #36 (0.020): 0.012*\"network\" + 0.011*\"prognosi\" + 0.010*\"pop\" + 0.008*\"develop\" + 0.008*\"cytokin\" + 0.007*\"championship\" + 0.007*\"softwar\" + 0.007*\"user\" + 0.007*\"base\" + 0.007*\"serv\"\n", + "2019-01-31 00:38:48,803 : INFO : topic #3 (0.020): 0.035*\"present\" + 0.027*\"offic\" + 0.024*\"minist\" + 0.021*\"govern\" + 0.021*\"nation\" + 0.019*\"serv\" + 0.019*\"member\" + 0.017*\"gener\" + 0.016*\"seri\" + 0.016*\"chickasaw\"\n", + "2019-01-31 00:38:48,809 : INFO : topic diff=0.006900, rho=0.038691\n", + "2019-01-31 00:38:48,964 : INFO : PROGRESS: pass 0, at document #1338000/4922894\n", + "2019-01-31 00:38:50,363 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:38:50,633 : INFO : topic #37 (0.020): 0.010*\"man\" + 0.009*\"love\" + 0.008*\"gestur\" + 0.006*\"blue\" + 0.006*\"comic\" + 0.005*\"septemb\" + 0.005*\"dixi\" + 0.005*\"charact\" + 0.004*\"vision\" + 0.004*\"appear\"\n", + "2019-01-31 00:38:50,634 : INFO : topic #0 (0.020): 0.067*\"statewid\" + 0.040*\"line\" + 0.038*\"arsen\" + 0.035*\"raid\" + 0.029*\"museo\" + 0.019*\"traceabl\" + 0.018*\"serv\" + 0.016*\"pain\" + 0.014*\"exhaust\" + 0.012*\"artist\"\n", + "2019-01-31 00:38:50,635 : INFO : topic #6 (0.020): 0.072*\"fewer\" + 0.023*\"septemb\" + 0.023*\"epiru\" + 0.018*\"teacher\" + 0.017*\"stake\" + 0.013*\"rodríguez\" + 0.012*\"proclaim\" + 0.011*\"direct\" + 0.011*\"movi\" + 0.010*\"acrimoni\"\n", + "2019-01-31 00:38:50,636 : INFO : topic #33 (0.020): 0.060*\"french\" + 0.046*\"franc\" + 0.030*\"pari\" + 0.024*\"jean\" + 0.023*\"sail\" + 0.019*\"daphn\" + 0.014*\"lazi\" + 0.014*\"loui\" + 0.012*\"piec\" + 0.007*\"wine\"\n", + "2019-01-31 00:38:50,637 : INFO : topic #36 (0.020): 0.012*\"network\" + 0.011*\"prognosi\" + 0.010*\"pop\" + 0.009*\"develop\" + 0.008*\"cytokin\" + 0.007*\"championship\" + 0.007*\"softwar\" + 0.007*\"user\" + 0.007*\"base\" + 0.007*\"serv\"\n", + "2019-01-31 00:38:50,643 : INFO : topic diff=0.005915, rho=0.038662\n", + "2019-01-31 00:38:53,374 : INFO : -11.503 per-word bound, 2901.7 perplexity estimate based on a held-out corpus of 2000 documents with 573812 words\n", + "2019-01-31 00:38:53,375 : INFO : PROGRESS: pass 0, at document #1340000/4922894\n", + "2019-01-31 00:38:54,774 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:38:55,041 : INFO : topic #14 (0.020): 0.023*\"forc\" + 0.022*\"aggress\" + 0.020*\"walter\" + 0.019*\"armi\" + 0.017*\"com\" + 0.014*\"diversifi\" + 0.014*\"oper\" + 0.013*\"unionist\" + 0.013*\"airbu\" + 0.012*\"militari\"\n", + "2019-01-31 00:38:55,042 : INFO : topic #7 (0.020): 0.021*\"snatch\" + 0.020*\"di\" + 0.018*\"factor\" + 0.016*\"yawn\" + 0.015*\"margin\" + 0.014*\"bone\" + 0.013*\"life\" + 0.012*\"faster\" + 0.012*\"will\" + 0.012*\"deal\"\n", + "2019-01-31 00:38:55,043 : INFO : topic #5 (0.020): 0.039*\"abroad\" + 0.029*\"son\" + 0.027*\"rel\" + 0.026*\"reconstruct\" + 0.021*\"band\" + 0.017*\"muscl\" + 0.016*\"simultan\" + 0.014*\"charcoal\" + 0.014*\"toyota\" + 0.010*\"myspac\"\n", + "2019-01-31 00:38:55,044 : INFO : topic #11 (0.020): 0.026*\"john\" + 0.013*\"will\" + 0.012*\"jame\" + 0.012*\"david\" + 0.011*\"rival\" + 0.010*\"mexican–american\" + 0.009*\"georg\" + 0.008*\"paul\" + 0.008*\"slur\" + 0.008*\"rhyme\"\n", + "2019-01-31 00:38:55,045 : INFO : topic #49 (0.020): 0.040*\"india\" + 0.031*\"incumb\" + 0.013*\"islam\" + 0.012*\"televis\" + 0.012*\"pakistan\" + 0.011*\"anglo\" + 0.011*\"muskoge\" + 0.011*\"sri\" + 0.010*\"khalsa\" + 0.010*\"alam\"\n", + "2019-01-31 00:38:55,051 : INFO : topic diff=0.006151, rho=0.038633\n", + "2019-01-31 00:38:55,213 : INFO : PROGRESS: pass 0, at document #1342000/4922894\n", + "2019-01-31 00:38:56,606 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:38:56,874 : INFO : topic #29 (0.020): 0.022*\"companhia\" + 0.011*\"million\" + 0.010*\"bank\" + 0.010*\"busi\" + 0.009*\"market\" + 0.008*\"yawn\" + 0.008*\"produc\" + 0.007*\"manag\" + 0.007*\"industri\" + 0.007*\"function\"\n", + "2019-01-31 00:38:56,876 : INFO : topic #21 (0.020): 0.037*\"samford\" + 0.022*\"spain\" + 0.019*\"del\" + 0.019*\"mexico\" + 0.014*\"soviet\" + 0.012*\"santa\" + 0.012*\"juan\" + 0.011*\"carlo\" + 0.011*\"francisco\" + 0.010*\"lizard\"\n", + "2019-01-31 00:38:56,877 : INFO : topic #24 (0.020): 0.042*\"book\" + 0.034*\"publicis\" + 0.024*\"word\" + 0.018*\"new\" + 0.015*\"edit\" + 0.013*\"presid\" + 0.012*\"storag\" + 0.012*\"nicola\" + 0.011*\"worldwid\" + 0.011*\"collect\"\n", + "2019-01-31 00:38:56,878 : INFO : topic #49 (0.020): 0.040*\"india\" + 0.031*\"incumb\" + 0.013*\"islam\" + 0.013*\"televis\" + 0.012*\"pakistan\" + 0.011*\"anglo\" + 0.011*\"muskoge\" + 0.010*\"sri\" + 0.010*\"khalsa\" + 0.010*\"alam\"\n", + "2019-01-31 00:38:56,879 : INFO : topic #43 (0.020): 0.062*\"elect\" + 0.053*\"parti\" + 0.023*\"voluntari\" + 0.022*\"democrat\" + 0.021*\"member\" + 0.017*\"polici\" + 0.014*\"liber\" + 0.014*\"seaport\" + 0.014*\"republ\" + 0.013*\"selma\"\n", + "2019-01-31 00:38:56,885 : INFO : topic diff=0.005921, rho=0.038605\n", + "2019-01-31 00:38:57,099 : INFO : PROGRESS: pass 0, at document #1344000/4922894\n", + "2019-01-31 00:38:58,484 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:38:58,750 : INFO : topic #22 (0.020): 0.034*\"spars\" + 0.024*\"factor\" + 0.022*\"adulthood\" + 0.016*\"feel\" + 0.014*\"male\" + 0.013*\"hostil\" + 0.012*\"plaisir\" + 0.010*\"live\" + 0.010*\"genu\" + 0.009*\"biom\"\n", + "2019-01-31 00:38:58,752 : INFO : topic #37 (0.020): 0.009*\"man\" + 0.009*\"love\" + 0.007*\"gestur\" + 0.006*\"comic\" + 0.006*\"blue\" + 0.005*\"septemb\" + 0.005*\"charact\" + 0.004*\"dixi\" + 0.004*\"vision\" + 0.004*\"appear\"\n", + "2019-01-31 00:38:58,753 : INFO : topic #1 (0.020): 0.055*\"china\" + 0.043*\"chilton\" + 0.023*\"korea\" + 0.022*\"hong\" + 0.021*\"kong\" + 0.018*\"korean\" + 0.016*\"sourc\" + 0.015*\"kim\" + 0.015*\"leah\" + 0.012*\"thailand\"\n", + "2019-01-31 00:38:58,754 : INFO : topic #44 (0.020): 0.034*\"rooftop\" + 0.026*\"final\" + 0.023*\"wife\" + 0.022*\"tourist\" + 0.018*\"champion\" + 0.016*\"taxpay\" + 0.016*\"martin\" + 0.015*\"chamber\" + 0.015*\"tiepolo\" + 0.013*\"open\"\n", + "2019-01-31 00:38:58,756 : INFO : topic #42 (0.020): 0.045*\"german\" + 0.030*\"germani\" + 0.015*\"vol\" + 0.014*\"israel\" + 0.014*\"berlin\" + 0.013*\"der\" + 0.013*\"jewish\" + 0.009*\"european\" + 0.009*\"europ\" + 0.009*\"itali\"\n", + "2019-01-31 00:38:58,761 : INFO : topic diff=0.006444, rho=0.038576\n", + "2019-01-31 00:38:58,919 : INFO : PROGRESS: pass 0, at document #1346000/4922894\n", + "2019-01-31 00:39:00,342 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:39:00,609 : INFO : topic #38 (0.020): 0.023*\"walter\" + 0.011*\"aza\" + 0.009*\"forc\" + 0.009*\"battalion\" + 0.008*\"teufel\" + 0.007*\"empath\" + 0.007*\"armi\" + 0.007*\"till\" + 0.007*\"militari\" + 0.006*\"pour\"\n", + "2019-01-31 00:39:00,610 : INFO : topic #22 (0.020): 0.034*\"spars\" + 0.024*\"factor\" + 0.021*\"adulthood\" + 0.016*\"feel\" + 0.014*\"male\" + 0.013*\"hostil\" + 0.012*\"plaisir\" + 0.010*\"live\" + 0.009*\"genu\" + 0.009*\"yawn\"\n", + "2019-01-31 00:39:00,611 : INFO : topic #37 (0.020): 0.009*\"man\" + 0.009*\"love\" + 0.007*\"gestur\" + 0.006*\"comic\" + 0.006*\"blue\" + 0.005*\"septemb\" + 0.005*\"charact\" + 0.004*\"dixi\" + 0.004*\"appear\" + 0.004*\"vision\"\n", + "2019-01-31 00:39:00,612 : INFO : topic #9 (0.020): 0.068*\"bone\" + 0.043*\"american\" + 0.030*\"valour\" + 0.019*\"dutch\" + 0.018*\"folei\" + 0.018*\"polit\" + 0.017*\"player\" + 0.016*\"english\" + 0.012*\"simpler\" + 0.011*\"acrimoni\"\n", + "2019-01-31 00:39:00,613 : INFO : topic #48 (0.020): 0.076*\"sens\" + 0.076*\"octob\" + 0.075*\"march\" + 0.069*\"juli\" + 0.068*\"januari\" + 0.067*\"notion\" + 0.067*\"august\" + 0.065*\"april\" + 0.064*\"decatur\" + 0.064*\"judici\"\n", + "2019-01-31 00:39:00,619 : INFO : topic diff=0.006029, rho=0.038547\n", + "2019-01-31 00:39:00,779 : INFO : PROGRESS: pass 0, at document #1348000/4922894\n", + "2019-01-31 00:39:02,209 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:39:02,476 : INFO : topic #38 (0.020): 0.023*\"walter\" + 0.011*\"aza\" + 0.009*\"battalion\" + 0.009*\"forc\" + 0.008*\"teufel\" + 0.007*\"empath\" + 0.007*\"armi\" + 0.007*\"militari\" + 0.007*\"till\" + 0.006*\"pour\"\n", + "2019-01-31 00:39:02,477 : INFO : topic #43 (0.020): 0.062*\"elect\" + 0.053*\"parti\" + 0.024*\"voluntari\" + 0.022*\"democrat\" + 0.021*\"member\" + 0.017*\"polici\" + 0.014*\"republ\" + 0.014*\"liber\" + 0.014*\"seaport\" + 0.013*\"selma\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 00:39:02,478 : INFO : topic #48 (0.020): 0.076*\"sens\" + 0.076*\"octob\" + 0.075*\"march\" + 0.069*\"juli\" + 0.068*\"januari\" + 0.068*\"notion\" + 0.067*\"august\" + 0.065*\"april\" + 0.064*\"decatur\" + 0.064*\"judici\"\n", + "2019-01-31 00:39:02,479 : INFO : topic #25 (0.020): 0.030*\"ring\" + 0.017*\"warmth\" + 0.017*\"area\" + 0.017*\"lagrang\" + 0.015*\"mount\" + 0.009*\"palmer\" + 0.009*\"north\" + 0.008*\"foam\" + 0.008*\"land\" + 0.008*\"vacant\"\n", + "2019-01-31 00:39:02,480 : INFO : topic #11 (0.020): 0.026*\"john\" + 0.013*\"will\" + 0.012*\"jame\" + 0.012*\"david\" + 0.011*\"rival\" + 0.010*\"mexican–american\" + 0.009*\"georg\" + 0.008*\"paul\" + 0.008*\"slur\" + 0.008*\"rhyme\"\n", + "2019-01-31 00:39:02,486 : INFO : topic diff=0.006705, rho=0.038519\n", + "2019-01-31 00:39:02,645 : INFO : PROGRESS: pass 0, at document #1350000/4922894\n", + "2019-01-31 00:39:04,030 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:39:04,299 : INFO : topic #2 (0.020): 0.048*\"isl\" + 0.038*\"shield\" + 0.018*\"narrat\" + 0.014*\"scot\" + 0.013*\"pope\" + 0.012*\"blur\" + 0.011*\"nativist\" + 0.010*\"coalit\" + 0.009*\"bahá\" + 0.009*\"vernon\"\n", + "2019-01-31 00:39:04,300 : INFO : topic #22 (0.020): 0.034*\"spars\" + 0.024*\"factor\" + 0.022*\"adulthood\" + 0.015*\"feel\" + 0.014*\"male\" + 0.013*\"hostil\" + 0.012*\"plaisir\" + 0.010*\"live\" + 0.009*\"genu\" + 0.009*\"yawn\"\n", + "2019-01-31 00:39:04,301 : INFO : topic #46 (0.020): 0.019*\"stop\" + 0.017*\"damag\" + 0.017*\"swedish\" + 0.016*\"norwai\" + 0.015*\"sweden\" + 0.014*\"wind\" + 0.014*\"replac\" + 0.014*\"norwegian\" + 0.011*\"treeless\" + 0.011*\"denmark\"\n", + "2019-01-31 00:39:04,302 : INFO : topic #20 (0.020): 0.140*\"scholar\" + 0.039*\"struggl\" + 0.032*\"high\" + 0.030*\"educ\" + 0.023*\"collector\" + 0.018*\"yawn\" + 0.014*\"prognosi\" + 0.010*\"gothic\" + 0.009*\"campbel\" + 0.009*\"class\"\n", + "2019-01-31 00:39:04,303 : INFO : topic #13 (0.020): 0.026*\"sourc\" + 0.026*\"australia\" + 0.025*\"london\" + 0.025*\"new\" + 0.022*\"australian\" + 0.022*\"england\" + 0.019*\"british\" + 0.017*\"ireland\" + 0.016*\"youth\" + 0.014*\"wale\"\n", + "2019-01-31 00:39:04,309 : INFO : topic diff=0.006086, rho=0.038490\n", + "2019-01-31 00:39:04,464 : INFO : PROGRESS: pass 0, at document #1352000/4922894\n", + "2019-01-31 00:39:05,847 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:39:06,114 : INFO : topic #17 (0.020): 0.075*\"church\" + 0.023*\"christian\" + 0.021*\"bishop\" + 0.021*\"cathol\" + 0.016*\"sail\" + 0.014*\"retroflex\" + 0.009*\"centuri\" + 0.009*\"relationship\" + 0.009*\"cathedr\" + 0.009*\"dioces\"\n", + "2019-01-31 00:39:06,115 : INFO : topic #47 (0.020): 0.064*\"muscl\" + 0.032*\"perceptu\" + 0.019*\"theater\" + 0.019*\"place\" + 0.017*\"compos\" + 0.016*\"damn\" + 0.015*\"orchestr\" + 0.013*\"physician\" + 0.013*\"olympo\" + 0.012*\"jack\"\n", + "2019-01-31 00:39:06,116 : INFO : topic #2 (0.020): 0.047*\"isl\" + 0.037*\"shield\" + 0.018*\"narrat\" + 0.014*\"scot\" + 0.013*\"pope\" + 0.012*\"blur\" + 0.011*\"nativist\" + 0.010*\"coalit\" + 0.010*\"bahá\" + 0.009*\"vernon\"\n", + "2019-01-31 00:39:06,117 : INFO : topic #37 (0.020): 0.009*\"man\" + 0.009*\"love\" + 0.007*\"gestur\" + 0.006*\"comic\" + 0.005*\"blue\" + 0.005*\"septemb\" + 0.005*\"charact\" + 0.004*\"appear\" + 0.004*\"dixi\" + 0.004*\"litig\"\n", + "2019-01-31 00:39:06,119 : INFO : topic #15 (0.020): 0.011*\"small\" + 0.011*\"organ\" + 0.011*\"develop\" + 0.010*\"commun\" + 0.010*\"word\" + 0.009*\"group\" + 0.008*\"peopl\" + 0.007*\"cultur\" + 0.007*\"human\" + 0.006*\"woman\"\n", + "2019-01-31 00:39:06,125 : INFO : topic diff=0.006666, rho=0.038462\n", + "2019-01-31 00:39:06,283 : INFO : PROGRESS: pass 0, at document #1354000/4922894\n", + "2019-01-31 00:39:07,702 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:39:07,968 : INFO : topic #14 (0.020): 0.024*\"forc\" + 0.022*\"aggress\" + 0.020*\"walter\" + 0.019*\"armi\" + 0.017*\"com\" + 0.014*\"oper\" + 0.013*\"diversifi\" + 0.013*\"unionist\" + 0.012*\"airbu\" + 0.012*\"militari\"\n", + "2019-01-31 00:39:07,969 : INFO : topic #47 (0.020): 0.064*\"muscl\" + 0.032*\"perceptu\" + 0.019*\"theater\" + 0.018*\"place\" + 0.017*\"compos\" + 0.016*\"damn\" + 0.015*\"orchestr\" + 0.014*\"physician\" + 0.013*\"olympo\" + 0.012*\"jack\"\n", + "2019-01-31 00:39:07,970 : INFO : topic #35 (0.020): 0.059*\"russia\" + 0.038*\"rural\" + 0.035*\"sovereignti\" + 0.026*\"personifi\" + 0.023*\"reprint\" + 0.022*\"poison\" + 0.020*\"moscow\" + 0.016*\"poland\" + 0.015*\"unfortun\" + 0.015*\"alexand\"\n", + "2019-01-31 00:39:07,971 : INFO : topic #27 (0.020): 0.072*\"questionnair\" + 0.018*\"candid\" + 0.017*\"taxpay\" + 0.012*\"driver\" + 0.012*\"find\" + 0.011*\"fool\" + 0.010*\"horac\" + 0.010*\"ret\" + 0.010*\"landslid\" + 0.010*\"tornado\"\n", + "2019-01-31 00:39:07,972 : INFO : topic #13 (0.020): 0.027*\"australia\" + 0.027*\"sourc\" + 0.026*\"london\" + 0.025*\"new\" + 0.022*\"australian\" + 0.022*\"england\" + 0.020*\"british\" + 0.017*\"ireland\" + 0.016*\"youth\" + 0.014*\"wale\"\n", + "2019-01-31 00:39:07,978 : INFO : topic diff=0.006220, rho=0.038433\n", + "2019-01-31 00:39:08,138 : INFO : PROGRESS: pass 0, at document #1356000/4922894\n", + "2019-01-31 00:39:09,546 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:39:09,812 : INFO : topic #10 (0.020): 0.012*\"cdd\" + 0.008*\"disco\" + 0.007*\"media\" + 0.007*\"pathwai\" + 0.006*\"have\" + 0.006*\"treat\" + 0.006*\"caus\" + 0.006*\"proper\" + 0.006*\"hormon\" + 0.006*\"human\"\n", + "2019-01-31 00:39:09,813 : INFO : topic #33 (0.020): 0.060*\"french\" + 0.046*\"franc\" + 0.030*\"pari\" + 0.025*\"jean\" + 0.023*\"sail\" + 0.018*\"daphn\" + 0.014*\"lazi\" + 0.014*\"loui\" + 0.012*\"piec\" + 0.009*\"wine\"\n", + "2019-01-31 00:39:09,814 : INFO : topic #47 (0.020): 0.064*\"muscl\" + 0.032*\"perceptu\" + 0.019*\"theater\" + 0.018*\"place\" + 0.017*\"compos\" + 0.016*\"damn\" + 0.015*\"orchestr\" + 0.014*\"physician\" + 0.013*\"olympo\" + 0.012*\"jack\"\n", + "2019-01-31 00:39:09,815 : INFO : topic #22 (0.020): 0.034*\"spars\" + 0.024*\"factor\" + 0.022*\"adulthood\" + 0.015*\"feel\" + 0.014*\"male\" + 0.013*\"hostil\" + 0.012*\"plaisir\" + 0.010*\"live\" + 0.009*\"genu\" + 0.009*\"yawn\"\n", + "2019-01-31 00:39:09,817 : INFO : topic #29 (0.020): 0.022*\"companhia\" + 0.010*\"million\" + 0.010*\"busi\" + 0.010*\"bank\" + 0.009*\"market\" + 0.008*\"yawn\" + 0.008*\"produc\" + 0.007*\"industri\" + 0.007*\"manag\" + 0.007*\"function\"\n", + "2019-01-31 00:39:09,822 : INFO : topic diff=0.006880, rho=0.038405\n", + "2019-01-31 00:39:09,984 : INFO : PROGRESS: pass 0, at document #1358000/4922894\n", + "2019-01-31 00:39:11,422 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:39:11,688 : INFO : topic #13 (0.020): 0.027*\"sourc\" + 0.027*\"australia\" + 0.026*\"london\" + 0.025*\"new\" + 0.022*\"england\" + 0.022*\"australian\" + 0.020*\"british\" + 0.017*\"ireland\" + 0.016*\"youth\" + 0.014*\"wale\"\n", + "2019-01-31 00:39:11,689 : INFO : topic #7 (0.020): 0.022*\"snatch\" + 0.020*\"di\" + 0.018*\"factor\" + 0.016*\"yawn\" + 0.015*\"margin\" + 0.014*\"bone\" + 0.013*\"life\" + 0.012*\"faster\" + 0.012*\"will\" + 0.012*\"deal\"\n", + "2019-01-31 00:39:11,690 : INFO : topic #43 (0.020): 0.062*\"elect\" + 0.053*\"parti\" + 0.024*\"voluntari\" + 0.022*\"democrat\" + 0.021*\"member\" + 0.017*\"polici\" + 0.015*\"republ\" + 0.014*\"liber\" + 0.013*\"seaport\" + 0.013*\"selma\"\n", + "2019-01-31 00:39:11,691 : INFO : topic #31 (0.020): 0.057*\"fusiform\" + 0.026*\"scientist\" + 0.024*\"taxpay\" + 0.024*\"player\" + 0.020*\"place\" + 0.014*\"clot\" + 0.013*\"leagu\" + 0.011*\"folei\" + 0.010*\"yawn\" + 0.009*\"barber\"\n", + "2019-01-31 00:39:11,692 : INFO : topic #29 (0.020): 0.023*\"companhia\" + 0.011*\"million\" + 0.010*\"busi\" + 0.010*\"bank\" + 0.009*\"market\" + 0.008*\"yawn\" + 0.008*\"produc\" + 0.007*\"industri\" + 0.007*\"manag\" + 0.007*\"function\"\n", + "2019-01-31 00:39:11,698 : INFO : topic diff=0.007065, rho=0.038376\n", + "2019-01-31 00:39:14,455 : INFO : -11.740 per-word bound, 3420.1 perplexity estimate based on a held-out corpus of 2000 documents with 572905 words\n", + "2019-01-31 00:39:14,456 : INFO : PROGRESS: pass 0, at document #1360000/4922894\n", + "2019-01-31 00:39:15,870 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:39:16,136 : INFO : topic #17 (0.020): 0.079*\"church\" + 0.023*\"christian\" + 0.020*\"cathol\" + 0.020*\"bishop\" + 0.016*\"sail\" + 0.014*\"retroflex\" + 0.009*\"centuri\" + 0.009*\"relationship\" + 0.009*\"cathedr\" + 0.009*\"italian\"\n", + "2019-01-31 00:39:16,137 : INFO : topic #42 (0.020): 0.045*\"german\" + 0.029*\"germani\" + 0.015*\"vol\" + 0.013*\"berlin\" + 0.013*\"jewish\" + 0.013*\"der\" + 0.013*\"israel\" + 0.010*\"european\" + 0.009*\"europ\" + 0.008*\"itali\"\n", + "2019-01-31 00:39:16,138 : INFO : topic #20 (0.020): 0.139*\"scholar\" + 0.040*\"struggl\" + 0.032*\"high\" + 0.029*\"educ\" + 0.023*\"collector\" + 0.019*\"yawn\" + 0.014*\"prognosi\" + 0.010*\"gothic\" + 0.009*\"district\" + 0.009*\"task\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 00:39:16,140 : INFO : topic #14 (0.020): 0.024*\"forc\" + 0.023*\"aggress\" + 0.020*\"walter\" + 0.019*\"armi\" + 0.016*\"com\" + 0.014*\"oper\" + 0.013*\"unionist\" + 0.013*\"diversifi\" + 0.012*\"militari\" + 0.012*\"airbu\"\n", + "2019-01-31 00:39:16,141 : INFO : topic #9 (0.020): 0.067*\"bone\" + 0.045*\"american\" + 0.028*\"valour\" + 0.019*\"folei\" + 0.019*\"dutch\" + 0.018*\"polit\" + 0.018*\"player\" + 0.015*\"english\" + 0.013*\"acrimoni\" + 0.012*\"simpler\"\n", + "2019-01-31 00:39:16,146 : INFO : topic diff=0.005609, rho=0.038348\n", + "2019-01-31 00:39:16,305 : INFO : PROGRESS: pass 0, at document #1362000/4922894\n", + "2019-01-31 00:39:17,705 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:39:17,971 : INFO : topic #35 (0.020): 0.058*\"russia\" + 0.037*\"rural\" + 0.036*\"sovereignti\" + 0.025*\"personifi\" + 0.023*\"poison\" + 0.023*\"reprint\" + 0.020*\"moscow\" + 0.016*\"unfortun\" + 0.016*\"poland\" + 0.014*\"alexand\"\n", + "2019-01-31 00:39:17,973 : INFO : topic #36 (0.020): 0.012*\"network\" + 0.011*\"prognosi\" + 0.010*\"pop\" + 0.009*\"develop\" + 0.008*\"cytokin\" + 0.008*\"softwar\" + 0.008*\"championship\" + 0.007*\"base\" + 0.007*\"user\" + 0.007*\"includ\"\n", + "2019-01-31 00:39:17,974 : INFO : topic #15 (0.020): 0.011*\"small\" + 0.011*\"organ\" + 0.011*\"develop\" + 0.010*\"commun\" + 0.010*\"word\" + 0.009*\"group\" + 0.008*\"peopl\" + 0.007*\"cultur\" + 0.007*\"human\" + 0.006*\"socialist\"\n", + "2019-01-31 00:39:17,975 : INFO : topic #2 (0.020): 0.046*\"isl\" + 0.037*\"shield\" + 0.018*\"narrat\" + 0.014*\"scot\" + 0.013*\"blur\" + 0.012*\"pope\" + 0.011*\"coalit\" + 0.010*\"nativist\" + 0.009*\"bahá\" + 0.009*\"vernon\"\n", + "2019-01-31 00:39:17,976 : INFO : topic #43 (0.020): 0.062*\"elect\" + 0.053*\"parti\" + 0.024*\"voluntari\" + 0.022*\"member\" + 0.022*\"democrat\" + 0.017*\"polici\" + 0.014*\"republ\" + 0.014*\"liber\" + 0.013*\"selma\" + 0.013*\"seaport\"\n", + "2019-01-31 00:39:17,982 : INFO : topic diff=0.006322, rho=0.038320\n", + "2019-01-31 00:39:18,137 : INFO : PROGRESS: pass 0, at document #1364000/4922894\n", + "2019-01-31 00:39:19,533 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:39:19,799 : INFO : topic #41 (0.020): 0.043*\"citi\" + 0.028*\"new\" + 0.021*\"palmer\" + 0.014*\"strategist\" + 0.013*\"center\" + 0.012*\"open\" + 0.012*\"year\" + 0.011*\"includ\" + 0.010*\"lobe\" + 0.009*\"highli\"\n", + "2019-01-31 00:39:19,800 : INFO : topic #27 (0.020): 0.071*\"questionnair\" + 0.019*\"taxpay\" + 0.018*\"candid\" + 0.014*\"ret\" + 0.012*\"driver\" + 0.012*\"find\" + 0.011*\"tornado\" + 0.010*\"fool\" + 0.010*\"théori\" + 0.010*\"scientist\"\n", + "2019-01-31 00:39:19,801 : INFO : topic #1 (0.020): 0.056*\"china\" + 0.046*\"chilton\" + 0.023*\"korea\" + 0.022*\"hong\" + 0.022*\"kong\" + 0.018*\"korean\" + 0.018*\"sourc\" + 0.014*\"kim\" + 0.014*\"leah\" + 0.012*\"shirin\"\n", + "2019-01-31 00:39:19,802 : INFO : topic #24 (0.020): 0.041*\"book\" + 0.034*\"publicis\" + 0.023*\"word\" + 0.018*\"new\" + 0.015*\"edit\" + 0.013*\"presid\" + 0.013*\"storag\" + 0.012*\"nicola\" + 0.011*\"collect\" + 0.011*\"worldwid\"\n", + "2019-01-31 00:39:19,803 : INFO : topic #32 (0.020): 0.050*\"district\" + 0.045*\"vigour\" + 0.044*\"popolo\" + 0.043*\"tortur\" + 0.030*\"cotton\" + 0.029*\"area\" + 0.023*\"multitud\" + 0.023*\"regim\" + 0.021*\"citi\" + 0.019*\"cede\"\n", + "2019-01-31 00:39:19,809 : INFO : topic diff=0.006663, rho=0.038292\n", + "2019-01-31 00:39:19,964 : INFO : PROGRESS: pass 0, at document #1366000/4922894\n", + "2019-01-31 00:39:21,356 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:39:21,622 : INFO : topic #48 (0.020): 0.077*\"sens\" + 0.077*\"march\" + 0.075*\"octob\" + 0.071*\"august\" + 0.070*\"januari\" + 0.070*\"juli\" + 0.068*\"notion\" + 0.067*\"april\" + 0.065*\"decatur\" + 0.065*\"judici\"\n", + "2019-01-31 00:39:21,624 : INFO : topic #24 (0.020): 0.041*\"book\" + 0.034*\"publicis\" + 0.024*\"word\" + 0.018*\"new\" + 0.014*\"edit\" + 0.013*\"presid\" + 0.013*\"storag\" + 0.012*\"nicola\" + 0.011*\"worldwid\" + 0.011*\"collect\"\n", + "2019-01-31 00:39:21,625 : INFO : topic #38 (0.020): 0.023*\"walter\" + 0.010*\"aza\" + 0.009*\"forc\" + 0.009*\"battalion\" + 0.007*\"empath\" + 0.007*\"armi\" + 0.007*\"teufel\" + 0.007*\"militari\" + 0.006*\"pour\" + 0.006*\"king\"\n", + "2019-01-31 00:39:21,626 : INFO : topic #10 (0.020): 0.012*\"cdd\" + 0.007*\"disco\" + 0.007*\"pathwai\" + 0.007*\"media\" + 0.007*\"treat\" + 0.006*\"caus\" + 0.006*\"proper\" + 0.006*\"have\" + 0.006*\"hormon\" + 0.006*\"effect\"\n", + "2019-01-31 00:39:21,627 : INFO : topic #33 (0.020): 0.060*\"french\" + 0.045*\"franc\" + 0.029*\"pari\" + 0.025*\"jean\" + 0.023*\"sail\" + 0.017*\"daphn\" + 0.014*\"lazi\" + 0.014*\"loui\" + 0.012*\"piec\" + 0.012*\"wreath\"\n", + "2019-01-31 00:39:21,633 : INFO : topic diff=0.006700, rho=0.038264\n", + "2019-01-31 00:39:21,791 : INFO : PROGRESS: pass 0, at document #1368000/4922894\n", + "2019-01-31 00:39:23,185 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:39:23,451 : INFO : topic #3 (0.020): 0.035*\"present\" + 0.026*\"offic\" + 0.025*\"minist\" + 0.021*\"govern\" + 0.021*\"nation\" + 0.020*\"serv\" + 0.019*\"member\" + 0.018*\"gener\" + 0.017*\"seri\" + 0.015*\"start\"\n", + "2019-01-31 00:39:23,452 : INFO : topic #43 (0.020): 0.062*\"elect\" + 0.052*\"parti\" + 0.024*\"voluntari\" + 0.023*\"member\" + 0.022*\"democrat\" + 0.017*\"republ\" + 0.016*\"polici\" + 0.014*\"report\" + 0.014*\"selma\" + 0.014*\"liber\"\n", + "2019-01-31 00:39:23,453 : INFO : topic #45 (0.020): 0.023*\"jpg\" + 0.022*\"fifteenth\" + 0.017*\"illicit\" + 0.016*\"western\" + 0.016*\"colder\" + 0.015*\"black\" + 0.013*\"record\" + 0.010*\"blind\" + 0.007*\"light\" + 0.007*\"green\"\n", + "2019-01-31 00:39:23,454 : INFO : topic #46 (0.020): 0.018*\"stop\" + 0.017*\"swedish\" + 0.016*\"norwai\" + 0.016*\"sweden\" + 0.015*\"damag\" + 0.015*\"wind\" + 0.014*\"norwegian\" + 0.013*\"replac\" + 0.012*\"treeless\" + 0.011*\"denmark\"\n", + "2019-01-31 00:39:23,455 : INFO : topic #18 (0.020): 0.010*\"théori\" + 0.007*\"later\" + 0.007*\"sack\" + 0.006*\"kill\" + 0.006*\"dai\" + 0.005*\"retrospect\" + 0.005*\"like\" + 0.005*\"end\" + 0.004*\"call\" + 0.004*\"kenworthi\"\n", + "2019-01-31 00:39:23,461 : INFO : topic diff=0.006293, rho=0.038236\n", + "2019-01-31 00:39:23,617 : INFO : PROGRESS: pass 0, at document #1370000/4922894\n", + "2019-01-31 00:39:25,004 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:39:25,270 : INFO : topic #44 (0.020): 0.032*\"rooftop\" + 0.028*\"final\" + 0.022*\"wife\" + 0.021*\"tourist\" + 0.018*\"champion\" + 0.016*\"taxpay\" + 0.015*\"martin\" + 0.014*\"chamber\" + 0.014*\"tiepolo\" + 0.014*\"open\"\n", + "2019-01-31 00:39:25,272 : INFO : topic #33 (0.020): 0.061*\"french\" + 0.045*\"franc\" + 0.029*\"pari\" + 0.025*\"jean\" + 0.023*\"sail\" + 0.017*\"daphn\" + 0.014*\"lazi\" + 0.013*\"loui\" + 0.012*\"piec\" + 0.012*\"wreath\"\n", + "2019-01-31 00:39:25,274 : INFO : topic #38 (0.020): 0.023*\"walter\" + 0.010*\"aza\" + 0.009*\"battalion\" + 0.009*\"forc\" + 0.007*\"teufel\" + 0.007*\"armi\" + 0.007*\"empath\" + 0.007*\"militari\" + 0.006*\"pour\" + 0.006*\"king\"\n", + "2019-01-31 00:39:25,275 : INFO : topic #42 (0.020): 0.044*\"german\" + 0.030*\"germani\" + 0.015*\"vol\" + 0.013*\"berlin\" + 0.013*\"der\" + 0.013*\"israel\" + 0.013*\"jewish\" + 0.010*\"european\" + 0.009*\"europ\" + 0.009*\"itali\"\n", + "2019-01-31 00:39:25,276 : INFO : topic #49 (0.020): 0.042*\"india\" + 0.030*\"incumb\" + 0.013*\"televis\" + 0.012*\"pakistan\" + 0.012*\"anglo\" + 0.012*\"islam\" + 0.011*\"sri\" + 0.011*\"tajikistan\" + 0.010*\"khalsa\" + 0.010*\"muskoge\"\n", + "2019-01-31 00:39:25,282 : INFO : topic diff=0.004829, rho=0.038208\n", + "2019-01-31 00:39:25,440 : INFO : PROGRESS: pass 0, at document #1372000/4922894\n", + "2019-01-31 00:39:26,820 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:39:27,087 : INFO : topic #43 (0.020): 0.062*\"elect\" + 0.053*\"parti\" + 0.024*\"voluntari\" + 0.023*\"member\" + 0.022*\"democrat\" + 0.016*\"polici\" + 0.016*\"republ\" + 0.014*\"selma\" + 0.014*\"report\" + 0.014*\"liber\"\n", + "2019-01-31 00:39:27,089 : INFO : topic #31 (0.020): 0.057*\"fusiform\" + 0.026*\"scientist\" + 0.024*\"player\" + 0.024*\"taxpay\" + 0.020*\"place\" + 0.014*\"clot\" + 0.013*\"leagu\" + 0.011*\"folei\" + 0.010*\"yawn\" + 0.009*\"barber\"\n", + "2019-01-31 00:39:27,089 : INFO : topic #39 (0.020): 0.051*\"canada\" + 0.038*\"canadian\" + 0.020*\"hoar\" + 0.020*\"toronto\" + 0.018*\"ontario\" + 0.016*\"hydrogen\" + 0.013*\"new\" + 0.012*\"novotná\" + 0.012*\"misericordia\" + 0.011*\"quebec\"\n", + "2019-01-31 00:39:27,091 : INFO : topic #38 (0.020): 0.023*\"walter\" + 0.010*\"aza\" + 0.009*\"battalion\" + 0.009*\"forc\" + 0.007*\"teufel\" + 0.007*\"armi\" + 0.007*\"empath\" + 0.007*\"militari\" + 0.006*\"pour\" + 0.006*\"king\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 00:39:27,092 : INFO : topic #24 (0.020): 0.041*\"book\" + 0.034*\"publicis\" + 0.023*\"word\" + 0.018*\"new\" + 0.014*\"edit\" + 0.013*\"presid\" + 0.013*\"storag\" + 0.012*\"nicola\" + 0.012*\"collect\" + 0.011*\"worldwid\"\n", + "2019-01-31 00:39:27,097 : INFO : topic diff=0.006412, rho=0.038180\n", + "2019-01-31 00:39:27,310 : INFO : PROGRESS: pass 0, at document #1374000/4922894\n", + "2019-01-31 00:39:28,710 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:39:28,976 : INFO : topic #48 (0.020): 0.077*\"march\" + 0.077*\"sens\" + 0.075*\"octob\" + 0.070*\"juli\" + 0.070*\"januari\" + 0.069*\"august\" + 0.068*\"notion\" + 0.067*\"april\" + 0.065*\"decatur\" + 0.065*\"judici\"\n", + "2019-01-31 00:39:28,977 : INFO : topic #12 (0.020): 0.007*\"number\" + 0.007*\"frontal\" + 0.006*\"poet\" + 0.006*\"théori\" + 0.006*\"exampl\" + 0.006*\"gener\" + 0.006*\"southern\" + 0.006*\"measur\" + 0.006*\"servitud\" + 0.005*\"method\"\n", + "2019-01-31 00:39:28,978 : INFO : topic #28 (0.020): 0.031*\"build\" + 0.025*\"hous\" + 0.021*\"rivièr\" + 0.017*\"buford\" + 0.012*\"histor\" + 0.012*\"briarwood\" + 0.011*\"constitut\" + 0.011*\"linear\" + 0.011*\"strategist\" + 0.010*\"depress\"\n", + "2019-01-31 00:39:28,980 : INFO : topic #16 (0.020): 0.049*\"king\" + 0.033*\"priest\" + 0.022*\"quarterli\" + 0.020*\"duke\" + 0.018*\"grammat\" + 0.017*\"rotterdam\" + 0.017*\"idiosyncrat\" + 0.015*\"brazil\" + 0.014*\"princ\" + 0.013*\"portugues\"\n", + "2019-01-31 00:39:28,981 : INFO : topic #11 (0.020): 0.026*\"john\" + 0.013*\"will\" + 0.012*\"jame\" + 0.012*\"david\" + 0.010*\"rival\" + 0.010*\"mexican–american\" + 0.009*\"georg\" + 0.008*\"paul\" + 0.008*\"slur\" + 0.008*\"rhyme\"\n", + "2019-01-31 00:39:28,987 : INFO : topic diff=0.006169, rho=0.038152\n", + "2019-01-31 00:39:29,146 : INFO : PROGRESS: pass 0, at document #1376000/4922894\n", + "2019-01-31 00:39:30,566 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:39:30,833 : INFO : topic #6 (0.020): 0.070*\"fewer\" + 0.024*\"epiru\" + 0.023*\"septemb\" + 0.018*\"teacher\" + 0.017*\"stake\" + 0.012*\"rodríguez\" + 0.012*\"proclaim\" + 0.011*\"movi\" + 0.011*\"direct\" + 0.010*\"acrimoni\"\n", + "2019-01-31 00:39:30,834 : INFO : topic #32 (0.020): 0.050*\"district\" + 0.045*\"vigour\" + 0.044*\"popolo\" + 0.043*\"tortur\" + 0.030*\"cotton\" + 0.029*\"area\" + 0.023*\"multitud\" + 0.023*\"regim\" + 0.021*\"citi\" + 0.019*\"cede\"\n", + "2019-01-31 00:39:30,834 : INFO : topic #43 (0.020): 0.063*\"elect\" + 0.053*\"parti\" + 0.024*\"voluntari\" + 0.023*\"member\" + 0.022*\"democrat\" + 0.017*\"polici\" + 0.016*\"republ\" + 0.014*\"liber\" + 0.014*\"report\" + 0.014*\"selma\"\n", + "2019-01-31 00:39:30,836 : INFO : topic #39 (0.020): 0.050*\"canada\" + 0.037*\"canadian\" + 0.020*\"toronto\" + 0.019*\"hoar\" + 0.018*\"ontario\" + 0.015*\"hydrogen\" + 0.014*\"new\" + 0.012*\"misericordia\" + 0.012*\"novotná\" + 0.011*\"quebec\"\n", + "2019-01-31 00:39:30,837 : INFO : topic #18 (0.020): 0.010*\"théori\" + 0.007*\"later\" + 0.007*\"sack\" + 0.006*\"kill\" + 0.006*\"dai\" + 0.005*\"retrospect\" + 0.005*\"like\" + 0.004*\"end\" + 0.004*\"kenworthi\" + 0.004*\"call\"\n", + "2019-01-31 00:39:30,843 : INFO : topic diff=0.007082, rho=0.038125\n", + "2019-01-31 00:39:30,995 : INFO : PROGRESS: pass 0, at document #1378000/4922894\n", + "2019-01-31 00:39:32,361 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:39:32,627 : INFO : topic #12 (0.020): 0.008*\"number\" + 0.007*\"frontal\" + 0.007*\"théori\" + 0.006*\"exampl\" + 0.006*\"poet\" + 0.006*\"gener\" + 0.006*\"southern\" + 0.006*\"measur\" + 0.005*\"servitud\" + 0.005*\"method\"\n", + "2019-01-31 00:39:32,628 : INFO : topic #31 (0.020): 0.058*\"fusiform\" + 0.025*\"scientist\" + 0.025*\"player\" + 0.024*\"taxpay\" + 0.020*\"place\" + 0.014*\"clot\" + 0.013*\"leagu\" + 0.011*\"folei\" + 0.010*\"yawn\" + 0.009*\"ruler\"\n", + "2019-01-31 00:39:32,630 : INFO : topic #26 (0.020): 0.032*\"workplac\" + 0.030*\"champion\" + 0.027*\"olymp\" + 0.026*\"woman\" + 0.025*\"men\" + 0.021*\"medal\" + 0.020*\"event\" + 0.018*\"atheist\" + 0.017*\"taxpay\" + 0.017*\"nation\"\n", + "2019-01-31 00:39:32,631 : INFO : topic #29 (0.020): 0.025*\"companhia\" + 0.011*\"million\" + 0.010*\"busi\" + 0.010*\"bank\" + 0.009*\"market\" + 0.008*\"yawn\" + 0.008*\"produc\" + 0.007*\"industri\" + 0.007*\"manag\" + 0.007*\"function\"\n", + "2019-01-31 00:39:32,632 : INFO : topic #14 (0.020): 0.023*\"forc\" + 0.023*\"aggress\" + 0.020*\"walter\" + 0.020*\"armi\" + 0.017*\"com\" + 0.014*\"oper\" + 0.013*\"unionist\" + 0.012*\"militari\" + 0.012*\"diversifi\" + 0.012*\"airbu\"\n", + "2019-01-31 00:39:32,638 : INFO : topic diff=0.006106, rho=0.038097\n", + "2019-01-31 00:39:35,373 : INFO : -11.573 per-word bound, 3047.1 perplexity estimate based on a held-out corpus of 2000 documents with 550957 words\n", + "2019-01-31 00:39:35,373 : INFO : PROGRESS: pass 0, at document #1380000/4922894\n", + "2019-01-31 00:39:36,785 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:39:37,051 : INFO : topic #23 (0.020): 0.133*\"audit\" + 0.067*\"best\" + 0.036*\"yawn\" + 0.029*\"jacksonvil\" + 0.025*\"festiv\" + 0.024*\"japanes\" + 0.022*\"noll\" + 0.021*\"intern\" + 0.019*\"women\" + 0.015*\"prison\"\n", + "2019-01-31 00:39:37,052 : INFO : topic #5 (0.020): 0.038*\"abroad\" + 0.029*\"son\" + 0.027*\"rel\" + 0.026*\"reconstruct\" + 0.021*\"band\" + 0.017*\"muscl\" + 0.016*\"simultan\" + 0.014*\"charcoal\" + 0.014*\"toyota\" + 0.010*\"myspac\"\n", + "2019-01-31 00:39:37,053 : INFO : topic #8 (0.020): 0.026*\"law\" + 0.025*\"cortic\" + 0.019*\"start\" + 0.016*\"act\" + 0.014*\"ricardo\" + 0.012*\"case\" + 0.010*\"polaris\" + 0.009*\"replac\" + 0.008*\"legal\" + 0.007*\"judaism\"\n", + "2019-01-31 00:39:37,055 : INFO : topic #10 (0.020): 0.013*\"cdd\" + 0.008*\"pathwai\" + 0.007*\"disco\" + 0.007*\"media\" + 0.006*\"caus\" + 0.006*\"treat\" + 0.006*\"proper\" + 0.006*\"effect\" + 0.006*\"have\" + 0.006*\"hormon\"\n", + "2019-01-31 00:39:37,056 : INFO : topic #40 (0.020): 0.085*\"unit\" + 0.023*\"schuster\" + 0.023*\"collector\" + 0.022*\"institut\" + 0.020*\"requir\" + 0.018*\"student\" + 0.013*\"professor\" + 0.012*\"http\" + 0.012*\"word\" + 0.011*\"degre\"\n", + "2019-01-31 00:39:37,061 : INFO : topic diff=0.004557, rho=0.038069\n", + "2019-01-31 00:39:37,218 : INFO : PROGRESS: pass 0, at document #1382000/4922894\n", + "2019-01-31 00:39:38,608 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:39:38,874 : INFO : topic #9 (0.020): 0.067*\"bone\" + 0.044*\"american\" + 0.027*\"valour\" + 0.019*\"folei\" + 0.019*\"dutch\" + 0.018*\"polit\" + 0.017*\"player\" + 0.017*\"english\" + 0.012*\"acrimoni\" + 0.012*\"simpler\"\n", + "2019-01-31 00:39:38,875 : INFO : topic #0 (0.020): 0.066*\"statewid\" + 0.042*\"line\" + 0.038*\"arsen\" + 0.036*\"raid\" + 0.027*\"museo\" + 0.020*\"traceabl\" + 0.017*\"serv\" + 0.015*\"pain\" + 0.014*\"exhaust\" + 0.012*\"artist\"\n", + "2019-01-31 00:39:38,876 : INFO : topic #28 (0.020): 0.031*\"build\" + 0.026*\"hous\" + 0.020*\"rivièr\" + 0.017*\"buford\" + 0.012*\"histor\" + 0.011*\"briarwood\" + 0.011*\"constitut\" + 0.011*\"linear\" + 0.010*\"strategist\" + 0.010*\"depress\"\n", + "2019-01-31 00:39:38,877 : INFO : topic #41 (0.020): 0.044*\"citi\" + 0.028*\"new\" + 0.022*\"palmer\" + 0.014*\"strategist\" + 0.013*\"center\" + 0.012*\"open\" + 0.011*\"year\" + 0.011*\"includ\" + 0.010*\"lobe\" + 0.010*\"highli\"\n", + "2019-01-31 00:39:38,878 : INFO : topic #25 (0.020): 0.030*\"ring\" + 0.018*\"warmth\" + 0.017*\"lagrang\" + 0.017*\"area\" + 0.015*\"mount\" + 0.009*\"palmer\" + 0.009*\"north\" + 0.008*\"foam\" + 0.008*\"land\" + 0.008*\"lobe\"\n", + "2019-01-31 00:39:38,884 : INFO : topic diff=0.004632, rho=0.038042\n", + "2019-01-31 00:39:39,044 : INFO : PROGRESS: pass 0, at document #1384000/4922894\n", + "2019-01-31 00:39:40,437 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:39:40,704 : INFO : topic #8 (0.020): 0.027*\"law\" + 0.025*\"cortic\" + 0.018*\"start\" + 0.015*\"act\" + 0.014*\"ricardo\" + 0.012*\"case\" + 0.011*\"polaris\" + 0.009*\"replac\" + 0.008*\"legal\" + 0.007*\"judaism\"\n", + "2019-01-31 00:39:40,705 : INFO : topic #25 (0.020): 0.030*\"ring\" + 0.018*\"warmth\" + 0.017*\"lagrang\" + 0.017*\"area\" + 0.015*\"mount\" + 0.009*\"palmer\" + 0.009*\"north\" + 0.008*\"foam\" + 0.008*\"land\" + 0.008*\"lobe\"\n", + "2019-01-31 00:39:40,707 : INFO : topic #4 (0.020): 0.021*\"enfranchis\" + 0.016*\"depress\" + 0.015*\"pour\" + 0.010*\"elabor\" + 0.008*\"mode\" + 0.008*\"veget\" + 0.007*\"encyclopedia\" + 0.007*\"produc\" + 0.007*\"uruguayan\" + 0.007*\"develop\"\n", + "2019-01-31 00:39:40,708 : INFO : topic #46 (0.020): 0.018*\"swedish\" + 0.017*\"stop\" + 0.016*\"sweden\" + 0.016*\"norwai\" + 0.015*\"norwegian\" + 0.015*\"damag\" + 0.014*\"wind\" + 0.012*\"replac\" + 0.012*\"denmark\" + 0.011*\"treeless\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 00:39:40,709 : INFO : topic #37 (0.020): 0.009*\"man\" + 0.009*\"love\" + 0.007*\"gestur\" + 0.006*\"comic\" + 0.006*\"blue\" + 0.005*\"septemb\" + 0.005*\"charact\" + 0.004*\"appear\" + 0.004*\"litig\" + 0.004*\"black\"\n", + "2019-01-31 00:39:40,715 : INFO : topic diff=0.006142, rho=0.038014\n", + "2019-01-31 00:39:40,869 : INFO : PROGRESS: pass 0, at document #1386000/4922894\n", + "2019-01-31 00:39:42,244 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:39:42,510 : INFO : topic #24 (0.020): 0.041*\"book\" + 0.035*\"publicis\" + 0.023*\"word\" + 0.018*\"new\" + 0.014*\"edit\" + 0.013*\"presid\" + 0.013*\"storag\" + 0.012*\"nicola\" + 0.012*\"collect\" + 0.011*\"worldwid\"\n", + "2019-01-31 00:39:42,511 : INFO : topic #18 (0.020): 0.010*\"théori\" + 0.007*\"later\" + 0.007*\"sack\" + 0.006*\"kill\" + 0.006*\"dai\" + 0.005*\"retrospect\" + 0.005*\"like\" + 0.005*\"end\" + 0.004*\"call\" + 0.004*\"kenworthi\"\n", + "2019-01-31 00:39:42,512 : INFO : topic #2 (0.020): 0.049*\"isl\" + 0.036*\"shield\" + 0.019*\"narrat\" + 0.014*\"scot\" + 0.013*\"pope\" + 0.012*\"blur\" + 0.010*\"coalit\" + 0.010*\"nativist\" + 0.010*\"bahá\" + 0.009*\"fleet\"\n", + "2019-01-31 00:39:42,514 : INFO : topic #7 (0.020): 0.021*\"snatch\" + 0.019*\"di\" + 0.018*\"factor\" + 0.016*\"yawn\" + 0.015*\"margin\" + 0.014*\"bone\" + 0.013*\"life\" + 0.012*\"faster\" + 0.012*\"will\" + 0.011*\"deal\"\n", + "2019-01-31 00:39:42,515 : INFO : topic #41 (0.020): 0.043*\"citi\" + 0.028*\"new\" + 0.021*\"palmer\" + 0.014*\"strategist\" + 0.013*\"center\" + 0.012*\"open\" + 0.011*\"year\" + 0.011*\"includ\" + 0.010*\"lobe\" + 0.009*\"highli\"\n", + "2019-01-31 00:39:42,521 : INFO : topic diff=0.006396, rho=0.037987\n", + "2019-01-31 00:39:42,671 : INFO : PROGRESS: pass 0, at document #1388000/4922894\n", + "2019-01-31 00:39:44,029 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:39:44,295 : INFO : topic #6 (0.020): 0.071*\"fewer\" + 0.023*\"septemb\" + 0.023*\"epiru\" + 0.018*\"teacher\" + 0.017*\"stake\" + 0.012*\"rodríguez\" + 0.012*\"proclaim\" + 0.011*\"direct\" + 0.011*\"movi\" + 0.010*\"acrimoni\"\n", + "2019-01-31 00:39:44,296 : INFO : topic #47 (0.020): 0.065*\"muscl\" + 0.034*\"perceptu\" + 0.019*\"theater\" + 0.019*\"place\" + 0.018*\"compos\" + 0.016*\"damn\" + 0.014*\"orchestr\" + 0.014*\"olympo\" + 0.013*\"physician\" + 0.012*\"jack\"\n", + "2019-01-31 00:39:44,297 : INFO : topic #39 (0.020): 0.050*\"canada\" + 0.038*\"canadian\" + 0.020*\"toronto\" + 0.019*\"hoar\" + 0.018*\"ontario\" + 0.014*\"hydrogen\" + 0.014*\"new\" + 0.012*\"novotná\" + 0.012*\"misericordia\" + 0.011*\"quebec\"\n", + "2019-01-31 00:39:44,298 : INFO : topic #0 (0.020): 0.066*\"statewid\" + 0.041*\"line\" + 0.038*\"arsen\" + 0.036*\"raid\" + 0.027*\"museo\" + 0.021*\"traceabl\" + 0.017*\"serv\" + 0.015*\"pain\" + 0.014*\"exhaust\" + 0.012*\"artist\"\n", + "2019-01-31 00:39:44,299 : INFO : topic #9 (0.020): 0.068*\"bone\" + 0.044*\"american\" + 0.028*\"valour\" + 0.019*\"dutch\" + 0.019*\"folei\" + 0.018*\"polit\" + 0.017*\"player\" + 0.017*\"english\" + 0.012*\"acrimoni\" + 0.012*\"simpler\"\n", + "2019-01-31 00:39:44,305 : INFO : topic diff=0.006081, rho=0.037959\n", + "2019-01-31 00:39:44,465 : INFO : PROGRESS: pass 0, at document #1390000/4922894\n", + "2019-01-31 00:39:45,885 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:39:46,151 : INFO : topic #37 (0.020): 0.010*\"man\" + 0.009*\"love\" + 0.007*\"gestur\" + 0.006*\"comic\" + 0.006*\"blue\" + 0.005*\"septemb\" + 0.005*\"charact\" + 0.004*\"litig\" + 0.004*\"appear\" + 0.004*\"black\"\n", + "2019-01-31 00:39:46,152 : INFO : topic #12 (0.020): 0.008*\"frontal\" + 0.007*\"number\" + 0.007*\"utopian\" + 0.007*\"poet\" + 0.006*\"théori\" + 0.006*\"gener\" + 0.006*\"exampl\" + 0.006*\"measur\" + 0.006*\"southern\" + 0.006*\"method\"\n", + "2019-01-31 00:39:46,154 : INFO : topic #5 (0.020): 0.038*\"abroad\" + 0.028*\"son\" + 0.026*\"rel\" + 0.026*\"reconstruct\" + 0.021*\"band\" + 0.017*\"muscl\" + 0.016*\"simultan\" + 0.014*\"charcoal\" + 0.014*\"toyota\" + 0.010*\"myspac\"\n", + "2019-01-31 00:39:46,155 : INFO : topic #43 (0.020): 0.063*\"elect\" + 0.053*\"parti\" + 0.024*\"voluntari\" + 0.023*\"member\" + 0.022*\"democrat\" + 0.017*\"polici\" + 0.015*\"republ\" + 0.014*\"report\" + 0.014*\"selma\" + 0.013*\"liber\"\n", + "2019-01-31 00:39:46,156 : INFO : topic #40 (0.020): 0.086*\"unit\" + 0.023*\"schuster\" + 0.023*\"collector\" + 0.022*\"institut\" + 0.020*\"requir\" + 0.018*\"student\" + 0.013*\"professor\" + 0.013*\"http\" + 0.012*\"word\" + 0.011*\"degre\"\n", + "2019-01-31 00:39:46,162 : INFO : topic diff=0.005939, rho=0.037932\n", + "2019-01-31 00:39:46,312 : INFO : PROGRESS: pass 0, at document #1392000/4922894\n", + "2019-01-31 00:39:47,678 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:39:47,944 : INFO : topic #42 (0.020): 0.045*\"german\" + 0.031*\"germani\" + 0.015*\"vol\" + 0.014*\"berlin\" + 0.013*\"der\" + 0.013*\"israel\" + 0.013*\"jewish\" + 0.010*\"european\" + 0.010*\"europ\" + 0.009*\"itali\"\n", + "2019-01-31 00:39:47,945 : INFO : topic #9 (0.020): 0.070*\"bone\" + 0.044*\"american\" + 0.027*\"valour\" + 0.019*\"dutch\" + 0.019*\"folei\" + 0.018*\"polit\" + 0.017*\"player\" + 0.016*\"english\" + 0.012*\"acrimoni\" + 0.011*\"simpler\"\n", + "2019-01-31 00:39:47,946 : INFO : topic #15 (0.020): 0.011*\"organ\" + 0.011*\"small\" + 0.010*\"develop\" + 0.010*\"commun\" + 0.010*\"word\" + 0.009*\"group\" + 0.008*\"peopl\" + 0.008*\"cultur\" + 0.007*\"human\" + 0.007*\"socialist\"\n", + "2019-01-31 00:39:47,947 : INFO : topic #14 (0.020): 0.024*\"forc\" + 0.023*\"aggress\" + 0.020*\"walter\" + 0.020*\"armi\" + 0.017*\"com\" + 0.014*\"oper\" + 0.013*\"unionist\" + 0.013*\"airbu\" + 0.012*\"militari\" + 0.011*\"diversifi\"\n", + "2019-01-31 00:39:47,948 : INFO : topic #20 (0.020): 0.143*\"scholar\" + 0.039*\"struggl\" + 0.037*\"high\" + 0.030*\"educ\" + 0.023*\"collector\" + 0.019*\"yawn\" + 0.014*\"prognosi\" + 0.010*\"gothic\" + 0.009*\"district\" + 0.009*\"task\"\n", + "2019-01-31 00:39:47,954 : INFO : topic diff=0.005970, rho=0.037905\n", + "2019-01-31 00:39:48,113 : INFO : PROGRESS: pass 0, at document #1394000/4922894\n", + "2019-01-31 00:39:49,531 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:39:49,798 : INFO : topic #17 (0.020): 0.080*\"church\" + 0.022*\"christian\" + 0.021*\"bishop\" + 0.021*\"cathol\" + 0.016*\"sail\" + 0.014*\"retroflex\" + 0.010*\"parish\" + 0.009*\"relationship\" + 0.009*\"centuri\" + 0.009*\"cathedr\"\n", + "2019-01-31 00:39:49,799 : INFO : topic #20 (0.020): 0.143*\"scholar\" + 0.040*\"struggl\" + 0.037*\"high\" + 0.030*\"educ\" + 0.023*\"collector\" + 0.018*\"yawn\" + 0.014*\"prognosi\" + 0.010*\"gothic\" + 0.009*\"district\" + 0.009*\"task\"\n", + "2019-01-31 00:39:49,800 : INFO : topic #13 (0.020): 0.027*\"sourc\" + 0.027*\"australia\" + 0.025*\"london\" + 0.025*\"new\" + 0.022*\"england\" + 0.022*\"australian\" + 0.020*\"british\" + 0.017*\"ireland\" + 0.015*\"youth\" + 0.015*\"wale\"\n", + "2019-01-31 00:39:49,801 : INFO : topic #26 (0.020): 0.032*\"workplac\" + 0.029*\"champion\" + 0.027*\"olymp\" + 0.027*\"woman\" + 0.025*\"men\" + 0.021*\"medal\" + 0.020*\"event\" + 0.018*\"taxpay\" + 0.018*\"atheist\" + 0.017*\"nation\"\n", + "2019-01-31 00:39:49,802 : INFO : topic #36 (0.020): 0.012*\"pop\" + 0.011*\"prognosi\" + 0.011*\"network\" + 0.009*\"develop\" + 0.008*\"cytokin\" + 0.008*\"championship\" + 0.008*\"softwar\" + 0.007*\"user\" + 0.007*\"diggin\" + 0.007*\"includ\"\n", + "2019-01-31 00:39:49,808 : INFO : topic diff=0.005093, rho=0.037878\n", + "2019-01-31 00:39:49,974 : INFO : PROGRESS: pass 0, at document #1396000/4922894\n", + "2019-01-31 00:39:51,427 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:39:51,693 : INFO : topic #1 (0.020): 0.058*\"china\" + 0.047*\"chilton\" + 0.024*\"hong\" + 0.023*\"kong\" + 0.021*\"korea\" + 0.017*\"korean\" + 0.017*\"sourc\" + 0.014*\"leah\" + 0.013*\"kim\" + 0.012*\"shirin\"\n", + "2019-01-31 00:39:51,694 : INFO : topic #37 (0.020): 0.010*\"man\" + 0.009*\"love\" + 0.007*\"gestur\" + 0.006*\"blue\" + 0.006*\"comic\" + 0.005*\"septemb\" + 0.005*\"charact\" + 0.004*\"litig\" + 0.004*\"appear\" + 0.004*\"black\"\n", + "2019-01-31 00:39:51,695 : INFO : topic #48 (0.020): 0.079*\"march\" + 0.078*\"sens\" + 0.076*\"octob\" + 0.076*\"juli\" + 0.072*\"august\" + 0.071*\"januari\" + 0.070*\"april\" + 0.069*\"notion\" + 0.069*\"judici\" + 0.066*\"decatur\"\n", + "2019-01-31 00:39:51,696 : INFO : topic #38 (0.020): 0.023*\"walter\" + 0.009*\"aza\" + 0.009*\"forc\" + 0.009*\"battalion\" + 0.008*\"teufel\" + 0.008*\"armi\" + 0.007*\"empath\" + 0.007*\"militari\" + 0.006*\"king\" + 0.006*\"till\"\n", + "2019-01-31 00:39:51,697 : INFO : topic #8 (0.020): 0.027*\"law\" + 0.025*\"cortic\" + 0.018*\"start\" + 0.015*\"act\" + 0.013*\"ricardo\" + 0.013*\"case\" + 0.010*\"polaris\" + 0.009*\"replac\" + 0.008*\"legal\" + 0.007*\"judaism\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 00:39:51,703 : INFO : topic diff=0.007833, rho=0.037851\n", + "2019-01-31 00:39:51,858 : INFO : PROGRESS: pass 0, at document #1398000/4922894\n", + "2019-01-31 00:39:53,244 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:39:53,511 : INFO : topic #12 (0.020): 0.008*\"frontal\" + 0.008*\"number\" + 0.007*\"utopian\" + 0.006*\"poet\" + 0.006*\"théori\" + 0.006*\"gener\" + 0.006*\"exampl\" + 0.006*\"southern\" + 0.006*\"measur\" + 0.006*\"method\"\n", + "2019-01-31 00:39:53,512 : INFO : topic #41 (0.020): 0.044*\"citi\" + 0.028*\"new\" + 0.021*\"palmer\" + 0.014*\"strategist\" + 0.013*\"center\" + 0.012*\"open\" + 0.011*\"year\" + 0.011*\"includ\" + 0.010*\"lobe\" + 0.009*\"highli\"\n", + "2019-01-31 00:39:53,513 : INFO : topic #6 (0.020): 0.070*\"fewer\" + 0.024*\"epiru\" + 0.024*\"septemb\" + 0.018*\"teacher\" + 0.017*\"stake\" + 0.012*\"rodríguez\" + 0.012*\"proclaim\" + 0.011*\"direct\" + 0.010*\"movi\" + 0.010*\"acrimoni\"\n", + "2019-01-31 00:39:53,514 : INFO : topic #10 (0.020): 0.013*\"cdd\" + 0.008*\"pathwai\" + 0.007*\"disco\" + 0.007*\"media\" + 0.006*\"caus\" + 0.006*\"treat\" + 0.006*\"proper\" + 0.006*\"effect\" + 0.006*\"have\" + 0.006*\"acid\"\n", + "2019-01-31 00:39:53,515 : INFO : topic #35 (0.020): 0.061*\"russia\" + 0.037*\"rural\" + 0.036*\"sovereignti\" + 0.026*\"poison\" + 0.026*\"personifi\" + 0.024*\"reprint\" + 0.020*\"moscow\" + 0.017*\"poland\" + 0.017*\"unfortun\" + 0.014*\"tyrant\"\n", + "2019-01-31 00:39:53,521 : INFO : topic diff=0.005280, rho=0.037823\n", + "2019-01-31 00:39:56,202 : INFO : -11.583 per-word bound, 3068.1 perplexity estimate based on a held-out corpus of 2000 documents with 541339 words\n", + "2019-01-31 00:39:56,203 : INFO : PROGRESS: pass 0, at document #1400000/4922894\n", + "2019-01-31 00:39:57,598 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:39:57,865 : INFO : topic #38 (0.020): 0.023*\"walter\" + 0.009*\"aza\" + 0.009*\"forc\" + 0.009*\"battalion\" + 0.008*\"teufel\" + 0.008*\"armi\" + 0.007*\"empath\" + 0.007*\"militari\" + 0.006*\"king\" + 0.006*\"till\"\n", + "2019-01-31 00:39:57,866 : INFO : topic #21 (0.020): 0.034*\"samford\" + 0.022*\"spain\" + 0.018*\"del\" + 0.018*\"mexico\" + 0.014*\"soviet\" + 0.012*\"santa\" + 0.012*\"juan\" + 0.011*\"josé\" + 0.011*\"francisco\" + 0.011*\"plung\"\n", + "2019-01-31 00:39:57,867 : INFO : topic #45 (0.020): 0.024*\"jpg\" + 0.021*\"fifteenth\" + 0.018*\"illicit\" + 0.016*\"colder\" + 0.016*\"western\" + 0.016*\"black\" + 0.013*\"record\" + 0.010*\"blind\" + 0.008*\"light\" + 0.007*\"green\"\n", + "2019-01-31 00:39:57,868 : INFO : topic #37 (0.020): 0.010*\"man\" + 0.009*\"love\" + 0.007*\"gestur\" + 0.006*\"comic\" + 0.006*\"blue\" + 0.005*\"septemb\" + 0.005*\"charact\" + 0.004*\"litig\" + 0.004*\"appear\" + 0.004*\"black\"\n", + "2019-01-31 00:39:57,869 : INFO : topic #9 (0.020): 0.069*\"bone\" + 0.043*\"american\" + 0.027*\"valour\" + 0.019*\"dutch\" + 0.018*\"folei\" + 0.017*\"polit\" + 0.017*\"player\" + 0.016*\"english\" + 0.012*\"acrimoni\" + 0.012*\"simpler\"\n", + "2019-01-31 00:39:57,875 : INFO : topic diff=0.005368, rho=0.037796\n", + "2019-01-31 00:39:58,028 : INFO : PROGRESS: pass 0, at document #1402000/4922894\n", + "2019-01-31 00:39:59,406 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:39:59,673 : INFO : topic #41 (0.020): 0.043*\"citi\" + 0.028*\"new\" + 0.021*\"palmer\" + 0.014*\"strategist\" + 0.013*\"center\" + 0.012*\"open\" + 0.011*\"year\" + 0.011*\"includ\" + 0.010*\"lobe\" + 0.009*\"highli\"\n", + "2019-01-31 00:39:59,674 : INFO : topic #25 (0.020): 0.030*\"ring\" + 0.018*\"warmth\" + 0.017*\"lagrang\" + 0.016*\"area\" + 0.016*\"mount\" + 0.009*\"palmer\" + 0.008*\"north\" + 0.008*\"foam\" + 0.008*\"vacant\" + 0.008*\"lobe\"\n", + "2019-01-31 00:39:59,675 : INFO : topic #5 (0.020): 0.039*\"abroad\" + 0.028*\"son\" + 0.027*\"rel\" + 0.027*\"reconstruct\" + 0.021*\"band\" + 0.017*\"muscl\" + 0.016*\"simultan\" + 0.014*\"charcoal\" + 0.014*\"toyota\" + 0.010*\"myspac\"\n", + "2019-01-31 00:39:59,676 : INFO : topic #49 (0.020): 0.043*\"india\" + 0.030*\"incumb\" + 0.013*\"pakistan\" + 0.012*\"televis\" + 0.012*\"islam\" + 0.012*\"anglo\" + 0.010*\"alam\" + 0.010*\"khalsa\" + 0.010*\"sri\" + 0.009*\"tajikistan\"\n", + "2019-01-31 00:39:59,677 : INFO : topic #22 (0.020): 0.033*\"spars\" + 0.024*\"factor\" + 0.020*\"adulthood\" + 0.015*\"feel\" + 0.013*\"male\" + 0.013*\"hostil\" + 0.011*\"plaisir\" + 0.010*\"live\" + 0.010*\"genu\" + 0.008*\"yawn\"\n", + "2019-01-31 00:39:59,683 : INFO : topic diff=0.005208, rho=0.037769\n", + "2019-01-31 00:39:59,838 : INFO : PROGRESS: pass 0, at document #1404000/4922894\n", + "2019-01-31 00:40:01,227 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:40:01,493 : INFO : topic #38 (0.020): 0.023*\"walter\" + 0.009*\"aza\" + 0.009*\"battalion\" + 0.009*\"forc\" + 0.008*\"armi\" + 0.008*\"teufel\" + 0.007*\"empath\" + 0.007*\"militari\" + 0.006*\"king\" + 0.006*\"pour\"\n", + "2019-01-31 00:40:01,494 : INFO : topic #34 (0.020): 0.071*\"start\" + 0.031*\"american\" + 0.031*\"unionist\" + 0.029*\"cotton\" + 0.027*\"new\" + 0.016*\"year\" + 0.014*\"california\" + 0.013*\"warrior\" + 0.013*\"terri\" + 0.013*\"north\"\n", + "2019-01-31 00:40:01,495 : INFO : topic #14 (0.020): 0.024*\"forc\" + 0.023*\"aggress\" + 0.020*\"walter\" + 0.020*\"armi\" + 0.017*\"com\" + 0.014*\"oper\" + 0.013*\"unionist\" + 0.012*\"airbu\" + 0.012*\"militari\" + 0.012*\"airmen\"\n", + "2019-01-31 00:40:01,496 : INFO : topic #16 (0.020): 0.050*\"king\" + 0.030*\"priest\" + 0.021*\"quarterli\" + 0.020*\"duke\" + 0.019*\"grammat\" + 0.017*\"rotterdam\" + 0.017*\"idiosyncrat\" + 0.016*\"brazil\" + 0.015*\"princ\" + 0.014*\"kingdom\"\n", + "2019-01-31 00:40:01,497 : INFO : topic #24 (0.020): 0.041*\"book\" + 0.035*\"publicis\" + 0.023*\"word\" + 0.018*\"new\" + 0.015*\"edit\" + 0.013*\"nicola\" + 0.012*\"presid\" + 0.012*\"storag\" + 0.012*\"collect\" + 0.011*\"author\"\n", + "2019-01-31 00:40:01,503 : INFO : topic diff=0.005555, rho=0.037743\n", + "2019-01-31 00:40:01,714 : INFO : PROGRESS: pass 0, at document #1406000/4922894\n", + "2019-01-31 00:40:03,119 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:40:03,386 : INFO : topic #3 (0.020): 0.036*\"present\" + 0.027*\"offic\" + 0.023*\"minist\" + 0.021*\"nation\" + 0.020*\"govern\" + 0.019*\"member\" + 0.018*\"gener\" + 0.017*\"serv\" + 0.016*\"seri\" + 0.015*\"chickasaw\"\n", + "2019-01-31 00:40:03,387 : INFO : topic #0 (0.020): 0.065*\"statewid\" + 0.041*\"line\" + 0.036*\"arsen\" + 0.036*\"raid\" + 0.026*\"museo\" + 0.020*\"traceabl\" + 0.018*\"serv\" + 0.015*\"pain\" + 0.013*\"exhaust\" + 0.012*\"oper\"\n", + "2019-01-31 00:40:03,388 : INFO : topic #36 (0.020): 0.012*\"pop\" + 0.011*\"prognosi\" + 0.011*\"network\" + 0.009*\"develop\" + 0.009*\"cytokin\" + 0.008*\"softwar\" + 0.008*\"diggin\" + 0.007*\"championship\" + 0.007*\"user\" + 0.007*\"includ\"\n", + "2019-01-31 00:40:03,389 : INFO : topic #41 (0.020): 0.044*\"citi\" + 0.028*\"new\" + 0.021*\"palmer\" + 0.014*\"strategist\" + 0.013*\"center\" + 0.012*\"open\" + 0.011*\"year\" + 0.011*\"includ\" + 0.010*\"lobe\" + 0.009*\"highli\"\n", + "2019-01-31 00:40:03,390 : INFO : topic #46 (0.020): 0.017*\"swedish\" + 0.017*\"sweden\" + 0.017*\"norwai\" + 0.016*\"stop\" + 0.015*\"damag\" + 0.015*\"norwegian\" + 0.014*\"wind\" + 0.012*\"denmark\" + 0.011*\"replac\" + 0.011*\"farid\"\n", + "2019-01-31 00:40:03,396 : INFO : topic diff=0.005826, rho=0.037716\n", + "2019-01-31 00:40:03,555 : INFO : PROGRESS: pass 0, at document #1408000/4922894\n", + "2019-01-31 00:40:04,959 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:40:05,225 : INFO : topic #18 (0.020): 0.010*\"théori\" + 0.007*\"later\" + 0.007*\"sack\" + 0.006*\"kill\" + 0.006*\"dai\" + 0.005*\"retrospect\" + 0.005*\"like\" + 0.004*\"end\" + 0.004*\"kenworthi\" + 0.004*\"call\"\n", + "2019-01-31 00:40:05,226 : INFO : topic #24 (0.020): 0.040*\"book\" + 0.035*\"publicis\" + 0.023*\"word\" + 0.018*\"new\" + 0.015*\"edit\" + 0.013*\"nicola\" + 0.012*\"presid\" + 0.012*\"storag\" + 0.012*\"collect\" + 0.011*\"magazin\"\n", + "2019-01-31 00:40:05,228 : INFO : topic #25 (0.020): 0.030*\"ring\" + 0.018*\"warmth\" + 0.017*\"lagrang\" + 0.016*\"area\" + 0.016*\"mount\" + 0.009*\"palmer\" + 0.008*\"foam\" + 0.008*\"north\" + 0.008*\"lobe\" + 0.008*\"land\"\n", + "2019-01-31 00:40:05,228 : INFO : topic #13 (0.020): 0.028*\"sourc\" + 0.026*\"australia\" + 0.025*\"london\" + 0.025*\"new\" + 0.023*\"australian\" + 0.022*\"england\" + 0.020*\"british\" + 0.017*\"ireland\" + 0.015*\"wale\" + 0.014*\"youth\"\n", + "2019-01-31 00:40:05,229 : INFO : topic #43 (0.020): 0.064*\"elect\" + 0.054*\"parti\" + 0.025*\"voluntari\" + 0.022*\"member\" + 0.021*\"democrat\" + 0.017*\"polici\" + 0.015*\"seaport\" + 0.014*\"republ\" + 0.014*\"report\" + 0.013*\"liber\"\n", + "2019-01-31 00:40:05,236 : INFO : topic diff=0.005156, rho=0.037689\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 00:40:05,390 : INFO : PROGRESS: pass 0, at document #1410000/4922894\n", + "2019-01-31 00:40:06,764 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:40:07,030 : INFO : topic #42 (0.020): 0.046*\"german\" + 0.030*\"germani\" + 0.015*\"vol\" + 0.014*\"berlin\" + 0.014*\"jewish\" + 0.013*\"der\" + 0.013*\"israel\" + 0.010*\"european\" + 0.010*\"isra\" + 0.009*\"europ\"\n", + "2019-01-31 00:40:07,031 : INFO : topic #18 (0.020): 0.010*\"théori\" + 0.007*\"later\" + 0.007*\"sack\" + 0.006*\"kill\" + 0.006*\"dai\" + 0.005*\"retrospect\" + 0.005*\"like\" + 0.004*\"end\" + 0.004*\"wander\" + 0.004*\"kenworthi\"\n", + "2019-01-31 00:40:07,032 : INFO : topic #43 (0.020): 0.064*\"elect\" + 0.054*\"parti\" + 0.025*\"voluntari\" + 0.022*\"member\" + 0.021*\"democrat\" + 0.016*\"polici\" + 0.015*\"seaport\" + 0.015*\"republ\" + 0.014*\"report\" + 0.013*\"liber\"\n", + "2019-01-31 00:40:07,033 : INFO : topic #22 (0.020): 0.033*\"spars\" + 0.024*\"factor\" + 0.021*\"adulthood\" + 0.015*\"feel\" + 0.014*\"male\" + 0.013*\"hostil\" + 0.011*\"plaisir\" + 0.010*\"genu\" + 0.010*\"live\" + 0.008*\"yawn\"\n", + "2019-01-31 00:40:07,034 : INFO : topic #20 (0.020): 0.143*\"scholar\" + 0.039*\"struggl\" + 0.035*\"high\" + 0.030*\"educ\" + 0.022*\"collector\" + 0.018*\"yawn\" + 0.013*\"prognosi\" + 0.009*\"pseudo\" + 0.009*\"gothic\" + 0.009*\"district\"\n", + "2019-01-31 00:40:07,040 : INFO : topic diff=0.004562, rho=0.037662\n", + "2019-01-31 00:40:07,193 : INFO : PROGRESS: pass 0, at document #1412000/4922894\n", + "2019-01-31 00:40:08,575 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:40:08,841 : INFO : topic #42 (0.020): 0.046*\"german\" + 0.030*\"germani\" + 0.014*\"vol\" + 0.014*\"jewish\" + 0.013*\"berlin\" + 0.013*\"der\" + 0.013*\"israel\" + 0.010*\"isra\" + 0.010*\"european\" + 0.009*\"europ\"\n", + "2019-01-31 00:40:08,842 : INFO : topic #49 (0.020): 0.043*\"india\" + 0.031*\"incumb\" + 0.012*\"pakistan\" + 0.012*\"islam\" + 0.012*\"anglo\" + 0.012*\"televis\" + 0.010*\"alam\" + 0.010*\"sri\" + 0.010*\"tajikistan\" + 0.010*\"khalsa\"\n", + "2019-01-31 00:40:08,843 : INFO : topic #27 (0.020): 0.068*\"questionnair\" + 0.018*\"taxpay\" + 0.017*\"ret\" + 0.017*\"candid\" + 0.013*\"find\" + 0.012*\"driver\" + 0.010*\"fool\" + 0.010*\"tornado\" + 0.010*\"scientist\" + 0.010*\"landslid\"\n", + "2019-01-31 00:40:08,844 : INFO : topic #1 (0.020): 0.056*\"china\" + 0.047*\"chilton\" + 0.023*\"hong\" + 0.023*\"kong\" + 0.021*\"korea\" + 0.016*\"korean\" + 0.016*\"sourc\" + 0.015*\"shirin\" + 0.014*\"leah\" + 0.014*\"kim\"\n", + "2019-01-31 00:40:08,846 : INFO : topic #3 (0.020): 0.035*\"present\" + 0.027*\"offic\" + 0.023*\"minist\" + 0.021*\"nation\" + 0.020*\"govern\" + 0.019*\"member\" + 0.017*\"gener\" + 0.017*\"serv\" + 0.017*\"seri\" + 0.015*\"chickasaw\"\n", + "2019-01-31 00:40:08,851 : INFO : topic diff=0.006399, rho=0.037635\n", + "2019-01-31 00:40:09,006 : INFO : PROGRESS: pass 0, at document #1414000/4922894\n", + "2019-01-31 00:40:10,377 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:40:10,643 : INFO : topic #2 (0.020): 0.048*\"isl\" + 0.037*\"shield\" + 0.019*\"narrat\" + 0.014*\"pope\" + 0.014*\"scot\" + 0.012*\"blur\" + 0.011*\"nativist\" + 0.010*\"coalit\" + 0.009*\"bahá\" + 0.009*\"fleet\"\n", + "2019-01-31 00:40:10,644 : INFO : topic #48 (0.020): 0.079*\"sens\" + 0.077*\"march\" + 0.077*\"octob\" + 0.075*\"juli\" + 0.072*\"august\" + 0.069*\"april\" + 0.069*\"januari\" + 0.069*\"notion\" + 0.068*\"judici\" + 0.066*\"decatur\"\n", + "2019-01-31 00:40:10,645 : INFO : topic #46 (0.020): 0.018*\"swedish\" + 0.018*\"sweden\" + 0.016*\"norwai\" + 0.016*\"stop\" + 0.015*\"damag\" + 0.015*\"norwegian\" + 0.015*\"wind\" + 0.012*\"denmark\" + 0.011*\"replac\" + 0.011*\"farid\"\n", + "2019-01-31 00:40:10,646 : INFO : topic #16 (0.020): 0.049*\"king\" + 0.030*\"priest\" + 0.022*\"quarterli\" + 0.020*\"duke\" + 0.019*\"grammat\" + 0.018*\"rotterdam\" + 0.017*\"idiosyncrat\" + 0.015*\"brazil\" + 0.014*\"kingdom\" + 0.014*\"princ\"\n", + "2019-01-31 00:40:10,647 : INFO : topic #35 (0.020): 0.059*\"russia\" + 0.037*\"sovereignti\" + 0.037*\"rural\" + 0.026*\"poison\" + 0.025*\"personifi\" + 0.025*\"reprint\" + 0.020*\"moscow\" + 0.017*\"poland\" + 0.017*\"unfortun\" + 0.013*\"tyrant\"\n", + "2019-01-31 00:40:10,653 : INFO : topic diff=0.005349, rho=0.037609\n", + "2019-01-31 00:40:10,808 : INFO : PROGRESS: pass 0, at document #1416000/4922894\n", + "2019-01-31 00:40:12,144 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:40:12,413 : INFO : topic #9 (0.020): 0.070*\"bone\" + 0.042*\"american\" + 0.028*\"valour\" + 0.019*\"dutch\" + 0.018*\"folei\" + 0.018*\"polit\" + 0.017*\"player\" + 0.016*\"english\" + 0.011*\"acrimoni\" + 0.011*\"simpler\"\n", + "2019-01-31 00:40:12,414 : INFO : topic #43 (0.020): 0.065*\"elect\" + 0.054*\"parti\" + 0.025*\"voluntari\" + 0.023*\"democrat\" + 0.022*\"member\" + 0.016*\"polici\" + 0.016*\"republ\" + 0.015*\"seaport\" + 0.013*\"liber\" + 0.013*\"selma\"\n", + "2019-01-31 00:40:12,415 : INFO : topic #14 (0.020): 0.024*\"forc\" + 0.023*\"aggress\" + 0.020*\"walter\" + 0.020*\"armi\" + 0.017*\"com\" + 0.013*\"oper\" + 0.013*\"unionist\" + 0.012*\"airbu\" + 0.012*\"militari\" + 0.012*\"airmen\"\n", + "2019-01-31 00:40:12,416 : INFO : topic #49 (0.020): 0.043*\"india\" + 0.030*\"incumb\" + 0.013*\"islam\" + 0.013*\"pakistan\" + 0.012*\"televis\" + 0.012*\"anglo\" + 0.010*\"alam\" + 0.010*\"tajikistan\" + 0.010*\"khalsa\" + 0.010*\"sri\"\n", + "2019-01-31 00:40:12,417 : INFO : topic #12 (0.020): 0.008*\"frontal\" + 0.008*\"number\" + 0.007*\"gener\" + 0.006*\"utopian\" + 0.006*\"exampl\" + 0.006*\"poet\" + 0.006*\"théori\" + 0.006*\"southern\" + 0.006*\"measur\" + 0.006*\"theoret\"\n", + "2019-01-31 00:40:12,423 : INFO : topic diff=0.007461, rho=0.037582\n", + "2019-01-31 00:40:12,582 : INFO : PROGRESS: pass 0, at document #1418000/4922894\n", + "2019-01-31 00:40:13,998 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:40:14,264 : INFO : topic #27 (0.020): 0.068*\"questionnair\" + 0.019*\"taxpay\" + 0.017*\"candid\" + 0.016*\"ret\" + 0.013*\"find\" + 0.012*\"driver\" + 0.011*\"tornado\" + 0.010*\"fool\" + 0.010*\"landslid\" + 0.010*\"théori\"\n", + "2019-01-31 00:40:14,265 : INFO : topic #20 (0.020): 0.143*\"scholar\" + 0.040*\"struggl\" + 0.035*\"high\" + 0.030*\"educ\" + 0.021*\"collector\" + 0.018*\"yawn\" + 0.013*\"prognosi\" + 0.010*\"gothic\" + 0.009*\"district\" + 0.009*\"pseudo\"\n", + "2019-01-31 00:40:14,266 : INFO : topic #34 (0.020): 0.071*\"start\" + 0.032*\"unionist\" + 0.031*\"american\" + 0.031*\"cotton\" + 0.027*\"new\" + 0.016*\"year\" + 0.014*\"california\" + 0.013*\"warrior\" + 0.012*\"north\" + 0.012*\"terri\"\n", + "2019-01-31 00:40:14,267 : INFO : topic #22 (0.020): 0.033*\"spars\" + 0.024*\"factor\" + 0.020*\"adulthood\" + 0.015*\"feel\" + 0.014*\"male\" + 0.013*\"hostil\" + 0.011*\"plaisir\" + 0.010*\"genu\" + 0.009*\"live\" + 0.008*\"biom\"\n", + "2019-01-31 00:40:14,268 : INFO : topic #4 (0.020): 0.022*\"enfranchis\" + 0.015*\"depress\" + 0.015*\"pour\" + 0.009*\"elabor\" + 0.008*\"mode\" + 0.007*\"veget\" + 0.007*\"encyclopedia\" + 0.007*\"uruguayan\" + 0.007*\"produc\" + 0.007*\"develop\"\n", + "2019-01-31 00:40:14,274 : INFO : topic diff=0.005952, rho=0.037556\n", + "2019-01-31 00:40:17,008 : INFO : -11.470 per-word bound, 2837.0 perplexity estimate based on a held-out corpus of 2000 documents with 578534 words\n", + "2019-01-31 00:40:17,008 : INFO : PROGRESS: pass 0, at document #1420000/4922894\n", + "2019-01-31 00:40:18,402 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:40:18,669 : INFO : topic #18 (0.020): 0.011*\"théori\" + 0.007*\"later\" + 0.007*\"sack\" + 0.006*\"dai\" + 0.006*\"kill\" + 0.005*\"retrospect\" + 0.005*\"like\" + 0.004*\"end\" + 0.004*\"wander\" + 0.004*\"kenworthi\"\n", + "2019-01-31 00:40:18,671 : INFO : topic #12 (0.020): 0.008*\"number\" + 0.008*\"frontal\" + 0.007*\"gener\" + 0.006*\"utopian\" + 0.006*\"poet\" + 0.006*\"exampl\" + 0.006*\"théori\" + 0.006*\"theoret\" + 0.006*\"southern\" + 0.006*\"measur\"\n", + "2019-01-31 00:40:18,672 : INFO : topic #4 (0.020): 0.022*\"enfranchis\" + 0.015*\"depress\" + 0.015*\"pour\" + 0.009*\"elabor\" + 0.008*\"veget\" + 0.007*\"mode\" + 0.007*\"uruguayan\" + 0.007*\"encyclopedia\" + 0.007*\"produc\" + 0.007*\"develop\"\n", + "2019-01-31 00:40:18,673 : INFO : topic #35 (0.020): 0.059*\"russia\" + 0.038*\"sovereignti\" + 0.036*\"rural\" + 0.026*\"poison\" + 0.025*\"reprint\" + 0.024*\"personifi\" + 0.021*\"moscow\" + 0.018*\"unfortun\" + 0.017*\"poland\" + 0.013*\"czech\"\n", + "2019-01-31 00:40:18,674 : INFO : topic #10 (0.020): 0.013*\"cdd\" + 0.008*\"media\" + 0.008*\"pathwai\" + 0.008*\"disco\" + 0.006*\"proper\" + 0.006*\"acid\" + 0.006*\"have\" + 0.006*\"treat\" + 0.006*\"caus\" + 0.006*\"hormon\"\n", + "2019-01-31 00:40:18,679 : INFO : topic diff=0.006277, rho=0.037529\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 00:40:18,839 : INFO : PROGRESS: pass 0, at document #1422000/4922894\n", + "2019-01-31 00:40:20,255 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:40:20,521 : INFO : topic #37 (0.020): 0.009*\"man\" + 0.009*\"love\" + 0.007*\"gestur\" + 0.006*\"comic\" + 0.006*\"blue\" + 0.005*\"septemb\" + 0.005*\"charact\" + 0.004*\"black\" + 0.004*\"appear\" + 0.004*\"litig\"\n", + "2019-01-31 00:40:20,523 : INFO : topic #41 (0.020): 0.043*\"citi\" + 0.028*\"new\" + 0.022*\"palmer\" + 0.014*\"strategist\" + 0.013*\"center\" + 0.012*\"open\" + 0.011*\"year\" + 0.011*\"includ\" + 0.010*\"lobe\" + 0.009*\"highli\"\n", + "2019-01-31 00:40:20,524 : INFO : topic #3 (0.020): 0.036*\"present\" + 0.027*\"offic\" + 0.023*\"minist\" + 0.022*\"nation\" + 0.020*\"govern\" + 0.019*\"member\" + 0.017*\"gener\" + 0.017*\"serv\" + 0.017*\"seri\" + 0.015*\"chickasaw\"\n", + "2019-01-31 00:40:20,525 : INFO : topic #32 (0.020): 0.052*\"district\" + 0.046*\"vigour\" + 0.044*\"popolo\" + 0.042*\"tortur\" + 0.030*\"cotton\" + 0.027*\"area\" + 0.025*\"multitud\" + 0.022*\"regim\" + 0.021*\"citi\" + 0.019*\"cede\"\n", + "2019-01-31 00:40:20,526 : INFO : topic #29 (0.020): 0.025*\"companhia\" + 0.011*\"million\" + 0.010*\"busi\" + 0.009*\"bank\" + 0.009*\"market\" + 0.009*\"produc\" + 0.008*\"yawn\" + 0.008*\"industri\" + 0.008*\"manag\" + 0.007*\"function\"\n", + "2019-01-31 00:40:20,532 : INFO : topic diff=0.006061, rho=0.037503\n", + "2019-01-31 00:40:20,683 : INFO : PROGRESS: pass 0, at document #1424000/4922894\n", + "2019-01-31 00:40:22,056 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:40:22,321 : INFO : topic #42 (0.020): 0.045*\"german\" + 0.030*\"germani\" + 0.014*\"vol\" + 0.014*\"jewish\" + 0.014*\"berlin\" + 0.013*\"der\" + 0.013*\"israel\" + 0.010*\"european\" + 0.009*\"itali\" + 0.009*\"isra\"\n", + "2019-01-31 00:40:22,322 : INFO : topic #30 (0.020): 0.037*\"leagu\" + 0.035*\"cleveland\" + 0.029*\"place\" + 0.026*\"taxpay\" + 0.025*\"scientist\" + 0.024*\"crete\" + 0.022*\"folei\" + 0.017*\"goal\" + 0.015*\"martin\" + 0.012*\"schmitz\"\n", + "2019-01-31 00:40:22,323 : INFO : topic #46 (0.020): 0.020*\"sweden\" + 0.018*\"swedish\" + 0.016*\"norwai\" + 0.016*\"stop\" + 0.015*\"wind\" + 0.014*\"damag\" + 0.014*\"norwegian\" + 0.012*\"denmark\" + 0.011*\"replac\" + 0.011*\"farid\"\n", + "2019-01-31 00:40:22,324 : INFO : topic #36 (0.020): 0.011*\"pop\" + 0.011*\"prognosi\" + 0.011*\"network\" + 0.009*\"develop\" + 0.008*\"cytokin\" + 0.008*\"softwar\" + 0.008*\"diggin\" + 0.008*\"user\" + 0.007*\"includ\" + 0.007*\"base\"\n", + "2019-01-31 00:40:22,326 : INFO : topic #45 (0.020): 0.025*\"jpg\" + 0.022*\"fifteenth\" + 0.017*\"illicit\" + 0.017*\"colder\" + 0.016*\"black\" + 0.015*\"western\" + 0.012*\"record\" + 0.010*\"blind\" + 0.008*\"light\" + 0.007*\"depress\"\n", + "2019-01-31 00:40:22,331 : INFO : topic diff=0.005725, rho=0.037477\n", + "2019-01-31 00:40:22,486 : INFO : PROGRESS: pass 0, at document #1426000/4922894\n", + "2019-01-31 00:40:23,877 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:40:24,143 : INFO : topic #22 (0.020): 0.033*\"spars\" + 0.024*\"factor\" + 0.020*\"adulthood\" + 0.015*\"feel\" + 0.013*\"male\" + 0.013*\"hostil\" + 0.011*\"plaisir\" + 0.010*\"genu\" + 0.009*\"live\" + 0.008*\"yawn\"\n", + "2019-01-31 00:40:24,144 : INFO : topic #49 (0.020): 0.043*\"india\" + 0.030*\"incumb\" + 0.013*\"islam\" + 0.013*\"pakistan\" + 0.012*\"anglo\" + 0.011*\"televis\" + 0.011*\"sri\" + 0.010*\"muskoge\" + 0.010*\"alam\" + 0.010*\"tajikistan\"\n", + "2019-01-31 00:40:24,146 : INFO : topic #41 (0.020): 0.043*\"citi\" + 0.028*\"new\" + 0.022*\"palmer\" + 0.014*\"strategist\" + 0.013*\"center\" + 0.012*\"open\" + 0.011*\"year\" + 0.011*\"includ\" + 0.010*\"lobe\" + 0.009*\"highli\"\n", + "2019-01-31 00:40:24,147 : INFO : topic #34 (0.020): 0.072*\"start\" + 0.032*\"unionist\" + 0.032*\"cotton\" + 0.031*\"american\" + 0.027*\"new\" + 0.016*\"year\" + 0.013*\"california\" + 0.013*\"warrior\" + 0.012*\"north\" + 0.012*\"terri\"\n", + "2019-01-31 00:40:24,148 : INFO : topic #10 (0.020): 0.012*\"cdd\" + 0.008*\"media\" + 0.008*\"disco\" + 0.007*\"pathwai\" + 0.007*\"have\" + 0.007*\"acid\" + 0.006*\"proper\" + 0.006*\"caus\" + 0.006*\"treat\" + 0.006*\"effect\"\n", + "2019-01-31 00:40:24,154 : INFO : topic diff=0.006087, rho=0.037450\n", + "2019-01-31 00:40:24,311 : INFO : PROGRESS: pass 0, at document #1428000/4922894\n", + "2019-01-31 00:40:25,687 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:40:25,957 : INFO : topic #19 (0.020): 0.014*\"languag\" + 0.011*\"centuri\" + 0.011*\"woodcut\" + 0.010*\"form\" + 0.009*\"origin\" + 0.008*\"mean\" + 0.008*\"trade\" + 0.007*\"god\" + 0.007*\"like\" + 0.006*\"uruguayan\"\n", + "2019-01-31 00:40:25,958 : INFO : topic #24 (0.020): 0.040*\"book\" + 0.035*\"publicis\" + 0.023*\"word\" + 0.018*\"new\" + 0.015*\"edit\" + 0.013*\"presid\" + 0.012*\"storag\" + 0.012*\"nicola\" + 0.011*\"collect\" + 0.011*\"magazin\"\n", + "2019-01-31 00:40:25,959 : INFO : topic #45 (0.020): 0.025*\"jpg\" + 0.022*\"fifteenth\" + 0.017*\"illicit\" + 0.017*\"colder\" + 0.016*\"black\" + 0.015*\"western\" + 0.012*\"record\" + 0.010*\"blind\" + 0.008*\"light\" + 0.007*\"depress\"\n", + "2019-01-31 00:40:25,960 : INFO : topic #37 (0.020): 0.009*\"man\" + 0.009*\"love\" + 0.007*\"gestur\" + 0.006*\"comic\" + 0.006*\"septemb\" + 0.005*\"blue\" + 0.005*\"charact\" + 0.004*\"appear\" + 0.004*\"black\" + 0.004*\"litig\"\n", + "2019-01-31 00:40:25,961 : INFO : topic #22 (0.020): 0.033*\"spars\" + 0.024*\"factor\" + 0.020*\"adulthood\" + 0.015*\"feel\" + 0.013*\"male\" + 0.013*\"hostil\" + 0.011*\"plaisir\" + 0.010*\"genu\" + 0.009*\"live\" + 0.008*\"yawn\"\n", + "2019-01-31 00:40:25,968 : INFO : topic diff=0.006226, rho=0.037424\n", + "2019-01-31 00:40:26,128 : INFO : PROGRESS: pass 0, at document #1430000/4922894\n", + "2019-01-31 00:40:27,524 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:40:27,791 : INFO : topic #2 (0.020): 0.047*\"isl\" + 0.037*\"shield\" + 0.019*\"narrat\" + 0.013*\"scot\" + 0.013*\"pope\" + 0.011*\"blur\" + 0.011*\"nativist\" + 0.010*\"coalit\" + 0.009*\"bahá\" + 0.009*\"fleet\"\n", + "2019-01-31 00:40:27,792 : INFO : topic #1 (0.020): 0.056*\"china\" + 0.046*\"chilton\" + 0.024*\"hong\" + 0.023*\"kong\" + 0.021*\"korea\" + 0.017*\"korean\" + 0.016*\"sourc\" + 0.015*\"kim\" + 0.015*\"shirin\" + 0.014*\"leah\"\n", + "2019-01-31 00:40:27,793 : INFO : topic #24 (0.020): 0.041*\"book\" + 0.035*\"publicis\" + 0.023*\"word\" + 0.018*\"new\" + 0.015*\"edit\" + 0.013*\"presid\" + 0.013*\"storag\" + 0.012*\"nicola\" + 0.011*\"collect\" + 0.011*\"magazin\"\n", + "2019-01-31 00:40:27,795 : INFO : topic #31 (0.020): 0.055*\"fusiform\" + 0.025*\"scientist\" + 0.025*\"player\" + 0.025*\"taxpay\" + 0.020*\"place\" + 0.014*\"clot\" + 0.012*\"leagu\" + 0.012*\"folei\" + 0.010*\"yawn\" + 0.009*\"yard\"\n", + "2019-01-31 00:40:27,796 : INFO : topic #41 (0.020): 0.043*\"citi\" + 0.028*\"new\" + 0.022*\"palmer\" + 0.014*\"strategist\" + 0.013*\"center\" + 0.012*\"open\" + 0.011*\"year\" + 0.011*\"includ\" + 0.010*\"lobe\" + 0.009*\"highli\"\n", + "2019-01-31 00:40:27,802 : INFO : topic diff=0.005176, rho=0.037398\n", + "2019-01-31 00:40:27,961 : INFO : PROGRESS: pass 0, at document #1432000/4922894\n", + "2019-01-31 00:40:29,363 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:40:29,629 : INFO : topic #33 (0.020): 0.063*\"french\" + 0.048*\"franc\" + 0.031*\"pari\" + 0.023*\"sail\" + 0.022*\"jean\" + 0.018*\"daphn\" + 0.015*\"lazi\" + 0.014*\"loui\" + 0.011*\"piec\" + 0.008*\"wine\"\n", + "2019-01-31 00:40:29,630 : INFO : topic #17 (0.020): 0.075*\"church\" + 0.021*\"cathol\" + 0.021*\"christian\" + 0.021*\"bishop\" + 0.015*\"sail\" + 0.015*\"retroflex\" + 0.009*\"relationship\" + 0.009*\"parish\" + 0.009*\"centuri\" + 0.009*\"historiographi\"\n", + "2019-01-31 00:40:29,632 : INFO : topic #2 (0.020): 0.047*\"isl\" + 0.037*\"shield\" + 0.019*\"narrat\" + 0.013*\"scot\" + 0.013*\"pope\" + 0.011*\"blur\" + 0.011*\"nativist\" + 0.010*\"coalit\" + 0.009*\"fleet\" + 0.009*\"bahá\"\n", + "2019-01-31 00:40:29,633 : INFO : topic #32 (0.020): 0.052*\"district\" + 0.045*\"vigour\" + 0.044*\"popolo\" + 0.043*\"tortur\" + 0.031*\"cotton\" + 0.027*\"area\" + 0.024*\"multitud\" + 0.022*\"regim\" + 0.021*\"citi\" + 0.019*\"cede\"\n", + "2019-01-31 00:40:29,634 : INFO : topic #1 (0.020): 0.056*\"china\" + 0.046*\"chilton\" + 0.024*\"hong\" + 0.023*\"kong\" + 0.021*\"korea\" + 0.017*\"korean\" + 0.016*\"sourc\" + 0.015*\"kim\" + 0.015*\"shirin\" + 0.014*\"leah\"\n", + "2019-01-31 00:40:29,640 : INFO : topic diff=0.006892, rho=0.037372\n", + "2019-01-31 00:40:29,795 : INFO : PROGRESS: pass 0, at document #1434000/4922894\n", + "2019-01-31 00:40:31,182 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:40:31,448 : INFO : topic #46 (0.020): 0.019*\"sweden\" + 0.017*\"swedish\" + 0.016*\"norwai\" + 0.016*\"stop\" + 0.015*\"norwegian\" + 0.015*\"wind\" + 0.014*\"damag\" + 0.011*\"replac\" + 0.011*\"denmark\" + 0.011*\"farid\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 00:40:31,449 : INFO : topic #5 (0.020): 0.039*\"abroad\" + 0.028*\"son\" + 0.027*\"rel\" + 0.026*\"reconstruct\" + 0.021*\"band\" + 0.017*\"muscl\" + 0.016*\"simultan\" + 0.014*\"charcoal\" + 0.014*\"toyota\" + 0.010*\"myspac\"\n", + "2019-01-31 00:40:31,450 : INFO : topic #2 (0.020): 0.047*\"isl\" + 0.037*\"shield\" + 0.019*\"narrat\" + 0.013*\"scot\" + 0.013*\"pope\" + 0.011*\"blur\" + 0.011*\"nativist\" + 0.010*\"coalit\" + 0.009*\"fleet\" + 0.009*\"bahá\"\n", + "2019-01-31 00:40:31,452 : INFO : topic #0 (0.020): 0.064*\"statewid\" + 0.039*\"line\" + 0.035*\"arsen\" + 0.035*\"raid\" + 0.026*\"museo\" + 0.020*\"traceabl\" + 0.018*\"serv\" + 0.015*\"pain\" + 0.013*\"exhaust\" + 0.012*\"oper\"\n", + "2019-01-31 00:40:31,453 : INFO : topic #14 (0.020): 0.024*\"forc\" + 0.023*\"aggress\" + 0.019*\"walter\" + 0.019*\"armi\" + 0.017*\"com\" + 0.013*\"unionist\" + 0.013*\"oper\" + 0.012*\"militari\" + 0.012*\"airbu\" + 0.012*\"airmen\"\n", + "2019-01-31 00:40:31,459 : INFO : topic diff=0.005614, rho=0.037346\n", + "2019-01-31 00:40:31,616 : INFO : PROGRESS: pass 0, at document #1436000/4922894\n", + "2019-01-31 00:40:33,473 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:40:33,740 : INFO : topic #24 (0.020): 0.041*\"book\" + 0.035*\"publicis\" + 0.023*\"word\" + 0.018*\"new\" + 0.015*\"edit\" + 0.013*\"presid\" + 0.013*\"storag\" + 0.012*\"nicola\" + 0.011*\"collect\" + 0.011*\"magazin\"\n", + "2019-01-31 00:40:33,742 : INFO : topic #45 (0.020): 0.025*\"jpg\" + 0.024*\"fifteenth\" + 0.017*\"illicit\" + 0.017*\"colder\" + 0.016*\"black\" + 0.014*\"western\" + 0.012*\"record\" + 0.010*\"blind\" + 0.007*\"light\" + 0.007*\"depress\"\n", + "2019-01-31 00:40:33,743 : INFO : topic #39 (0.020): 0.052*\"canada\" + 0.040*\"canadian\" + 0.021*\"toronto\" + 0.020*\"hoar\" + 0.019*\"ontario\" + 0.014*\"new\" + 0.013*\"hydrogen\" + 0.012*\"quebec\" + 0.012*\"novotná\" + 0.011*\"misericordia\"\n", + "2019-01-31 00:40:33,744 : INFO : topic #23 (0.020): 0.136*\"audit\" + 0.064*\"best\" + 0.036*\"yawn\" + 0.028*\"jacksonvil\" + 0.025*\"japanes\" + 0.022*\"festiv\" + 0.022*\"noll\" + 0.019*\"women\" + 0.019*\"intern\" + 0.014*\"prison\"\n", + "2019-01-31 00:40:33,745 : INFO : topic #43 (0.020): 0.063*\"elect\" + 0.053*\"parti\" + 0.024*\"voluntari\" + 0.024*\"democrat\" + 0.021*\"member\" + 0.016*\"polici\" + 0.015*\"republ\" + 0.015*\"seaport\" + 0.014*\"report\" + 0.014*\"liber\"\n", + "2019-01-31 00:40:33,751 : INFO : topic diff=0.005369, rho=0.037320\n", + "2019-01-31 00:40:33,908 : INFO : PROGRESS: pass 0, at document #1438000/4922894\n", + "2019-01-31 00:40:35,469 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:40:35,736 : INFO : topic #12 (0.020): 0.008*\"frontal\" + 0.008*\"number\" + 0.007*\"gener\" + 0.006*\"théori\" + 0.006*\"measur\" + 0.006*\"exampl\" + 0.006*\"utopian\" + 0.006*\"poet\" + 0.006*\"method\" + 0.006*\"theoret\"\n", + "2019-01-31 00:40:35,737 : INFO : topic #36 (0.020): 0.011*\"network\" + 0.011*\"prognosi\" + 0.011*\"pop\" + 0.009*\"develop\" + 0.008*\"cytokin\" + 0.008*\"diggin\" + 0.008*\"user\" + 0.008*\"softwar\" + 0.007*\"championship\" + 0.007*\"includ\"\n", + "2019-01-31 00:40:35,738 : INFO : topic #25 (0.020): 0.031*\"ring\" + 0.018*\"warmth\" + 0.016*\"area\" + 0.016*\"lagrang\" + 0.015*\"mount\" + 0.008*\"palmer\" + 0.008*\"foam\" + 0.008*\"land\" + 0.008*\"crayfish\" + 0.008*\"north\"\n", + "2019-01-31 00:40:35,739 : INFO : topic #35 (0.020): 0.058*\"russia\" + 0.037*\"sovereignti\" + 0.035*\"rural\" + 0.026*\"poison\" + 0.024*\"reprint\" + 0.023*\"personifi\" + 0.021*\"moscow\" + 0.018*\"unfortun\" + 0.017*\"poland\" + 0.014*\"tyrant\"\n", + "2019-01-31 00:40:35,740 : INFO : topic #39 (0.020): 0.051*\"canada\" + 0.040*\"canadian\" + 0.021*\"toronto\" + 0.019*\"hoar\" + 0.019*\"ontario\" + 0.014*\"new\" + 0.013*\"hydrogen\" + 0.012*\"quebec\" + 0.011*\"misericordia\" + 0.011*\"novotná\"\n", + "2019-01-31 00:40:35,746 : INFO : topic diff=0.005464, rho=0.037294\n", + "2019-01-31 00:40:38,513 : INFO : -11.663 per-word bound, 3243.7 perplexity estimate based on a held-out corpus of 2000 documents with 590721 words\n", + "2019-01-31 00:40:38,514 : INFO : PROGRESS: pass 0, at document #1440000/4922894\n", + "2019-01-31 00:40:39,905 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:40:40,171 : INFO : topic #46 (0.020): 0.019*\"sweden\" + 0.017*\"swedish\" + 0.016*\"norwai\" + 0.016*\"stop\" + 0.015*\"wind\" + 0.015*\"norwegian\" + 0.014*\"damag\" + 0.012*\"treeless\" + 0.011*\"denmark\" + 0.011*\"replac\"\n", + "2019-01-31 00:40:40,172 : INFO : topic #21 (0.020): 0.035*\"samford\" + 0.023*\"spain\" + 0.019*\"mexico\" + 0.018*\"del\" + 0.014*\"soviet\" + 0.012*\"santa\" + 0.012*\"juan\" + 0.011*\"francisco\" + 0.011*\"carlo\" + 0.011*\"lizard\"\n", + "2019-01-31 00:40:40,173 : INFO : topic #3 (0.020): 0.035*\"present\" + 0.027*\"offic\" + 0.023*\"minist\" + 0.021*\"nation\" + 0.020*\"govern\" + 0.019*\"member\" + 0.018*\"gener\" + 0.017*\"serv\" + 0.017*\"seri\" + 0.016*\"chickasaw\"\n", + "2019-01-31 00:40:40,174 : INFO : topic #29 (0.020): 0.025*\"companhia\" + 0.011*\"million\" + 0.010*\"busi\" + 0.009*\"market\" + 0.009*\"bank\" + 0.009*\"produc\" + 0.008*\"yawn\" + 0.008*\"industri\" + 0.007*\"manag\" + 0.007*\"function\"\n", + "2019-01-31 00:40:40,175 : INFO : topic #44 (0.020): 0.033*\"rooftop\" + 0.029*\"final\" + 0.022*\"wife\" + 0.020*\"tourist\" + 0.017*\"champion\" + 0.016*\"taxpay\" + 0.014*\"chamber\" + 0.014*\"martin\" + 0.014*\"tiepolo\" + 0.013*\"poet\"\n", + "2019-01-31 00:40:40,181 : INFO : topic diff=0.007480, rho=0.037268\n", + "2019-01-31 00:40:40,335 : INFO : PROGRESS: pass 0, at document #1442000/4922894\n", + "2019-01-31 00:40:41,711 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:40:41,977 : INFO : topic #47 (0.020): 0.065*\"muscl\" + 0.035*\"perceptu\" + 0.019*\"theater\" + 0.018*\"place\" + 0.018*\"compos\" + 0.016*\"damn\" + 0.016*\"physician\" + 0.014*\"olympo\" + 0.014*\"orchestr\" + 0.011*\"word\"\n", + "2019-01-31 00:40:41,978 : INFO : topic #43 (0.020): 0.063*\"elect\" + 0.053*\"parti\" + 0.024*\"voluntari\" + 0.024*\"democrat\" + 0.021*\"member\" + 0.016*\"polici\" + 0.015*\"republ\" + 0.014*\"seaport\" + 0.014*\"report\" + 0.014*\"bypass\"\n", + "2019-01-31 00:40:41,979 : INFO : topic #48 (0.020): 0.079*\"sens\" + 0.078*\"march\" + 0.078*\"octob\" + 0.075*\"juli\" + 0.071*\"januari\" + 0.070*\"august\" + 0.070*\"judici\" + 0.070*\"notion\" + 0.070*\"april\" + 0.067*\"decatur\"\n", + "2019-01-31 00:40:41,980 : INFO : topic #14 (0.020): 0.024*\"forc\" + 0.023*\"aggress\" + 0.020*\"armi\" + 0.020*\"walter\" + 0.018*\"com\" + 0.013*\"oper\" + 0.013*\"unionist\" + 0.013*\"militari\" + 0.011*\"airbu\" + 0.011*\"diversifi\"\n", + "2019-01-31 00:40:41,981 : INFO : topic #49 (0.020): 0.043*\"india\" + 0.030*\"incumb\" + 0.013*\"islam\" + 0.013*\"pakistan\" + 0.012*\"anglo\" + 0.011*\"televis\" + 0.011*\"muskoge\" + 0.010*\"tajikistan\" + 0.010*\"sri\" + 0.009*\"alam\"\n", + "2019-01-31 00:40:41,987 : INFO : topic diff=0.004971, rho=0.037242\n", + "2019-01-31 00:40:42,145 : INFO : PROGRESS: pass 0, at document #1444000/4922894\n", + "2019-01-31 00:40:43,578 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:40:43,845 : INFO : topic #47 (0.020): 0.065*\"muscl\" + 0.035*\"perceptu\" + 0.020*\"theater\" + 0.018*\"place\" + 0.018*\"compos\" + 0.016*\"damn\" + 0.015*\"physician\" + 0.014*\"olympo\" + 0.014*\"orchestr\" + 0.011*\"word\"\n", + "2019-01-31 00:40:43,846 : INFO : topic #29 (0.020): 0.025*\"companhia\" + 0.011*\"million\" + 0.010*\"busi\" + 0.010*\"market\" + 0.009*\"bank\" + 0.009*\"produc\" + 0.008*\"yawn\" + 0.008*\"industri\" + 0.007*\"manag\" + 0.007*\"function\"\n", + "2019-01-31 00:40:43,847 : INFO : topic #13 (0.020): 0.026*\"sourc\" + 0.026*\"australia\" + 0.026*\"london\" + 0.025*\"new\" + 0.023*\"australian\" + 0.023*\"england\" + 0.019*\"british\" + 0.017*\"ireland\" + 0.014*\"wale\" + 0.014*\"youth\"\n", + "2019-01-31 00:40:43,848 : INFO : topic #26 (0.020): 0.032*\"workplac\" + 0.030*\"champion\" + 0.028*\"woman\" + 0.026*\"olymp\" + 0.025*\"men\" + 0.022*\"medal\" + 0.021*\"event\" + 0.018*\"nation\" + 0.018*\"taxpay\" + 0.016*\"théori\"\n", + "2019-01-31 00:40:43,849 : INFO : topic #15 (0.020): 0.011*\"organ\" + 0.011*\"small\" + 0.010*\"develop\" + 0.010*\"commun\" + 0.009*\"word\" + 0.009*\"group\" + 0.008*\"peopl\" + 0.008*\"cultur\" + 0.007*\"human\" + 0.007*\"woman\"\n", + "2019-01-31 00:40:43,855 : INFO : topic diff=0.005690, rho=0.037216\n", + "2019-01-31 00:40:44,010 : INFO : PROGRESS: pass 0, at document #1446000/4922894\n", + "2019-01-31 00:40:45,401 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:40:45,671 : INFO : topic #35 (0.020): 0.058*\"russia\" + 0.038*\"sovereignti\" + 0.035*\"rural\" + 0.028*\"poison\" + 0.023*\"reprint\" + 0.022*\"personifi\" + 0.020*\"moscow\" + 0.019*\"unfortun\" + 0.017*\"poland\" + 0.014*\"malaysia\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 00:40:45,673 : INFO : topic #17 (0.020): 0.075*\"church\" + 0.021*\"cathol\" + 0.021*\"christian\" + 0.020*\"bishop\" + 0.016*\"sail\" + 0.015*\"retroflex\" + 0.011*\"cathedr\" + 0.009*\"parish\" + 0.009*\"relationship\" + 0.009*\"historiographi\"\n", + "2019-01-31 00:40:45,674 : INFO : topic #1 (0.020): 0.053*\"china\" + 0.043*\"chilton\" + 0.023*\"hong\" + 0.022*\"kong\" + 0.020*\"korea\" + 0.017*\"korean\" + 0.017*\"kim\" + 0.017*\"leah\" + 0.015*\"sourc\" + 0.014*\"shirin\"\n", + "2019-01-31 00:40:45,675 : INFO : topic #36 (0.020): 0.012*\"prognosi\" + 0.010*\"network\" + 0.010*\"pop\" + 0.009*\"develop\" + 0.008*\"cytokin\" + 0.008*\"championship\" + 0.008*\"user\" + 0.008*\"diggin\" + 0.008*\"softwar\" + 0.007*\"base\"\n", + "2019-01-31 00:40:45,676 : INFO : topic #12 (0.020): 0.008*\"frontal\" + 0.008*\"number\" + 0.007*\"gener\" + 0.006*\"théori\" + 0.006*\"exampl\" + 0.006*\"utopian\" + 0.006*\"measur\" + 0.006*\"poet\" + 0.006*\"theoret\" + 0.006*\"method\"\n", + "2019-01-31 00:40:45,682 : INFO : topic diff=0.005764, rho=0.037190\n", + "2019-01-31 00:40:45,837 : INFO : PROGRESS: pass 0, at document #1448000/4922894\n", + "2019-01-31 00:40:47,217 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:40:47,483 : INFO : topic #27 (0.020): 0.068*\"questionnair\" + 0.020*\"godaddi\" + 0.017*\"taxpay\" + 0.016*\"candid\" + 0.014*\"ret\" + 0.013*\"driver\" + 0.012*\"find\" + 0.012*\"fool\" + 0.011*\"poet\" + 0.011*\"landslid\"\n", + "2019-01-31 00:40:47,485 : INFO : topic #37 (0.020): 0.009*\"man\" + 0.009*\"love\" + 0.007*\"gestur\" + 0.006*\"septemb\" + 0.006*\"comic\" + 0.005*\"charact\" + 0.005*\"blue\" + 0.005*\"appear\" + 0.004*\"litig\" + 0.004*\"black\"\n", + "2019-01-31 00:40:47,486 : INFO : topic #47 (0.020): 0.063*\"muscl\" + 0.035*\"perceptu\" + 0.020*\"theater\" + 0.018*\"place\" + 0.017*\"compos\" + 0.017*\"damn\" + 0.015*\"physician\" + 0.014*\"orchestr\" + 0.014*\"olympo\" + 0.011*\"word\"\n", + "2019-01-31 00:40:47,487 : INFO : topic #34 (0.020): 0.072*\"start\" + 0.032*\"unionist\" + 0.032*\"american\" + 0.030*\"cotton\" + 0.027*\"new\" + 0.016*\"year\" + 0.013*\"california\" + 0.013*\"warrior\" + 0.012*\"terri\" + 0.012*\"north\"\n", + "2019-01-31 00:40:47,488 : INFO : topic #10 (0.020): 0.012*\"cdd\" + 0.008*\"media\" + 0.008*\"disco\" + 0.007*\"pathwai\" + 0.007*\"have\" + 0.006*\"acid\" + 0.006*\"caus\" + 0.006*\"proper\" + 0.006*\"hormon\" + 0.006*\"treat\"\n", + "2019-01-31 00:40:47,494 : INFO : topic diff=0.007230, rho=0.037165\n", + "2019-01-31 00:40:47,653 : INFO : PROGRESS: pass 0, at document #1450000/4922894\n", + "2019-01-31 00:40:49,053 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:40:49,319 : INFO : topic #3 (0.020): 0.034*\"present\" + 0.027*\"offic\" + 0.024*\"minist\" + 0.021*\"nation\" + 0.020*\"govern\" + 0.019*\"member\" + 0.019*\"gener\" + 0.017*\"serv\" + 0.017*\"seri\" + 0.015*\"chickasaw\"\n", + "2019-01-31 00:40:49,320 : INFO : topic #5 (0.020): 0.039*\"abroad\" + 0.028*\"son\" + 0.027*\"rel\" + 0.027*\"reconstruct\" + 0.022*\"band\" + 0.016*\"muscl\" + 0.016*\"simultan\" + 0.014*\"charcoal\" + 0.014*\"toyota\" + 0.010*\"myspac\"\n", + "2019-01-31 00:40:49,321 : INFO : topic #18 (0.020): 0.010*\"théori\" + 0.007*\"later\" + 0.007*\"sack\" + 0.006*\"kill\" + 0.006*\"dai\" + 0.005*\"retrospect\" + 0.005*\"like\" + 0.005*\"end\" + 0.004*\"help\" + 0.004*\"call\"\n", + "2019-01-31 00:40:49,322 : INFO : topic #33 (0.020): 0.063*\"french\" + 0.048*\"franc\" + 0.031*\"pari\" + 0.022*\"sail\" + 0.022*\"jean\" + 0.018*\"daphn\" + 0.015*\"lazi\" + 0.014*\"loui\" + 0.011*\"piec\" + 0.010*\"wine\"\n", + "2019-01-31 00:40:49,324 : INFO : topic #45 (0.020): 0.028*\"jpg\" + 0.025*\"fifteenth\" + 0.018*\"illicit\" + 0.016*\"colder\" + 0.015*\"black\" + 0.014*\"western\" + 0.012*\"record\" + 0.010*\"blind\" + 0.007*\"light\" + 0.007*\"green\"\n", + "2019-01-31 00:40:49,329 : INFO : topic diff=0.006050, rho=0.037139\n", + "2019-01-31 00:40:49,480 : INFO : PROGRESS: pass 0, at document #1452000/4922894\n", + "2019-01-31 00:40:50,832 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:40:51,099 : INFO : topic #16 (0.020): 0.052*\"king\" + 0.032*\"priest\" + 0.020*\"quarterli\" + 0.019*\"duke\" + 0.019*\"rotterdam\" + 0.019*\"grammat\" + 0.019*\"idiosyncrat\" + 0.014*\"kingdom\" + 0.013*\"brazil\" + 0.013*\"princ\"\n", + "2019-01-31 00:40:51,100 : INFO : topic #28 (0.020): 0.031*\"build\" + 0.025*\"hous\" + 0.023*\"rivièr\" + 0.017*\"buford\" + 0.013*\"briarwood\" + 0.012*\"histor\" + 0.011*\"constitut\" + 0.011*\"strategist\" + 0.010*\"depress\" + 0.010*\"linear\"\n", + "2019-01-31 00:40:51,101 : INFO : topic #33 (0.020): 0.063*\"french\" + 0.048*\"franc\" + 0.031*\"pari\" + 0.022*\"sail\" + 0.022*\"jean\" + 0.018*\"daphn\" + 0.015*\"lazi\" + 0.015*\"loui\" + 0.011*\"piec\" + 0.010*\"wine\"\n", + "2019-01-31 00:40:51,102 : INFO : topic #18 (0.020): 0.010*\"théori\" + 0.007*\"later\" + 0.007*\"sack\" + 0.006*\"kill\" + 0.006*\"dai\" + 0.005*\"retrospect\" + 0.005*\"like\" + 0.005*\"end\" + 0.004*\"help\" + 0.004*\"call\"\n", + "2019-01-31 00:40:51,103 : INFO : topic #13 (0.020): 0.027*\"sourc\" + 0.026*\"australia\" + 0.025*\"london\" + 0.024*\"new\" + 0.023*\"england\" + 0.023*\"australian\" + 0.019*\"british\" + 0.017*\"ireland\" + 0.014*\"wale\" + 0.014*\"youth\"\n", + "2019-01-31 00:40:51,109 : INFO : topic diff=0.005361, rho=0.037113\n", + "2019-01-31 00:40:51,269 : INFO : PROGRESS: pass 0, at document #1454000/4922894\n", + "2019-01-31 00:40:52,706 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:40:52,973 : INFO : topic #26 (0.020): 0.031*\"workplac\" + 0.030*\"champion\" + 0.028*\"woman\" + 0.026*\"olymp\" + 0.025*\"men\" + 0.022*\"medal\" + 0.021*\"event\" + 0.018*\"taxpay\" + 0.018*\"nation\" + 0.017*\"atheist\"\n", + "2019-01-31 00:40:52,974 : INFO : topic #6 (0.020): 0.071*\"fewer\" + 0.024*\"septemb\" + 0.024*\"epiru\" + 0.018*\"teacher\" + 0.016*\"stake\" + 0.013*\"proclaim\" + 0.012*\"rodríguez\" + 0.011*\"movi\" + 0.011*\"direct\" + 0.010*\"acrimoni\"\n", + "2019-01-31 00:40:52,975 : INFO : topic #46 (0.020): 0.018*\"sweden\" + 0.017*\"swedish\" + 0.016*\"norwai\" + 0.016*\"wind\" + 0.016*\"stop\" + 0.015*\"norwegian\" + 0.014*\"damag\" + 0.012*\"farid\" + 0.011*\"huntsvil\" + 0.011*\"denmark\"\n", + "2019-01-31 00:40:52,976 : INFO : topic #3 (0.020): 0.034*\"present\" + 0.027*\"offic\" + 0.023*\"minist\" + 0.021*\"nation\" + 0.020*\"govern\" + 0.019*\"member\" + 0.019*\"gener\" + 0.017*\"seri\" + 0.017*\"serv\" + 0.015*\"chickasaw\"\n", + "2019-01-31 00:40:52,977 : INFO : topic #10 (0.020): 0.012*\"cdd\" + 0.008*\"media\" + 0.008*\"disco\" + 0.007*\"pathwai\" + 0.007*\"have\" + 0.006*\"hormon\" + 0.006*\"acid\" + 0.006*\"caus\" + 0.006*\"proper\" + 0.006*\"treat\"\n", + "2019-01-31 00:40:52,983 : INFO : topic diff=0.007626, rho=0.037088\n", + "2019-01-31 00:40:53,138 : INFO : PROGRESS: pass 0, at document #1456000/4922894\n", + "2019-01-31 00:40:54,516 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:40:54,783 : INFO : topic #3 (0.020): 0.034*\"present\" + 0.027*\"offic\" + 0.023*\"minist\" + 0.021*\"nation\" + 0.020*\"govern\" + 0.019*\"member\" + 0.019*\"gener\" + 0.018*\"serv\" + 0.016*\"seri\" + 0.015*\"chickasaw\"\n", + "2019-01-31 00:40:54,784 : INFO : topic #4 (0.020): 0.021*\"enfranchis\" + 0.015*\"pour\" + 0.015*\"depress\" + 0.010*\"elabor\" + 0.008*\"veget\" + 0.008*\"mode\" + 0.007*\"encyclopedia\" + 0.007*\"uruguayan\" + 0.007*\"produc\" + 0.007*\"candid\"\n", + "2019-01-31 00:40:54,785 : INFO : topic #15 (0.020): 0.012*\"organ\" + 0.011*\"small\" + 0.011*\"develop\" + 0.010*\"commun\" + 0.009*\"word\" + 0.009*\"group\" + 0.008*\"peopl\" + 0.007*\"cultur\" + 0.007*\"woman\" + 0.007*\"human\"\n", + "2019-01-31 00:40:54,786 : INFO : topic #29 (0.020): 0.025*\"companhia\" + 0.011*\"million\" + 0.010*\"busi\" + 0.009*\"market\" + 0.009*\"bank\" + 0.009*\"produc\" + 0.008*\"yawn\" + 0.008*\"industri\" + 0.008*\"manag\" + 0.007*\"function\"\n", + "2019-01-31 00:40:54,787 : INFO : topic #21 (0.020): 0.036*\"samford\" + 0.023*\"spain\" + 0.019*\"mexico\" + 0.018*\"del\" + 0.013*\"soviet\" + 0.013*\"santa\" + 0.012*\"juan\" + 0.011*\"francisco\" + 0.011*\"lizard\" + 0.011*\"carlo\"\n", + "2019-01-31 00:40:54,793 : INFO : topic diff=0.006284, rho=0.037062\n", + "2019-01-31 00:40:54,945 : INFO : PROGRESS: pass 0, at document #1458000/4922894\n", + "2019-01-31 00:40:56,322 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:40:56,588 : INFO : topic #3 (0.020): 0.033*\"present\" + 0.028*\"offic\" + 0.023*\"minist\" + 0.021*\"nation\" + 0.020*\"govern\" + 0.020*\"serv\" + 0.019*\"member\" + 0.018*\"gener\" + 0.016*\"seri\" + 0.015*\"chickasaw\"\n", + "2019-01-31 00:40:56,589 : INFO : topic #33 (0.020): 0.063*\"french\" + 0.048*\"franc\" + 0.032*\"pari\" + 0.023*\"sail\" + 0.022*\"jean\" + 0.018*\"daphn\" + 0.015*\"lazi\" + 0.014*\"loui\" + 0.011*\"piec\" + 0.010*\"wine\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 00:40:56,591 : INFO : topic #21 (0.020): 0.036*\"samford\" + 0.022*\"spain\" + 0.019*\"mexico\" + 0.018*\"del\" + 0.013*\"soviet\" + 0.012*\"santa\" + 0.012*\"juan\" + 0.011*\"francisco\" + 0.011*\"lizard\" + 0.011*\"carlo\"\n", + "2019-01-31 00:40:56,592 : INFO : topic #38 (0.020): 0.024*\"walter\" + 0.010*\"battalion\" + 0.009*\"aza\" + 0.009*\"forc\" + 0.008*\"teufel\" + 0.007*\"armi\" + 0.007*\"empath\" + 0.007*\"militari\" + 0.007*\"till\" + 0.006*\"king\"\n", + "2019-01-31 00:40:56,593 : INFO : topic #32 (0.020): 0.051*\"district\" + 0.046*\"vigour\" + 0.043*\"popolo\" + 0.043*\"tortur\" + 0.030*\"cotton\" + 0.027*\"area\" + 0.023*\"multitud\" + 0.023*\"regim\" + 0.020*\"citi\" + 0.019*\"cede\"\n", + "2019-01-31 00:40:56,599 : INFO : topic diff=0.006419, rho=0.037037\n", + "2019-01-31 00:40:59,307 : INFO : -11.946 per-word bound, 3946.2 perplexity estimate based on a held-out corpus of 2000 documents with 576624 words\n", + "2019-01-31 00:40:59,308 : INFO : PROGRESS: pass 0, at document #1460000/4922894\n", + "2019-01-31 00:41:00,695 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:41:00,962 : INFO : topic #14 (0.020): 0.025*\"forc\" + 0.025*\"aggress\" + 0.020*\"armi\" + 0.020*\"walter\" + 0.019*\"com\" + 0.013*\"unionist\" + 0.013*\"oper\" + 0.012*\"militari\" + 0.012*\"airmen\" + 0.011*\"airbu\"\n", + "2019-01-31 00:41:00,963 : INFO : topic #45 (0.020): 0.027*\"jpg\" + 0.026*\"fifteenth\" + 0.018*\"illicit\" + 0.016*\"colder\" + 0.015*\"black\" + 0.015*\"western\" + 0.012*\"record\" + 0.010*\"blind\" + 0.007*\"light\" + 0.007*\"green\"\n", + "2019-01-31 00:41:00,964 : INFO : topic #29 (0.020): 0.025*\"companhia\" + 0.011*\"million\" + 0.011*\"busi\" + 0.009*\"bank\" + 0.009*\"market\" + 0.009*\"produc\" + 0.008*\"yawn\" + 0.008*\"manag\" + 0.008*\"industri\" + 0.007*\"function\"\n", + "2019-01-31 00:41:00,965 : INFO : topic #32 (0.020): 0.051*\"district\" + 0.045*\"vigour\" + 0.043*\"popolo\" + 0.043*\"tortur\" + 0.030*\"cotton\" + 0.027*\"area\" + 0.023*\"multitud\" + 0.023*\"regim\" + 0.021*\"citi\" + 0.019*\"cede\"\n", + "2019-01-31 00:41:00,966 : INFO : topic #42 (0.020): 0.045*\"german\" + 0.029*\"germani\" + 0.015*\"jewish\" + 0.014*\"vol\" + 0.013*\"berlin\" + 0.013*\"israel\" + 0.012*\"der\" + 0.010*\"european\" + 0.009*\"itali\" + 0.009*\"europ\"\n", + "2019-01-31 00:41:00,972 : INFO : topic diff=0.006277, rho=0.037012\n", + "2019-01-31 00:41:01,129 : INFO : PROGRESS: pass 0, at document #1462000/4922894\n", + "2019-01-31 00:41:02,526 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:41:02,792 : INFO : topic #22 (0.020): 0.034*\"spars\" + 0.024*\"factor\" + 0.020*\"adulthood\" + 0.016*\"feel\" + 0.014*\"male\" + 0.012*\"hostil\" + 0.011*\"plaisir\" + 0.010*\"genu\" + 0.009*\"live\" + 0.008*\"yawn\"\n", + "2019-01-31 00:41:02,793 : INFO : topic #2 (0.020): 0.046*\"isl\" + 0.037*\"shield\" + 0.018*\"narrat\" + 0.013*\"scot\" + 0.012*\"blur\" + 0.012*\"pope\" + 0.011*\"coalit\" + 0.011*\"nativist\" + 0.009*\"fleet\" + 0.009*\"bahá\"\n", + "2019-01-31 00:41:02,794 : INFO : topic #45 (0.020): 0.027*\"jpg\" + 0.026*\"fifteenth\" + 0.018*\"illicit\" + 0.016*\"colder\" + 0.015*\"western\" + 0.015*\"black\" + 0.012*\"record\" + 0.010*\"blind\" + 0.007*\"light\" + 0.007*\"green\"\n", + "2019-01-31 00:41:02,795 : INFO : topic #35 (0.020): 0.059*\"russia\" + 0.038*\"sovereignti\" + 0.035*\"rural\" + 0.026*\"poison\" + 0.024*\"reprint\" + 0.023*\"personifi\" + 0.020*\"unfortun\" + 0.020*\"moscow\" + 0.019*\"turin\" + 0.017*\"poland\"\n", + "2019-01-31 00:41:02,796 : INFO : topic #23 (0.020): 0.138*\"audit\" + 0.065*\"best\" + 0.037*\"yawn\" + 0.028*\"jacksonvil\" + 0.024*\"japanes\" + 0.023*\"festiv\" + 0.022*\"noll\" + 0.019*\"women\" + 0.018*\"intern\" + 0.014*\"prison\"\n", + "2019-01-31 00:41:02,802 : INFO : topic diff=0.007196, rho=0.036986\n", + "2019-01-31 00:41:02,955 : INFO : PROGRESS: pass 0, at document #1464000/4922894\n", + "2019-01-31 00:41:04,320 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:41:04,586 : INFO : topic #8 (0.020): 0.028*\"law\" + 0.024*\"cortic\" + 0.019*\"act\" + 0.018*\"start\" + 0.013*\"ricardo\" + 0.013*\"case\" + 0.010*\"order\" + 0.010*\"polaris\" + 0.009*\"replac\" + 0.008*\"legal\"\n", + "2019-01-31 00:41:04,587 : INFO : topic #19 (0.020): 0.015*\"languag\" + 0.011*\"centuri\" + 0.010*\"woodcut\" + 0.010*\"form\" + 0.009*\"origin\" + 0.008*\"mean\" + 0.007*\"trade\" + 0.007*\"god\" + 0.007*\"like\" + 0.006*\"uruguayan\"\n", + "2019-01-31 00:41:04,588 : INFO : topic #33 (0.020): 0.063*\"french\" + 0.048*\"franc\" + 0.031*\"pari\" + 0.023*\"sail\" + 0.022*\"jean\" + 0.018*\"daphn\" + 0.015*\"loui\" + 0.015*\"lazi\" + 0.012*\"piec\" + 0.010*\"wine\"\n", + "2019-01-31 00:41:04,589 : INFO : topic #46 (0.020): 0.018*\"sweden\" + 0.017*\"swedish\" + 0.017*\"stop\" + 0.016*\"wind\" + 0.015*\"norwai\" + 0.014*\"norwegian\" + 0.014*\"damag\" + 0.012*\"treeless\" + 0.011*\"denmark\" + 0.011*\"huntsvil\"\n", + "2019-01-31 00:41:04,590 : INFO : topic #28 (0.020): 0.031*\"build\" + 0.025*\"hous\" + 0.023*\"rivièr\" + 0.017*\"buford\" + 0.012*\"histor\" + 0.012*\"briarwood\" + 0.011*\"constitut\" + 0.011*\"strategist\" + 0.010*\"depress\" + 0.010*\"linear\"\n", + "2019-01-31 00:41:04,596 : INFO : topic diff=0.006130, rho=0.036961\n", + "2019-01-31 00:41:04,756 : INFO : PROGRESS: pass 0, at document #1466000/4922894\n", + "2019-01-31 00:41:06,137 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:41:06,403 : INFO : topic #49 (0.020): 0.041*\"india\" + 0.030*\"incumb\" + 0.014*\"islam\" + 0.013*\"pakistan\" + 0.012*\"anglo\" + 0.012*\"televis\" + 0.010*\"muskoge\" + 0.010*\"sri\" + 0.009*\"tajikistan\" + 0.009*\"start\"\n", + "2019-01-31 00:41:06,405 : INFO : topic #6 (0.020): 0.071*\"fewer\" + 0.024*\"epiru\" + 0.024*\"septemb\" + 0.018*\"teacher\" + 0.016*\"stake\" + 0.013*\"rodríguez\" + 0.012*\"proclaim\" + 0.011*\"direct\" + 0.011*\"movi\" + 0.010*\"acrimoni\"\n", + "2019-01-31 00:41:06,406 : INFO : topic #27 (0.020): 0.070*\"questionnair\" + 0.018*\"candid\" + 0.017*\"taxpay\" + 0.016*\"godaddi\" + 0.013*\"driver\" + 0.013*\"ret\" + 0.012*\"fool\" + 0.011*\"find\" + 0.011*\"tornado\" + 0.011*\"landslid\"\n", + "2019-01-31 00:41:06,407 : INFO : topic #19 (0.020): 0.015*\"languag\" + 0.011*\"centuri\" + 0.010*\"woodcut\" + 0.010*\"form\" + 0.009*\"origin\" + 0.008*\"mean\" + 0.007*\"trade\" + 0.007*\"god\" + 0.007*\"like\" + 0.006*\"known\"\n", + "2019-01-31 00:41:06,408 : INFO : topic #20 (0.020): 0.140*\"scholar\" + 0.040*\"struggl\" + 0.034*\"high\" + 0.030*\"educ\" + 0.022*\"collector\" + 0.017*\"yawn\" + 0.013*\"prognosi\" + 0.010*\"task\" + 0.010*\"gothic\" + 0.010*\"district\"\n", + "2019-01-31 00:41:06,414 : INFO : topic diff=0.006223, rho=0.036936\n", + "2019-01-31 00:41:06,569 : INFO : PROGRESS: pass 0, at document #1468000/4922894\n", + "2019-01-31 00:41:07,939 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:41:08,208 : INFO : topic #9 (0.020): 0.080*\"bone\" + 0.041*\"american\" + 0.026*\"valour\" + 0.017*\"dutch\" + 0.017*\"folei\" + 0.017*\"polit\" + 0.016*\"player\" + 0.015*\"english\" + 0.013*\"acrimoni\" + 0.013*\"simpler\"\n", + "2019-01-31 00:41:08,209 : INFO : topic #10 (0.020): 0.011*\"cdd\" + 0.008*\"disco\" + 0.008*\"media\" + 0.008*\"pathwai\" + 0.007*\"have\" + 0.007*\"hormon\" + 0.007*\"caus\" + 0.006*\"treat\" + 0.006*\"acid\" + 0.006*\"effect\"\n", + "2019-01-31 00:41:08,210 : INFO : topic #11 (0.020): 0.026*\"john\" + 0.013*\"will\" + 0.012*\"jame\" + 0.012*\"david\" + 0.011*\"rival\" + 0.010*\"mexican–american\" + 0.009*\"slur\" + 0.009*\"georg\" + 0.008*\"paul\" + 0.008*\"rhyme\"\n", + "2019-01-31 00:41:08,211 : INFO : topic #30 (0.020): 0.039*\"cleveland\" + 0.037*\"leagu\" + 0.029*\"place\" + 0.027*\"scientist\" + 0.026*\"taxpay\" + 0.023*\"crete\" + 0.022*\"folei\" + 0.017*\"goal\" + 0.015*\"martin\" + 0.012*\"diversifi\"\n", + "2019-01-31 00:41:08,212 : INFO : topic #13 (0.020): 0.027*\"sourc\" + 0.027*\"australia\" + 0.025*\"london\" + 0.025*\"new\" + 0.023*\"australian\" + 0.023*\"england\" + 0.019*\"british\" + 0.017*\"ireland\" + 0.015*\"youth\" + 0.014*\"wale\"\n", + "2019-01-31 00:41:08,218 : INFO : topic diff=0.006765, rho=0.036911\n", + "2019-01-31 00:41:08,428 : INFO : PROGRESS: pass 0, at document #1470000/4922894\n", + "2019-01-31 00:41:09,815 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:41:10,082 : INFO : topic #35 (0.020): 0.058*\"russia\" + 0.038*\"sovereignti\" + 0.035*\"rural\" + 0.026*\"poison\" + 0.024*\"reprint\" + 0.024*\"personifi\" + 0.021*\"moscow\" + 0.020*\"unfortun\" + 0.019*\"turin\" + 0.017*\"poland\"\n", + "2019-01-31 00:41:10,083 : INFO : topic #46 (0.020): 0.017*\"stop\" + 0.017*\"sweden\" + 0.017*\"swedish\" + 0.016*\"wind\" + 0.015*\"damag\" + 0.015*\"norwai\" + 0.014*\"norwegian\" + 0.012*\"huntsvil\" + 0.012*\"treeless\" + 0.011*\"farid\"\n", + "2019-01-31 00:41:10,084 : INFO : topic #15 (0.020): 0.011*\"small\" + 0.011*\"organ\" + 0.010*\"develop\" + 0.010*\"commun\" + 0.009*\"group\" + 0.009*\"word\" + 0.008*\"peopl\" + 0.007*\"cultur\" + 0.007*\"woman\" + 0.007*\"human\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 00:41:10,086 : INFO : topic #11 (0.020): 0.026*\"john\" + 0.013*\"will\" + 0.012*\"jame\" + 0.012*\"david\" + 0.011*\"rival\" + 0.010*\"mexican–american\" + 0.009*\"slur\" + 0.009*\"georg\" + 0.008*\"paul\" + 0.008*\"rhyme\"\n", + "2019-01-31 00:41:10,087 : INFO : topic #2 (0.020): 0.046*\"isl\" + 0.038*\"shield\" + 0.019*\"narrat\" + 0.013*\"scot\" + 0.012*\"pope\" + 0.012*\"blur\" + 0.011*\"nativist\" + 0.010*\"coalit\" + 0.009*\"fleet\" + 0.009*\"bahá\"\n", + "2019-01-31 00:41:10,092 : INFO : topic diff=0.005940, rho=0.036886\n", + "2019-01-31 00:41:10,248 : INFO : PROGRESS: pass 0, at document #1472000/4922894\n", + "2019-01-31 00:41:11,659 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:41:11,926 : INFO : topic #22 (0.020): 0.033*\"spars\" + 0.025*\"factor\" + 0.020*\"adulthood\" + 0.016*\"feel\" + 0.014*\"male\" + 0.013*\"hostil\" + 0.011*\"plaisir\" + 0.010*\"genu\" + 0.009*\"live\" + 0.008*\"yawn\"\n", + "2019-01-31 00:41:11,927 : INFO : topic #15 (0.020): 0.011*\"small\" + 0.011*\"organ\" + 0.011*\"develop\" + 0.010*\"commun\" + 0.009*\"group\" + 0.009*\"word\" + 0.008*\"peopl\" + 0.007*\"cultur\" + 0.007*\"woman\" + 0.007*\"human\"\n", + "2019-01-31 00:41:11,928 : INFO : topic #14 (0.020): 0.026*\"forc\" + 0.025*\"aggress\" + 0.021*\"armi\" + 0.020*\"walter\" + 0.018*\"com\" + 0.013*\"unionist\" + 0.013*\"oper\" + 0.013*\"militari\" + 0.011*\"airbu\" + 0.011*\"airmen\"\n", + "2019-01-31 00:41:11,929 : INFO : topic #35 (0.020): 0.057*\"russia\" + 0.038*\"sovereignti\" + 0.034*\"rural\" + 0.026*\"poison\" + 0.025*\"personifi\" + 0.024*\"reprint\" + 0.021*\"moscow\" + 0.020*\"unfortun\" + 0.018*\"turin\" + 0.017*\"poland\"\n", + "2019-01-31 00:41:11,930 : INFO : topic #42 (0.020): 0.045*\"german\" + 0.029*\"germani\" + 0.017*\"jewish\" + 0.014*\"israel\" + 0.014*\"vol\" + 0.013*\"berlin\" + 0.012*\"der\" + 0.010*\"european\" + 0.010*\"jeremiah\" + 0.009*\"europ\"\n", + "2019-01-31 00:41:11,936 : INFO : topic diff=0.005696, rho=0.036860\n", + "2019-01-31 00:41:12,087 : INFO : PROGRESS: pass 0, at document #1474000/4922894\n", + "2019-01-31 00:41:13,439 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:41:13,706 : INFO : topic #20 (0.020): 0.140*\"scholar\" + 0.040*\"struggl\" + 0.035*\"high\" + 0.030*\"educ\" + 0.023*\"collector\" + 0.017*\"yawn\" + 0.013*\"prognosi\" + 0.010*\"task\" + 0.009*\"district\" + 0.009*\"gothic\"\n", + "2019-01-31 00:41:13,707 : INFO : topic #5 (0.020): 0.039*\"abroad\" + 0.027*\"son\" + 0.027*\"reconstruct\" + 0.027*\"rel\" + 0.022*\"band\" + 0.017*\"muscl\" + 0.016*\"simultan\" + 0.014*\"charcoal\" + 0.013*\"toyota\" + 0.010*\"myspac\"\n", + "2019-01-31 00:41:13,708 : INFO : topic #36 (0.020): 0.011*\"pop\" + 0.011*\"prognosi\" + 0.011*\"network\" + 0.009*\"develop\" + 0.008*\"cytokin\" + 0.008*\"championship\" + 0.008*\"user\" + 0.008*\"softwar\" + 0.007*\"base\" + 0.007*\"diggin\"\n", + "2019-01-31 00:41:13,709 : INFO : topic #3 (0.020): 0.033*\"present\" + 0.029*\"offic\" + 0.022*\"minist\" + 0.021*\"nation\" + 0.020*\"serv\" + 0.020*\"govern\" + 0.019*\"member\" + 0.018*\"gener\" + 0.016*\"seri\" + 0.016*\"chickasaw\"\n", + "2019-01-31 00:41:13,710 : INFO : topic #29 (0.020): 0.025*\"companhia\" + 0.011*\"million\" + 0.011*\"busi\" + 0.009*\"market\" + 0.009*\"bank\" + 0.009*\"produc\" + 0.008*\"yawn\" + 0.008*\"industri\" + 0.008*\"manag\" + 0.007*\"function\"\n", + "2019-01-31 00:41:13,716 : INFO : topic diff=0.006173, rho=0.036835\n", + "2019-01-31 00:41:13,876 : INFO : PROGRESS: pass 0, at document #1476000/4922894\n", + "2019-01-31 00:41:15,302 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:41:15,567 : INFO : topic #28 (0.020): 0.031*\"build\" + 0.025*\"hous\" + 0.023*\"rivièr\" + 0.017*\"buford\" + 0.012*\"histor\" + 0.012*\"briarwood\" + 0.011*\"constitut\" + 0.011*\"strategist\" + 0.010*\"linear\" + 0.010*\"depress\"\n", + "2019-01-31 00:41:15,568 : INFO : topic #39 (0.020): 0.051*\"canada\" + 0.038*\"canadian\" + 0.021*\"toronto\" + 0.019*\"ontario\" + 0.019*\"hoar\" + 0.014*\"new\" + 0.012*\"hydrogen\" + 0.012*\"novotná\" + 0.012*\"misericordia\" + 0.012*\"quebec\"\n", + "2019-01-31 00:41:15,570 : INFO : topic #8 (0.020): 0.028*\"law\" + 0.023*\"cortic\" + 0.020*\"act\" + 0.018*\"start\" + 0.013*\"ricardo\" + 0.013*\"case\" + 0.010*\"order\" + 0.009*\"polaris\" + 0.009*\"replac\" + 0.008*\"legal\"\n", + "2019-01-31 00:41:15,571 : INFO : topic #40 (0.020): 0.086*\"unit\" + 0.022*\"schuster\" + 0.022*\"collector\" + 0.021*\"institut\" + 0.020*\"requir\" + 0.019*\"student\" + 0.014*\"professor\" + 0.012*\"word\" + 0.011*\"degre\" + 0.011*\"http\"\n", + "2019-01-31 00:41:15,572 : INFO : topic #47 (0.020): 0.065*\"muscl\" + 0.034*\"perceptu\" + 0.021*\"theater\" + 0.019*\"place\" + 0.017*\"damn\" + 0.017*\"compos\" + 0.014*\"physician\" + 0.014*\"olympo\" + 0.014*\"orchestr\" + 0.011*\"jack\"\n", + "2019-01-31 00:41:15,578 : INFO : topic diff=0.007005, rho=0.036811\n", + "2019-01-31 00:41:15,738 : INFO : PROGRESS: pass 0, at document #1478000/4922894\n", + "2019-01-31 00:41:17,121 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:41:17,391 : INFO : topic #3 (0.020): 0.032*\"present\" + 0.028*\"offic\" + 0.022*\"minist\" + 0.022*\"nation\" + 0.020*\"member\" + 0.020*\"govern\" + 0.020*\"serv\" + 0.018*\"gener\" + 0.016*\"seri\" + 0.015*\"chickasaw\"\n", + "2019-01-31 00:41:17,392 : INFO : topic #2 (0.020): 0.046*\"isl\" + 0.038*\"shield\" + 0.018*\"narrat\" + 0.013*\"scot\" + 0.012*\"blur\" + 0.012*\"pope\" + 0.011*\"nativist\" + 0.011*\"coalit\" + 0.009*\"fleet\" + 0.009*\"sai\"\n", + "2019-01-31 00:41:17,393 : INFO : topic #20 (0.020): 0.142*\"scholar\" + 0.040*\"struggl\" + 0.035*\"high\" + 0.030*\"educ\" + 0.023*\"collector\" + 0.017*\"yawn\" + 0.013*\"prognosi\" + 0.010*\"task\" + 0.009*\"gothic\" + 0.009*\"district\"\n", + "2019-01-31 00:41:17,394 : INFO : topic #45 (0.020): 0.027*\"jpg\" + 0.026*\"fifteenth\" + 0.018*\"illicit\" + 0.016*\"colder\" + 0.015*\"western\" + 0.015*\"black\" + 0.012*\"record\" + 0.010*\"blind\" + 0.007*\"light\" + 0.007*\"green\"\n", + "2019-01-31 00:41:17,395 : INFO : topic #37 (0.020): 0.009*\"love\" + 0.009*\"man\" + 0.007*\"gestur\" + 0.006*\"septemb\" + 0.006*\"charact\" + 0.005*\"dixi\" + 0.005*\"comic\" + 0.005*\"blue\" + 0.004*\"appear\" + 0.004*\"black\"\n", + "2019-01-31 00:41:17,401 : INFO : topic diff=0.006131, rho=0.036786\n", + "2019-01-31 00:41:20,102 : INFO : -11.685 per-word bound, 3292.0 perplexity estimate based on a held-out corpus of 2000 documents with 552756 words\n", + "2019-01-31 00:41:20,103 : INFO : PROGRESS: pass 0, at document #1480000/4922894\n", + "2019-01-31 00:41:21,495 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:41:21,762 : INFO : topic #38 (0.020): 0.023*\"walter\" + 0.010*\"aza\" + 0.010*\"battalion\" + 0.008*\"forc\" + 0.008*\"teufel\" + 0.007*\"armi\" + 0.007*\"empath\" + 0.007*\"militari\" + 0.006*\"till\" + 0.006*\"pour\"\n", + "2019-01-31 00:41:21,763 : INFO : topic #44 (0.020): 0.031*\"rooftop\" + 0.029*\"final\" + 0.024*\"wife\" + 0.020*\"tourist\" + 0.018*\"champion\" + 0.016*\"taxpay\" + 0.015*\"martin\" + 0.014*\"chamber\" + 0.013*\"tiepolo\" + 0.013*\"winner\"\n", + "2019-01-31 00:41:21,764 : INFO : topic #33 (0.020): 0.064*\"french\" + 0.049*\"franc\" + 0.031*\"pari\" + 0.022*\"sail\" + 0.022*\"jean\" + 0.018*\"daphn\" + 0.016*\"lazi\" + 0.015*\"loui\" + 0.011*\"piec\" + 0.009*\"wine\"\n", + "2019-01-31 00:41:21,765 : INFO : topic #49 (0.020): 0.040*\"india\" + 0.030*\"incumb\" + 0.013*\"islam\" + 0.013*\"anglo\" + 0.012*\"pakistan\" + 0.012*\"televis\" + 0.010*\"muskoge\" + 0.010*\"sri\" + 0.010*\"khalsa\" + 0.009*\"start\"\n", + "2019-01-31 00:41:21,766 : INFO : topic #3 (0.020): 0.032*\"present\" + 0.028*\"offic\" + 0.023*\"minist\" + 0.022*\"nation\" + 0.020*\"member\" + 0.020*\"govern\" + 0.020*\"serv\" + 0.018*\"gener\" + 0.016*\"seri\" + 0.016*\"chickasaw\"\n", + "2019-01-31 00:41:21,772 : INFO : topic diff=0.005522, rho=0.036761\n", + "2019-01-31 00:41:21,934 : INFO : PROGRESS: pass 0, at document #1482000/4922894\n", + "2019-01-31 00:41:23,367 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:41:23,633 : INFO : topic #9 (0.020): 0.079*\"bone\" + 0.041*\"american\" + 0.025*\"valour\" + 0.017*\"dutch\" + 0.017*\"polit\" + 0.017*\"folei\" + 0.016*\"player\" + 0.015*\"english\" + 0.013*\"simpler\" + 0.013*\"acrimoni\"\n", + "2019-01-31 00:41:23,634 : INFO : topic #7 (0.020): 0.022*\"snatch\" + 0.019*\"di\" + 0.018*\"factor\" + 0.016*\"yawn\" + 0.015*\"margin\" + 0.013*\"bone\" + 0.013*\"life\" + 0.012*\"faster\" + 0.012*\"will\" + 0.012*\"daughter\"\n", + "2019-01-31 00:41:23,635 : INFO : topic #37 (0.020): 0.009*\"love\" + 0.009*\"man\" + 0.007*\"gestur\" + 0.006*\"septemb\" + 0.006*\"charact\" + 0.005*\"comic\" + 0.005*\"dixi\" + 0.005*\"blue\" + 0.005*\"appear\" + 0.004*\"madison\"\n", + "2019-01-31 00:41:23,637 : INFO : topic #43 (0.020): 0.063*\"elect\" + 0.053*\"parti\" + 0.025*\"voluntari\" + 0.024*\"democrat\" + 0.021*\"member\" + 0.017*\"polici\" + 0.016*\"republ\" + 0.014*\"report\" + 0.014*\"bypass\" + 0.014*\"selma\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 00:41:23,638 : INFO : topic #26 (0.020): 0.032*\"workplac\" + 0.030*\"champion\" + 0.027*\"woman\" + 0.026*\"olymp\" + 0.025*\"men\" + 0.021*\"medal\" + 0.020*\"event\" + 0.018*\"nation\" + 0.018*\"taxpay\" + 0.017*\"alic\"\n", + "2019-01-31 00:41:23,644 : INFO : topic diff=0.006173, rho=0.036736\n", + "2019-01-31 00:41:23,801 : INFO : PROGRESS: pass 0, at document #1484000/4922894\n", + "2019-01-31 00:41:25,176 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:41:25,442 : INFO : topic #12 (0.020): 0.009*\"number\" + 0.008*\"frontal\" + 0.007*\"gener\" + 0.006*\"exampl\" + 0.006*\"poet\" + 0.006*\"théori\" + 0.006*\"servitud\" + 0.006*\"method\" + 0.006*\"utopian\" + 0.006*\"measur\"\n", + "2019-01-31 00:41:25,443 : INFO : topic #10 (0.020): 0.011*\"cdd\" + 0.008*\"disco\" + 0.008*\"media\" + 0.007*\"have\" + 0.007*\"pathwai\" + 0.007*\"hormon\" + 0.007*\"caus\" + 0.006*\"effect\" + 0.006*\"treat\" + 0.006*\"proper\"\n", + "2019-01-31 00:41:25,444 : INFO : topic #27 (0.020): 0.071*\"questionnair\" + 0.018*\"candid\" + 0.017*\"taxpay\" + 0.014*\"godaddi\" + 0.013*\"driver\" + 0.013*\"ret\" + 0.012*\"fool\" + 0.011*\"find\" + 0.011*\"tornado\" + 0.010*\"poet\"\n", + "2019-01-31 00:41:25,444 : INFO : topic #13 (0.020): 0.027*\"sourc\" + 0.026*\"australia\" + 0.025*\"london\" + 0.025*\"new\" + 0.023*\"england\" + 0.023*\"australian\" + 0.020*\"british\" + 0.018*\"ireland\" + 0.015*\"youth\" + 0.014*\"wale\"\n", + "2019-01-31 00:41:25,446 : INFO : topic #29 (0.020): 0.025*\"companhia\" + 0.011*\"million\" + 0.011*\"busi\" + 0.009*\"market\" + 0.009*\"produc\" + 0.009*\"bank\" + 0.008*\"industri\" + 0.008*\"yawn\" + 0.008*\"manag\" + 0.007*\"function\"\n", + "2019-01-31 00:41:25,451 : INFO : topic diff=0.006195, rho=0.036711\n", + "2019-01-31 00:41:25,607 : INFO : PROGRESS: pass 0, at document #1486000/4922894\n", + "2019-01-31 00:41:26,986 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:41:27,253 : INFO : topic #48 (0.020): 0.076*\"sens\" + 0.075*\"march\" + 0.075*\"octob\" + 0.069*\"juli\" + 0.068*\"januari\" + 0.067*\"april\" + 0.066*\"notion\" + 0.066*\"august\" + 0.065*\"judici\" + 0.063*\"decatur\"\n", + "2019-01-31 00:41:27,254 : INFO : topic #14 (0.020): 0.025*\"forc\" + 0.024*\"aggress\" + 0.021*\"armi\" + 0.020*\"walter\" + 0.018*\"com\" + 0.013*\"unionist\" + 0.013*\"militari\" + 0.013*\"oper\" + 0.012*\"airbu\" + 0.011*\"diversifi\"\n", + "2019-01-31 00:41:27,255 : INFO : topic #41 (0.020): 0.041*\"citi\" + 0.028*\"new\" + 0.022*\"palmer\" + 0.015*\"strategist\" + 0.012*\"center\" + 0.012*\"open\" + 0.011*\"includ\" + 0.011*\"year\" + 0.010*\"lobe\" + 0.009*\"dai\"\n", + "2019-01-31 00:41:27,256 : INFO : topic #24 (0.020): 0.042*\"book\" + 0.035*\"publicis\" + 0.024*\"word\" + 0.017*\"new\" + 0.015*\"edit\" + 0.013*\"storag\" + 0.013*\"presid\" + 0.012*\"nicola\" + 0.012*\"collect\" + 0.011*\"magazin\"\n", + "2019-01-31 00:41:27,257 : INFO : topic #25 (0.020): 0.030*\"ring\" + 0.017*\"warmth\" + 0.017*\"lagrang\" + 0.017*\"area\" + 0.016*\"mount\" + 0.009*\"palmer\" + 0.009*\"foam\" + 0.008*\"vacant\" + 0.008*\"north\" + 0.008*\"land\"\n", + "2019-01-31 00:41:27,263 : INFO : topic diff=0.006561, rho=0.036686\n", + "2019-01-31 00:41:27,419 : INFO : PROGRESS: pass 0, at document #1488000/4922894\n", + "2019-01-31 00:41:28,809 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:41:29,075 : INFO : topic #16 (0.020): 0.049*\"king\" + 0.030*\"priest\" + 0.020*\"duke\" + 0.019*\"rotterdam\" + 0.019*\"grammat\" + 0.019*\"quarterli\" + 0.017*\"idiosyncrat\" + 0.015*\"kingdom\" + 0.013*\"portugues\" + 0.012*\"maria\"\n", + "2019-01-31 00:41:29,076 : INFO : topic #21 (0.020): 0.035*\"samford\" + 0.021*\"spain\" + 0.018*\"mexico\" + 0.018*\"del\" + 0.013*\"soviet\" + 0.013*\"santa\" + 0.012*\"juan\" + 0.011*\"lizard\" + 0.011*\"francisco\" + 0.011*\"carlo\"\n", + "2019-01-31 00:41:29,077 : INFO : topic #39 (0.020): 0.050*\"canada\" + 0.037*\"canadian\" + 0.021*\"toronto\" + 0.019*\"hoar\" + 0.018*\"ontario\" + 0.014*\"new\" + 0.013*\"hydrogen\" + 0.013*\"novotná\" + 0.012*\"misericordia\" + 0.011*\"quebec\"\n", + "2019-01-31 00:41:29,078 : INFO : topic #12 (0.020): 0.009*\"number\" + 0.008*\"frontal\" + 0.007*\"gener\" + 0.006*\"exampl\" + 0.006*\"théori\" + 0.006*\"poet\" + 0.006*\"servitud\" + 0.006*\"utopian\" + 0.006*\"method\" + 0.006*\"measur\"\n", + "2019-01-31 00:41:29,079 : INFO : topic #3 (0.020): 0.033*\"present\" + 0.028*\"offic\" + 0.023*\"minist\" + 0.022*\"nation\" + 0.020*\"member\" + 0.020*\"govern\" + 0.019*\"serv\" + 0.018*\"gener\" + 0.016*\"seri\" + 0.015*\"chickasaw\"\n", + "2019-01-31 00:41:29,085 : INFO : topic diff=0.005363, rho=0.036662\n", + "2019-01-31 00:41:29,237 : INFO : PROGRESS: pass 0, at document #1490000/4922894\n", + "2019-01-31 00:41:30,614 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:41:30,880 : INFO : topic #24 (0.020): 0.042*\"book\" + 0.035*\"publicis\" + 0.024*\"word\" + 0.018*\"new\" + 0.014*\"edit\" + 0.013*\"presid\" + 0.013*\"storag\" + 0.012*\"nicola\" + 0.012*\"collect\" + 0.011*\"magazin\"\n", + "2019-01-31 00:41:30,881 : INFO : topic #13 (0.020): 0.027*\"sourc\" + 0.026*\"australia\" + 0.025*\"london\" + 0.025*\"new\" + 0.023*\"australian\" + 0.023*\"england\" + 0.020*\"british\" + 0.018*\"ireland\" + 0.015*\"youth\" + 0.014*\"wale\"\n", + "2019-01-31 00:41:30,882 : INFO : topic #43 (0.020): 0.064*\"elect\" + 0.053*\"parti\" + 0.025*\"voluntari\" + 0.024*\"democrat\" + 0.021*\"member\" + 0.017*\"republ\" + 0.017*\"polici\" + 0.014*\"report\" + 0.014*\"bypass\" + 0.013*\"selma\"\n", + "2019-01-31 00:41:30,883 : INFO : topic #42 (0.020): 0.045*\"german\" + 0.029*\"germani\" + 0.015*\"jewish\" + 0.014*\"berlin\" + 0.014*\"vol\" + 0.013*\"israel\" + 0.013*\"der\" + 0.010*\"europ\" + 0.010*\"european\" + 0.009*\"itali\"\n", + "2019-01-31 00:41:30,884 : INFO : topic #11 (0.020): 0.026*\"john\" + 0.013*\"will\" + 0.012*\"jame\" + 0.012*\"david\" + 0.011*\"rival\" + 0.010*\"mexican–american\" + 0.009*\"georg\" + 0.008*\"slur\" + 0.008*\"paul\" + 0.007*\"rhyme\"\n", + "2019-01-31 00:41:30,890 : INFO : topic diff=0.005486, rho=0.036637\n", + "2019-01-31 00:41:31,045 : INFO : PROGRESS: pass 0, at document #1492000/4922894\n", + "2019-01-31 00:41:32,421 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:41:32,688 : INFO : topic #44 (0.020): 0.031*\"rooftop\" + 0.029*\"final\" + 0.023*\"wife\" + 0.020*\"tourist\" + 0.018*\"champion\" + 0.016*\"taxpay\" + 0.016*\"martin\" + 0.014*\"chamber\" + 0.013*\"tiepolo\" + 0.013*\"winner\"\n", + "2019-01-31 00:41:32,689 : INFO : topic #49 (0.020): 0.041*\"india\" + 0.029*\"incumb\" + 0.014*\"anglo\" + 0.014*\"islam\" + 0.013*\"pakistan\" + 0.012*\"televis\" + 0.011*\"sri\" + 0.011*\"muskoge\" + 0.009*\"affection\" + 0.009*\"khalsa\"\n", + "2019-01-31 00:41:32,690 : INFO : topic #8 (0.020): 0.028*\"law\" + 0.024*\"cortic\" + 0.019*\"act\" + 0.019*\"start\" + 0.013*\"ricardo\" + 0.013*\"case\" + 0.010*\"polaris\" + 0.009*\"order\" + 0.009*\"replac\" + 0.008*\"legal\"\n", + "2019-01-31 00:41:32,691 : INFO : topic #23 (0.020): 0.137*\"audit\" + 0.066*\"best\" + 0.036*\"yawn\" + 0.027*\"jacksonvil\" + 0.025*\"japanes\" + 0.024*\"festiv\" + 0.022*\"noll\" + 0.018*\"women\" + 0.018*\"intern\" + 0.014*\"prison\"\n", + "2019-01-31 00:41:32,692 : INFO : topic #29 (0.020): 0.025*\"companhia\" + 0.011*\"million\" + 0.011*\"busi\" + 0.010*\"market\" + 0.009*\"produc\" + 0.009*\"bank\" + 0.008*\"yawn\" + 0.008*\"industri\" + 0.008*\"manag\" + 0.007*\"function\"\n", + "2019-01-31 00:41:32,698 : INFO : topic diff=0.005837, rho=0.036613\n", + "2019-01-31 00:41:32,853 : INFO : PROGRESS: pass 0, at document #1494000/4922894\n", + "2019-01-31 00:41:34,235 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:41:34,502 : INFO : topic #23 (0.020): 0.137*\"audit\" + 0.066*\"best\" + 0.036*\"yawn\" + 0.028*\"jacksonvil\" + 0.026*\"japanes\" + 0.024*\"festiv\" + 0.022*\"noll\" + 0.019*\"women\" + 0.018*\"intern\" + 0.014*\"prison\"\n", + "2019-01-31 00:41:34,503 : INFO : topic #4 (0.020): 0.021*\"enfranchis\" + 0.016*\"pour\" + 0.015*\"depress\" + 0.009*\"elabor\" + 0.008*\"veget\" + 0.008*\"mode\" + 0.007*\"uruguayan\" + 0.007*\"encyclopedia\" + 0.007*\"candid\" + 0.007*\"produc\"\n", + "2019-01-31 00:41:34,503 : INFO : topic #16 (0.020): 0.049*\"king\" + 0.032*\"priest\" + 0.020*\"grammat\" + 0.020*\"duke\" + 0.019*\"rotterdam\" + 0.019*\"quarterli\" + 0.017*\"idiosyncrat\" + 0.015*\"kingdom\" + 0.013*\"portugues\" + 0.012*\"count\"\n", + "2019-01-31 00:41:34,505 : INFO : topic #15 (0.020): 0.011*\"organ\" + 0.011*\"small\" + 0.010*\"develop\" + 0.010*\"commun\" + 0.009*\"group\" + 0.009*\"word\" + 0.008*\"peopl\" + 0.008*\"cultur\" + 0.007*\"woman\" + 0.007*\"human\"\n", + "2019-01-31 00:41:34,506 : INFO : topic #5 (0.020): 0.039*\"abroad\" + 0.028*\"son\" + 0.027*\"rel\" + 0.026*\"reconstruct\" + 0.022*\"band\" + 0.017*\"muscl\" + 0.016*\"simultan\" + 0.014*\"charcoal\" + 0.013*\"toyota\" + 0.010*\"myspac\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 00:41:34,512 : INFO : topic diff=0.006679, rho=0.036588\n", + "2019-01-31 00:41:34,663 : INFO : PROGRESS: pass 0, at document #1496000/4922894\n", + "2019-01-31 00:41:36,020 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:41:36,286 : INFO : topic #43 (0.020): 0.064*\"elect\" + 0.053*\"parti\" + 0.025*\"voluntari\" + 0.023*\"democrat\" + 0.021*\"member\" + 0.017*\"polici\" + 0.016*\"republ\" + 0.014*\"report\" + 0.014*\"bypass\" + 0.013*\"selma\"\n", + "2019-01-31 00:41:36,287 : INFO : topic #28 (0.020): 0.031*\"build\" + 0.025*\"hous\" + 0.023*\"rivièr\" + 0.016*\"buford\" + 0.012*\"briarwood\" + 0.012*\"histor\" + 0.011*\"strategist\" + 0.011*\"constitut\" + 0.010*\"depress\" + 0.010*\"linear\"\n", + "2019-01-31 00:41:36,288 : INFO : topic #11 (0.020): 0.026*\"john\" + 0.013*\"will\" + 0.012*\"jame\" + 0.012*\"david\" + 0.011*\"rival\" + 0.010*\"mexican–american\" + 0.009*\"georg\" + 0.008*\"slur\" + 0.008*\"paul\" + 0.007*\"rhyme\"\n", + "2019-01-31 00:41:36,289 : INFO : topic #17 (0.020): 0.075*\"church\" + 0.021*\"cathol\" + 0.021*\"christian\" + 0.019*\"bishop\" + 0.015*\"sail\" + 0.015*\"retroflex\" + 0.010*\"cathedr\" + 0.009*\"relationship\" + 0.009*\"centuri\" + 0.009*\"parish\"\n", + "2019-01-31 00:41:36,290 : INFO : topic #16 (0.020): 0.049*\"king\" + 0.032*\"priest\" + 0.020*\"grammat\" + 0.019*\"quarterli\" + 0.019*\"rotterdam\" + 0.019*\"duke\" + 0.017*\"idiosyncrat\" + 0.014*\"kingdom\" + 0.013*\"portugues\" + 0.012*\"maria\"\n", + "2019-01-31 00:41:36,296 : INFO : topic diff=0.005765, rho=0.036564\n", + "2019-01-31 00:41:36,453 : INFO : PROGRESS: pass 0, at document #1498000/4922894\n", + "2019-01-31 00:41:37,850 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:41:38,116 : INFO : topic #22 (0.020): 0.033*\"spars\" + 0.024*\"factor\" + 0.020*\"adulthood\" + 0.016*\"feel\" + 0.015*\"male\" + 0.012*\"hostil\" + 0.012*\"plaisir\" + 0.010*\"genu\" + 0.009*\"live\" + 0.008*\"yawn\"\n", + "2019-01-31 00:41:38,117 : INFO : topic #21 (0.020): 0.036*\"samford\" + 0.022*\"spain\" + 0.018*\"mexico\" + 0.018*\"del\" + 0.013*\"soviet\" + 0.012*\"santa\" + 0.011*\"juan\" + 0.011*\"lizard\" + 0.011*\"francisco\" + 0.011*\"carlo\"\n", + "2019-01-31 00:41:38,118 : INFO : topic #4 (0.020): 0.021*\"enfranchis\" + 0.016*\"pour\" + 0.015*\"depress\" + 0.009*\"elabor\" + 0.008*\"veget\" + 0.008*\"mode\" + 0.007*\"encyclopedia\" + 0.007*\"uruguayan\" + 0.007*\"produc\" + 0.007*\"candid\"\n", + "2019-01-31 00:41:38,119 : INFO : topic #36 (0.020): 0.011*\"network\" + 0.011*\"prognosi\" + 0.011*\"pop\" + 0.009*\"develop\" + 0.009*\"cytokin\" + 0.008*\"softwar\" + 0.008*\"user\" + 0.007*\"championship\" + 0.007*\"diggin\" + 0.007*\"uruguayan\"\n", + "2019-01-31 00:41:38,120 : INFO : topic #43 (0.020): 0.063*\"elect\" + 0.054*\"parti\" + 0.025*\"voluntari\" + 0.023*\"democrat\" + 0.021*\"member\" + 0.017*\"polici\" + 0.016*\"republ\" + 0.014*\"report\" + 0.014*\"bypass\" + 0.013*\"selma\"\n", + "2019-01-31 00:41:38,126 : INFO : topic diff=0.006082, rho=0.036539\n", + "2019-01-31 00:41:40,875 : INFO : -11.689 per-word bound, 3300.9 perplexity estimate based on a held-out corpus of 2000 documents with 582129 words\n", + "2019-01-31 00:41:40,876 : INFO : PROGRESS: pass 0, at document #1500000/4922894\n", + "2019-01-31 00:41:42,286 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:41:42,552 : INFO : topic #8 (0.020): 0.027*\"law\" + 0.024*\"cortic\" + 0.019*\"start\" + 0.019*\"act\" + 0.014*\"ricardo\" + 0.013*\"case\" + 0.010*\"polaris\" + 0.009*\"order\" + 0.009*\"replac\" + 0.008*\"legal\"\n", + "2019-01-31 00:41:42,553 : INFO : topic #30 (0.020): 0.038*\"cleveland\" + 0.037*\"leagu\" + 0.028*\"place\" + 0.026*\"taxpay\" + 0.026*\"scientist\" + 0.023*\"crete\" + 0.021*\"folei\" + 0.016*\"goal\" + 0.015*\"martin\" + 0.012*\"schmitz\"\n", + "2019-01-31 00:41:42,554 : INFO : topic #2 (0.020): 0.048*\"isl\" + 0.037*\"shield\" + 0.018*\"narrat\" + 0.013*\"blur\" + 0.013*\"scot\" + 0.013*\"pope\" + 0.011*\"coalit\" + 0.010*\"nativist\" + 0.009*\"bahá\" + 0.009*\"fleet\"\n", + "2019-01-31 00:41:42,555 : INFO : topic #36 (0.020): 0.011*\"prognosi\" + 0.011*\"network\" + 0.011*\"pop\" + 0.009*\"develop\" + 0.009*\"cytokin\" + 0.008*\"softwar\" + 0.008*\"user\" + 0.007*\"championship\" + 0.007*\"uruguayan\" + 0.007*\"diggin\"\n", + "2019-01-31 00:41:42,556 : INFO : topic #19 (0.020): 0.015*\"languag\" + 0.011*\"centuri\" + 0.010*\"woodcut\" + 0.010*\"form\" + 0.009*\"origin\" + 0.008*\"mean\" + 0.007*\"trade\" + 0.007*\"like\" + 0.006*\"english\" + 0.006*\"known\"\n", + "2019-01-31 00:41:42,562 : INFO : topic diff=0.005669, rho=0.036515\n", + "2019-01-31 00:41:42,721 : INFO : PROGRESS: pass 0, at document #1502000/4922894\n", + "2019-01-31 00:41:44,127 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:41:44,393 : INFO : topic #22 (0.020): 0.033*\"spars\" + 0.024*\"factor\" + 0.020*\"adulthood\" + 0.016*\"feel\" + 0.015*\"male\" + 0.012*\"hostil\" + 0.011*\"plaisir\" + 0.010*\"genu\" + 0.009*\"live\" + 0.008*\"yawn\"\n", + "2019-01-31 00:41:44,394 : INFO : topic #6 (0.020): 0.071*\"fewer\" + 0.025*\"septemb\" + 0.024*\"epiru\" + 0.018*\"teacher\" + 0.016*\"stake\" + 0.013*\"rodríguez\" + 0.012*\"proclaim\" + 0.011*\"direct\" + 0.011*\"movi\" + 0.011*\"acrimoni\"\n", + "2019-01-31 00:41:44,395 : INFO : topic #29 (0.020): 0.025*\"companhia\" + 0.011*\"million\" + 0.011*\"busi\" + 0.010*\"market\" + 0.009*\"produc\" + 0.009*\"bank\" + 0.008*\"yawn\" + 0.008*\"industri\" + 0.008*\"manag\" + 0.007*\"function\"\n", + "2019-01-31 00:41:44,397 : INFO : topic #30 (0.020): 0.038*\"cleveland\" + 0.037*\"leagu\" + 0.028*\"place\" + 0.026*\"taxpay\" + 0.026*\"scientist\" + 0.023*\"crete\" + 0.021*\"folei\" + 0.016*\"goal\" + 0.015*\"martin\" + 0.012*\"schmitz\"\n", + "2019-01-31 00:41:44,398 : INFO : topic #25 (0.020): 0.032*\"ring\" + 0.018*\"warmth\" + 0.017*\"lagrang\" + 0.017*\"area\" + 0.016*\"mount\" + 0.009*\"foam\" + 0.009*\"palmer\" + 0.008*\"vacant\" + 0.008*\"north\" + 0.008*\"land\"\n", + "2019-01-31 00:41:44,405 : INFO : topic diff=0.006691, rho=0.036491\n", + "2019-01-31 00:41:44,620 : INFO : PROGRESS: pass 0, at document #1504000/4922894\n", + "2019-01-31 00:41:46,054 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:41:46,320 : INFO : topic #27 (0.020): 0.074*\"questionnair\" + 0.019*\"taxpay\" + 0.018*\"candid\" + 0.013*\"driver\" + 0.013*\"godaddi\" + 0.012*\"fool\" + 0.011*\"ret\" + 0.011*\"find\" + 0.011*\"tornado\" + 0.011*\"squatter\"\n", + "2019-01-31 00:41:46,321 : INFO : topic #21 (0.020): 0.038*\"samford\" + 0.021*\"spain\" + 0.018*\"mexico\" + 0.018*\"del\" + 0.013*\"francisco\" + 0.013*\"soviet\" + 0.013*\"santa\" + 0.011*\"juan\" + 0.011*\"lizard\" + 0.011*\"carlo\"\n", + "2019-01-31 00:41:46,323 : INFO : topic #48 (0.020): 0.076*\"sens\" + 0.076*\"octob\" + 0.075*\"march\" + 0.070*\"juli\" + 0.068*\"januari\" + 0.067*\"april\" + 0.067*\"notion\" + 0.066*\"august\" + 0.066*\"judici\" + 0.064*\"decatur\"\n", + "2019-01-31 00:41:46,324 : INFO : topic #24 (0.020): 0.041*\"book\" + 0.035*\"publicis\" + 0.024*\"word\" + 0.018*\"new\" + 0.014*\"edit\" + 0.013*\"presid\" + 0.013*\"storag\" + 0.012*\"nicola\" + 0.012*\"collect\" + 0.011*\"magazin\"\n", + "2019-01-31 00:41:46,325 : INFO : topic #14 (0.020): 0.025*\"forc\" + 0.024*\"aggress\" + 0.021*\"armi\" + 0.020*\"walter\" + 0.017*\"com\" + 0.013*\"unionist\" + 0.013*\"oper\" + 0.013*\"militari\" + 0.012*\"diversifi\" + 0.011*\"airbu\"\n", + "2019-01-31 00:41:46,331 : INFO : topic diff=0.005575, rho=0.036466\n", + "2019-01-31 00:41:46,488 : INFO : PROGRESS: pass 0, at document #1506000/4922894\n", + "2019-01-31 00:41:47,896 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:41:48,163 : INFO : topic #14 (0.020): 0.025*\"forc\" + 0.023*\"aggress\" + 0.021*\"armi\" + 0.020*\"walter\" + 0.017*\"com\" + 0.013*\"unionist\" + 0.013*\"oper\" + 0.013*\"militari\" + 0.012*\"diversifi\" + 0.011*\"airbu\"\n", + "2019-01-31 00:41:48,164 : INFO : topic #38 (0.020): 0.023*\"walter\" + 0.010*\"battalion\" + 0.009*\"aza\" + 0.008*\"forc\" + 0.007*\"teufel\" + 0.007*\"armi\" + 0.007*\"empath\" + 0.006*\"militari\" + 0.006*\"govern\" + 0.006*\"king\"\n", + "2019-01-31 00:41:48,165 : INFO : topic #15 (0.020): 0.011*\"small\" + 0.011*\"organ\" + 0.010*\"develop\" + 0.010*\"commun\" + 0.009*\"group\" + 0.009*\"word\" + 0.008*\"peopl\" + 0.008*\"cultur\" + 0.007*\"woman\" + 0.007*\"human\"\n", + "2019-01-31 00:41:48,167 : INFO : topic #19 (0.020): 0.015*\"languag\" + 0.011*\"centuri\" + 0.010*\"woodcut\" + 0.010*\"form\" + 0.009*\"origin\" + 0.008*\"mean\" + 0.007*\"trade\" + 0.007*\"like\" + 0.006*\"god\" + 0.006*\"known\"\n", + "2019-01-31 00:41:48,168 : INFO : topic #41 (0.020): 0.041*\"citi\" + 0.028*\"new\" + 0.023*\"palmer\" + 0.014*\"strategist\" + 0.013*\"center\" + 0.012*\"open\" + 0.011*\"year\" + 0.011*\"includ\" + 0.010*\"lobe\" + 0.009*\"dai\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 00:41:48,174 : INFO : topic diff=0.006276, rho=0.036442\n", + "2019-01-31 00:41:48,332 : INFO : PROGRESS: pass 0, at document #1508000/4922894\n", + "2019-01-31 00:41:49,754 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:41:50,020 : INFO : topic #31 (0.020): 0.058*\"fusiform\" + 0.025*\"scientist\" + 0.024*\"player\" + 0.024*\"taxpay\" + 0.020*\"place\" + 0.014*\"clot\" + 0.012*\"folei\" + 0.012*\"leagu\" + 0.010*\"yawn\" + 0.009*\"reconstruct\"\n", + "2019-01-31 00:41:50,022 : INFO : topic #12 (0.020): 0.009*\"number\" + 0.008*\"frontal\" + 0.007*\"gener\" + 0.006*\"théori\" + 0.006*\"poet\" + 0.006*\"exampl\" + 0.006*\"southern\" + 0.006*\"servitud\" + 0.006*\"method\" + 0.005*\"differ\"\n", + "2019-01-31 00:41:50,023 : INFO : topic #24 (0.020): 0.041*\"book\" + 0.035*\"publicis\" + 0.024*\"word\" + 0.018*\"new\" + 0.014*\"edit\" + 0.013*\"presid\" + 0.012*\"storag\" + 0.012*\"nicola\" + 0.012*\"collect\" + 0.011*\"magazin\"\n", + "2019-01-31 00:41:50,024 : INFO : topic #27 (0.020): 0.074*\"questionnair\" + 0.019*\"taxpay\" + 0.018*\"candid\" + 0.013*\"driver\" + 0.013*\"godaddi\" + 0.012*\"fool\" + 0.012*\"ret\" + 0.011*\"find\" + 0.011*\"tornado\" + 0.011*\"squatter\"\n", + "2019-01-31 00:41:50,025 : INFO : topic #21 (0.020): 0.038*\"samford\" + 0.020*\"spain\" + 0.018*\"del\" + 0.017*\"mexico\" + 0.013*\"santa\" + 0.013*\"francisco\" + 0.013*\"soviet\" + 0.011*\"lizard\" + 0.011*\"juan\" + 0.011*\"carlo\"\n", + "2019-01-31 00:41:50,031 : INFO : topic diff=0.005304, rho=0.036418\n", + "2019-01-31 00:41:50,190 : INFO : PROGRESS: pass 0, at document #1510000/4922894\n", + "2019-01-31 00:41:51,602 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:41:51,869 : INFO : topic #6 (0.020): 0.072*\"fewer\" + 0.025*\"septemb\" + 0.023*\"epiru\" + 0.018*\"teacher\" + 0.016*\"stake\" + 0.012*\"proclaim\" + 0.012*\"rodríguez\" + 0.011*\"direct\" + 0.011*\"movi\" + 0.010*\"acrimoni\"\n", + "2019-01-31 00:41:51,870 : INFO : topic #34 (0.020): 0.073*\"start\" + 0.032*\"unionist\" + 0.031*\"cotton\" + 0.031*\"american\" + 0.027*\"new\" + 0.016*\"year\" + 0.014*\"california\" + 0.012*\"warrior\" + 0.012*\"terri\" + 0.012*\"north\"\n", + "2019-01-31 00:41:51,871 : INFO : topic #39 (0.020): 0.050*\"canada\" + 0.039*\"canadian\" + 0.022*\"hoar\" + 0.021*\"toronto\" + 0.018*\"ontario\" + 0.014*\"hydrogen\" + 0.014*\"new\" + 0.012*\"novotná\" + 0.012*\"misericordia\" + 0.012*\"quebec\"\n", + "2019-01-31 00:41:51,872 : INFO : topic #49 (0.020): 0.041*\"india\" + 0.028*\"incumb\" + 0.013*\"anglo\" + 0.013*\"islam\" + 0.012*\"televis\" + 0.012*\"pakistan\" + 0.011*\"alam\" + 0.010*\"sri\" + 0.010*\"muskoge\" + 0.009*\"affection\"\n", + "2019-01-31 00:41:51,873 : INFO : topic #24 (0.020): 0.041*\"book\" + 0.035*\"publicis\" + 0.024*\"word\" + 0.018*\"new\" + 0.014*\"edit\" + 0.013*\"presid\" + 0.012*\"storag\" + 0.012*\"nicola\" + 0.012*\"collect\" + 0.011*\"magazin\"\n", + "2019-01-31 00:41:51,879 : INFO : topic diff=0.007031, rho=0.036394\n", + "2019-01-31 00:41:52,034 : INFO : PROGRESS: pass 0, at document #1512000/4922894\n", + "2019-01-31 00:41:53,429 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:41:53,695 : INFO : topic #12 (0.020): 0.009*\"number\" + 0.008*\"frontal\" + 0.007*\"gener\" + 0.006*\"poet\" + 0.006*\"théori\" + 0.006*\"exampl\" + 0.006*\"southern\" + 0.006*\"servitud\" + 0.006*\"method\" + 0.005*\"differ\"\n", + "2019-01-31 00:41:53,697 : INFO : topic #40 (0.020): 0.088*\"unit\" + 0.023*\"schuster\" + 0.022*\"collector\" + 0.021*\"institut\" + 0.020*\"requir\" + 0.019*\"student\" + 0.014*\"professor\" + 0.012*\"word\" + 0.012*\"http\" + 0.011*\"degre\"\n", + "2019-01-31 00:41:53,698 : INFO : topic #28 (0.020): 0.031*\"build\" + 0.025*\"hous\" + 0.022*\"rivièr\" + 0.017*\"buford\" + 0.012*\"histor\" + 0.012*\"briarwood\" + 0.011*\"constitut\" + 0.011*\"strategist\" + 0.010*\"depress\" + 0.010*\"linear\"\n", + "2019-01-31 00:41:53,699 : INFO : topic #13 (0.020): 0.027*\"australia\" + 0.027*\"sourc\" + 0.027*\"london\" + 0.025*\"new\" + 0.023*\"australian\" + 0.022*\"england\" + 0.019*\"british\" + 0.017*\"ireland\" + 0.015*\"youth\" + 0.014*\"wale\"\n", + "2019-01-31 00:41:53,700 : INFO : topic #44 (0.020): 0.033*\"rooftop\" + 0.030*\"final\" + 0.024*\"wife\" + 0.020*\"tourist\" + 0.018*\"champion\" + 0.016*\"taxpay\" + 0.016*\"martin\" + 0.014*\"chamber\" + 0.013*\"tiepolo\" + 0.013*\"winner\"\n", + "2019-01-31 00:41:53,706 : INFO : topic diff=0.005473, rho=0.036370\n", + "2019-01-31 00:41:53,860 : INFO : PROGRESS: pass 0, at document #1514000/4922894\n", + "2019-01-31 00:41:55,240 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:41:55,506 : INFO : topic #32 (0.020): 0.053*\"district\" + 0.045*\"vigour\" + 0.044*\"popolo\" + 0.041*\"tortur\" + 0.030*\"cotton\" + 0.028*\"area\" + 0.024*\"regim\" + 0.023*\"multitud\" + 0.022*\"citi\" + 0.019*\"cede\"\n", + "2019-01-31 00:41:55,507 : INFO : topic #1 (0.020): 0.054*\"china\" + 0.042*\"chilton\" + 0.025*\"kong\" + 0.025*\"hong\" + 0.023*\"korea\" + 0.022*\"korean\" + 0.018*\"sourc\" + 0.016*\"leah\" + 0.014*\"kim\" + 0.014*\"articul\"\n", + "2019-01-31 00:41:55,508 : INFO : topic #17 (0.020): 0.074*\"church\" + 0.022*\"cathol\" + 0.021*\"christian\" + 0.020*\"bishop\" + 0.015*\"sail\" + 0.015*\"retroflex\" + 0.009*\"cathedr\" + 0.009*\"relationship\" + 0.009*\"historiographi\" + 0.009*\"parish\"\n", + "2019-01-31 00:41:55,509 : INFO : topic #34 (0.020): 0.074*\"start\" + 0.032*\"unionist\" + 0.031*\"cotton\" + 0.031*\"american\" + 0.027*\"new\" + 0.016*\"year\" + 0.014*\"california\" + 0.012*\"warrior\" + 0.012*\"terri\" + 0.012*\"north\"\n", + "2019-01-31 00:41:55,510 : INFO : topic #27 (0.020): 0.074*\"questionnair\" + 0.019*\"taxpay\" + 0.017*\"candid\" + 0.014*\"ret\" + 0.013*\"driver\" + 0.012*\"fool\" + 0.012*\"godaddi\" + 0.011*\"tornado\" + 0.011*\"find\" + 0.010*\"landslid\"\n", + "2019-01-31 00:41:55,516 : INFO : topic diff=0.005304, rho=0.036346\n", + "2019-01-31 00:41:55,672 : INFO : PROGRESS: pass 0, at document #1516000/4922894\n", + "2019-01-31 00:41:57,073 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:41:57,339 : INFO : topic #12 (0.020): 0.009*\"number\" + 0.008*\"frontal\" + 0.007*\"gener\" + 0.006*\"poet\" + 0.006*\"exampl\" + 0.006*\"théori\" + 0.006*\"southern\" + 0.006*\"servitud\" + 0.006*\"method\" + 0.005*\"differ\"\n", + "2019-01-31 00:41:57,341 : INFO : topic #35 (0.020): 0.056*\"russia\" + 0.036*\"sovereignti\" + 0.033*\"rural\" + 0.025*\"reprint\" + 0.025*\"personifi\" + 0.023*\"poison\" + 0.021*\"moscow\" + 0.019*\"unfortun\" + 0.016*\"poland\" + 0.015*\"turin\"\n", + "2019-01-31 00:41:57,342 : INFO : topic #2 (0.020): 0.046*\"isl\" + 0.037*\"shield\" + 0.018*\"narrat\" + 0.013*\"scot\" + 0.012*\"blur\" + 0.012*\"pope\" + 0.011*\"coalit\" + 0.010*\"nativist\" + 0.010*\"bahá\" + 0.009*\"fleet\"\n", + "2019-01-31 00:41:57,343 : INFO : topic #39 (0.020): 0.051*\"canada\" + 0.039*\"canadian\" + 0.022*\"toronto\" + 0.021*\"hoar\" + 0.018*\"ontario\" + 0.014*\"new\" + 0.014*\"hydrogen\" + 0.013*\"novotná\" + 0.012*\"misericordia\" + 0.011*\"quebec\"\n", + "2019-01-31 00:41:57,344 : INFO : topic #13 (0.020): 0.027*\"london\" + 0.026*\"sourc\" + 0.026*\"australia\" + 0.025*\"new\" + 0.023*\"australian\" + 0.022*\"england\" + 0.019*\"british\" + 0.017*\"ireland\" + 0.015*\"youth\" + 0.014*\"wale\"\n", + "2019-01-31 00:41:57,349 : INFO : topic diff=0.006034, rho=0.036322\n", + "2019-01-31 00:41:57,505 : INFO : PROGRESS: pass 0, at document #1518000/4922894\n", + "2019-01-31 00:41:58,899 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:41:59,165 : INFO : topic #25 (0.020): 0.032*\"ring\" + 0.018*\"warmth\" + 0.017*\"area\" + 0.017*\"lagrang\" + 0.015*\"mount\" + 0.009*\"palmer\" + 0.009*\"foam\" + 0.008*\"vacant\" + 0.008*\"north\" + 0.008*\"lobe\"\n", + "2019-01-31 00:41:59,167 : INFO : topic #27 (0.020): 0.074*\"questionnair\" + 0.019*\"taxpay\" + 0.017*\"candid\" + 0.014*\"ret\" + 0.013*\"driver\" + 0.012*\"godaddi\" + 0.012*\"fool\" + 0.011*\"tornado\" + 0.011*\"find\" + 0.010*\"squatter\"\n", + "2019-01-31 00:41:59,168 : INFO : topic #26 (0.020): 0.031*\"workplac\" + 0.030*\"champion\" + 0.027*\"woman\" + 0.025*\"olymp\" + 0.024*\"men\" + 0.022*\"medal\" + 0.021*\"event\" + 0.018*\"nation\" + 0.018*\"taxpay\" + 0.017*\"atheist\"\n", + "2019-01-31 00:41:59,169 : INFO : topic #37 (0.020): 0.009*\"man\" + 0.009*\"love\" + 0.007*\"gestur\" + 0.006*\"charact\" + 0.006*\"septemb\" + 0.006*\"comic\" + 0.005*\"blue\" + 0.005*\"appear\" + 0.005*\"dixi\" + 0.004*\"admit\"\n", + "2019-01-31 00:41:59,170 : INFO : topic #36 (0.020): 0.011*\"network\" + 0.011*\"prognosi\" + 0.010*\"pop\" + 0.009*\"develop\" + 0.009*\"cytokin\" + 0.008*\"user\" + 0.008*\"softwar\" + 0.007*\"championship\" + 0.007*\"diggin\" + 0.007*\"uruguayan\"\n", + "2019-01-31 00:41:59,176 : INFO : topic diff=0.005246, rho=0.036298\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 00:42:01,852 : INFO : -11.877 per-word bound, 3762.5 perplexity estimate based on a held-out corpus of 2000 documents with 535638 words\n", + "2019-01-31 00:42:01,852 : INFO : PROGRESS: pass 0, at document #1520000/4922894\n", + "2019-01-31 00:42:03,233 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:42:03,500 : INFO : topic #47 (0.020): 0.066*\"muscl\" + 0.035*\"perceptu\" + 0.020*\"theater\" + 0.018*\"place\" + 0.017*\"compos\" + 0.017*\"damn\" + 0.014*\"olympo\" + 0.014*\"physician\" + 0.013*\"orchestr\" + 0.012*\"word\"\n", + "2019-01-31 00:42:03,501 : INFO : topic #40 (0.020): 0.088*\"unit\" + 0.023*\"schuster\" + 0.022*\"collector\" + 0.021*\"institut\" + 0.020*\"requir\" + 0.019*\"student\" + 0.014*\"professor\" + 0.012*\"word\" + 0.012*\"http\" + 0.011*\"degre\"\n", + "2019-01-31 00:42:03,502 : INFO : topic #35 (0.020): 0.056*\"russia\" + 0.035*\"sovereignti\" + 0.033*\"rural\" + 0.026*\"personifi\" + 0.025*\"reprint\" + 0.024*\"poison\" + 0.021*\"moscow\" + 0.019*\"unfortun\" + 0.016*\"poland\" + 0.014*\"turin\"\n", + "2019-01-31 00:42:03,503 : INFO : topic #7 (0.020): 0.022*\"snatch\" + 0.020*\"di\" + 0.018*\"factor\" + 0.016*\"yawn\" + 0.015*\"margin\" + 0.014*\"life\" + 0.014*\"bone\" + 0.012*\"faster\" + 0.012*\"will\" + 0.012*\"daughter\"\n", + "2019-01-31 00:42:03,505 : INFO : topic #17 (0.020): 0.074*\"church\" + 0.022*\"cathol\" + 0.021*\"christian\" + 0.021*\"bishop\" + 0.015*\"sail\" + 0.015*\"retroflex\" + 0.009*\"relationship\" + 0.009*\"historiographi\" + 0.009*\"cathedr\" + 0.009*\"centuri\"\n", + "2019-01-31 00:42:03,510 : INFO : topic diff=0.004966, rho=0.036274\n", + "2019-01-31 00:42:03,670 : INFO : PROGRESS: pass 0, at document #1522000/4922894\n", + "2019-01-31 00:42:05,434 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:42:05,702 : INFO : topic #24 (0.020): 0.042*\"book\" + 0.035*\"publicis\" + 0.024*\"word\" + 0.018*\"new\" + 0.014*\"edit\" + 0.013*\"presid\" + 0.012*\"storag\" + 0.012*\"nicola\" + 0.012*\"collect\" + 0.011*\"author\"\n", + "2019-01-31 00:42:05,703 : INFO : topic #39 (0.020): 0.050*\"canada\" + 0.039*\"canadian\" + 0.021*\"toronto\" + 0.021*\"hoar\" + 0.018*\"ontario\" + 0.014*\"new\" + 0.014*\"hydrogen\" + 0.013*\"misericordia\" + 0.013*\"novotná\" + 0.012*\"quebec\"\n", + "2019-01-31 00:42:05,704 : INFO : topic #9 (0.020): 0.073*\"bone\" + 0.043*\"american\" + 0.025*\"valour\" + 0.019*\"dutch\" + 0.018*\"polit\" + 0.017*\"player\" + 0.017*\"folei\" + 0.016*\"english\" + 0.013*\"acrimoni\" + 0.013*\"simpler\"\n", + "2019-01-31 00:42:05,705 : INFO : topic #45 (0.020): 0.026*\"jpg\" + 0.025*\"fifteenth\" + 0.017*\"illicit\" + 0.016*\"colder\" + 0.015*\"western\" + 0.015*\"black\" + 0.012*\"record\" + 0.010*\"blind\" + 0.007*\"light\" + 0.007*\"depress\"\n", + "2019-01-31 00:42:05,706 : INFO : topic #18 (0.020): 0.010*\"théori\" + 0.007*\"later\" + 0.007*\"sack\" + 0.006*\"kill\" + 0.006*\"dai\" + 0.005*\"retrospect\" + 0.004*\"end\" + 0.004*\"like\" + 0.004*\"man\" + 0.004*\"call\"\n", + "2019-01-31 00:42:05,712 : INFO : topic diff=0.005709, rho=0.036250\n", + "2019-01-31 00:42:05,870 : INFO : PROGRESS: pass 0, at document #1524000/4922894\n", + "2019-01-31 00:42:07,731 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:42:07,999 : INFO : topic #39 (0.020): 0.050*\"canada\" + 0.039*\"canadian\" + 0.021*\"toronto\" + 0.021*\"hoar\" + 0.018*\"ontario\" + 0.014*\"new\" + 0.014*\"hydrogen\" + 0.013*\"misericordia\" + 0.012*\"novotná\" + 0.012*\"quebec\"\n", + "2019-01-31 00:42:08,000 : INFO : topic #38 (0.020): 0.023*\"walter\" + 0.010*\"aza\" + 0.009*\"battalion\" + 0.008*\"forc\" + 0.007*\"teufel\" + 0.007*\"armi\" + 0.007*\"empath\" + 0.006*\"militari\" + 0.006*\"govern\" + 0.006*\"pour\"\n", + "2019-01-31 00:42:08,001 : INFO : topic #9 (0.020): 0.073*\"bone\" + 0.043*\"american\" + 0.025*\"valour\" + 0.019*\"dutch\" + 0.018*\"polit\" + 0.017*\"player\" + 0.017*\"folei\" + 0.016*\"english\" + 0.013*\"acrimoni\" + 0.013*\"simpler\"\n", + "2019-01-31 00:42:08,002 : INFO : topic #10 (0.020): 0.010*\"cdd\" + 0.008*\"disco\" + 0.008*\"media\" + 0.008*\"pathwai\" + 0.007*\"hormon\" + 0.007*\"caus\" + 0.007*\"have\" + 0.006*\"effect\" + 0.006*\"proper\" + 0.006*\"treat\"\n", + "2019-01-31 00:42:08,003 : INFO : topic #30 (0.020): 0.037*\"cleveland\" + 0.037*\"leagu\" + 0.029*\"place\" + 0.026*\"taxpay\" + 0.026*\"scientist\" + 0.023*\"crete\" + 0.021*\"folei\" + 0.017*\"goal\" + 0.015*\"martin\" + 0.012*\"schmitz\"\n", + "2019-01-31 00:42:08,009 : INFO : topic diff=0.006597, rho=0.036226\n", + "2019-01-31 00:42:08,170 : INFO : PROGRESS: pass 0, at document #1526000/4922894\n", + "2019-01-31 00:42:09,648 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:42:09,915 : INFO : topic #2 (0.020): 0.046*\"isl\" + 0.038*\"shield\" + 0.017*\"narrat\" + 0.013*\"scot\" + 0.012*\"blur\" + 0.012*\"pope\" + 0.011*\"coalit\" + 0.010*\"nativist\" + 0.009*\"class\" + 0.009*\"fleet\"\n", + "2019-01-31 00:42:09,916 : INFO : topic #5 (0.020): 0.039*\"abroad\" + 0.029*\"son\" + 0.027*\"rel\" + 0.026*\"reconstruct\" + 0.022*\"band\" + 0.016*\"muscl\" + 0.016*\"simultan\" + 0.014*\"charcoal\" + 0.014*\"toyota\" + 0.010*\"myspac\"\n", + "2019-01-31 00:42:09,917 : INFO : topic #16 (0.020): 0.048*\"king\" + 0.030*\"priest\" + 0.019*\"grammat\" + 0.019*\"quarterli\" + 0.019*\"rotterdam\" + 0.018*\"idiosyncrat\" + 0.018*\"duke\" + 0.015*\"kingdom\" + 0.014*\"portugues\" + 0.013*\"maria\"\n", + "2019-01-31 00:42:09,918 : INFO : topic #33 (0.020): 0.063*\"french\" + 0.045*\"franc\" + 0.030*\"pari\" + 0.021*\"sail\" + 0.021*\"jean\" + 0.018*\"daphn\" + 0.014*\"lazi\" + 0.013*\"loui\" + 0.011*\"piec\" + 0.010*\"wine\"\n", + "2019-01-31 00:42:09,919 : INFO : topic #27 (0.020): 0.073*\"questionnair\" + 0.019*\"taxpay\" + 0.018*\"candid\" + 0.016*\"ret\" + 0.013*\"driver\" + 0.012*\"tornado\" + 0.012*\"find\" + 0.011*\"fool\" + 0.011*\"godaddi\" + 0.010*\"squatter\"\n", + "2019-01-31 00:42:09,925 : INFO : topic diff=0.006089, rho=0.036202\n", + "2019-01-31 00:42:10,079 : INFO : PROGRESS: pass 0, at document #1528000/4922894\n", + "2019-01-31 00:42:11,456 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:42:11,723 : INFO : topic #9 (0.020): 0.073*\"bone\" + 0.042*\"american\" + 0.026*\"valour\" + 0.019*\"dutch\" + 0.018*\"polit\" + 0.017*\"player\" + 0.017*\"folei\" + 0.016*\"english\" + 0.013*\"acrimoni\" + 0.013*\"simpler\"\n", + "2019-01-31 00:42:11,724 : INFO : topic #44 (0.020): 0.032*\"rooftop\" + 0.029*\"final\" + 0.023*\"wife\" + 0.020*\"tourist\" + 0.019*\"champion\" + 0.017*\"taxpay\" + 0.015*\"martin\" + 0.014*\"chamber\" + 0.013*\"tiepolo\" + 0.012*\"winner\"\n", + "2019-01-31 00:42:11,725 : INFO : topic #5 (0.020): 0.039*\"abroad\" + 0.029*\"son\" + 0.027*\"rel\" + 0.026*\"reconstruct\" + 0.022*\"band\" + 0.016*\"muscl\" + 0.016*\"simultan\" + 0.014*\"charcoal\" + 0.014*\"toyota\" + 0.010*\"myspac\"\n", + "2019-01-31 00:42:11,726 : INFO : topic #18 (0.020): 0.010*\"théori\" + 0.007*\"later\" + 0.007*\"sack\" + 0.006*\"kill\" + 0.006*\"dai\" + 0.005*\"retrospect\" + 0.005*\"like\" + 0.004*\"end\" + 0.004*\"man\" + 0.004*\"call\"\n", + "2019-01-31 00:42:11,727 : INFO : topic #40 (0.020): 0.088*\"unit\" + 0.023*\"schuster\" + 0.022*\"collector\" + 0.022*\"institut\" + 0.020*\"requir\" + 0.018*\"student\" + 0.014*\"professor\" + 0.012*\"word\" + 0.011*\"http\" + 0.011*\"degre\"\n", + "2019-01-31 00:42:11,733 : INFO : topic diff=0.006765, rho=0.036179\n", + "2019-01-31 00:42:11,891 : INFO : PROGRESS: pass 0, at document #1530000/4922894\n", + "2019-01-31 00:42:13,296 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:42:13,563 : INFO : topic #30 (0.020): 0.037*\"leagu\" + 0.037*\"cleveland\" + 0.029*\"place\" + 0.027*\"taxpay\" + 0.026*\"scientist\" + 0.023*\"crete\" + 0.021*\"folei\" + 0.017*\"goal\" + 0.015*\"martin\" + 0.011*\"schmitz\"\n", + "2019-01-31 00:42:13,564 : INFO : topic #32 (0.020): 0.052*\"district\" + 0.045*\"vigour\" + 0.044*\"popolo\" + 0.040*\"tortur\" + 0.029*\"cotton\" + 0.028*\"area\" + 0.024*\"regim\" + 0.023*\"multitud\" + 0.022*\"citi\" + 0.019*\"commun\"\n", + "2019-01-31 00:42:13,565 : INFO : topic #46 (0.020): 0.018*\"stop\" + 0.018*\"swedish\" + 0.018*\"sweden\" + 0.017*\"norwai\" + 0.015*\"wind\" + 0.015*\"norwegian\" + 0.014*\"damag\" + 0.012*\"huntsvil\" + 0.011*\"farid\" + 0.011*\"denmark\"\n", + "2019-01-31 00:42:13,566 : INFO : topic #33 (0.020): 0.063*\"french\" + 0.045*\"franc\" + 0.031*\"pari\" + 0.021*\"sail\" + 0.021*\"jean\" + 0.019*\"daphn\" + 0.014*\"lazi\" + 0.013*\"loui\" + 0.010*\"piec\" + 0.009*\"wine\"\n", + "2019-01-31 00:42:13,567 : INFO : topic #15 (0.020): 0.011*\"small\" + 0.011*\"organ\" + 0.010*\"commun\" + 0.010*\"develop\" + 0.009*\"group\" + 0.009*\"word\" + 0.008*\"peopl\" + 0.008*\"cultur\" + 0.007*\"human\" + 0.006*\"woman\"\n", + "2019-01-31 00:42:13,573 : INFO : topic diff=0.005706, rho=0.036155\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 00:42:13,731 : INFO : PROGRESS: pass 0, at document #1532000/4922894\n", + "2019-01-31 00:42:15,138 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:42:15,404 : INFO : topic #30 (0.020): 0.037*\"leagu\" + 0.037*\"cleveland\" + 0.029*\"place\" + 0.027*\"taxpay\" + 0.026*\"scientist\" + 0.023*\"crete\" + 0.021*\"folei\" + 0.017*\"goal\" + 0.015*\"martin\" + 0.011*\"schmitz\"\n", + "2019-01-31 00:42:15,405 : INFO : topic #43 (0.020): 0.064*\"elect\" + 0.054*\"parti\" + 0.024*\"voluntari\" + 0.022*\"democrat\" + 0.020*\"member\" + 0.017*\"polici\" + 0.014*\"republ\" + 0.013*\"report\" + 0.013*\"seaport\" + 0.013*\"bypass\"\n", + "2019-01-31 00:42:15,406 : INFO : topic #37 (0.020): 0.009*\"man\" + 0.009*\"love\" + 0.008*\"gestur\" + 0.006*\"charact\" + 0.006*\"septemb\" + 0.006*\"comic\" + 0.005*\"blue\" + 0.005*\"appear\" + 0.004*\"dixi\" + 0.004*\"admit\"\n", + "2019-01-31 00:42:15,407 : INFO : topic #19 (0.020): 0.016*\"languag\" + 0.012*\"centuri\" + 0.010*\"woodcut\" + 0.009*\"form\" + 0.009*\"origin\" + 0.008*\"mean\" + 0.007*\"trade\" + 0.007*\"like\" + 0.007*\"english\" + 0.007*\"known\"\n", + "2019-01-31 00:42:15,408 : INFO : topic #39 (0.020): 0.049*\"canada\" + 0.038*\"canadian\" + 0.021*\"hoar\" + 0.021*\"ontario\" + 0.021*\"toronto\" + 0.014*\"new\" + 0.013*\"hydrogen\" + 0.013*\"novotná\" + 0.013*\"misericordia\" + 0.012*\"quebec\"\n", + "2019-01-31 00:42:15,414 : INFO : topic diff=0.005029, rho=0.036131\n", + "2019-01-31 00:42:15,628 : INFO : PROGRESS: pass 0, at document #1534000/4922894\n", + "2019-01-31 00:42:17,029 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:42:17,295 : INFO : topic #34 (0.020): 0.072*\"start\" + 0.032*\"unionist\" + 0.031*\"american\" + 0.030*\"cotton\" + 0.027*\"new\" + 0.016*\"year\" + 0.014*\"california\" + 0.012*\"warrior\" + 0.012*\"north\" + 0.012*\"terri\"\n", + "2019-01-31 00:42:17,296 : INFO : topic #23 (0.020): 0.136*\"audit\" + 0.069*\"best\" + 0.036*\"yawn\" + 0.027*\"jacksonvil\" + 0.024*\"japanes\" + 0.024*\"festiv\" + 0.021*\"noll\" + 0.019*\"women\" + 0.018*\"intern\" + 0.014*\"prison\"\n", + "2019-01-31 00:42:17,297 : INFO : topic #45 (0.020): 0.025*\"jpg\" + 0.024*\"fifteenth\" + 0.018*\"illicit\" + 0.016*\"colder\" + 0.015*\"black\" + 0.015*\"western\" + 0.012*\"record\" + 0.010*\"blind\" + 0.007*\"light\" + 0.007*\"depress\"\n", + "2019-01-31 00:42:17,298 : INFO : topic #30 (0.020): 0.037*\"leagu\" + 0.037*\"cleveland\" + 0.029*\"place\" + 0.027*\"taxpay\" + 0.026*\"scientist\" + 0.023*\"crete\" + 0.021*\"folei\" + 0.017*\"goal\" + 0.015*\"martin\" + 0.012*\"schmitz\"\n", + "2019-01-31 00:42:17,299 : INFO : topic #33 (0.020): 0.062*\"french\" + 0.044*\"franc\" + 0.030*\"pari\" + 0.022*\"sail\" + 0.021*\"jean\" + 0.019*\"daphn\" + 0.014*\"lazi\" + 0.012*\"loui\" + 0.011*\"piec\" + 0.009*\"wine\"\n", + "2019-01-31 00:42:17,305 : INFO : topic diff=0.005688, rho=0.036108\n", + "2019-01-31 00:42:17,460 : INFO : PROGRESS: pass 0, at document #1536000/4922894\n", + "2019-01-31 00:42:18,844 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:42:19,111 : INFO : topic #7 (0.020): 0.021*\"snatch\" + 0.019*\"di\" + 0.018*\"factor\" + 0.016*\"yawn\" + 0.015*\"margin\" + 0.014*\"bone\" + 0.014*\"life\" + 0.012*\"faster\" + 0.012*\"daughter\" + 0.011*\"will\"\n", + "2019-01-31 00:42:19,112 : INFO : topic #37 (0.020): 0.009*\"man\" + 0.009*\"love\" + 0.008*\"gestur\" + 0.006*\"charact\" + 0.006*\"septemb\" + 0.006*\"comic\" + 0.005*\"blue\" + 0.005*\"appear\" + 0.004*\"dixi\" + 0.004*\"admit\"\n", + "2019-01-31 00:42:19,113 : INFO : topic #18 (0.020): 0.010*\"théori\" + 0.007*\"later\" + 0.007*\"sack\" + 0.006*\"kill\" + 0.006*\"dai\" + 0.005*\"retrospect\" + 0.005*\"like\" + 0.004*\"end\" + 0.004*\"help\" + 0.004*\"man\"\n", + "2019-01-31 00:42:19,114 : INFO : topic #6 (0.020): 0.072*\"fewer\" + 0.024*\"septemb\" + 0.024*\"epiru\" + 0.018*\"teacher\" + 0.016*\"stake\" + 0.012*\"proclaim\" + 0.012*\"rodríguez\" + 0.011*\"direct\" + 0.011*\"movi\" + 0.010*\"acrimoni\"\n", + "2019-01-31 00:42:19,115 : INFO : topic #14 (0.020): 0.025*\"forc\" + 0.024*\"aggress\" + 0.020*\"walter\" + 0.020*\"armi\" + 0.017*\"com\" + 0.013*\"unionist\" + 0.013*\"oper\" + 0.013*\"militari\" + 0.012*\"airbu\" + 0.011*\"diversifi\"\n", + "2019-01-31 00:42:19,121 : INFO : topic diff=0.004895, rho=0.036084\n", + "2019-01-31 00:42:19,277 : INFO : PROGRESS: pass 0, at document #1538000/4922894\n", + "2019-01-31 00:42:20,672 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:42:20,938 : INFO : topic #9 (0.020): 0.074*\"bone\" + 0.040*\"american\" + 0.026*\"valour\" + 0.018*\"dutch\" + 0.017*\"polit\" + 0.016*\"folei\" + 0.016*\"player\" + 0.016*\"english\" + 0.013*\"acrimoni\" + 0.012*\"simpler\"\n", + "2019-01-31 00:42:20,940 : INFO : topic #3 (0.020): 0.034*\"present\" + 0.026*\"offic\" + 0.025*\"minist\" + 0.022*\"serv\" + 0.021*\"nation\" + 0.020*\"govern\" + 0.020*\"member\" + 0.019*\"gener\" + 0.016*\"seri\" + 0.015*\"chickasaw\"\n", + "2019-01-31 00:42:20,941 : INFO : topic #28 (0.020): 0.031*\"build\" + 0.025*\"hous\" + 0.021*\"rivièr\" + 0.017*\"buford\" + 0.013*\"histor\" + 0.012*\"briarwood\" + 0.011*\"constitut\" + 0.010*\"strategist\" + 0.010*\"depress\" + 0.010*\"linear\"\n", + "2019-01-31 00:42:20,942 : INFO : topic #42 (0.020): 0.045*\"german\" + 0.029*\"germani\" + 0.014*\"vol\" + 0.014*\"jewish\" + 0.014*\"israel\" + 0.013*\"berlin\" + 0.013*\"der\" + 0.010*\"europ\" + 0.010*\"european\" + 0.009*\"itali\"\n", + "2019-01-31 00:42:20,943 : INFO : topic #27 (0.020): 0.073*\"questionnair\" + 0.019*\"taxpay\" + 0.017*\"candid\" + 0.015*\"ret\" + 0.013*\"driver\" + 0.012*\"tornado\" + 0.012*\"fool\" + 0.012*\"find\" + 0.011*\"squatter\" + 0.010*\"landslid\"\n", + "2019-01-31 00:42:20,949 : INFO : topic diff=0.005520, rho=0.036061\n", + "2019-01-31 00:42:23,608 : INFO : -11.625 per-word bound, 3157.7 perplexity estimate based on a held-out corpus of 2000 documents with 517770 words\n", + "2019-01-31 00:42:23,609 : INFO : PROGRESS: pass 0, at document #1540000/4922894\n", + "2019-01-31 00:42:24,992 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:42:25,258 : INFO : topic #44 (0.020): 0.031*\"rooftop\" + 0.028*\"final\" + 0.023*\"wife\" + 0.020*\"tourist\" + 0.019*\"champion\" + 0.016*\"taxpay\" + 0.015*\"martin\" + 0.014*\"chamber\" + 0.013*\"tiepolo\" + 0.012*\"winner\"\n", + "2019-01-31 00:42:25,259 : INFO : topic #8 (0.020): 0.027*\"law\" + 0.024*\"cortic\" + 0.018*\"start\" + 0.017*\"act\" + 0.013*\"ricardo\" + 0.013*\"case\" + 0.010*\"polaris\" + 0.009*\"replac\" + 0.008*\"legal\" + 0.008*\"order\"\n", + "2019-01-31 00:42:25,261 : INFO : topic #17 (0.020): 0.074*\"church\" + 0.022*\"cathol\" + 0.021*\"bishop\" + 0.020*\"christian\" + 0.015*\"sail\" + 0.015*\"retroflex\" + 0.010*\"cathedr\" + 0.009*\"historiographi\" + 0.009*\"centuri\" + 0.009*\"parish\"\n", + "2019-01-31 00:42:25,262 : INFO : topic #29 (0.020): 0.026*\"companhia\" + 0.011*\"million\" + 0.011*\"busi\" + 0.010*\"bank\" + 0.010*\"market\" + 0.009*\"produc\" + 0.008*\"industri\" + 0.008*\"yawn\" + 0.008*\"manag\" + 0.007*\"function\"\n", + "2019-01-31 00:42:25,263 : INFO : topic #35 (0.020): 0.057*\"russia\" + 0.035*\"sovereignti\" + 0.033*\"rural\" + 0.026*\"reprint\" + 0.025*\"personifi\" + 0.024*\"poison\" + 0.020*\"moscow\" + 0.019*\"unfortun\" + 0.016*\"poland\" + 0.015*\"czech\"\n", + "2019-01-31 00:42:25,268 : INFO : topic diff=0.005680, rho=0.036037\n", + "2019-01-31 00:42:25,425 : INFO : PROGRESS: pass 0, at document #1542000/4922894\n", + "2019-01-31 00:42:26,804 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:42:27,071 : INFO : topic #26 (0.020): 0.030*\"workplac\" + 0.029*\"champion\" + 0.028*\"woman\" + 0.026*\"olymp\" + 0.023*\"medal\" + 0.023*\"men\" + 0.021*\"event\" + 0.019*\"nation\" + 0.018*\"taxpay\" + 0.017*\"atheist\"\n", + "2019-01-31 00:42:27,072 : INFO : topic #36 (0.020): 0.012*\"network\" + 0.012*\"prognosi\" + 0.010*\"pop\" + 0.009*\"develop\" + 0.008*\"softwar\" + 0.008*\"user\" + 0.008*\"cytokin\" + 0.007*\"diggin\" + 0.007*\"championship\" + 0.007*\"includ\"\n", + "2019-01-31 00:42:27,073 : INFO : topic #32 (0.020): 0.053*\"district\" + 0.045*\"vigour\" + 0.044*\"popolo\" + 0.039*\"tortur\" + 0.029*\"cotton\" + 0.027*\"area\" + 0.024*\"regim\" + 0.023*\"multitud\" + 0.022*\"citi\" + 0.019*\"commun\"\n", + "2019-01-31 00:42:27,074 : INFO : topic #19 (0.020): 0.016*\"languag\" + 0.012*\"centuri\" + 0.010*\"woodcut\" + 0.009*\"form\" + 0.009*\"origin\" + 0.008*\"mean\" + 0.007*\"trade\" + 0.007*\"english\" + 0.007*\"like\" + 0.007*\"known\"\n", + "2019-01-31 00:42:27,075 : INFO : topic #45 (0.020): 0.025*\"jpg\" + 0.024*\"fifteenth\" + 0.018*\"illicit\" + 0.016*\"colder\" + 0.016*\"black\" + 0.015*\"western\" + 0.013*\"record\" + 0.011*\"blind\" + 0.007*\"light\" + 0.007*\"green\"\n", + "2019-01-31 00:42:27,081 : INFO : topic diff=0.005784, rho=0.036014\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 00:42:27,234 : INFO : PROGRESS: pass 0, at document #1544000/4922894\n", + "2019-01-31 00:42:28,602 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:42:28,869 : INFO : topic #7 (0.020): 0.021*\"snatch\" + 0.020*\"di\" + 0.018*\"factor\" + 0.016*\"yawn\" + 0.015*\"margin\" + 0.014*\"bone\" + 0.014*\"life\" + 0.012*\"faster\" + 0.012*\"daughter\" + 0.012*\"deal\"\n", + "2019-01-31 00:42:28,870 : INFO : topic #30 (0.020): 0.037*\"cleveland\" + 0.037*\"leagu\" + 0.029*\"place\" + 0.027*\"taxpay\" + 0.026*\"scientist\" + 0.023*\"crete\" + 0.021*\"folei\" + 0.016*\"goal\" + 0.015*\"martin\" + 0.012*\"schmitz\"\n", + "2019-01-31 00:42:28,871 : INFO : topic #35 (0.020): 0.056*\"russia\" + 0.035*\"sovereignti\" + 0.034*\"rural\" + 0.026*\"reprint\" + 0.024*\"personifi\" + 0.024*\"poison\" + 0.019*\"moscow\" + 0.019*\"unfortun\" + 0.016*\"poland\" + 0.015*\"czech\"\n", + "2019-01-31 00:42:28,872 : INFO : topic #0 (0.020): 0.065*\"statewid\" + 0.040*\"line\" + 0.036*\"arsen\" + 0.035*\"raid\" + 0.027*\"museo\" + 0.022*\"traceabl\" + 0.018*\"serv\" + 0.015*\"exhaust\" + 0.014*\"pain\" + 0.012*\"oper\"\n", + "2019-01-31 00:42:28,873 : INFO : topic #29 (0.020): 0.026*\"companhia\" + 0.011*\"million\" + 0.011*\"busi\" + 0.010*\"market\" + 0.010*\"bank\" + 0.009*\"produc\" + 0.008*\"industri\" + 0.008*\"yawn\" + 0.008*\"manag\" + 0.007*\"function\"\n", + "2019-01-31 00:42:28,879 : INFO : topic diff=0.005157, rho=0.035991\n", + "2019-01-31 00:42:29,037 : INFO : PROGRESS: pass 0, at document #1546000/4922894\n", + "2019-01-31 00:42:30,433 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:42:30,700 : INFO : topic #23 (0.020): 0.137*\"audit\" + 0.070*\"best\" + 0.036*\"yawn\" + 0.027*\"jacksonvil\" + 0.024*\"festiv\" + 0.024*\"japanes\" + 0.021*\"noll\" + 0.019*\"women\" + 0.018*\"intern\" + 0.014*\"prison\"\n", + "2019-01-31 00:42:30,701 : INFO : topic #5 (0.020): 0.039*\"abroad\" + 0.029*\"son\" + 0.026*\"rel\" + 0.025*\"reconstruct\" + 0.021*\"band\" + 0.016*\"muscl\" + 0.016*\"simultan\" + 0.015*\"charcoal\" + 0.014*\"toyota\" + 0.010*\"myspac\"\n", + "2019-01-31 00:42:30,702 : INFO : topic #4 (0.020): 0.021*\"enfranchis\" + 0.015*\"depress\" + 0.015*\"pour\" + 0.009*\"elabor\" + 0.008*\"veget\" + 0.008*\"mode\" + 0.007*\"uruguayan\" + 0.007*\"candid\" + 0.007*\"encyclopedia\" + 0.006*\"produc\"\n", + "2019-01-31 00:42:30,703 : INFO : topic #33 (0.020): 0.063*\"french\" + 0.046*\"franc\" + 0.031*\"pari\" + 0.023*\"sail\" + 0.022*\"jean\" + 0.018*\"daphn\" + 0.014*\"lazi\" + 0.013*\"loui\" + 0.011*\"piec\" + 0.009*\"wine\"\n", + "2019-01-31 00:42:30,704 : INFO : topic #0 (0.020): 0.066*\"statewid\" + 0.039*\"line\" + 0.036*\"arsen\" + 0.035*\"raid\" + 0.028*\"museo\" + 0.022*\"traceabl\" + 0.017*\"serv\" + 0.014*\"exhaust\" + 0.014*\"pain\" + 0.013*\"oper\"\n", + "2019-01-31 00:42:30,710 : INFO : topic diff=0.005858, rho=0.035968\n", + "2019-01-31 00:42:30,868 : INFO : PROGRESS: pass 0, at document #1548000/4922894\n", + "2019-01-31 00:42:32,263 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:42:32,529 : INFO : topic #28 (0.020): 0.031*\"build\" + 0.026*\"hous\" + 0.023*\"rivièr\" + 0.017*\"buford\" + 0.013*\"histor\" + 0.012*\"briarwood\" + 0.011*\"constitut\" + 0.010*\"strategist\" + 0.010*\"depress\" + 0.010*\"linear\"\n", + "2019-01-31 00:42:32,531 : INFO : topic #36 (0.020): 0.012*\"network\" + 0.012*\"prognosi\" + 0.010*\"pop\" + 0.009*\"develop\" + 0.008*\"cytokin\" + 0.008*\"user\" + 0.008*\"softwar\" + 0.008*\"championship\" + 0.008*\"diggin\" + 0.007*\"includ\"\n", + "2019-01-31 00:42:32,532 : INFO : topic #3 (0.020): 0.034*\"present\" + 0.026*\"offic\" + 0.025*\"minist\" + 0.023*\"serv\" + 0.021*\"nation\" + 0.020*\"member\" + 0.019*\"govern\" + 0.018*\"gener\" + 0.016*\"seri\" + 0.015*\"chickasaw\"\n", + "2019-01-31 00:42:32,533 : INFO : topic #41 (0.020): 0.041*\"citi\" + 0.028*\"new\" + 0.022*\"palmer\" + 0.014*\"strategist\" + 0.012*\"center\" + 0.012*\"open\" + 0.011*\"year\" + 0.011*\"includ\" + 0.010*\"lobe\" + 0.009*\"dai\"\n", + "2019-01-31 00:42:32,534 : INFO : topic #45 (0.020): 0.025*\"jpg\" + 0.024*\"fifteenth\" + 0.017*\"illicit\" + 0.016*\"black\" + 0.016*\"colder\" + 0.015*\"western\" + 0.013*\"record\" + 0.010*\"blind\" + 0.008*\"light\" + 0.007*\"green\"\n", + "2019-01-31 00:42:32,540 : INFO : topic diff=0.005734, rho=0.035944\n", + "2019-01-31 00:42:32,694 : INFO : PROGRESS: pass 0, at document #1550000/4922894\n", + "2019-01-31 00:42:34,063 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:42:34,329 : INFO : topic #38 (0.020): 0.024*\"walter\" + 0.009*\"aza\" + 0.009*\"battalion\" + 0.008*\"forc\" + 0.008*\"empath\" + 0.007*\"armi\" + 0.007*\"teufel\" + 0.006*\"militari\" + 0.006*\"pour\" + 0.006*\"govern\"\n", + "2019-01-31 00:42:34,330 : INFO : topic #33 (0.020): 0.063*\"french\" + 0.046*\"franc\" + 0.031*\"pari\" + 0.022*\"sail\" + 0.022*\"jean\" + 0.018*\"daphn\" + 0.014*\"lazi\" + 0.013*\"loui\" + 0.011*\"piec\" + 0.009*\"wine\"\n", + "2019-01-31 00:42:34,332 : INFO : topic #11 (0.020): 0.025*\"john\" + 0.013*\"will\" + 0.013*\"jame\" + 0.012*\"david\" + 0.010*\"rival\" + 0.010*\"mexican–american\" + 0.009*\"georg\" + 0.008*\"paul\" + 0.008*\"slur\" + 0.008*\"rhyme\"\n", + "2019-01-31 00:42:34,332 : INFO : topic #46 (0.020): 0.019*\"stop\" + 0.018*\"swedish\" + 0.018*\"sweden\" + 0.016*\"norwai\" + 0.015*\"wind\" + 0.014*\"damag\" + 0.014*\"norwegian\" + 0.012*\"huntsvil\" + 0.010*\"farid\" + 0.010*\"denmark\"\n", + "2019-01-31 00:42:34,334 : INFO : topic #18 (0.020): 0.010*\"théori\" + 0.007*\"later\" + 0.007*\"sack\" + 0.006*\"kill\" + 0.006*\"dai\" + 0.005*\"retrospect\" + 0.005*\"end\" + 0.005*\"like\" + 0.004*\"man\" + 0.004*\"call\"\n", + "2019-01-31 00:42:34,339 : INFO : topic diff=0.006208, rho=0.035921\n", + "2019-01-31 00:42:34,494 : INFO : PROGRESS: pass 0, at document #1552000/4922894\n", + "2019-01-31 00:42:35,870 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:42:36,137 : INFO : topic #33 (0.020): 0.063*\"french\" + 0.046*\"franc\" + 0.031*\"pari\" + 0.022*\"sail\" + 0.022*\"jean\" + 0.018*\"daphn\" + 0.014*\"lazi\" + 0.013*\"loui\" + 0.011*\"piec\" + 0.009*\"wine\"\n", + "2019-01-31 00:42:36,138 : INFO : topic #22 (0.020): 0.034*\"spars\" + 0.024*\"factor\" + 0.020*\"adulthood\" + 0.016*\"feel\" + 0.015*\"male\" + 0.012*\"hostil\" + 0.011*\"plaisir\" + 0.010*\"genu\" + 0.009*\"live\" + 0.008*\"yawn\"\n", + "2019-01-31 00:42:36,139 : INFO : topic #9 (0.020): 0.073*\"bone\" + 0.039*\"american\" + 0.027*\"valour\" + 0.018*\"dutch\" + 0.017*\"polit\" + 0.016*\"folei\" + 0.016*\"player\" + 0.015*\"english\" + 0.013*\"acrimoni\" + 0.012*\"simpler\"\n", + "2019-01-31 00:42:36,140 : INFO : topic #24 (0.020): 0.042*\"book\" + 0.035*\"publicis\" + 0.024*\"word\" + 0.017*\"new\" + 0.014*\"edit\" + 0.013*\"presid\" + 0.012*\"storag\" + 0.012*\"nicola\" + 0.011*\"collect\" + 0.011*\"magazin\"\n", + "2019-01-31 00:42:36,141 : INFO : topic #47 (0.020): 0.065*\"muscl\" + 0.035*\"perceptu\" + 0.019*\"theater\" + 0.018*\"place\" + 0.018*\"compos\" + 0.017*\"damn\" + 0.015*\"olympo\" + 0.013*\"physician\" + 0.013*\"orchestr\" + 0.011*\"word\"\n", + "2019-01-31 00:42:36,147 : INFO : topic diff=0.006295, rho=0.035898\n", + "2019-01-31 00:42:36,313 : INFO : PROGRESS: pass 0, at document #1554000/4922894\n", + "2019-01-31 00:42:37,707 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:42:37,973 : INFO : topic #23 (0.020): 0.138*\"audit\" + 0.070*\"best\" + 0.035*\"yawn\" + 0.028*\"jacksonvil\" + 0.025*\"japanes\" + 0.024*\"festiv\" + 0.020*\"noll\" + 0.019*\"women\" + 0.017*\"intern\" + 0.014*\"prison\"\n", + "2019-01-31 00:42:37,974 : INFO : topic #42 (0.020): 0.046*\"german\" + 0.030*\"germani\" + 0.014*\"vol\" + 0.014*\"berlin\" + 0.014*\"israel\" + 0.013*\"der\" + 0.013*\"jewish\" + 0.010*\"europ\" + 0.009*\"european\" + 0.009*\"austria\"\n", + "2019-01-31 00:42:37,976 : INFO : topic #12 (0.020): 0.008*\"number\" + 0.008*\"frontal\" + 0.007*\"gener\" + 0.006*\"exampl\" + 0.006*\"théori\" + 0.006*\"poet\" + 0.006*\"southern\" + 0.006*\"servitud\" + 0.006*\"method\" + 0.006*\"differ\"\n", + "2019-01-31 00:42:37,977 : INFO : topic #6 (0.020): 0.072*\"fewer\" + 0.025*\"septemb\" + 0.023*\"epiru\" + 0.019*\"teacher\" + 0.016*\"stake\" + 0.012*\"rodríguez\" + 0.012*\"proclaim\" + 0.011*\"direct\" + 0.011*\"movi\" + 0.010*\"acrimoni\"\n", + "2019-01-31 00:42:37,978 : INFO : topic #25 (0.020): 0.031*\"ring\" + 0.017*\"warmth\" + 0.017*\"lagrang\" + 0.017*\"area\" + 0.015*\"mount\" + 0.009*\"foam\" + 0.009*\"palmer\" + 0.008*\"north\" + 0.008*\"sourc\" + 0.008*\"lobe\"\n", + "2019-01-31 00:42:37,984 : INFO : topic diff=0.005194, rho=0.035875\n", + "2019-01-31 00:42:38,141 : INFO : PROGRESS: pass 0, at document #1556000/4922894\n", + "2019-01-31 00:42:39,550 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:42:39,815 : INFO : topic #23 (0.020): 0.137*\"audit\" + 0.070*\"best\" + 0.035*\"yawn\" + 0.028*\"jacksonvil\" + 0.024*\"japanes\" + 0.024*\"festiv\" + 0.020*\"noll\" + 0.019*\"women\" + 0.017*\"intern\" + 0.014*\"prison\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 00:42:39,816 : INFO : topic #30 (0.020): 0.037*\"leagu\" + 0.036*\"cleveland\" + 0.029*\"place\" + 0.027*\"taxpay\" + 0.026*\"scientist\" + 0.023*\"crete\" + 0.021*\"folei\" + 0.016*\"goal\" + 0.015*\"martin\" + 0.012*\"schmitz\"\n", + "2019-01-31 00:42:39,817 : INFO : topic #5 (0.020): 0.039*\"abroad\" + 0.029*\"son\" + 0.027*\"rel\" + 0.025*\"reconstruct\" + 0.021*\"band\" + 0.016*\"muscl\" + 0.016*\"simultan\" + 0.015*\"charcoal\" + 0.014*\"toyota\" + 0.010*\"myspac\"\n", + "2019-01-31 00:42:39,818 : INFO : topic #10 (0.020): 0.010*\"cdd\" + 0.008*\"disco\" + 0.008*\"media\" + 0.007*\"pathwai\" + 0.007*\"have\" + 0.007*\"caus\" + 0.007*\"proper\" + 0.006*\"hormon\" + 0.006*\"dress\" + 0.006*\"effect\"\n", + "2019-01-31 00:42:39,819 : INFO : topic #15 (0.020): 0.011*\"small\" + 0.011*\"organ\" + 0.010*\"develop\" + 0.010*\"commun\" + 0.009*\"group\" + 0.009*\"word\" + 0.008*\"peopl\" + 0.008*\"cultur\" + 0.007*\"human\" + 0.006*\"woman\"\n", + "2019-01-31 00:42:39,825 : INFO : topic diff=0.006061, rho=0.035852\n", + "2019-01-31 00:42:39,980 : INFO : PROGRESS: pass 0, at document #1558000/4922894\n", + "2019-01-31 00:42:41,368 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:42:41,635 : INFO : topic #11 (0.020): 0.025*\"john\" + 0.013*\"will\" + 0.012*\"jame\" + 0.012*\"david\" + 0.011*\"rival\" + 0.009*\"mexican–american\" + 0.009*\"georg\" + 0.008*\"paul\" + 0.008*\"slur\" + 0.008*\"rhyme\"\n", + "2019-01-31 00:42:41,636 : INFO : topic #46 (0.020): 0.018*\"stop\" + 0.017*\"sweden\" + 0.017*\"swedish\" + 0.016*\"norwai\" + 0.015*\"wind\" + 0.014*\"damag\" + 0.014*\"norwegian\" + 0.012*\"huntsvil\" + 0.011*\"farid\" + 0.010*\"treeless\"\n", + "2019-01-31 00:42:41,637 : INFO : topic #3 (0.020): 0.035*\"present\" + 0.026*\"offic\" + 0.025*\"minist\" + 0.022*\"serv\" + 0.021*\"nation\" + 0.020*\"govern\" + 0.019*\"member\" + 0.018*\"gener\" + 0.016*\"seri\" + 0.015*\"start\"\n", + "2019-01-31 00:42:41,638 : INFO : topic #2 (0.020): 0.046*\"isl\" + 0.038*\"shield\" + 0.017*\"narrat\" + 0.014*\"scot\" + 0.012*\"pope\" + 0.011*\"blur\" + 0.010*\"coalit\" + 0.010*\"nativist\" + 0.009*\"crew\" + 0.009*\"sai\"\n", + "2019-01-31 00:42:41,639 : INFO : topic #40 (0.020): 0.090*\"unit\" + 0.023*\"schuster\" + 0.022*\"institut\" + 0.022*\"collector\" + 0.020*\"requir\" + 0.018*\"student\" + 0.014*\"professor\" + 0.012*\"word\" + 0.012*\"degre\" + 0.011*\"http\"\n", + "2019-01-31 00:42:41,645 : INFO : topic diff=0.005323, rho=0.035829\n", + "2019-01-31 00:42:44,356 : INFO : -11.668 per-word bound, 3254.0 perplexity estimate based on a held-out corpus of 2000 documents with 566242 words\n", + "2019-01-31 00:42:44,357 : INFO : PROGRESS: pass 0, at document #1560000/4922894\n", + "2019-01-31 00:42:45,747 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:42:46,014 : INFO : topic #31 (0.020): 0.057*\"fusiform\" + 0.025*\"scientist\" + 0.024*\"taxpay\" + 0.024*\"player\" + 0.020*\"place\" + 0.014*\"clot\" + 0.012*\"leagu\" + 0.011*\"folei\" + 0.010*\"yawn\" + 0.009*\"yard\"\n", + "2019-01-31 00:42:46,015 : INFO : topic #42 (0.020): 0.046*\"german\" + 0.030*\"germani\" + 0.014*\"vol\" + 0.014*\"berlin\" + 0.014*\"israel\" + 0.013*\"der\" + 0.013*\"jewish\" + 0.010*\"europ\" + 0.009*\"european\" + 0.009*\"austria\"\n", + "2019-01-31 00:42:46,017 : INFO : topic #12 (0.020): 0.009*\"number\" + 0.008*\"frontal\" + 0.007*\"gener\" + 0.006*\"théori\" + 0.006*\"exampl\" + 0.006*\"poet\" + 0.006*\"southern\" + 0.006*\"servitud\" + 0.006*\"method\" + 0.006*\"differ\"\n", + "2019-01-31 00:42:46,018 : INFO : topic #8 (0.020): 0.026*\"law\" + 0.024*\"cortic\" + 0.022*\"act\" + 0.018*\"start\" + 0.013*\"ricardo\" + 0.013*\"case\" + 0.009*\"polaris\" + 0.008*\"replac\" + 0.008*\"legal\" + 0.007*\"order\"\n", + "2019-01-31 00:42:46,019 : INFO : topic #0 (0.020): 0.066*\"statewid\" + 0.039*\"line\" + 0.036*\"arsen\" + 0.034*\"raid\" + 0.030*\"museo\" + 0.022*\"traceabl\" + 0.017*\"serv\" + 0.014*\"exhaust\" + 0.014*\"pain\" + 0.012*\"oper\"\n", + "2019-01-31 00:42:46,024 : INFO : topic diff=0.004552, rho=0.035806\n", + "2019-01-31 00:42:46,185 : INFO : PROGRESS: pass 0, at document #1562000/4922894\n", + "2019-01-31 00:42:47,614 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:42:47,880 : INFO : topic #1 (0.020): 0.059*\"china\" + 0.047*\"chilton\" + 0.024*\"hong\" + 0.024*\"kong\" + 0.021*\"korea\" + 0.017*\"korean\" + 0.016*\"sourc\" + 0.015*\"shirin\" + 0.014*\"leah\" + 0.013*\"articul\"\n", + "2019-01-31 00:42:47,881 : INFO : topic #23 (0.020): 0.138*\"audit\" + 0.069*\"best\" + 0.036*\"yawn\" + 0.028*\"jacksonvil\" + 0.024*\"japanes\" + 0.023*\"festiv\" + 0.020*\"noll\" + 0.019*\"women\" + 0.017*\"intern\" + 0.014*\"prison\"\n", + "2019-01-31 00:42:47,882 : INFO : topic #33 (0.020): 0.063*\"french\" + 0.046*\"franc\" + 0.031*\"pari\" + 0.022*\"sail\" + 0.022*\"jean\" + 0.018*\"daphn\" + 0.014*\"lazi\" + 0.013*\"loui\" + 0.011*\"piec\" + 0.009*\"wine\"\n", + "2019-01-31 00:42:47,883 : INFO : topic #35 (0.020): 0.056*\"russia\" + 0.035*\"sovereignti\" + 0.034*\"rural\" + 0.025*\"reprint\" + 0.024*\"poison\" + 0.024*\"personifi\" + 0.020*\"unfortun\" + 0.019*\"moscow\" + 0.016*\"poland\" + 0.014*\"czech\"\n", + "2019-01-31 00:42:47,884 : INFO : topic #36 (0.020): 0.012*\"network\" + 0.012*\"prognosi\" + 0.010*\"pop\" + 0.009*\"develop\" + 0.008*\"cytokin\" + 0.008*\"softwar\" + 0.008*\"user\" + 0.007*\"championship\" + 0.007*\"includ\" + 0.007*\"diggin\"\n", + "2019-01-31 00:42:47,890 : INFO : topic diff=0.005663, rho=0.035783\n", + "2019-01-31 00:42:48,046 : INFO : PROGRESS: pass 0, at document #1564000/4922894\n", + "2019-01-31 00:42:49,439 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:42:49,705 : INFO : topic #25 (0.020): 0.030*\"ring\" + 0.017*\"warmth\" + 0.017*\"lagrang\" + 0.017*\"area\" + 0.015*\"mount\" + 0.009*\"foam\" + 0.009*\"palmer\" + 0.009*\"north\" + 0.008*\"land\" + 0.008*\"sourc\"\n", + "2019-01-31 00:42:49,706 : INFO : topic #49 (0.020): 0.042*\"india\" + 0.031*\"incumb\" + 0.013*\"islam\" + 0.012*\"anglo\" + 0.012*\"pakistan\" + 0.011*\"televis\" + 0.011*\"sri\" + 0.011*\"muskoge\" + 0.010*\"khalsa\" + 0.010*\"iran\"\n", + "2019-01-31 00:42:49,707 : INFO : topic #21 (0.020): 0.039*\"samford\" + 0.021*\"spain\" + 0.019*\"del\" + 0.018*\"mexico\" + 0.013*\"soviet\" + 0.012*\"francisco\" + 0.012*\"santa\" + 0.011*\"juan\" + 0.011*\"carlo\" + 0.010*\"josé\"\n", + "2019-01-31 00:42:49,708 : INFO : topic #32 (0.020): 0.055*\"district\" + 0.045*\"vigour\" + 0.043*\"popolo\" + 0.040*\"tortur\" + 0.038*\"cotton\" + 0.027*\"area\" + 0.023*\"regim\" + 0.023*\"citi\" + 0.023*\"multitud\" + 0.019*\"cede\"\n", + "2019-01-31 00:42:49,709 : INFO : topic #29 (0.020): 0.025*\"companhia\" + 0.011*\"million\" + 0.010*\"busi\" + 0.010*\"market\" + 0.010*\"bank\" + 0.009*\"produc\" + 0.008*\"industri\" + 0.008*\"yawn\" + 0.007*\"manag\" + 0.007*\"function\"\n", + "2019-01-31 00:42:49,715 : INFO : topic diff=0.005417, rho=0.035760\n", + "2019-01-31 00:42:49,927 : INFO : PROGRESS: pass 0, at document #1566000/4922894\n", + "2019-01-31 00:42:51,307 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:42:51,573 : INFO : topic #47 (0.020): 0.066*\"muscl\" + 0.034*\"perceptu\" + 0.019*\"theater\" + 0.018*\"place\" + 0.018*\"compos\" + 0.017*\"damn\" + 0.014*\"olympo\" + 0.013*\"physician\" + 0.012*\"orchestr\" + 0.012*\"jack\"\n", + "2019-01-31 00:42:51,574 : INFO : topic #6 (0.020): 0.071*\"fewer\" + 0.025*\"septemb\" + 0.023*\"epiru\" + 0.019*\"teacher\" + 0.016*\"stake\" + 0.012*\"proclaim\" + 0.012*\"rodríguez\" + 0.011*\"direct\" + 0.011*\"movi\" + 0.010*\"acrimoni\"\n", + "2019-01-31 00:42:51,575 : INFO : topic #49 (0.020): 0.041*\"india\" + 0.032*\"incumb\" + 0.013*\"islam\" + 0.012*\"anglo\" + 0.012*\"pakistan\" + 0.011*\"televis\" + 0.011*\"sri\" + 0.011*\"muskoge\" + 0.010*\"khalsa\" + 0.010*\"alam\"\n", + "2019-01-31 00:42:51,576 : INFO : topic #34 (0.020): 0.073*\"start\" + 0.032*\"american\" + 0.032*\"unionist\" + 0.029*\"cotton\" + 0.028*\"new\" + 0.017*\"year\" + 0.014*\"california\" + 0.013*\"warrior\" + 0.012*\"north\" + 0.012*\"terri\"\n", + "2019-01-31 00:42:51,577 : INFO : topic #37 (0.020): 0.010*\"man\" + 0.009*\"love\" + 0.007*\"gestur\" + 0.007*\"charact\" + 0.006*\"septemb\" + 0.006*\"comic\" + 0.005*\"blue\" + 0.005*\"appear\" + 0.004*\"dixi\" + 0.004*\"black\"\n", + "2019-01-31 00:42:51,583 : INFO : topic diff=0.004586, rho=0.035737\n", + "2019-01-31 00:42:51,741 : INFO : PROGRESS: pass 0, at document #1568000/4922894\n", + "2019-01-31 00:42:53,157 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:42:53,423 : INFO : topic #14 (0.020): 0.024*\"forc\" + 0.023*\"aggress\" + 0.021*\"walter\" + 0.020*\"armi\" + 0.016*\"com\" + 0.013*\"oper\" + 0.013*\"unionist\" + 0.013*\"militari\" + 0.012*\"airbu\" + 0.010*\"diversifi\"\n", + "2019-01-31 00:42:53,424 : INFO : topic #15 (0.020): 0.011*\"small\" + 0.011*\"organ\" + 0.010*\"develop\" + 0.010*\"commun\" + 0.009*\"group\" + 0.009*\"word\" + 0.008*\"peopl\" + 0.008*\"cultur\" + 0.007*\"human\" + 0.007*\"woman\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 00:42:53,425 : INFO : topic #32 (0.020): 0.056*\"district\" + 0.045*\"vigour\" + 0.042*\"popolo\" + 0.040*\"tortur\" + 0.039*\"cotton\" + 0.027*\"area\" + 0.023*\"multitud\" + 0.023*\"regim\" + 0.023*\"citi\" + 0.019*\"cede\"\n", + "2019-01-31 00:42:53,426 : INFO : topic #43 (0.020): 0.064*\"elect\" + 0.053*\"parti\" + 0.023*\"voluntari\" + 0.023*\"democrat\" + 0.020*\"member\" + 0.016*\"polici\" + 0.016*\"republ\" + 0.014*\"liber\" + 0.013*\"bypass\" + 0.013*\"report\"\n", + "2019-01-31 00:42:53,427 : INFO : topic #5 (0.020): 0.039*\"abroad\" + 0.029*\"son\" + 0.027*\"rel\" + 0.026*\"reconstruct\" + 0.021*\"band\" + 0.016*\"muscl\" + 0.016*\"simultan\" + 0.014*\"charcoal\" + 0.014*\"toyota\" + 0.010*\"myspac\"\n", + "2019-01-31 00:42:53,433 : INFO : topic diff=0.006657, rho=0.035714\n", + "2019-01-31 00:42:53,587 : INFO : PROGRESS: pass 0, at document #1570000/4922894\n", + "2019-01-31 00:42:54,960 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:42:55,226 : INFO : topic #25 (0.020): 0.030*\"ring\" + 0.017*\"warmth\" + 0.017*\"lagrang\" + 0.017*\"area\" + 0.015*\"mount\" + 0.009*\"foam\" + 0.009*\"palmer\" + 0.008*\"north\" + 0.008*\"land\" + 0.008*\"sourc\"\n", + "2019-01-31 00:42:55,227 : INFO : topic #20 (0.020): 0.137*\"scholar\" + 0.039*\"struggl\" + 0.034*\"high\" + 0.030*\"educ\" + 0.023*\"collector\" + 0.017*\"yawn\" + 0.013*\"prognosi\" + 0.010*\"district\" + 0.009*\"task\" + 0.009*\"gothic\"\n", + "2019-01-31 00:42:55,228 : INFO : topic #32 (0.020): 0.056*\"district\" + 0.045*\"vigour\" + 0.043*\"popolo\" + 0.040*\"tortur\" + 0.038*\"cotton\" + 0.027*\"area\" + 0.023*\"multitud\" + 0.023*\"regim\" + 0.022*\"citi\" + 0.019*\"cede\"\n", + "2019-01-31 00:42:55,229 : INFO : topic #5 (0.020): 0.039*\"abroad\" + 0.029*\"son\" + 0.027*\"rel\" + 0.026*\"reconstruct\" + 0.021*\"band\" + 0.016*\"muscl\" + 0.016*\"simultan\" + 0.014*\"charcoal\" + 0.014*\"toyota\" + 0.010*\"myspac\"\n", + "2019-01-31 00:42:55,230 : INFO : topic #29 (0.020): 0.025*\"companhia\" + 0.011*\"million\" + 0.010*\"busi\" + 0.010*\"market\" + 0.009*\"bank\" + 0.009*\"produc\" + 0.008*\"industri\" + 0.008*\"yawn\" + 0.007*\"manag\" + 0.007*\"function\"\n", + "2019-01-31 00:42:55,236 : INFO : topic diff=0.005161, rho=0.035692\n", + "2019-01-31 00:42:55,394 : INFO : PROGRESS: pass 0, at document #1572000/4922894\n", + "2019-01-31 00:42:56,797 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:42:57,064 : INFO : topic #1 (0.020): 0.059*\"china\" + 0.048*\"chilton\" + 0.024*\"hong\" + 0.024*\"kong\" + 0.021*\"korea\" + 0.017*\"korean\" + 0.016*\"sourc\" + 0.015*\"shirin\" + 0.014*\"leah\" + 0.013*\"articul\"\n", + "2019-01-31 00:42:57,065 : INFO : topic #10 (0.020): 0.011*\"cdd\" + 0.008*\"disco\" + 0.008*\"media\" + 0.007*\"pathwai\" + 0.007*\"have\" + 0.007*\"proper\" + 0.007*\"caus\" + 0.006*\"hormon\" + 0.006*\"effect\" + 0.006*\"treat\"\n", + "2019-01-31 00:42:57,066 : INFO : topic #14 (0.020): 0.024*\"forc\" + 0.023*\"aggress\" + 0.021*\"walter\" + 0.020*\"armi\" + 0.017*\"com\" + 0.013*\"oper\" + 0.013*\"militari\" + 0.013*\"unionist\" + 0.012*\"airbu\" + 0.011*\"diversifi\"\n", + "2019-01-31 00:42:57,067 : INFO : topic #26 (0.020): 0.030*\"workplac\" + 0.029*\"woman\" + 0.028*\"champion\" + 0.025*\"olymp\" + 0.025*\"men\" + 0.022*\"medal\" + 0.021*\"event\" + 0.019*\"taxpay\" + 0.018*\"nation\" + 0.018*\"atheist\"\n", + "2019-01-31 00:42:57,068 : INFO : topic #3 (0.020): 0.035*\"present\" + 0.026*\"offic\" + 0.026*\"minist\" + 0.021*\"nation\" + 0.021*\"serv\" + 0.020*\"govern\" + 0.020*\"member\" + 0.018*\"gener\" + 0.015*\"seri\" + 0.015*\"start\"\n", + "2019-01-31 00:42:57,074 : INFO : topic diff=0.005756, rho=0.035669\n", + "2019-01-31 00:42:57,228 : INFO : PROGRESS: pass 0, at document #1574000/4922894\n", + "2019-01-31 00:42:58,597 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:42:58,863 : INFO : topic #43 (0.020): 0.064*\"elect\" + 0.054*\"parti\" + 0.023*\"voluntari\" + 0.022*\"democrat\" + 0.020*\"member\" + 0.016*\"polici\" + 0.015*\"republ\" + 0.013*\"liber\" + 0.013*\"bypass\" + 0.013*\"seaport\"\n", + "2019-01-31 00:42:58,864 : INFO : topic #41 (0.020): 0.042*\"citi\" + 0.028*\"new\" + 0.022*\"palmer\" + 0.014*\"strategist\" + 0.012*\"center\" + 0.012*\"open\" + 0.011*\"includ\" + 0.010*\"year\" + 0.010*\"lobe\" + 0.009*\"dai\"\n", + "2019-01-31 00:42:58,865 : INFO : topic #2 (0.020): 0.045*\"isl\" + 0.038*\"shield\" + 0.017*\"narrat\" + 0.014*\"scot\" + 0.013*\"pope\" + 0.011*\"blur\" + 0.011*\"coalit\" + 0.010*\"nativist\" + 0.009*\"bahá\" + 0.009*\"sai\"\n", + "2019-01-31 00:42:58,866 : INFO : topic #22 (0.020): 0.036*\"spars\" + 0.024*\"factor\" + 0.019*\"adulthood\" + 0.015*\"feel\" + 0.014*\"male\" + 0.012*\"hostil\" + 0.011*\"plaisir\" + 0.010*\"genu\" + 0.009*\"live\" + 0.008*\"yawn\"\n", + "2019-01-31 00:42:58,868 : INFO : topic #5 (0.020): 0.039*\"abroad\" + 0.028*\"son\" + 0.027*\"rel\" + 0.026*\"reconstruct\" + 0.021*\"band\" + 0.016*\"muscl\" + 0.016*\"simultan\" + 0.014*\"charcoal\" + 0.014*\"toyota\" + 0.010*\"myspac\"\n", + "2019-01-31 00:42:58,873 : INFO : topic diff=0.007868, rho=0.035646\n", + "2019-01-31 00:42:59,031 : INFO : PROGRESS: pass 0, at document #1576000/4922894\n", + "2019-01-31 00:43:00,428 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:43:00,694 : INFO : topic #14 (0.020): 0.024*\"forc\" + 0.022*\"aggress\" + 0.022*\"walter\" + 0.020*\"armi\" + 0.017*\"com\" + 0.013*\"oper\" + 0.013*\"militari\" + 0.013*\"unionist\" + 0.011*\"airbu\" + 0.011*\"diversifi\"\n", + "2019-01-31 00:43:00,695 : INFO : topic #45 (0.020): 0.025*\"jpg\" + 0.024*\"fifteenth\" + 0.017*\"illicit\" + 0.016*\"black\" + 0.016*\"western\" + 0.015*\"colder\" + 0.014*\"record\" + 0.010*\"blind\" + 0.008*\"green\" + 0.007*\"depress\"\n", + "2019-01-31 00:43:00,696 : INFO : topic #7 (0.020): 0.022*\"snatch\" + 0.021*\"di\" + 0.018*\"factor\" + 0.016*\"yawn\" + 0.015*\"margin\" + 0.014*\"bone\" + 0.013*\"life\" + 0.012*\"faster\" + 0.012*\"daughter\" + 0.011*\"will\"\n", + "2019-01-31 00:43:00,697 : INFO : topic #35 (0.020): 0.056*\"russia\" + 0.035*\"sovereignti\" + 0.034*\"rural\" + 0.025*\"reprint\" + 0.025*\"personifi\" + 0.024*\"poison\" + 0.020*\"moscow\" + 0.019*\"unfortun\" + 0.016*\"poland\" + 0.015*\"malaysia\"\n", + "2019-01-31 00:43:00,698 : INFO : topic #39 (0.020): 0.049*\"canada\" + 0.038*\"canadian\" + 0.021*\"hoar\" + 0.021*\"toronto\" + 0.020*\"ontario\" + 0.014*\"new\" + 0.014*\"quebec\" + 0.014*\"hydrogen\" + 0.013*\"misericordia\" + 0.011*\"novotná\"\n", + "2019-01-31 00:43:00,704 : INFO : topic diff=0.006180, rho=0.035624\n", + "2019-01-31 00:43:00,862 : INFO : PROGRESS: pass 0, at document #1578000/4922894\n", + "2019-01-31 00:43:02,272 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:43:02,538 : INFO : topic #10 (0.020): 0.011*\"cdd\" + 0.008*\"media\" + 0.008*\"disco\" + 0.007*\"pathwai\" + 0.007*\"have\" + 0.007*\"hormon\" + 0.007*\"caus\" + 0.007*\"proper\" + 0.006*\"effect\" + 0.006*\"treat\"\n", + "2019-01-31 00:43:02,539 : INFO : topic #20 (0.020): 0.137*\"scholar\" + 0.039*\"struggl\" + 0.033*\"high\" + 0.030*\"educ\" + 0.023*\"collector\" + 0.017*\"yawn\" + 0.013*\"prognosi\" + 0.010*\"district\" + 0.009*\"task\" + 0.009*\"gothic\"\n", + "2019-01-31 00:43:02,540 : INFO : topic #46 (0.020): 0.019*\"stop\" + 0.016*\"sweden\" + 0.016*\"swedish\" + 0.016*\"wind\" + 0.016*\"norwai\" + 0.015*\"damag\" + 0.013*\"norwegian\" + 0.012*\"huntsvil\" + 0.012*\"treeless\" + 0.010*\"farid\"\n", + "2019-01-31 00:43:02,541 : INFO : topic #2 (0.020): 0.046*\"isl\" + 0.038*\"shield\" + 0.017*\"narrat\" + 0.014*\"scot\" + 0.013*\"pope\" + 0.011*\"blur\" + 0.010*\"coalit\" + 0.010*\"nativist\" + 0.009*\"bahá\" + 0.009*\"sai\"\n", + "2019-01-31 00:43:02,542 : INFO : topic #29 (0.020): 0.024*\"companhia\" + 0.011*\"million\" + 0.010*\"busi\" + 0.009*\"produc\" + 0.009*\"market\" + 0.009*\"bank\" + 0.009*\"industri\" + 0.008*\"yawn\" + 0.007*\"manag\" + 0.007*\"function\"\n", + "2019-01-31 00:43:02,548 : INFO : topic diff=0.005579, rho=0.035601\n", + "2019-01-31 00:43:05,272 : INFO : -11.703 per-word bound, 3333.7 perplexity estimate based on a held-out corpus of 2000 documents with 559860 words\n", + "2019-01-31 00:43:05,273 : INFO : PROGRESS: pass 0, at document #1580000/4922894\n", + "2019-01-31 00:43:06,683 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:43:06,949 : INFO : topic #44 (0.020): 0.031*\"rooftop\" + 0.027*\"final\" + 0.023*\"wife\" + 0.019*\"champion\" + 0.019*\"tourist\" + 0.017*\"chamber\" + 0.015*\"taxpay\" + 0.014*\"martin\" + 0.014*\"open\" + 0.013*\"tiepolo\"\n", + "2019-01-31 00:43:06,950 : INFO : topic #14 (0.020): 0.024*\"forc\" + 0.023*\"aggress\" + 0.022*\"walter\" + 0.020*\"armi\" + 0.017*\"com\" + 0.013*\"oper\" + 0.013*\"militari\" + 0.013*\"unionist\" + 0.011*\"airbu\" + 0.011*\"diversifi\"\n", + "2019-01-31 00:43:06,951 : INFO : topic #30 (0.020): 0.037*\"leagu\" + 0.036*\"cleveland\" + 0.029*\"place\" + 0.027*\"taxpay\" + 0.026*\"scientist\" + 0.024*\"crete\" + 0.021*\"folei\" + 0.016*\"goal\" + 0.015*\"martin\" + 0.012*\"schmitz\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 00:43:06,953 : INFO : topic #18 (0.020): 0.010*\"théori\" + 0.007*\"later\" + 0.007*\"sack\" + 0.006*\"kill\" + 0.006*\"dai\" + 0.005*\"retrospect\" + 0.005*\"like\" + 0.005*\"end\" + 0.004*\"man\" + 0.004*\"call\"\n", + "2019-01-31 00:43:06,954 : INFO : topic #31 (0.020): 0.056*\"fusiform\" + 0.025*\"scientist\" + 0.024*\"taxpay\" + 0.023*\"player\" + 0.020*\"place\" + 0.014*\"clot\" + 0.012*\"leagu\" + 0.011*\"folei\" + 0.010*\"yawn\" + 0.009*\"ruler\"\n", + "2019-01-31 00:43:06,960 : INFO : topic diff=0.005444, rho=0.035578\n", + "2019-01-31 00:43:07,118 : INFO : PROGRESS: pass 0, at document #1582000/4922894\n", + "2019-01-31 00:43:08,532 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:43:08,799 : INFO : topic #25 (0.020): 0.033*\"ring\" + 0.017*\"warmth\" + 0.017*\"area\" + 0.016*\"lagrang\" + 0.015*\"mount\" + 0.009*\"foam\" + 0.009*\"north\" + 0.008*\"palmer\" + 0.008*\"land\" + 0.008*\"lobe\"\n", + "2019-01-31 00:43:08,800 : INFO : topic #16 (0.020): 0.051*\"king\" + 0.032*\"priest\" + 0.020*\"grammat\" + 0.019*\"quarterli\" + 0.019*\"rotterdam\" + 0.019*\"duke\" + 0.018*\"idiosyncrat\" + 0.013*\"kingdom\" + 0.013*\"maria\" + 0.012*\"portugues\"\n", + "2019-01-31 00:43:08,801 : INFO : topic #34 (0.020): 0.074*\"start\" + 0.032*\"unionist\" + 0.032*\"american\" + 0.028*\"cotton\" + 0.028*\"new\" + 0.017*\"year\" + 0.015*\"california\" + 0.013*\"warrior\" + 0.013*\"terri\" + 0.012*\"north\"\n", + "2019-01-31 00:43:08,802 : INFO : topic #48 (0.020): 0.078*\"octob\" + 0.078*\"sens\" + 0.073*\"march\" + 0.068*\"juli\" + 0.067*\"august\" + 0.067*\"januari\" + 0.066*\"april\" + 0.066*\"notion\" + 0.063*\"judici\" + 0.061*\"decatur\"\n", + "2019-01-31 00:43:08,803 : INFO : topic #18 (0.020): 0.010*\"théori\" + 0.007*\"later\" + 0.007*\"sack\" + 0.006*\"kill\" + 0.006*\"dai\" + 0.005*\"retrospect\" + 0.005*\"like\" + 0.004*\"end\" + 0.004*\"man\" + 0.004*\"call\"\n", + "2019-01-31 00:43:08,809 : INFO : topic diff=0.005779, rho=0.035556\n", + "2019-01-31 00:43:08,972 : INFO : PROGRESS: pass 0, at document #1584000/4922894\n", + "2019-01-31 00:43:10,419 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:43:10,685 : INFO : topic #8 (0.020): 0.027*\"act\" + 0.026*\"law\" + 0.024*\"cortic\" + 0.018*\"start\" + 0.013*\"ricardo\" + 0.013*\"case\" + 0.010*\"polaris\" + 0.008*\"replac\" + 0.008*\"legal\" + 0.007*\"judaism\"\n", + "2019-01-31 00:43:10,686 : INFO : topic #27 (0.020): 0.071*\"questionnair\" + 0.019*\"taxpay\" + 0.018*\"ret\" + 0.017*\"candid\" + 0.013*\"tornado\" + 0.012*\"driver\" + 0.012*\"squatter\" + 0.011*\"fool\" + 0.011*\"find\" + 0.010*\"théori\"\n", + "2019-01-31 00:43:10,687 : INFO : topic #16 (0.020): 0.051*\"king\" + 0.033*\"priest\" + 0.020*\"grammat\" + 0.019*\"quarterli\" + 0.019*\"rotterdam\" + 0.019*\"duke\" + 0.018*\"idiosyncrat\" + 0.013*\"kingdom\" + 0.013*\"maria\" + 0.012*\"portugues\"\n", + "2019-01-31 00:43:10,688 : INFO : topic #14 (0.020): 0.024*\"forc\" + 0.022*\"aggress\" + 0.022*\"walter\" + 0.020*\"armi\" + 0.017*\"com\" + 0.013*\"oper\" + 0.013*\"unionist\" + 0.013*\"militari\" + 0.011*\"diversifi\" + 0.011*\"airbu\"\n", + "2019-01-31 00:43:10,689 : INFO : topic #34 (0.020): 0.074*\"start\" + 0.032*\"unionist\" + 0.031*\"american\" + 0.028*\"new\" + 0.028*\"cotton\" + 0.018*\"year\" + 0.015*\"california\" + 0.013*\"terri\" + 0.013*\"warrior\" + 0.012*\"north\"\n", + "2019-01-31 00:43:10,695 : INFO : topic diff=0.006703, rho=0.035533\n", + "2019-01-31 00:43:10,856 : INFO : PROGRESS: pass 0, at document #1586000/4922894\n", + "2019-01-31 00:43:12,276 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:43:12,543 : INFO : topic #11 (0.020): 0.025*\"john\" + 0.013*\"will\" + 0.012*\"jame\" + 0.012*\"david\" + 0.011*\"rival\" + 0.009*\"mexican–american\" + 0.009*\"georg\" + 0.009*\"slur\" + 0.008*\"paul\" + 0.007*\"rhyme\"\n", + "2019-01-31 00:43:12,544 : INFO : topic #31 (0.020): 0.056*\"fusiform\" + 0.025*\"scientist\" + 0.024*\"taxpay\" + 0.024*\"player\" + 0.020*\"place\" + 0.014*\"clot\" + 0.011*\"leagu\" + 0.011*\"folei\" + 0.010*\"yawn\" + 0.010*\"ruler\"\n", + "2019-01-31 00:43:12,545 : INFO : topic #37 (0.020): 0.010*\"man\" + 0.009*\"love\" + 0.007*\"gestur\" + 0.007*\"charact\" + 0.006*\"septemb\" + 0.006*\"comic\" + 0.005*\"blue\" + 0.005*\"appear\" + 0.004*\"black\" + 0.004*\"dixi\"\n", + "2019-01-31 00:43:12,546 : INFO : topic #35 (0.020): 0.056*\"russia\" + 0.040*\"sovereignti\" + 0.034*\"rural\" + 0.026*\"poison\" + 0.025*\"reprint\" + 0.024*\"personifi\" + 0.021*\"unfortun\" + 0.020*\"moscow\" + 0.017*\"poland\" + 0.015*\"malaysia\"\n", + "2019-01-31 00:43:12,547 : INFO : topic #22 (0.020): 0.035*\"spars\" + 0.024*\"factor\" + 0.020*\"adulthood\" + 0.016*\"feel\" + 0.014*\"male\" + 0.012*\"hostil\" + 0.011*\"plaisir\" + 0.009*\"genu\" + 0.009*\"live\" + 0.008*\"yawn\"\n", + "2019-01-31 00:43:12,552 : INFO : topic diff=0.006777, rho=0.035511\n", + "2019-01-31 00:43:12,710 : INFO : PROGRESS: pass 0, at document #1588000/4922894\n", + "2019-01-31 00:43:14,106 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:43:14,372 : INFO : topic #44 (0.020): 0.031*\"rooftop\" + 0.027*\"final\" + 0.024*\"wife\" + 0.019*\"champion\" + 0.019*\"tourist\" + 0.016*\"chamber\" + 0.016*\"taxpay\" + 0.014*\"martin\" + 0.014*\"open\" + 0.013*\"tiepolo\"\n", + "2019-01-31 00:43:14,373 : INFO : topic #6 (0.020): 0.072*\"fewer\" + 0.024*\"septemb\" + 0.023*\"epiru\" + 0.018*\"teacher\" + 0.016*\"stake\" + 0.013*\"proclaim\" + 0.012*\"rodríguez\" + 0.011*\"direct\" + 0.011*\"movi\" + 0.010*\"acrimoni\"\n", + "2019-01-31 00:43:14,374 : INFO : topic #13 (0.020): 0.027*\"australia\" + 0.027*\"sourc\" + 0.025*\"london\" + 0.025*\"new\" + 0.023*\"australian\" + 0.023*\"england\" + 0.019*\"british\" + 0.018*\"ireland\" + 0.015*\"youth\" + 0.014*\"wale\"\n", + "2019-01-31 00:43:14,376 : INFO : topic #37 (0.020): 0.010*\"man\" + 0.009*\"love\" + 0.007*\"gestur\" + 0.007*\"charact\" + 0.006*\"septemb\" + 0.006*\"comic\" + 0.005*\"blue\" + 0.005*\"appear\" + 0.004*\"black\" + 0.004*\"dixi\"\n", + "2019-01-31 00:43:14,377 : INFO : topic #5 (0.020): 0.039*\"abroad\" + 0.028*\"son\" + 0.026*\"rel\" + 0.026*\"reconstruct\" + 0.021*\"band\" + 0.016*\"muscl\" + 0.016*\"simultan\" + 0.014*\"charcoal\" + 0.014*\"toyota\" + 0.010*\"myspac\"\n", + "2019-01-31 00:43:14,382 : INFO : topic diff=0.005561, rho=0.035489\n", + "2019-01-31 00:43:14,534 : INFO : PROGRESS: pass 0, at document #1590000/4922894\n", + "2019-01-31 00:43:15,886 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:43:16,153 : INFO : topic #23 (0.020): 0.135*\"audit\" + 0.068*\"best\" + 0.035*\"yawn\" + 0.028*\"jacksonvil\" + 0.024*\"japanes\" + 0.023*\"festiv\" + 0.021*\"noll\" + 0.018*\"women\" + 0.017*\"intern\" + 0.014*\"prison\"\n", + "2019-01-31 00:43:16,154 : INFO : topic #42 (0.020): 0.045*\"german\" + 0.031*\"germani\" + 0.014*\"vol\" + 0.014*\"israel\" + 0.013*\"berlin\" + 0.013*\"jewish\" + 0.013*\"der\" + 0.010*\"europ\" + 0.010*\"european\" + 0.009*\"austria\"\n", + "2019-01-31 00:43:16,155 : INFO : topic #44 (0.020): 0.031*\"rooftop\" + 0.027*\"final\" + 0.024*\"wife\" + 0.019*\"tourist\" + 0.019*\"champion\" + 0.016*\"chamber\" + 0.016*\"taxpay\" + 0.015*\"martin\" + 0.014*\"open\" + 0.013*\"tiepolo\"\n", + "2019-01-31 00:43:16,156 : INFO : topic #27 (0.020): 0.072*\"questionnair\" + 0.019*\"taxpay\" + 0.018*\"candid\" + 0.017*\"ret\" + 0.013*\"tornado\" + 0.012*\"driver\" + 0.012*\"fool\" + 0.011*\"squatter\" + 0.011*\"find\" + 0.010*\"théori\"\n", + "2019-01-31 00:43:16,157 : INFO : topic #0 (0.020): 0.068*\"statewid\" + 0.040*\"line\" + 0.036*\"arsen\" + 0.035*\"raid\" + 0.028*\"museo\" + 0.020*\"traceabl\" + 0.017*\"serv\" + 0.014*\"exhaust\" + 0.013*\"pain\" + 0.013*\"oper\"\n", + "2019-01-31 00:43:16,163 : INFO : topic diff=0.005877, rho=0.035466\n", + "2019-01-31 00:43:16,315 : INFO : PROGRESS: pass 0, at document #1592000/4922894\n", + "2019-01-31 00:43:17,692 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:43:17,958 : INFO : topic #44 (0.020): 0.030*\"rooftop\" + 0.026*\"final\" + 0.023*\"wife\" + 0.019*\"champion\" + 0.019*\"tourist\" + 0.018*\"chamber\" + 0.016*\"open\" + 0.016*\"taxpay\" + 0.016*\"martin\" + 0.014*\"tiepolo\"\n", + "2019-01-31 00:43:17,959 : INFO : topic #17 (0.020): 0.075*\"church\" + 0.021*\"christian\" + 0.021*\"cathol\" + 0.021*\"bishop\" + 0.016*\"sail\" + 0.014*\"retroflex\" + 0.010*\"parish\" + 0.009*\"historiographi\" + 0.009*\"cathedr\" + 0.009*\"relationship\"\n", + "2019-01-31 00:43:17,960 : INFO : topic #46 (0.020): 0.019*\"stop\" + 0.018*\"sweden\" + 0.017*\"swedish\" + 0.016*\"norwai\" + 0.015*\"wind\" + 0.015*\"damag\" + 0.013*\"norwegian\" + 0.012*\"huntsvil\" + 0.012*\"treeless\" + 0.012*\"denmark\"\n", + "2019-01-31 00:43:17,961 : INFO : topic #9 (0.020): 0.077*\"bone\" + 0.040*\"american\" + 0.026*\"valour\" + 0.019*\"polit\" + 0.018*\"folei\" + 0.017*\"dutch\" + 0.017*\"player\" + 0.015*\"english\" + 0.013*\"acrimoni\" + 0.011*\"simpler\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 00:43:17,962 : INFO : topic #38 (0.020): 0.024*\"walter\" + 0.010*\"aza\" + 0.009*\"battalion\" + 0.008*\"forc\" + 0.008*\"empath\" + 0.007*\"teufel\" + 0.007*\"armi\" + 0.006*\"militari\" + 0.006*\"govern\" + 0.006*\"pour\"\n", + "2019-01-31 00:43:17,968 : INFO : topic diff=0.006631, rho=0.035444\n", + "2019-01-31 00:43:18,122 : INFO : PROGRESS: pass 0, at document #1594000/4922894\n", + "2019-01-31 00:43:19,494 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:43:19,761 : INFO : topic #43 (0.020): 0.064*\"elect\" + 0.055*\"parti\" + 0.023*\"voluntari\" + 0.021*\"democrat\" + 0.021*\"member\" + 0.016*\"polici\" + 0.014*\"republ\" + 0.014*\"selma\" + 0.013*\"report\" + 0.013*\"seaport\"\n", + "2019-01-31 00:43:19,762 : INFO : topic #4 (0.020): 0.022*\"enfranchis\" + 0.015*\"depress\" + 0.014*\"pour\" + 0.009*\"elabor\" + 0.008*\"mode\" + 0.008*\"veget\" + 0.007*\"uruguayan\" + 0.007*\"candid\" + 0.007*\"develop\" + 0.007*\"produc\"\n", + "2019-01-31 00:43:19,763 : INFO : topic #39 (0.020): 0.051*\"canada\" + 0.038*\"canadian\" + 0.022*\"toronto\" + 0.022*\"hoar\" + 0.020*\"ontario\" + 0.014*\"hydrogen\" + 0.014*\"new\" + 0.014*\"quebec\" + 0.014*\"misericordia\" + 0.012*\"novotná\"\n", + "2019-01-31 00:43:19,764 : INFO : topic #7 (0.020): 0.021*\"snatch\" + 0.020*\"di\" + 0.018*\"factor\" + 0.015*\"yawn\" + 0.015*\"margin\" + 0.014*\"bone\" + 0.013*\"life\" + 0.012*\"faster\" + 0.012*\"deal\" + 0.012*\"daughter\"\n", + "2019-01-31 00:43:19,765 : INFO : topic #45 (0.020): 0.024*\"jpg\" + 0.023*\"fifteenth\" + 0.017*\"black\" + 0.017*\"colder\" + 0.016*\"illicit\" + 0.016*\"western\" + 0.014*\"record\" + 0.011*\"blind\" + 0.008*\"green\" + 0.007*\"light\"\n", + "2019-01-31 00:43:19,771 : INFO : topic diff=0.005868, rho=0.035422\n", + "2019-01-31 00:43:19,927 : INFO : PROGRESS: pass 0, at document #1596000/4922894\n", + "2019-01-31 00:43:21,315 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:43:21,582 : INFO : topic #46 (0.020): 0.018*\"stop\" + 0.018*\"sweden\" + 0.017*\"swedish\" + 0.016*\"norwai\" + 0.015*\"wind\" + 0.015*\"damag\" + 0.014*\"norwegian\" + 0.012*\"huntsvil\" + 0.012*\"treeless\" + 0.011*\"denmark\"\n", + "2019-01-31 00:43:21,583 : INFO : topic #0 (0.020): 0.068*\"statewid\" + 0.040*\"line\" + 0.036*\"arsen\" + 0.035*\"raid\" + 0.028*\"museo\" + 0.020*\"traceabl\" + 0.017*\"serv\" + 0.014*\"exhaust\" + 0.014*\"pain\" + 0.013*\"oper\"\n", + "2019-01-31 00:43:21,584 : INFO : topic #14 (0.020): 0.023*\"forc\" + 0.022*\"aggress\" + 0.022*\"walter\" + 0.020*\"armi\" + 0.017*\"com\" + 0.013*\"oper\" + 0.013*\"militari\" + 0.013*\"unionist\" + 0.011*\"diversifi\" + 0.011*\"airbu\"\n", + "2019-01-31 00:43:21,584 : INFO : topic #1 (0.020): 0.059*\"china\" + 0.048*\"chilton\" + 0.023*\"hong\" + 0.023*\"kong\" + 0.022*\"korea\" + 0.017*\"korean\" + 0.017*\"sourc\" + 0.014*\"shirin\" + 0.014*\"leah\" + 0.013*\"ashvil\"\n", + "2019-01-31 00:43:21,585 : INFO : topic #30 (0.020): 0.036*\"cleveland\" + 0.036*\"leagu\" + 0.029*\"place\" + 0.027*\"taxpay\" + 0.025*\"scientist\" + 0.024*\"crete\" + 0.021*\"folei\" + 0.016*\"goal\" + 0.016*\"martin\" + 0.012*\"schmitz\"\n", + "2019-01-31 00:43:21,591 : INFO : topic diff=0.006117, rho=0.035400\n", + "2019-01-31 00:43:21,802 : INFO : PROGRESS: pass 0, at document #1598000/4922894\n", + "2019-01-31 00:43:23,205 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:43:23,471 : INFO : topic #18 (0.020): 0.010*\"théori\" + 0.007*\"sack\" + 0.007*\"later\" + 0.006*\"dai\" + 0.006*\"kill\" + 0.005*\"retrospect\" + 0.005*\"like\" + 0.004*\"end\" + 0.004*\"man\" + 0.004*\"call\"\n", + "2019-01-31 00:43:23,472 : INFO : topic #11 (0.020): 0.025*\"john\" + 0.013*\"will\" + 0.012*\"jame\" + 0.011*\"david\" + 0.011*\"rival\" + 0.009*\"mexican–american\" + 0.009*\"slur\" + 0.009*\"georg\" + 0.008*\"paul\" + 0.007*\"rhyme\"\n", + "2019-01-31 00:43:23,473 : INFO : topic #13 (0.020): 0.027*\"australia\" + 0.026*\"sourc\" + 0.025*\"london\" + 0.024*\"new\" + 0.024*\"australian\" + 0.023*\"england\" + 0.019*\"british\" + 0.018*\"ireland\" + 0.015*\"youth\" + 0.015*\"wale\"\n", + "2019-01-31 00:43:23,474 : INFO : topic #33 (0.020): 0.060*\"french\" + 0.042*\"franc\" + 0.028*\"pari\" + 0.021*\"sail\" + 0.020*\"jean\" + 0.017*\"daphn\" + 0.013*\"lazi\" + 0.011*\"loui\" + 0.011*\"piec\" + 0.007*\"wine\"\n", + "2019-01-31 00:43:23,475 : INFO : topic #14 (0.020): 0.023*\"forc\" + 0.022*\"aggress\" + 0.022*\"walter\" + 0.020*\"armi\" + 0.017*\"com\" + 0.013*\"oper\" + 0.013*\"militari\" + 0.013*\"unionist\" + 0.011*\"diversifi\" + 0.011*\"airbu\"\n", + "2019-01-31 00:43:23,481 : INFO : topic diff=0.005936, rho=0.035377\n", + "2019-01-31 00:43:26,203 : INFO : -11.629 per-word bound, 3166.1 perplexity estimate based on a held-out corpus of 2000 documents with 544776 words\n", + "2019-01-31 00:43:26,203 : INFO : PROGRESS: pass 0, at document #1600000/4922894\n", + "2019-01-31 00:43:27,612 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:43:27,878 : INFO : topic #33 (0.020): 0.060*\"french\" + 0.042*\"franc\" + 0.028*\"pari\" + 0.021*\"sail\" + 0.020*\"jean\" + 0.017*\"daphn\" + 0.013*\"lazi\" + 0.012*\"loui\" + 0.011*\"piec\" + 0.007*\"wine\"\n", + "2019-01-31 00:43:27,879 : INFO : topic #6 (0.020): 0.072*\"fewer\" + 0.024*\"septemb\" + 0.023*\"epiru\" + 0.019*\"teacher\" + 0.016*\"stake\" + 0.013*\"proclaim\" + 0.012*\"rodríguez\" + 0.011*\"direct\" + 0.011*\"movi\" + 0.010*\"acrimoni\"\n", + "2019-01-31 00:43:27,880 : INFO : topic #44 (0.020): 0.031*\"rooftop\" + 0.026*\"final\" + 0.023*\"wife\" + 0.019*\"champion\" + 0.018*\"tourist\" + 0.018*\"chamber\" + 0.016*\"taxpay\" + 0.016*\"martin\" + 0.015*\"open\" + 0.014*\"tiepolo\"\n", + "2019-01-31 00:43:27,881 : INFO : topic #38 (0.020): 0.024*\"walter\" + 0.011*\"aza\" + 0.009*\"battalion\" + 0.008*\"forc\" + 0.008*\"empath\" + 0.008*\"teufel\" + 0.007*\"armi\" + 0.006*\"militari\" + 0.006*\"govern\" + 0.006*\"pour\"\n", + "2019-01-31 00:43:27,882 : INFO : topic #23 (0.020): 0.136*\"audit\" + 0.070*\"best\" + 0.034*\"yawn\" + 0.028*\"jacksonvil\" + 0.024*\"japanes\" + 0.023*\"festiv\" + 0.021*\"noll\" + 0.018*\"women\" + 0.017*\"intern\" + 0.014*\"prison\"\n", + "2019-01-31 00:43:27,888 : INFO : topic diff=0.005878, rho=0.035355\n", + "2019-01-31 00:43:28,044 : INFO : PROGRESS: pass 0, at document #1602000/4922894\n", + "2019-01-31 00:43:29,438 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:43:29,705 : INFO : topic #3 (0.020): 0.035*\"present\" + 0.026*\"minist\" + 0.026*\"offic\" + 0.023*\"serv\" + 0.021*\"nation\" + 0.020*\"govern\" + 0.019*\"member\" + 0.018*\"gener\" + 0.015*\"seri\" + 0.015*\"start\"\n", + "2019-01-31 00:43:29,706 : INFO : topic #16 (0.020): 0.050*\"king\" + 0.031*\"priest\" + 0.020*\"grammat\" + 0.019*\"quarterli\" + 0.019*\"duke\" + 0.018*\"rotterdam\" + 0.016*\"idiosyncrat\" + 0.013*\"maria\" + 0.012*\"portugues\" + 0.012*\"kingdom\"\n", + "2019-01-31 00:43:29,707 : INFO : topic #18 (0.020): 0.010*\"théori\" + 0.007*\"later\" + 0.007*\"sack\" + 0.006*\"dai\" + 0.006*\"kill\" + 0.005*\"retrospect\" + 0.005*\"like\" + 0.004*\"end\" + 0.004*\"man\" + 0.004*\"call\"\n", + "2019-01-31 00:43:29,708 : INFO : topic #43 (0.020): 0.064*\"elect\" + 0.054*\"parti\" + 0.024*\"voluntari\" + 0.021*\"democrat\" + 0.020*\"member\" + 0.016*\"polici\" + 0.014*\"selma\" + 0.014*\"republ\" + 0.013*\"report\" + 0.013*\"liber\"\n", + "2019-01-31 00:43:29,709 : INFO : topic #48 (0.020): 0.078*\"octob\" + 0.077*\"sens\" + 0.075*\"march\" + 0.069*\"januari\" + 0.068*\"juli\" + 0.068*\"april\" + 0.068*\"august\" + 0.068*\"notion\" + 0.064*\"judici\" + 0.063*\"decatur\"\n", + "2019-01-31 00:43:29,715 : INFO : topic diff=0.006346, rho=0.035333\n", + "2019-01-31 00:43:29,872 : INFO : PROGRESS: pass 0, at document #1604000/4922894\n", + "2019-01-31 00:43:31,272 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:43:31,538 : INFO : topic #25 (0.020): 0.032*\"ring\" + 0.017*\"warmth\" + 0.017*\"lagrang\" + 0.016*\"area\" + 0.015*\"mount\" + 0.009*\"foam\" + 0.009*\"north\" + 0.008*\"palmer\" + 0.008*\"land\" + 0.008*\"vacant\"\n", + "2019-01-31 00:43:31,539 : INFO : topic #10 (0.020): 0.011*\"cdd\" + 0.009*\"media\" + 0.008*\"disco\" + 0.008*\"hormon\" + 0.008*\"have\" + 0.007*\"pathwai\" + 0.007*\"proper\" + 0.007*\"caus\" + 0.006*\"treat\" + 0.006*\"effect\"\n", + "2019-01-31 00:43:31,540 : INFO : topic #43 (0.020): 0.065*\"elect\" + 0.053*\"parti\" + 0.025*\"voluntari\" + 0.021*\"democrat\" + 0.020*\"member\" + 0.016*\"polici\" + 0.014*\"selma\" + 0.014*\"republ\" + 0.013*\"report\" + 0.013*\"bypass\"\n", + "2019-01-31 00:43:31,541 : INFO : topic #22 (0.020): 0.035*\"spars\" + 0.026*\"factor\" + 0.020*\"adulthood\" + 0.016*\"feel\" + 0.014*\"male\" + 0.012*\"hostil\" + 0.011*\"plaisir\" + 0.010*\"genu\" + 0.009*\"live\" + 0.008*\"yawn\"\n", + "2019-01-31 00:43:31,542 : INFO : topic #36 (0.020): 0.012*\"network\" + 0.012*\"prognosi\" + 0.010*\"pop\" + 0.009*\"softwar\" + 0.009*\"develop\" + 0.008*\"championship\" + 0.008*\"user\" + 0.008*\"cytokin\" + 0.007*\"diggin\" + 0.007*\"brio\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 00:43:31,548 : INFO : topic diff=0.006311, rho=0.035311\n", + "2019-01-31 00:43:31,705 : INFO : PROGRESS: pass 0, at document #1606000/4922894\n", + "2019-01-31 00:43:33,107 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:43:33,373 : INFO : topic #33 (0.020): 0.060*\"french\" + 0.047*\"franc\" + 0.028*\"pari\" + 0.022*\"sail\" + 0.020*\"jean\" + 0.017*\"daphn\" + 0.013*\"lazi\" + 0.012*\"loui\" + 0.011*\"piec\" + 0.007*\"wine\"\n", + "2019-01-31 00:43:33,374 : INFO : topic #1 (0.020): 0.057*\"china\" + 0.047*\"chilton\" + 0.025*\"hong\" + 0.024*\"kong\" + 0.022*\"korea\" + 0.017*\"korean\" + 0.016*\"sourc\" + 0.015*\"shirin\" + 0.015*\"leah\" + 0.013*\"kim\"\n", + "2019-01-31 00:43:33,375 : INFO : topic #44 (0.020): 0.031*\"rooftop\" + 0.027*\"final\" + 0.023*\"wife\" + 0.019*\"champion\" + 0.019*\"tourist\" + 0.018*\"chamber\" + 0.016*\"taxpay\" + 0.016*\"martin\" + 0.015*\"open\" + 0.014*\"tiepolo\"\n", + "2019-01-31 00:43:33,376 : INFO : topic #7 (0.020): 0.021*\"snatch\" + 0.020*\"di\" + 0.017*\"factor\" + 0.016*\"yawn\" + 0.015*\"margin\" + 0.014*\"bone\" + 0.013*\"life\" + 0.012*\"faster\" + 0.012*\"deal\" + 0.012*\"daughter\"\n", + "2019-01-31 00:43:33,377 : INFO : topic #2 (0.020): 0.044*\"isl\" + 0.038*\"shield\" + 0.018*\"narrat\" + 0.014*\"scot\" + 0.013*\"pope\" + 0.011*\"coalit\" + 0.011*\"nativist\" + 0.011*\"blur\" + 0.009*\"bahá\" + 0.009*\"fleet\"\n", + "2019-01-31 00:43:33,383 : INFO : topic diff=0.006580, rho=0.035289\n", + "2019-01-31 00:43:33,540 : INFO : PROGRESS: pass 0, at document #1608000/4922894\n", + "2019-01-31 00:43:34,941 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:43:35,208 : INFO : topic #6 (0.020): 0.072*\"fewer\" + 0.024*\"septemb\" + 0.023*\"epiru\" + 0.019*\"teacher\" + 0.016*\"stake\" + 0.012*\"proclaim\" + 0.012*\"rodríguez\" + 0.011*\"movi\" + 0.011*\"direct\" + 0.010*\"acrimoni\"\n", + "2019-01-31 00:43:35,209 : INFO : topic #19 (0.020): 0.016*\"languag\" + 0.012*\"centuri\" + 0.010*\"woodcut\" + 0.010*\"origin\" + 0.009*\"form\" + 0.008*\"mean\" + 0.007*\"trade\" + 0.007*\"english\" + 0.007*\"known\" + 0.007*\"uruguayan\"\n", + "2019-01-31 00:43:35,210 : INFO : topic #0 (0.020): 0.069*\"statewid\" + 0.039*\"line\" + 0.036*\"arsen\" + 0.035*\"raid\" + 0.027*\"museo\" + 0.020*\"traceabl\" + 0.017*\"serv\" + 0.014*\"exhaust\" + 0.013*\"pain\" + 0.013*\"oper\"\n", + "2019-01-31 00:43:35,211 : INFO : topic #23 (0.020): 0.136*\"audit\" + 0.070*\"best\" + 0.034*\"yawn\" + 0.028*\"jacksonvil\" + 0.024*\"japanes\" + 0.023*\"festiv\" + 0.021*\"noll\" + 0.018*\"women\" + 0.017*\"intern\" + 0.014*\"prison\"\n", + "2019-01-31 00:43:35,212 : INFO : topic #37 (0.020): 0.009*\"man\" + 0.009*\"love\" + 0.008*\"gestur\" + 0.007*\"charact\" + 0.007*\"comic\" + 0.007*\"septemb\" + 0.005*\"blue\" + 0.005*\"appear\" + 0.004*\"black\" + 0.004*\"workplac\"\n", + "2019-01-31 00:43:35,218 : INFO : topic diff=0.005495, rho=0.035267\n", + "2019-01-31 00:43:35,376 : INFO : PROGRESS: pass 0, at document #1610000/4922894\n", + "2019-01-31 00:43:36,768 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:43:37,035 : INFO : topic #27 (0.020): 0.070*\"questionnair\" + 0.019*\"taxpay\" + 0.018*\"candid\" + 0.015*\"ret\" + 0.012*\"fool\" + 0.012*\"driver\" + 0.012*\"tornado\" + 0.012*\"squatter\" + 0.011*\"find\" + 0.010*\"théori\"\n", + "2019-01-31 00:43:37,036 : INFO : topic #9 (0.020): 0.074*\"bone\" + 0.038*\"american\" + 0.027*\"valour\" + 0.018*\"polit\" + 0.018*\"dutch\" + 0.018*\"folei\" + 0.017*\"player\" + 0.015*\"english\" + 0.013*\"acrimoni\" + 0.011*\"simpler\"\n", + "2019-01-31 00:43:37,037 : INFO : topic #39 (0.020): 0.051*\"canada\" + 0.038*\"canadian\" + 0.022*\"toronto\" + 0.022*\"hoar\" + 0.019*\"ontario\" + 0.014*\"hydrogen\" + 0.014*\"new\" + 0.013*\"quebec\" + 0.013*\"misericordia\" + 0.012*\"novotná\"\n", + "2019-01-31 00:43:37,038 : INFO : topic #24 (0.020): 0.041*\"book\" + 0.036*\"publicis\" + 0.024*\"word\" + 0.017*\"new\" + 0.014*\"edit\" + 0.013*\"presid\" + 0.013*\"nicola\" + 0.012*\"storag\" + 0.012*\"collect\" + 0.011*\"magazin\"\n", + "2019-01-31 00:43:37,039 : INFO : topic #42 (0.020): 0.045*\"german\" + 0.032*\"germani\" + 0.015*\"vol\" + 0.014*\"israel\" + 0.013*\"jewish\" + 0.013*\"berlin\" + 0.013*\"der\" + 0.010*\"europ\" + 0.010*\"european\" + 0.009*\"austria\"\n", + "2019-01-31 00:43:37,045 : INFO : topic diff=0.006482, rho=0.035245\n", + "2019-01-31 00:43:37,200 : INFO : PROGRESS: pass 0, at document #1612000/4922894\n", + "2019-01-31 00:43:38,586 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:43:38,852 : INFO : topic #38 (0.020): 0.024*\"walter\" + 0.011*\"aza\" + 0.009*\"battalion\" + 0.008*\"forc\" + 0.008*\"teufel\" + 0.007*\"empath\" + 0.007*\"armi\" + 0.006*\"till\" + 0.006*\"militari\" + 0.006*\"govern\"\n", + "2019-01-31 00:43:38,854 : INFO : topic #15 (0.020): 0.012*\"small\" + 0.011*\"organ\" + 0.010*\"develop\" + 0.010*\"commun\" + 0.009*\"word\" + 0.009*\"group\" + 0.008*\"peopl\" + 0.008*\"cultur\" + 0.007*\"human\" + 0.006*\"socialist\"\n", + "2019-01-31 00:43:38,855 : INFO : topic #43 (0.020): 0.066*\"elect\" + 0.054*\"parti\" + 0.024*\"voluntari\" + 0.021*\"democrat\" + 0.020*\"member\" + 0.017*\"polici\" + 0.015*\"seaport\" + 0.014*\"republ\" + 0.013*\"selma\" + 0.013*\"bypass\"\n", + "2019-01-31 00:43:38,856 : INFO : topic #42 (0.020): 0.045*\"german\" + 0.031*\"germani\" + 0.015*\"vol\" + 0.014*\"israel\" + 0.014*\"jewish\" + 0.013*\"der\" + 0.013*\"berlin\" + 0.010*\"europ\" + 0.010*\"european\" + 0.009*\"austria\"\n", + "2019-01-31 00:43:38,857 : INFO : topic #48 (0.020): 0.079*\"octob\" + 0.077*\"sens\" + 0.074*\"march\" + 0.067*\"august\" + 0.067*\"notion\" + 0.067*\"januari\" + 0.067*\"april\" + 0.067*\"juli\" + 0.064*\"judici\" + 0.063*\"decatur\"\n", + "2019-01-31 00:43:38,863 : INFO : topic diff=0.005898, rho=0.035223\n", + "2019-01-31 00:43:39,017 : INFO : PROGRESS: pass 0, at document #1614000/4922894\n", + "2019-01-31 00:43:40,405 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:43:40,672 : INFO : topic #47 (0.020): 0.065*\"muscl\" + 0.035*\"perceptu\" + 0.021*\"theater\" + 0.018*\"place\" + 0.018*\"compos\" + 0.016*\"damn\" + 0.014*\"olympo\" + 0.013*\"orchestr\" + 0.012*\"physician\" + 0.012*\"word\"\n", + "2019-01-31 00:43:40,673 : INFO : topic #16 (0.020): 0.050*\"king\" + 0.032*\"priest\" + 0.020*\"quarterli\" + 0.019*\"grammat\" + 0.019*\"duke\" + 0.019*\"rotterdam\" + 0.017*\"idiosyncrat\" + 0.013*\"maria\" + 0.013*\"princ\" + 0.012*\"count\"\n", + "2019-01-31 00:43:40,674 : INFO : topic #15 (0.020): 0.012*\"small\" + 0.011*\"organ\" + 0.010*\"develop\" + 0.010*\"commun\" + 0.009*\"word\" + 0.009*\"group\" + 0.008*\"peopl\" + 0.008*\"cultur\" + 0.007*\"human\" + 0.006*\"socialist\"\n", + "2019-01-31 00:43:40,675 : INFO : topic #43 (0.020): 0.066*\"elect\" + 0.053*\"parti\" + 0.025*\"voluntari\" + 0.021*\"democrat\" + 0.020*\"member\" + 0.017*\"polici\" + 0.014*\"seaport\" + 0.014*\"republ\" + 0.013*\"selma\" + 0.013*\"bypass\"\n", + "2019-01-31 00:43:40,676 : INFO : topic #40 (0.020): 0.090*\"unit\" + 0.024*\"schuster\" + 0.022*\"collector\" + 0.022*\"institut\" + 0.021*\"requir\" + 0.019*\"student\" + 0.014*\"professor\" + 0.012*\"word\" + 0.011*\"degre\" + 0.011*\"http\"\n", + "2019-01-31 00:43:40,682 : INFO : topic diff=0.005655, rho=0.035202\n", + "2019-01-31 00:43:40,840 : INFO : PROGRESS: pass 0, at document #1616000/4922894\n", + "2019-01-31 00:43:42,246 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:43:42,513 : INFO : topic #3 (0.020): 0.034*\"present\" + 0.026*\"offic\" + 0.025*\"minist\" + 0.024*\"serv\" + 0.021*\"nation\" + 0.020*\"govern\" + 0.019*\"member\" + 0.018*\"gener\" + 0.015*\"seri\" + 0.015*\"start\"\n", + "2019-01-31 00:43:42,514 : INFO : topic #28 (0.020): 0.030*\"build\" + 0.025*\"hous\" + 0.022*\"rivièr\" + 0.017*\"buford\" + 0.012*\"histor\" + 0.011*\"briarwood\" + 0.011*\"constitut\" + 0.010*\"linear\" + 0.010*\"strategist\" + 0.010*\"depress\"\n", + "2019-01-31 00:43:42,515 : INFO : topic #45 (0.020): 0.024*\"jpg\" + 0.023*\"fifteenth\" + 0.017*\"black\" + 0.017*\"western\" + 0.017*\"colder\" + 0.016*\"illicit\" + 0.015*\"record\" + 0.011*\"blind\" + 0.008*\"light\" + 0.008*\"green\"\n", + "2019-01-31 00:43:42,516 : INFO : topic #23 (0.020): 0.137*\"audit\" + 0.070*\"best\" + 0.034*\"yawn\" + 0.027*\"jacksonvil\" + 0.024*\"japanes\" + 0.023*\"festiv\" + 0.021*\"noll\" + 0.018*\"women\" + 0.017*\"intern\" + 0.014*\"prison\"\n", + "2019-01-31 00:43:42,517 : INFO : topic #14 (0.020): 0.024*\"forc\" + 0.022*\"aggress\" + 0.022*\"walter\" + 0.020*\"armi\" + 0.017*\"com\" + 0.013*\"oper\" + 0.013*\"unionist\" + 0.012*\"militari\" + 0.011*\"airbu\" + 0.011*\"diversifi\"\n", + "2019-01-31 00:43:42,523 : INFO : topic diff=0.004504, rho=0.035180\n", + "2019-01-31 00:43:42,678 : INFO : PROGRESS: pass 0, at document #1618000/4922894\n", + "2019-01-31 00:43:44,059 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 00:43:44,325 : INFO : topic #1 (0.020): 0.054*\"china\" + 0.045*\"chilton\" + 0.026*\"hong\" + 0.024*\"kong\" + 0.022*\"korea\" + 0.017*\"korean\" + 0.017*\"sourc\" + 0.015*\"shirin\" + 0.015*\"leah\" + 0.013*\"kim\"\n", + "2019-01-31 00:43:44,326 : INFO : topic #34 (0.020): 0.073*\"start\" + 0.035*\"cotton\" + 0.032*\"unionist\" + 0.030*\"american\" + 0.028*\"new\" + 0.017*\"year\" + 0.015*\"california\" + 0.013*\"terri\" + 0.012*\"north\" + 0.012*\"warrior\"\n", + "2019-01-31 00:43:44,327 : INFO : topic #24 (0.020): 0.040*\"book\" + 0.035*\"publicis\" + 0.024*\"word\" + 0.017*\"new\" + 0.014*\"edit\" + 0.013*\"presid\" + 0.013*\"nicola\" + 0.012*\"storag\" + 0.012*\"collect\" + 0.011*\"magazin\"\n", + "2019-01-31 00:43:44,328 : INFO : topic #0 (0.020): 0.068*\"statewid\" + 0.039*\"line\" + 0.037*\"arsen\" + 0.034*\"raid\" + 0.028*\"museo\" + 0.020*\"traceabl\" + 0.017*\"serv\" + 0.015*\"exhaust\" + 0.014*\"pain\" + 0.013*\"gai\"\n", + "2019-01-31 00:43:44,329 : INFO : topic #10 (0.020): 0.011*\"cdd\" + 0.009*\"media\" + 0.008*\"hormon\" + 0.008*\"disco\" + 0.008*\"have\" + 0.007*\"pathwai\" + 0.007*\"proper\" + 0.007*\"caus\" + 0.006*\"effect\" + 0.006*\"treat\"\n", + "2019-01-31 00:43:44,335 : INFO : topic diff=0.006087, rho=0.035158\n", + "2019-01-31 00:43:47,049 : INFO : -11.657 per-word bound, 3228.5 perplexity estimate based on a held-out corpus of 2000 documents with 564370 words\n", + "2019-01-31 00:43:47,050 : INFO : PROGRESS: pass 0, at document #1620000/4922894\n", + "2019-01-31 00:43:48,425 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:43:48,691 : INFO : topic #2 (0.020): 0.046*\"isl\" + 0.037*\"shield\" + 0.018*\"narrat\" + 0.014*\"scot\" + 0.014*\"pope\" + 0.011*\"coalit\" + 0.011*\"nativist\" + 0.011*\"blur\" + 0.009*\"bahá\" + 0.009*\"fleet\"\n", + "2019-01-31 00:43:48,692 : INFO : topic #43 (0.020): 0.066*\"elect\" + 0.053*\"parti\" + 0.025*\"voluntari\" + 0.021*\"democrat\" + 0.020*\"member\" + 0.017*\"polici\" + 0.014*\"seaport\" + 0.013*\"republ\" + 0.013*\"selma\" + 0.013*\"report\"\n", + "2019-01-31 00:43:48,693 : INFO : topic #28 (0.020): 0.030*\"build\" + 0.025*\"hous\" + 0.021*\"rivièr\" + 0.017*\"buford\" + 0.012*\"histor\" + 0.011*\"briarwood\" + 0.011*\"constitut\" + 0.010*\"linear\" + 0.010*\"depress\" + 0.009*\"strategist\"\n", + "2019-01-31 00:43:48,694 : INFO : topic #5 (0.020): 0.038*\"abroad\" + 0.029*\"son\" + 0.026*\"rel\" + 0.025*\"reconstruct\" + 0.021*\"band\" + 0.017*\"muscl\" + 0.016*\"simultan\" + 0.014*\"charcoal\" + 0.013*\"toyota\" + 0.011*\"myspac\"\n", + "2019-01-31 00:43:48,695 : INFO : topic #46 (0.020): 0.019*\"stop\" + 0.016*\"sweden\" + 0.016*\"swedish\" + 0.015*\"wind\" + 0.015*\"norwai\" + 0.015*\"treeless\" + 0.014*\"norwegian\" + 0.013*\"damag\" + 0.012*\"huntsvil\" + 0.011*\"denmark\"\n", + "2019-01-31 00:43:48,701 : INFO : topic diff=0.007010, rho=0.035136\n", + "2019-01-31 00:43:48,857 : INFO : PROGRESS: pass 0, at document #1622000/4922894\n", + "2019-01-31 00:43:50,235 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:43:50,502 : INFO : topic #40 (0.020): 0.090*\"unit\" + 0.024*\"schuster\" + 0.022*\"institut\" + 0.022*\"collector\" + 0.021*\"requir\" + 0.019*\"student\" + 0.014*\"professor\" + 0.012*\"word\" + 0.011*\"http\" + 0.011*\"degre\"\n", + "2019-01-31 00:43:50,503 : INFO : topic #31 (0.020): 0.056*\"fusiform\" + 0.026*\"scientist\" + 0.024*\"player\" + 0.024*\"taxpay\" + 0.020*\"place\" + 0.013*\"clot\" + 0.012*\"leagu\" + 0.011*\"folei\" + 0.010*\"yawn\" + 0.009*\"yard\"\n", + "2019-01-31 00:43:50,504 : INFO : topic #26 (0.020): 0.030*\"workplac\" + 0.029*\"woman\" + 0.028*\"champion\" + 0.025*\"men\" + 0.024*\"olymp\" + 0.022*\"medal\" + 0.020*\"event\" + 0.018*\"taxpay\" + 0.018*\"alic\" + 0.018*\"gold\"\n", + "2019-01-31 00:43:50,505 : INFO : topic #15 (0.020): 0.011*\"small\" + 0.011*\"organ\" + 0.010*\"develop\" + 0.010*\"commun\" + 0.009*\"word\" + 0.009*\"group\" + 0.008*\"peopl\" + 0.008*\"cultur\" + 0.007*\"human\" + 0.006*\"woman\"\n", + "2019-01-31 00:43:50,506 : INFO : topic #2 (0.020): 0.046*\"isl\" + 0.037*\"shield\" + 0.018*\"narrat\" + 0.014*\"scot\" + 0.014*\"pope\" + 0.011*\"coalit\" + 0.011*\"blur\" + 0.011*\"nativist\" + 0.009*\"bahá\" + 0.009*\"fleet\"\n", + "2019-01-31 00:43:50,512 : INFO : topic diff=0.005434, rho=0.035115\n", + "2019-01-31 00:43:50,672 : INFO : PROGRESS: pass 0, at document #1624000/4922894\n", + "2019-01-31 00:43:52,083 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:43:52,349 : INFO : topic #11 (0.020): 0.025*\"john\" + 0.013*\"will\" + 0.012*\"jame\" + 0.011*\"david\" + 0.011*\"rival\" + 0.009*\"mexican–american\" + 0.009*\"georg\" + 0.009*\"slur\" + 0.008*\"paul\" + 0.008*\"rhyme\"\n", + "2019-01-31 00:43:52,350 : INFO : topic #33 (0.020): 0.058*\"french\" + 0.046*\"franc\" + 0.027*\"pari\" + 0.022*\"sail\" + 0.020*\"jean\" + 0.016*\"daphn\" + 0.013*\"lazi\" + 0.011*\"loui\" + 0.011*\"piec\" + 0.008*\"convei\"\n", + "2019-01-31 00:43:52,351 : INFO : topic #16 (0.020): 0.050*\"king\" + 0.032*\"priest\" + 0.019*\"quarterli\" + 0.019*\"grammat\" + 0.018*\"duke\" + 0.018*\"rotterdam\" + 0.017*\"idiosyncrat\" + 0.013*\"princ\" + 0.013*\"maria\" + 0.012*\"count\"\n", + "2019-01-31 00:43:52,352 : INFO : topic #39 (0.020): 0.051*\"canada\" + 0.037*\"canadian\" + 0.022*\"toronto\" + 0.021*\"hoar\" + 0.019*\"ontario\" + 0.014*\"hydrogen\" + 0.014*\"new\" + 0.013*\"misericordia\" + 0.013*\"quebec\" + 0.012*\"novotná\"\n", + "2019-01-31 00:43:52,353 : INFO : topic #17 (0.020): 0.073*\"church\" + 0.021*\"christian\" + 0.021*\"cathol\" + 0.020*\"bishop\" + 0.015*\"sail\" + 0.015*\"retroflex\" + 0.010*\"historiographi\" + 0.010*\"romanc\" + 0.009*\"parish\" + 0.009*\"cathedr\"\n", + "2019-01-31 00:43:52,359 : INFO : topic diff=0.006906, rho=0.035093\n", + "2019-01-31 00:43:52,523 : INFO : PROGRESS: pass 0, at document #1626000/4922894\n", + "2019-01-31 00:43:53,968 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:43:54,234 : INFO : topic #14 (0.020): 0.024*\"forc\" + 0.023*\"aggress\" + 0.021*\"walter\" + 0.021*\"armi\" + 0.017*\"com\" + 0.014*\"oper\" + 0.014*\"unionist\" + 0.012*\"militari\" + 0.012*\"airbu\" + 0.011*\"diversifi\"\n", + "2019-01-31 00:43:54,236 : INFO : topic #15 (0.020): 0.011*\"small\" + 0.011*\"organ\" + 0.010*\"develop\" + 0.010*\"commun\" + 0.009*\"word\" + 0.009*\"group\" + 0.008*\"peopl\" + 0.008*\"cultur\" + 0.007*\"human\" + 0.006*\"woman\"\n", + "2019-01-31 00:43:54,236 : INFO : topic #30 (0.020): 0.036*\"cleveland\" + 0.036*\"leagu\" + 0.029*\"place\" + 0.027*\"taxpay\" + 0.025*\"scientist\" + 0.024*\"crete\" + 0.021*\"folei\" + 0.016*\"goal\" + 0.015*\"martin\" + 0.012*\"schmitz\"\n", + "2019-01-31 00:43:54,237 : INFO : topic #43 (0.020): 0.065*\"elect\" + 0.053*\"parti\" + 0.025*\"voluntari\" + 0.021*\"democrat\" + 0.020*\"member\" + 0.017*\"polici\" + 0.014*\"republ\" + 0.014*\"seaport\" + 0.013*\"report\" + 0.013*\"selma\"\n", + "2019-01-31 00:43:54,238 : INFO : topic #22 (0.020): 0.034*\"spars\" + 0.025*\"factor\" + 0.020*\"adulthood\" + 0.017*\"feel\" + 0.015*\"male\" + 0.012*\"hostil\" + 0.011*\"plaisir\" + 0.009*\"genu\" + 0.009*\"live\" + 0.008*\"yawn\"\n", + "2019-01-31 00:43:54,244 : INFO : topic diff=0.005354, rho=0.035072\n", + "2019-01-31 00:43:54,401 : INFO : PROGRESS: pass 0, at document #1628000/4922894\n", + "2019-01-31 00:43:55,790 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:43:56,057 : INFO : topic #44 (0.020): 0.031*\"rooftop\" + 0.027*\"final\" + 0.024*\"wife\" + 0.020*\"champion\" + 0.019*\"tourist\" + 0.018*\"chamber\" + 0.016*\"winner\" + 0.016*\"martin\" + 0.015*\"taxpay\" + 0.015*\"open\"\n", + "2019-01-31 00:43:56,059 : INFO : topic #41 (0.020): 0.043*\"citi\" + 0.027*\"new\" + 0.022*\"palmer\" + 0.015*\"strategist\" + 0.012*\"open\" + 0.012*\"center\" + 0.011*\"includ\" + 0.010*\"lobe\" + 0.010*\"year\" + 0.009*\"dai\"\n", + "2019-01-31 00:43:56,060 : INFO : topic #39 (0.020): 0.051*\"canada\" + 0.037*\"canadian\" + 0.022*\"toronto\" + 0.021*\"hoar\" + 0.019*\"ontario\" + 0.014*\"hydrogen\" + 0.014*\"misericordia\" + 0.014*\"new\" + 0.013*\"quebec\" + 0.012*\"novotná\"\n", + "2019-01-31 00:43:56,061 : INFO : topic #5 (0.020): 0.038*\"abroad\" + 0.029*\"son\" + 0.026*\"rel\" + 0.025*\"reconstruct\" + 0.021*\"band\" + 0.017*\"muscl\" + 0.016*\"simultan\" + 0.014*\"charcoal\" + 0.013*\"toyota\" + 0.011*\"myspac\"\n", + "2019-01-31 00:43:56,063 : INFO : topic #14 (0.020): 0.025*\"forc\" + 0.023*\"aggress\" + 0.021*\"walter\" + 0.020*\"armi\" + 0.017*\"com\" + 0.014*\"oper\" + 0.013*\"unionist\" + 0.012*\"airbu\" + 0.012*\"militari\" + 0.011*\"diversifi\"\n", + "2019-01-31 00:43:56,069 : INFO : topic diff=0.006475, rho=0.035050\n", + "2019-01-31 00:43:56,228 : INFO : PROGRESS: pass 0, at document #1630000/4922894\n", + "2019-01-31 00:43:57,635 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:43:57,902 : INFO : topic #45 (0.020): 0.025*\"jpg\" + 0.023*\"fifteenth\" + 0.016*\"illicit\" + 0.016*\"colder\" + 0.016*\"black\" + 0.016*\"western\" + 0.014*\"record\" + 0.011*\"blind\" + 0.008*\"light\" + 0.007*\"green\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 00:43:57,903 : INFO : topic #48 (0.020): 0.079*\"octob\" + 0.077*\"sens\" + 0.074*\"march\" + 0.069*\"notion\" + 0.068*\"juli\" + 0.068*\"januari\" + 0.067*\"august\" + 0.067*\"april\" + 0.064*\"judici\" + 0.063*\"decatur\"\n", + "2019-01-31 00:43:57,904 : INFO : topic #23 (0.020): 0.137*\"audit\" + 0.069*\"best\" + 0.035*\"yawn\" + 0.027*\"jacksonvil\" + 0.024*\"japanes\" + 0.023*\"noll\" + 0.022*\"festiv\" + 0.019*\"women\" + 0.017*\"intern\" + 0.013*\"winner\"\n", + "2019-01-31 00:43:57,905 : INFO : topic #38 (0.020): 0.024*\"walter\" + 0.010*\"aza\" + 0.009*\"battalion\" + 0.008*\"forc\" + 0.008*\"teufel\" + 0.007*\"empath\" + 0.007*\"armi\" + 0.006*\"till\" + 0.006*\"militari\" + 0.006*\"pour\"\n", + "2019-01-31 00:43:57,907 : INFO : topic #19 (0.020): 0.016*\"languag\" + 0.012*\"centuri\" + 0.010*\"woodcut\" + 0.009*\"origin\" + 0.009*\"form\" + 0.008*\"mean\" + 0.007*\"trade\" + 0.007*\"known\" + 0.007*\"english\" + 0.007*\"god\"\n", + "2019-01-31 00:43:57,913 : INFO : topic diff=0.005909, rho=0.035028\n", + "2019-01-31 00:43:58,131 : INFO : PROGRESS: pass 0, at document #1632000/4922894\n", + "2019-01-31 00:43:59,542 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:43:59,809 : INFO : topic #15 (0.020): 0.012*\"small\" + 0.011*\"organ\" + 0.010*\"develop\" + 0.010*\"commun\" + 0.009*\"word\" + 0.009*\"group\" + 0.008*\"peopl\" + 0.008*\"cultur\" + 0.007*\"human\" + 0.006*\"woman\"\n", + "2019-01-31 00:43:59,810 : INFO : topic #1 (0.020): 0.053*\"china\" + 0.045*\"chilton\" + 0.026*\"hong\" + 0.025*\"kong\" + 0.021*\"korea\" + 0.019*\"korean\" + 0.017*\"sourc\" + 0.016*\"shirin\" + 0.015*\"leah\" + 0.014*\"kim\"\n", + "2019-01-31 00:43:59,811 : INFO : topic #43 (0.020): 0.065*\"elect\" + 0.053*\"parti\" + 0.025*\"voluntari\" + 0.021*\"democrat\" + 0.020*\"member\" + 0.017*\"polici\" + 0.014*\"seaport\" + 0.013*\"republ\" + 0.013*\"report\" + 0.013*\"selma\"\n", + "2019-01-31 00:43:59,812 : INFO : topic #10 (0.020): 0.011*\"cdd\" + 0.009*\"media\" + 0.008*\"hormon\" + 0.008*\"disco\" + 0.008*\"have\" + 0.007*\"pathwai\" + 0.007*\"proper\" + 0.007*\"caus\" + 0.006*\"treat\" + 0.006*\"effect\"\n", + "2019-01-31 00:43:59,814 : INFO : topic #31 (0.020): 0.055*\"fusiform\" + 0.026*\"scientist\" + 0.024*\"taxpay\" + 0.024*\"player\" + 0.020*\"place\" + 0.014*\"clot\" + 0.012*\"leagu\" + 0.011*\"folei\" + 0.010*\"yawn\" + 0.010*\"yard\"\n", + "2019-01-31 00:43:59,819 : INFO : topic diff=0.004654, rho=0.035007\n", + "2019-01-31 00:43:59,970 : INFO : PROGRESS: pass 0, at document #1634000/4922894\n", + "2019-01-31 00:44:01,320 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:44:01,586 : INFO : topic #19 (0.020): 0.016*\"languag\" + 0.012*\"centuri\" + 0.011*\"woodcut\" + 0.010*\"origin\" + 0.009*\"form\" + 0.008*\"mean\" + 0.007*\"trade\" + 0.007*\"english\" + 0.007*\"known\" + 0.007*\"god\"\n", + "2019-01-31 00:44:01,587 : INFO : topic #30 (0.020): 0.036*\"cleveland\" + 0.036*\"leagu\" + 0.029*\"place\" + 0.027*\"taxpay\" + 0.025*\"scientist\" + 0.023*\"crete\" + 0.021*\"folei\" + 0.016*\"goal\" + 0.015*\"martin\" + 0.012*\"schmitz\"\n", + "2019-01-31 00:44:01,588 : INFO : topic #7 (0.020): 0.021*\"snatch\" + 0.020*\"di\" + 0.018*\"factor\" + 0.015*\"yawn\" + 0.015*\"margin\" + 0.014*\"bone\" + 0.013*\"life\" + 0.012*\"faster\" + 0.012*\"daughter\" + 0.012*\"deal\"\n", + "2019-01-31 00:44:01,590 : INFO : topic #41 (0.020): 0.043*\"citi\" + 0.027*\"new\" + 0.022*\"palmer\" + 0.015*\"strategist\" + 0.012*\"open\" + 0.012*\"center\" + 0.011*\"includ\" + 0.010*\"year\" + 0.010*\"lobe\" + 0.009*\"dai\"\n", + "2019-01-31 00:44:01,591 : INFO : topic #47 (0.020): 0.066*\"muscl\" + 0.035*\"perceptu\" + 0.021*\"theater\" + 0.020*\"place\" + 0.017*\"compos\" + 0.015*\"damn\" + 0.014*\"olympo\" + 0.013*\"orchestr\" + 0.012*\"word\" + 0.012*\"physician\"\n", + "2019-01-31 00:44:01,597 : INFO : topic diff=0.006440, rho=0.034986\n", + "2019-01-31 00:44:01,754 : INFO : PROGRESS: pass 0, at document #1636000/4922894\n", + "2019-01-31 00:44:03,159 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:44:03,425 : INFO : topic #9 (0.020): 0.073*\"bone\" + 0.041*\"american\" + 0.028*\"valour\" + 0.019*\"folei\" + 0.018*\"player\" + 0.018*\"polit\" + 0.018*\"dutch\" + 0.016*\"english\" + 0.012*\"acrimoni\" + 0.011*\"simpler\"\n", + "2019-01-31 00:44:03,426 : INFO : topic #19 (0.020): 0.016*\"languag\" + 0.012*\"centuri\" + 0.011*\"woodcut\" + 0.010*\"origin\" + 0.009*\"form\" + 0.008*\"mean\" + 0.007*\"trade\" + 0.007*\"english\" + 0.007*\"known\" + 0.007*\"god\"\n", + "2019-01-31 00:44:03,427 : INFO : topic #12 (0.020): 0.009*\"number\" + 0.007*\"frontal\" + 0.007*\"gener\" + 0.006*\"poet\" + 0.006*\"servitud\" + 0.006*\"exampl\" + 0.006*\"théori\" + 0.006*\"method\" + 0.006*\"mode\" + 0.006*\"measur\"\n", + "2019-01-31 00:44:03,429 : INFO : topic #21 (0.020): 0.036*\"samford\" + 0.021*\"spain\" + 0.018*\"del\" + 0.018*\"mexico\" + 0.013*\"soviet\" + 0.012*\"francisco\" + 0.012*\"santa\" + 0.011*\"mexican\" + 0.011*\"lizard\" + 0.011*\"juan\"\n", + "2019-01-31 00:44:03,430 : INFO : topic #14 (0.020): 0.024*\"forc\" + 0.023*\"aggress\" + 0.021*\"walter\" + 0.021*\"armi\" + 0.018*\"com\" + 0.014*\"oper\" + 0.013*\"unionist\" + 0.013*\"militari\" + 0.012*\"airbu\" + 0.010*\"refut\"\n", + "2019-01-31 00:44:03,436 : INFO : topic diff=0.004858, rho=0.034964\n", + "2019-01-31 00:44:03,595 : INFO : PROGRESS: pass 0, at document #1638000/4922894\n", + "2019-01-31 00:44:04,992 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:44:05,259 : INFO : topic #12 (0.020): 0.009*\"number\" + 0.007*\"frontal\" + 0.007*\"gener\" + 0.006*\"poet\" + 0.006*\"exampl\" + 0.006*\"servitud\" + 0.006*\"théori\" + 0.006*\"method\" + 0.006*\"measur\" + 0.006*\"mode\"\n", + "2019-01-31 00:44:05,260 : INFO : topic #31 (0.020): 0.055*\"fusiform\" + 0.026*\"scientist\" + 0.024*\"taxpay\" + 0.024*\"player\" + 0.020*\"place\" + 0.014*\"clot\" + 0.012*\"leagu\" + 0.011*\"folei\" + 0.010*\"yawn\" + 0.009*\"yard\"\n", + "2019-01-31 00:44:05,261 : INFO : topic #30 (0.020): 0.036*\"cleveland\" + 0.036*\"leagu\" + 0.029*\"place\" + 0.027*\"taxpay\" + 0.024*\"scientist\" + 0.023*\"crete\" + 0.021*\"folei\" + 0.017*\"goal\" + 0.015*\"martin\" + 0.012*\"schmitz\"\n", + "2019-01-31 00:44:05,262 : INFO : topic #38 (0.020): 0.024*\"walter\" + 0.010*\"aza\" + 0.009*\"battalion\" + 0.008*\"forc\" + 0.007*\"teufel\" + 0.007*\"armi\" + 0.007*\"empath\" + 0.006*\"militari\" + 0.006*\"till\" + 0.006*\"pour\"\n", + "2019-01-31 00:44:05,263 : INFO : topic #43 (0.020): 0.065*\"elect\" + 0.053*\"parti\" + 0.025*\"voluntari\" + 0.021*\"democrat\" + 0.020*\"member\" + 0.017*\"polici\" + 0.014*\"seaport\" + 0.014*\"report\" + 0.013*\"bypass\" + 0.013*\"republ\"\n", + "2019-01-31 00:44:05,269 : INFO : topic diff=0.005580, rho=0.034943\n", + "2019-01-31 00:44:07,929 : INFO : -11.761 per-word bound, 3471.8 perplexity estimate based on a held-out corpus of 2000 documents with 523897 words\n", + "2019-01-31 00:44:07,929 : INFO : PROGRESS: pass 0, at document #1640000/4922894\n", + "2019-01-31 00:44:09,305 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:44:09,572 : INFO : topic #0 (0.020): 0.066*\"statewid\" + 0.040*\"line\" + 0.037*\"arsen\" + 0.032*\"raid\" + 0.029*\"museo\" + 0.019*\"traceabl\" + 0.018*\"serv\" + 0.015*\"exhaust\" + 0.013*\"pain\" + 0.013*\"gai\"\n", + "2019-01-31 00:44:09,573 : INFO : topic #22 (0.020): 0.035*\"spars\" + 0.025*\"factor\" + 0.020*\"adulthood\" + 0.017*\"feel\" + 0.015*\"male\" + 0.012*\"hostil\" + 0.012*\"plaisir\" + 0.009*\"genu\" + 0.009*\"live\" + 0.008*\"yawn\"\n", + "2019-01-31 00:44:09,574 : INFO : topic #33 (0.020): 0.058*\"french\" + 0.046*\"franc\" + 0.033*\"pari\" + 0.022*\"sail\" + 0.020*\"jean\" + 0.016*\"daphn\" + 0.013*\"lazi\" + 0.012*\"loui\" + 0.011*\"piec\" + 0.007*\"convei\"\n", + "2019-01-31 00:44:09,576 : INFO : topic #24 (0.020): 0.041*\"book\" + 0.035*\"publicis\" + 0.024*\"word\" + 0.017*\"new\" + 0.014*\"edit\" + 0.013*\"presid\" + 0.012*\"nicola\" + 0.012*\"storag\" + 0.012*\"collect\" + 0.011*\"magazin\"\n", + "2019-01-31 00:44:09,577 : INFO : topic #37 (0.020): 0.010*\"man\" + 0.009*\"love\" + 0.007*\"charact\" + 0.007*\"gestur\" + 0.007*\"comic\" + 0.006*\"septemb\" + 0.005*\"blue\" + 0.005*\"appear\" + 0.004*\"anim\" + 0.004*\"black\"\n", + "2019-01-31 00:44:09,583 : INFO : topic diff=0.005457, rho=0.034922\n", + "2019-01-31 00:44:09,739 : INFO : PROGRESS: pass 0, at document #1642000/4922894\n", + "2019-01-31 00:44:11,128 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:44:11,394 : INFO : topic #3 (0.020): 0.035*\"present\" + 0.026*\"offic\" + 0.025*\"minist\" + 0.024*\"serv\" + 0.020*\"nation\" + 0.019*\"member\" + 0.019*\"govern\" + 0.018*\"gener\" + 0.015*\"seri\" + 0.015*\"start\"\n", + "2019-01-31 00:44:11,395 : INFO : topic #32 (0.020): 0.052*\"district\" + 0.044*\"popolo\" + 0.044*\"vigour\" + 0.040*\"tortur\" + 0.032*\"cotton\" + 0.026*\"area\" + 0.024*\"regim\" + 0.023*\"multitud\" + 0.022*\"citi\" + 0.019*\"cede\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 00:44:11,396 : INFO : topic #18 (0.020): 0.010*\"théori\" + 0.007*\"later\" + 0.007*\"sack\" + 0.006*\"kill\" + 0.006*\"dai\" + 0.005*\"retrospect\" + 0.004*\"like\" + 0.004*\"end\" + 0.004*\"call\" + 0.004*\"help\"\n", + "2019-01-31 00:44:11,398 : INFO : topic #5 (0.020): 0.039*\"abroad\" + 0.029*\"son\" + 0.026*\"rel\" + 0.025*\"reconstruct\" + 0.022*\"band\" + 0.017*\"muscl\" + 0.016*\"simultan\" + 0.014*\"charcoal\" + 0.013*\"toyota\" + 0.010*\"myspac\"\n", + "2019-01-31 00:44:11,399 : INFO : topic #29 (0.020): 0.025*\"companhia\" + 0.011*\"million\" + 0.011*\"busi\" + 0.009*\"market\" + 0.009*\"bank\" + 0.009*\"industri\" + 0.009*\"produc\" + 0.008*\"yawn\" + 0.008*\"manag\" + 0.007*\"trace\"\n", + "2019-01-31 00:44:11,405 : INFO : topic diff=0.005346, rho=0.034900\n", + "2019-01-31 00:44:11,558 : INFO : PROGRESS: pass 0, at document #1644000/4922894\n", + "2019-01-31 00:44:12,943 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:44:13,209 : INFO : topic #17 (0.020): 0.074*\"church\" + 0.021*\"cathol\" + 0.021*\"christian\" + 0.020*\"bishop\" + 0.016*\"retroflex\" + 0.016*\"sail\" + 0.010*\"cathedr\" + 0.009*\"historiographi\" + 0.009*\"romanc\" + 0.009*\"centuri\"\n", + "2019-01-31 00:44:13,211 : INFO : topic #36 (0.020): 0.012*\"network\" + 0.011*\"prognosi\" + 0.011*\"pop\" + 0.008*\"softwar\" + 0.008*\"brio\" + 0.008*\"develop\" + 0.008*\"diggin\" + 0.008*\"championship\" + 0.007*\"uruguayan\" + 0.007*\"cytokin\"\n", + "2019-01-31 00:44:13,212 : INFO : topic #29 (0.020): 0.025*\"companhia\" + 0.011*\"million\" + 0.011*\"busi\" + 0.009*\"market\" + 0.009*\"bank\" + 0.009*\"industri\" + 0.009*\"produc\" + 0.008*\"yawn\" + 0.007*\"manag\" + 0.007*\"trace\"\n", + "2019-01-31 00:44:13,213 : INFO : topic #25 (0.020): 0.033*\"ring\" + 0.018*\"lagrang\" + 0.017*\"warmth\" + 0.016*\"area\" + 0.015*\"mount\" + 0.009*\"foam\" + 0.009*\"north\" + 0.009*\"palmer\" + 0.008*\"land\" + 0.008*\"lobe\"\n", + "2019-01-31 00:44:13,214 : INFO : topic #1 (0.020): 0.053*\"china\" + 0.045*\"chilton\" + 0.025*\"hong\" + 0.024*\"kong\" + 0.023*\"korea\" + 0.020*\"korean\" + 0.018*\"sourc\" + 0.015*\"shirin\" + 0.015*\"leah\" + 0.013*\"kim\"\n", + "2019-01-31 00:44:13,220 : INFO : topic diff=0.005054, rho=0.034879\n", + "2019-01-31 00:44:13,376 : INFO : PROGRESS: pass 0, at document #1646000/4922894\n", + "2019-01-31 00:44:14,769 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:44:15,036 : INFO : topic #12 (0.020): 0.008*\"number\" + 0.007*\"frontal\" + 0.007*\"gener\" + 0.006*\"exampl\" + 0.006*\"poet\" + 0.006*\"théori\" + 0.006*\"servitud\" + 0.006*\"method\" + 0.006*\"mode\" + 0.006*\"measur\"\n", + "2019-01-31 00:44:15,037 : INFO : topic #30 (0.020): 0.036*\"leagu\" + 0.036*\"cleveland\" + 0.029*\"place\" + 0.027*\"taxpay\" + 0.024*\"scientist\" + 0.023*\"crete\" + 0.021*\"folei\" + 0.017*\"goal\" + 0.015*\"martin\" + 0.012*\"schmitz\"\n", + "2019-01-31 00:44:15,038 : INFO : topic #46 (0.020): 0.018*\"stop\" + 0.017*\"sweden\" + 0.016*\"swedish\" + 0.016*\"wind\" + 0.016*\"norwai\" + 0.015*\"norwegian\" + 0.013*\"damag\" + 0.013*\"farid\" + 0.013*\"turkish\" + 0.012*\"treeless\"\n", + "2019-01-31 00:44:15,040 : INFO : topic #6 (0.020): 0.071*\"fewer\" + 0.025*\"septemb\" + 0.023*\"epiru\" + 0.018*\"teacher\" + 0.017*\"stake\" + 0.012*\"rodríguez\" + 0.012*\"proclaim\" + 0.011*\"direct\" + 0.011*\"movi\" + 0.010*\"acrimoni\"\n", + "2019-01-31 00:44:15,041 : INFO : topic #44 (0.020): 0.030*\"rooftop\" + 0.027*\"final\" + 0.024*\"wife\" + 0.020*\"champion\" + 0.019*\"tourist\" + 0.018*\"chamber\" + 0.016*\"open\" + 0.016*\"winner\" + 0.015*\"taxpay\" + 0.015*\"martin\"\n", + "2019-01-31 00:44:15,047 : INFO : topic diff=0.006107, rho=0.034858\n", + "2019-01-31 00:44:15,204 : INFO : PROGRESS: pass 0, at document #1648000/4922894\n", + "2019-01-31 00:44:16,598 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:44:16,865 : INFO : topic #26 (0.020): 0.029*\"workplac\" + 0.028*\"woman\" + 0.028*\"champion\" + 0.024*\"olymp\" + 0.024*\"men\" + 0.022*\"medal\" + 0.021*\"event\" + 0.019*\"atheist\" + 0.018*\"rainfal\" + 0.018*\"taxpay\"\n", + "2019-01-31 00:44:16,866 : INFO : topic #22 (0.020): 0.035*\"spars\" + 0.025*\"factor\" + 0.020*\"adulthood\" + 0.016*\"feel\" + 0.015*\"male\" + 0.012*\"hostil\" + 0.012*\"plaisir\" + 0.010*\"genu\" + 0.009*\"live\" + 0.008*\"yawn\"\n", + "2019-01-31 00:44:16,867 : INFO : topic #37 (0.020): 0.009*\"man\" + 0.009*\"love\" + 0.008*\"charact\" + 0.007*\"gestur\" + 0.007*\"comic\" + 0.007*\"septemb\" + 0.005*\"appear\" + 0.005*\"blue\" + 0.005*\"anim\" + 0.004*\"black\"\n", + "2019-01-31 00:44:16,868 : INFO : topic #40 (0.020): 0.090*\"unit\" + 0.024*\"schuster\" + 0.022*\"collector\" + 0.022*\"institut\" + 0.021*\"requir\" + 0.019*\"student\" + 0.015*\"professor\" + 0.012*\"word\" + 0.011*\"degre\" + 0.011*\"governor\"\n", + "2019-01-31 00:44:16,869 : INFO : topic #31 (0.020): 0.055*\"fusiform\" + 0.026*\"scientist\" + 0.024*\"taxpay\" + 0.024*\"player\" + 0.020*\"place\" + 0.014*\"clot\" + 0.013*\"leagu\" + 0.011*\"folei\" + 0.010*\"yawn\" + 0.009*\"yard\"\n", + "2019-01-31 00:44:16,875 : INFO : topic diff=0.005742, rho=0.034837\n", + "2019-01-31 00:44:17,027 : INFO : PROGRESS: pass 0, at document #1650000/4922894\n", + "2019-01-31 00:44:18,376 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:44:18,642 : INFO : topic #39 (0.020): 0.053*\"canada\" + 0.038*\"canadian\" + 0.022*\"toronto\" + 0.021*\"hoar\" + 0.019*\"ontario\" + 0.014*\"new\" + 0.014*\"hydrogen\" + 0.013*\"misericordia\" + 0.013*\"novotná\" + 0.012*\"quebec\"\n", + "2019-01-31 00:44:18,643 : INFO : topic #2 (0.020): 0.046*\"isl\" + 0.038*\"shield\" + 0.019*\"narrat\" + 0.013*\"scot\" + 0.012*\"pope\" + 0.012*\"blur\" + 0.011*\"coalit\" + 0.011*\"nativist\" + 0.009*\"class\" + 0.009*\"bahá\"\n", + "2019-01-31 00:44:18,644 : INFO : topic #16 (0.020): 0.049*\"king\" + 0.031*\"priest\" + 0.024*\"duke\" + 0.020*\"rotterdam\" + 0.018*\"quarterli\" + 0.018*\"idiosyncrat\" + 0.017*\"grammat\" + 0.015*\"count\" + 0.013*\"portugues\" + 0.012*\"princ\"\n", + "2019-01-31 00:44:18,646 : INFO : topic #8 (0.020): 0.027*\"law\" + 0.023*\"cortic\" + 0.023*\"act\" + 0.018*\"start\" + 0.013*\"ricardo\" + 0.012*\"case\" + 0.010*\"polaris\" + 0.009*\"legal\" + 0.009*\"replac\" + 0.007*\"judaism\"\n", + "2019-01-31 00:44:18,647 : INFO : topic #32 (0.020): 0.052*\"district\" + 0.045*\"vigour\" + 0.045*\"popolo\" + 0.040*\"tortur\" + 0.031*\"cotton\" + 0.026*\"area\" + 0.024*\"regim\" + 0.023*\"multitud\" + 0.022*\"citi\" + 0.019*\"cede\"\n", + "2019-01-31 00:44:18,652 : INFO : topic diff=0.005770, rho=0.034816\n", + "2019-01-31 00:44:18,809 : INFO : PROGRESS: pass 0, at document #1652000/4922894\n", + "2019-01-31 00:44:20,208 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:44:20,474 : INFO : topic #42 (0.020): 0.048*\"german\" + 0.031*\"germani\" + 0.016*\"vol\" + 0.014*\"israel\" + 0.013*\"berlin\" + 0.013*\"der\" + 0.012*\"jewish\" + 0.010*\"european\" + 0.010*\"europ\" + 0.010*\"itali\"\n", + "2019-01-31 00:44:20,475 : INFO : topic #20 (0.020): 0.137*\"scholar\" + 0.040*\"struggl\" + 0.032*\"high\" + 0.030*\"educ\" + 0.027*\"collector\" + 0.018*\"yawn\" + 0.014*\"prognosi\" + 0.009*\"task\" + 0.009*\"pseudo\" + 0.009*\"start\"\n", + "2019-01-31 00:44:20,476 : INFO : topic #0 (0.020): 0.065*\"statewid\" + 0.043*\"line\" + 0.037*\"arsen\" + 0.034*\"raid\" + 0.028*\"museo\" + 0.019*\"traceabl\" + 0.018*\"serv\" + 0.014*\"exhaust\" + 0.014*\"pain\" + 0.013*\"oper\"\n", + "2019-01-31 00:44:20,477 : INFO : topic #36 (0.020): 0.012*\"network\" + 0.011*\"prognosi\" + 0.011*\"pop\" + 0.008*\"softwar\" + 0.008*\"brio\" + 0.008*\"develop\" + 0.008*\"championship\" + 0.008*\"diggin\" + 0.007*\"uruguayan\" + 0.007*\"cytokin\"\n", + "2019-01-31 00:44:20,478 : INFO : topic #6 (0.020): 0.071*\"fewer\" + 0.024*\"septemb\" + 0.023*\"epiru\" + 0.018*\"teacher\" + 0.017*\"stake\" + 0.012*\"rodríguez\" + 0.012*\"proclaim\" + 0.012*\"direct\" + 0.011*\"movi\" + 0.010*\"acrimoni\"\n", + "2019-01-31 00:44:20,484 : INFO : topic diff=0.005179, rho=0.034794\n", + "2019-01-31 00:44:20,641 : INFO : PROGRESS: pass 0, at document #1654000/4922894\n", + "2019-01-31 00:44:22,024 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:44:22,291 : INFO : topic #19 (0.020): 0.016*\"languag\" + 0.012*\"centuri\" + 0.011*\"woodcut\" + 0.009*\"origin\" + 0.009*\"form\" + 0.008*\"mean\" + 0.007*\"trade\" + 0.007*\"english\" + 0.007*\"known\" + 0.006*\"like\"\n", + "2019-01-31 00:44:22,292 : INFO : topic #14 (0.020): 0.025*\"forc\" + 0.022*\"aggress\" + 0.021*\"armi\" + 0.021*\"walter\" + 0.017*\"com\" + 0.014*\"oper\" + 0.013*\"unionist\" + 0.012*\"militari\" + 0.012*\"airbu\" + 0.011*\"airmen\"\n", + "2019-01-31 00:44:22,293 : INFO : topic #48 (0.020): 0.080*\"octob\" + 0.078*\"sens\" + 0.078*\"march\" + 0.071*\"juli\" + 0.071*\"notion\" + 0.070*\"januari\" + 0.070*\"april\" + 0.069*\"august\" + 0.067*\"judici\" + 0.065*\"decatur\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 00:44:22,294 : INFO : topic #3 (0.020): 0.035*\"present\" + 0.027*\"offic\" + 0.024*\"minist\" + 0.023*\"serv\" + 0.020*\"nation\" + 0.020*\"member\" + 0.019*\"govern\" + 0.018*\"gener\" + 0.016*\"seri\" + 0.015*\"start\"\n", + "2019-01-31 00:44:22,295 : INFO : topic #21 (0.020): 0.035*\"samford\" + 0.021*\"spain\" + 0.018*\"mexico\" + 0.018*\"del\" + 0.013*\"soviet\" + 0.012*\"santa\" + 0.011*\"lizard\" + 0.011*\"francisco\" + 0.011*\"mexican\" + 0.011*\"carlo\"\n", + "2019-01-31 00:44:22,301 : INFO : topic diff=0.006476, rho=0.034773\n", + "2019-01-31 00:44:22,460 : INFO : PROGRESS: pass 0, at document #1656000/4922894\n", + "2019-01-31 00:44:23,868 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:44:24,135 : INFO : topic #31 (0.020): 0.055*\"fusiform\" + 0.026*\"scientist\" + 0.025*\"taxpay\" + 0.023*\"player\" + 0.020*\"place\" + 0.014*\"clot\" + 0.013*\"leagu\" + 0.011*\"folei\" + 0.010*\"yawn\" + 0.009*\"yard\"\n", + "2019-01-31 00:44:24,136 : INFO : topic #27 (0.020): 0.072*\"questionnair\" + 0.019*\"taxpay\" + 0.019*\"candid\" + 0.013*\"ret\" + 0.013*\"tornado\" + 0.012*\"driver\" + 0.012*\"find\" + 0.012*\"fool\" + 0.011*\"squatter\" + 0.010*\"champion\"\n", + "2019-01-31 00:44:24,137 : INFO : topic #9 (0.020): 0.076*\"bone\" + 0.039*\"american\" + 0.029*\"valour\" + 0.019*\"player\" + 0.019*\"folei\" + 0.018*\"dutch\" + 0.018*\"polit\" + 0.016*\"english\" + 0.012*\"acrimoni\" + 0.011*\"simpler\"\n", + "2019-01-31 00:44:24,138 : INFO : topic #17 (0.020): 0.077*\"church\" + 0.022*\"cathol\" + 0.021*\"christian\" + 0.020*\"bishop\" + 0.016*\"sail\" + 0.015*\"retroflex\" + 0.011*\"cathedr\" + 0.009*\"parish\" + 0.009*\"historiographi\" + 0.009*\"poll\"\n", + "2019-01-31 00:44:24,139 : INFO : topic #32 (0.020): 0.052*\"district\" + 0.044*\"popolo\" + 0.044*\"vigour\" + 0.040*\"tortur\" + 0.030*\"cotton\" + 0.026*\"area\" + 0.024*\"regim\" + 0.023*\"multitud\" + 0.022*\"citi\" + 0.019*\"cede\"\n", + "2019-01-31 00:44:24,145 : INFO : topic diff=0.006871, rho=0.034752\n", + "2019-01-31 00:44:24,305 : INFO : PROGRESS: pass 0, at document #1658000/4922894\n", + "2019-01-31 00:44:25,697 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:44:25,963 : INFO : topic #33 (0.020): 0.059*\"french\" + 0.047*\"franc\" + 0.033*\"pari\" + 0.021*\"sail\" + 0.021*\"jean\" + 0.016*\"daphn\" + 0.013*\"lazi\" + 0.012*\"loui\" + 0.011*\"piec\" + 0.007*\"convei\"\n", + "2019-01-31 00:44:25,964 : INFO : topic #28 (0.020): 0.031*\"build\" + 0.024*\"hous\" + 0.021*\"rivièr\" + 0.019*\"buford\" + 0.013*\"histor\" + 0.011*\"briarwood\" + 0.011*\"linear\" + 0.011*\"constitut\" + 0.011*\"strategist\" + 0.010*\"depress\"\n", + "2019-01-31 00:44:25,965 : INFO : topic #38 (0.020): 0.023*\"walter\" + 0.011*\"aza\" + 0.009*\"battalion\" + 0.008*\"forc\" + 0.008*\"teufel\" + 0.008*\"armi\" + 0.008*\"till\" + 0.007*\"empath\" + 0.006*\"pour\" + 0.006*\"militari\"\n", + "2019-01-31 00:44:25,966 : INFO : topic #44 (0.020): 0.030*\"rooftop\" + 0.027*\"final\" + 0.025*\"wife\" + 0.020*\"champion\" + 0.019*\"tourist\" + 0.018*\"chamber\" + 0.015*\"open\" + 0.015*\"taxpay\" + 0.015*\"winner\" + 0.014*\"tiepolo\"\n", + "2019-01-31 00:44:25,967 : INFO : topic #32 (0.020): 0.053*\"district\" + 0.044*\"vigour\" + 0.044*\"popolo\" + 0.040*\"tortur\" + 0.031*\"cotton\" + 0.026*\"area\" + 0.024*\"multitud\" + 0.024*\"regim\" + 0.022*\"citi\" + 0.019*\"cede\"\n", + "2019-01-31 00:44:25,973 : INFO : topic diff=0.005480, rho=0.034731\n", + "2019-01-31 00:44:28,706 : INFO : -11.791 per-word bound, 3544.0 perplexity estimate based on a held-out corpus of 2000 documents with 570585 words\n", + "2019-01-31 00:44:28,707 : INFO : PROGRESS: pass 0, at document #1660000/4922894\n", + "2019-01-31 00:44:30,121 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:44:30,387 : INFO : topic #5 (0.020): 0.038*\"abroad\" + 0.029*\"son\" + 0.026*\"rel\" + 0.025*\"reconstruct\" + 0.021*\"band\" + 0.017*\"muscl\" + 0.016*\"simultan\" + 0.014*\"charcoal\" + 0.013*\"toyota\" + 0.011*\"myspac\"\n", + "2019-01-31 00:44:30,388 : INFO : topic #25 (0.020): 0.032*\"ring\" + 0.018*\"lagrang\" + 0.017*\"warmth\" + 0.016*\"area\" + 0.015*\"mount\" + 0.009*\"north\" + 0.009*\"foam\" + 0.008*\"land\" + 0.008*\"palmer\" + 0.008*\"lobe\"\n", + "2019-01-31 00:44:30,389 : INFO : topic #26 (0.020): 0.029*\"woman\" + 0.029*\"workplac\" + 0.027*\"champion\" + 0.025*\"olymp\" + 0.024*\"men\" + 0.022*\"medal\" + 0.021*\"event\" + 0.019*\"rainfal\" + 0.018*\"atheist\" + 0.018*\"taxpay\"\n", + "2019-01-31 00:44:30,390 : INFO : topic #4 (0.020): 0.023*\"enfranchis\" + 0.015*\"depress\" + 0.014*\"pour\" + 0.009*\"elabor\" + 0.009*\"veget\" + 0.009*\"mode\" + 0.007*\"encyclopedia\" + 0.007*\"candid\" + 0.007*\"uruguayan\" + 0.007*\"produc\"\n", + "2019-01-31 00:44:30,392 : INFO : topic #22 (0.020): 0.035*\"spars\" + 0.025*\"factor\" + 0.020*\"adulthood\" + 0.016*\"feel\" + 0.014*\"male\" + 0.012*\"plaisir\" + 0.012*\"hostil\" + 0.010*\"genu\" + 0.009*\"live\" + 0.008*\"yawn\"\n", + "2019-01-31 00:44:30,397 : INFO : topic diff=0.006492, rho=0.034711\n", + "2019-01-31 00:44:30,614 : INFO : PROGRESS: pass 0, at document #1662000/4922894\n", + "2019-01-31 00:44:32,025 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:44:32,292 : INFO : topic #10 (0.020): 0.011*\"cdd\" + 0.009*\"media\" + 0.008*\"disco\" + 0.008*\"hormon\" + 0.007*\"have\" + 0.007*\"pathwai\" + 0.007*\"caus\" + 0.007*\"proper\" + 0.006*\"effect\" + 0.006*\"treat\"\n", + "2019-01-31 00:44:32,293 : INFO : topic #5 (0.020): 0.038*\"abroad\" + 0.029*\"son\" + 0.026*\"rel\" + 0.026*\"reconstruct\" + 0.021*\"band\" + 0.017*\"muscl\" + 0.016*\"simultan\" + 0.014*\"charcoal\" + 0.013*\"toyota\" + 0.011*\"myspac\"\n", + "2019-01-31 00:44:32,294 : INFO : topic #0 (0.020): 0.063*\"statewid\" + 0.042*\"line\" + 0.037*\"arsen\" + 0.034*\"raid\" + 0.028*\"museo\" + 0.019*\"traceabl\" + 0.018*\"serv\" + 0.014*\"exhaust\" + 0.013*\"pain\" + 0.012*\"gai\"\n", + "2019-01-31 00:44:32,295 : INFO : topic #11 (0.020): 0.025*\"john\" + 0.013*\"will\" + 0.013*\"jame\" + 0.012*\"david\" + 0.010*\"rival\" + 0.009*\"mexican–american\" + 0.008*\"georg\" + 0.008*\"slur\" + 0.008*\"paul\" + 0.008*\"rhyme\"\n", + "2019-01-31 00:44:32,296 : INFO : topic #16 (0.020): 0.049*\"king\" + 0.030*\"priest\" + 0.025*\"duke\" + 0.020*\"rotterdam\" + 0.019*\"idiosyncrat\" + 0.019*\"quarterli\" + 0.017*\"grammat\" + 0.015*\"count\" + 0.012*\"brazil\" + 0.012*\"princ\"\n", + "2019-01-31 00:44:32,302 : INFO : topic diff=0.005054, rho=0.034690\n", + "2019-01-31 00:44:32,454 : INFO : PROGRESS: pass 0, at document #1664000/4922894\n", + "2019-01-31 00:44:33,803 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:44:34,069 : INFO : topic #23 (0.020): 0.135*\"audit\" + 0.068*\"best\" + 0.035*\"yawn\" + 0.027*\"jacksonvil\" + 0.024*\"japanes\" + 0.024*\"noll\" + 0.021*\"festiv\" + 0.019*\"women\" + 0.017*\"intern\" + 0.013*\"prison\"\n", + "2019-01-31 00:44:34,070 : INFO : topic #6 (0.020): 0.072*\"fewer\" + 0.024*\"septemb\" + 0.023*\"epiru\" + 0.018*\"teacher\" + 0.017*\"stake\" + 0.013*\"rodríguez\" + 0.012*\"proclaim\" + 0.011*\"direct\" + 0.011*\"movi\" + 0.010*\"acrimoni\"\n", + "2019-01-31 00:44:34,071 : INFO : topic #15 (0.020): 0.011*\"small\" + 0.011*\"organ\" + 0.010*\"develop\" + 0.009*\"commun\" + 0.009*\"word\" + 0.009*\"group\" + 0.008*\"peopl\" + 0.007*\"cultur\" + 0.007*\"woman\" + 0.007*\"human\"\n", + "2019-01-31 00:44:34,072 : INFO : topic #47 (0.020): 0.067*\"muscl\" + 0.034*\"perceptu\" + 0.021*\"theater\" + 0.019*\"place\" + 0.017*\"compos\" + 0.015*\"damn\" + 0.014*\"physician\" + 0.014*\"orchestr\" + 0.012*\"olympo\" + 0.011*\"word\"\n", + "2019-01-31 00:44:34,073 : INFO : topic #9 (0.020): 0.077*\"bone\" + 0.039*\"american\" + 0.028*\"valour\" + 0.019*\"player\" + 0.018*\"folei\" + 0.018*\"dutch\" + 0.018*\"polit\" + 0.016*\"english\" + 0.012*\"acrimoni\" + 0.011*\"simpler\"\n", + "2019-01-31 00:44:34,079 : INFO : topic diff=0.004756, rho=0.034669\n", + "2019-01-31 00:44:34,228 : INFO : PROGRESS: pass 0, at document #1666000/4922894\n", + "2019-01-31 00:44:35,576 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:44:35,843 : INFO : topic #2 (0.020): 0.045*\"isl\" + 0.039*\"shield\" + 0.019*\"narrat\" + 0.013*\"scot\" + 0.012*\"pope\" + 0.011*\"blur\" + 0.011*\"nativist\" + 0.011*\"coalit\" + 0.009*\"fleet\" + 0.009*\"class\"\n", + "2019-01-31 00:44:35,844 : INFO : topic #46 (0.020): 0.018*\"swedish\" + 0.018*\"sweden\" + 0.017*\"stop\" + 0.016*\"wind\" + 0.016*\"norwai\" + 0.015*\"norwegian\" + 0.014*\"damag\" + 0.013*\"treeless\" + 0.012*\"farid\" + 0.012*\"turkish\"\n", + "2019-01-31 00:44:35,845 : INFO : topic #12 (0.020): 0.009*\"number\" + 0.007*\"frontal\" + 0.007*\"gener\" + 0.006*\"théori\" + 0.006*\"exampl\" + 0.006*\"poet\" + 0.006*\"measur\" + 0.006*\"mode\" + 0.006*\"method\" + 0.006*\"southern\"\n", + "2019-01-31 00:44:35,846 : INFO : topic #38 (0.020): 0.023*\"walter\" + 0.011*\"aza\" + 0.009*\"battalion\" + 0.009*\"forc\" + 0.008*\"armi\" + 0.008*\"teufel\" + 0.008*\"empath\" + 0.007*\"till\" + 0.006*\"pour\" + 0.006*\"militari\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 00:44:35,847 : INFO : topic #11 (0.020): 0.025*\"john\" + 0.013*\"will\" + 0.012*\"jame\" + 0.012*\"david\" + 0.010*\"rival\" + 0.009*\"mexican–american\" + 0.008*\"georg\" + 0.008*\"slur\" + 0.008*\"rhyme\" + 0.008*\"paul\"\n", + "2019-01-31 00:44:35,853 : INFO : topic diff=0.005096, rho=0.034648\n", + "2019-01-31 00:44:36,006 : INFO : PROGRESS: pass 0, at document #1668000/4922894\n", + "2019-01-31 00:44:37,599 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:44:37,865 : INFO : topic #22 (0.020): 0.034*\"spars\" + 0.025*\"factor\" + 0.020*\"adulthood\" + 0.016*\"feel\" + 0.014*\"male\" + 0.012*\"hostil\" + 0.011*\"plaisir\" + 0.010*\"genu\" + 0.009*\"live\" + 0.008*\"yawn\"\n", + "2019-01-31 00:44:37,866 : INFO : topic #47 (0.020): 0.067*\"muscl\" + 0.035*\"perceptu\" + 0.021*\"theater\" + 0.019*\"place\" + 0.017*\"compos\" + 0.015*\"damn\" + 0.014*\"physician\" + 0.014*\"orchestr\" + 0.013*\"olympo\" + 0.011*\"word\"\n", + "2019-01-31 00:44:37,868 : INFO : topic #9 (0.020): 0.077*\"bone\" + 0.039*\"american\" + 0.029*\"valour\" + 0.021*\"dutch\" + 0.019*\"player\" + 0.018*\"folei\" + 0.017*\"polit\" + 0.016*\"english\" + 0.012*\"acrimoni\" + 0.011*\"simpler\"\n", + "2019-01-31 00:44:37,869 : INFO : topic #20 (0.020): 0.137*\"scholar\" + 0.040*\"struggl\" + 0.032*\"high\" + 0.030*\"educ\" + 0.026*\"collector\" + 0.018*\"yawn\" + 0.013*\"prognosi\" + 0.009*\"task\" + 0.009*\"gothic\" + 0.009*\"start\"\n", + "2019-01-31 00:44:37,870 : INFO : topic #11 (0.020): 0.025*\"john\" + 0.013*\"will\" + 0.012*\"jame\" + 0.012*\"david\" + 0.010*\"rival\" + 0.009*\"mexican–american\" + 0.009*\"georg\" + 0.008*\"slur\" + 0.008*\"rhyme\" + 0.008*\"paul\"\n", + "2019-01-31 00:44:37,876 : INFO : topic diff=0.005313, rho=0.034627\n", + "2019-01-31 00:44:38,035 : INFO : PROGRESS: pass 0, at document #1670000/4922894\n", + "2019-01-31 00:44:39,441 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:44:39,707 : INFO : topic #36 (0.020): 0.011*\"prognosi\" + 0.011*\"network\" + 0.011*\"pop\" + 0.008*\"championship\" + 0.008*\"brio\" + 0.008*\"softwar\" + 0.008*\"develop\" + 0.008*\"diggin\" + 0.008*\"cytokin\" + 0.008*\"uruguayan\"\n", + "2019-01-31 00:44:39,708 : INFO : topic #9 (0.020): 0.077*\"bone\" + 0.039*\"american\" + 0.029*\"valour\" + 0.021*\"dutch\" + 0.018*\"player\" + 0.018*\"folei\" + 0.017*\"polit\" + 0.016*\"english\" + 0.011*\"acrimoni\" + 0.011*\"simpler\"\n", + "2019-01-31 00:44:39,710 : INFO : topic #24 (0.020): 0.041*\"book\" + 0.035*\"publicis\" + 0.025*\"word\" + 0.018*\"new\" + 0.014*\"edit\" + 0.013*\"presid\" + 0.012*\"nicola\" + 0.012*\"storag\" + 0.012*\"collect\" + 0.011*\"magazin\"\n", + "2019-01-31 00:44:39,711 : INFO : topic #18 (0.020): 0.010*\"théori\" + 0.007*\"later\" + 0.007*\"sack\" + 0.006*\"kill\" + 0.006*\"dai\" + 0.005*\"retrospect\" + 0.004*\"like\" + 0.004*\"end\" + 0.004*\"call\" + 0.004*\"help\"\n", + "2019-01-31 00:44:39,712 : INFO : topic #2 (0.020): 0.044*\"isl\" + 0.039*\"shield\" + 0.019*\"narrat\" + 0.013*\"scot\" + 0.012*\"pope\" + 0.011*\"nativist\" + 0.011*\"blur\" + 0.011*\"coalit\" + 0.009*\"fleet\" + 0.009*\"class\"\n", + "2019-01-31 00:44:39,718 : INFO : topic diff=0.004340, rho=0.034606\n", + "2019-01-31 00:44:39,872 : INFO : PROGRESS: pass 0, at document #1672000/4922894\n", + "2019-01-31 00:44:41,237 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:44:41,503 : INFO : topic #25 (0.020): 0.032*\"ring\" + 0.018*\"lagrang\" + 0.017*\"warmth\" + 0.016*\"area\" + 0.015*\"mount\" + 0.009*\"north\" + 0.009*\"palmer\" + 0.008*\"foam\" + 0.008*\"land\" + 0.008*\"lobe\"\n", + "2019-01-31 00:44:41,504 : INFO : topic #44 (0.020): 0.030*\"rooftop\" + 0.027*\"final\" + 0.024*\"wife\" + 0.020*\"champion\" + 0.019*\"tourist\" + 0.017*\"chamber\" + 0.016*\"poet\" + 0.015*\"taxpay\" + 0.015*\"martin\" + 0.015*\"tiepolo\"\n", + "2019-01-31 00:44:41,505 : INFO : topic #31 (0.020): 0.055*\"fusiform\" + 0.027*\"scientist\" + 0.025*\"taxpay\" + 0.023*\"player\" + 0.020*\"place\" + 0.014*\"clot\" + 0.013*\"leagu\" + 0.011*\"folei\" + 0.010*\"yawn\" + 0.009*\"reconstruct\"\n", + "2019-01-31 00:44:41,507 : INFO : topic #28 (0.020): 0.031*\"build\" + 0.025*\"hous\" + 0.022*\"rivièr\" + 0.019*\"buford\" + 0.013*\"histor\" + 0.012*\"briarwood\" + 0.011*\"linear\" + 0.011*\"constitut\" + 0.011*\"strategist\" + 0.010*\"depress\"\n", + "2019-01-31 00:44:41,508 : INFO : topic #39 (0.020): 0.052*\"canada\" + 0.039*\"canadian\" + 0.022*\"toronto\" + 0.021*\"hoar\" + 0.018*\"ontario\" + 0.014*\"new\" + 0.014*\"novotná\" + 0.014*\"misericordia\" + 0.014*\"hydrogen\" + 0.012*\"quebec\"\n", + "2019-01-31 00:44:41,513 : INFO : topic diff=0.005141, rho=0.034586\n", + "2019-01-31 00:44:41,668 : INFO : PROGRESS: pass 0, at document #1674000/4922894\n", + "2019-01-31 00:44:43,054 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:44:43,320 : INFO : topic #30 (0.020): 0.037*\"cleveland\" + 0.036*\"leagu\" + 0.030*\"place\" + 0.027*\"taxpay\" + 0.024*\"scientist\" + 0.023*\"crete\" + 0.021*\"folei\" + 0.017*\"goal\" + 0.015*\"martin\" + 0.012*\"schmitz\"\n", + "2019-01-31 00:44:43,321 : INFO : topic #16 (0.020): 0.049*\"king\" + 0.031*\"priest\" + 0.023*\"duke\" + 0.019*\"idiosyncrat\" + 0.019*\"rotterdam\" + 0.019*\"quarterli\" + 0.018*\"grammat\" + 0.015*\"count\" + 0.013*\"portugues\" + 0.012*\"kingdom\"\n", + "2019-01-31 00:44:43,322 : INFO : topic #14 (0.020): 0.025*\"forc\" + 0.022*\"aggress\" + 0.021*\"armi\" + 0.021*\"walter\" + 0.018*\"com\" + 0.014*\"oper\" + 0.013*\"unionist\" + 0.012*\"militari\" + 0.012*\"airbu\" + 0.011*\"diversifi\"\n", + "2019-01-31 00:44:43,323 : INFO : topic #21 (0.020): 0.035*\"samford\" + 0.021*\"spain\" + 0.018*\"del\" + 0.018*\"mexico\" + 0.014*\"soviet\" + 0.012*\"lizard\" + 0.012*\"santa\" + 0.011*\"francisco\" + 0.011*\"juan\" + 0.011*\"carlo\"\n", + "2019-01-31 00:44:43,324 : INFO : topic #41 (0.020): 0.043*\"citi\" + 0.027*\"new\" + 0.022*\"palmer\" + 0.014*\"strategist\" + 0.012*\"open\" + 0.011*\"includ\" + 0.011*\"center\" + 0.010*\"lobe\" + 0.010*\"year\" + 0.009*\"dai\"\n", + "2019-01-31 00:44:43,330 : INFO : topic diff=0.005281, rho=0.034565\n", + "2019-01-31 00:44:43,486 : INFO : PROGRESS: pass 0, at document #1676000/4922894\n", + "2019-01-31 00:44:44,868 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:44:45,136 : INFO : topic #36 (0.020): 0.011*\"network\" + 0.011*\"prognosi\" + 0.011*\"pop\" + 0.008*\"develop\" + 0.008*\"championship\" + 0.008*\"brio\" + 0.008*\"softwar\" + 0.008*\"diggin\" + 0.008*\"cytokin\" + 0.008*\"uruguayan\"\n", + "2019-01-31 00:44:45,137 : INFO : topic #37 (0.020): 0.010*\"man\" + 0.009*\"love\" + 0.008*\"charact\" + 0.007*\"gestur\" + 0.007*\"septemb\" + 0.006*\"comic\" + 0.005*\"appear\" + 0.005*\"blue\" + 0.005*\"anim\" + 0.005*\"black\"\n", + "2019-01-31 00:44:45,138 : INFO : topic #6 (0.020): 0.072*\"fewer\" + 0.024*\"septemb\" + 0.022*\"epiru\" + 0.018*\"teacher\" + 0.018*\"stake\" + 0.013*\"rodríguez\" + 0.012*\"proclaim\" + 0.011*\"direct\" + 0.011*\"movi\" + 0.010*\"acrimoni\"\n", + "2019-01-31 00:44:45,139 : INFO : topic #3 (0.020): 0.036*\"present\" + 0.027*\"offic\" + 0.025*\"minist\" + 0.021*\"serv\" + 0.020*\"nation\" + 0.019*\"govern\" + 0.019*\"member\" + 0.019*\"gener\" + 0.016*\"seri\" + 0.015*\"start\"\n", + "2019-01-31 00:44:45,141 : INFO : topic #38 (0.020): 0.023*\"walter\" + 0.011*\"aza\" + 0.009*\"battalion\" + 0.009*\"forc\" + 0.008*\"armi\" + 0.008*\"empath\" + 0.007*\"teufel\" + 0.007*\"till\" + 0.007*\"pour\" + 0.006*\"militari\"\n", + "2019-01-31 00:44:45,147 : INFO : topic diff=0.004645, rho=0.034544\n", + "2019-01-31 00:44:45,302 : INFO : PROGRESS: pass 0, at document #1678000/4922894\n", + "2019-01-31 00:44:46,693 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:44:46,959 : INFO : topic #23 (0.020): 0.135*\"audit\" + 0.068*\"best\" + 0.034*\"yawn\" + 0.027*\"jacksonvil\" + 0.024*\"japanes\" + 0.023*\"noll\" + 0.021*\"festiv\" + 0.019*\"women\" + 0.018*\"intern\" + 0.013*\"misconcept\"\n", + "2019-01-31 00:44:46,960 : INFO : topic #40 (0.020): 0.092*\"unit\" + 0.023*\"schuster\" + 0.023*\"collector\" + 0.022*\"institut\" + 0.020*\"requir\" + 0.019*\"student\" + 0.014*\"professor\" + 0.012*\"word\" + 0.011*\"http\" + 0.011*\"governor\"\n", + "2019-01-31 00:44:46,961 : INFO : topic #1 (0.020): 0.049*\"china\" + 0.043*\"chilton\" + 0.024*\"hong\" + 0.023*\"kong\" + 0.021*\"korea\" + 0.019*\"leah\" + 0.017*\"korean\" + 0.016*\"sourc\" + 0.015*\"kim\" + 0.013*\"shirin\"\n", + "2019-01-31 00:44:46,962 : INFO : topic #46 (0.020): 0.018*\"stop\" + 0.018*\"swedish\" + 0.018*\"sweden\" + 0.016*\"norwai\" + 0.016*\"wind\" + 0.015*\"norwegian\" + 0.014*\"damag\" + 0.012*\"treeless\" + 0.012*\"farid\" + 0.012*\"denmark\"\n", + "2019-01-31 00:44:46,963 : INFO : topic #13 (0.020): 0.026*\"sourc\" + 0.026*\"australia\" + 0.025*\"london\" + 0.024*\"new\" + 0.023*\"england\" + 0.022*\"australian\" + 0.020*\"british\" + 0.018*\"ireland\" + 0.015*\"youth\" + 0.014*\"wale\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 00:44:46,969 : INFO : topic diff=0.005707, rho=0.034524\n", + "2019-01-31 00:44:49,606 : INFO : -11.894 per-word bound, 3806.5 perplexity estimate based on a held-out corpus of 2000 documents with 538208 words\n", + "2019-01-31 00:44:49,606 : INFO : PROGRESS: pass 0, at document #1680000/4922894\n", + "2019-01-31 00:44:50,972 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:44:51,238 : INFO : topic #34 (0.020): 0.072*\"start\" + 0.032*\"unionist\" + 0.031*\"cotton\" + 0.031*\"american\" + 0.027*\"new\" + 0.017*\"year\" + 0.015*\"california\" + 0.012*\"terri\" + 0.012*\"warrior\" + 0.012*\"north\"\n", + "2019-01-31 00:44:51,240 : INFO : topic #22 (0.020): 0.034*\"spars\" + 0.025*\"factor\" + 0.019*\"adulthood\" + 0.015*\"feel\" + 0.014*\"male\" + 0.012*\"plaisir\" + 0.012*\"hostil\" + 0.010*\"genu\" + 0.009*\"live\" + 0.008*\"yawn\"\n", + "2019-01-31 00:44:51,241 : INFO : topic #17 (0.020): 0.074*\"church\" + 0.021*\"cathol\" + 0.021*\"christian\" + 0.020*\"bishop\" + 0.016*\"sail\" + 0.015*\"retroflex\" + 0.010*\"cathedr\" + 0.010*\"poll\" + 0.009*\"historiographi\" + 0.009*\"parish\"\n", + "2019-01-31 00:44:51,242 : INFO : topic #39 (0.020): 0.053*\"canada\" + 0.039*\"canadian\" + 0.023*\"toronto\" + 0.021*\"hoar\" + 0.019*\"ontario\" + 0.015*\"misericordia\" + 0.014*\"hydrogen\" + 0.014*\"new\" + 0.014*\"novotná\" + 0.013*\"quebec\"\n", + "2019-01-31 00:44:51,243 : INFO : topic #31 (0.020): 0.056*\"fusiform\" + 0.026*\"scientist\" + 0.025*\"taxpay\" + 0.022*\"player\" + 0.019*\"place\" + 0.014*\"clot\" + 0.014*\"leagu\" + 0.011*\"folei\" + 0.010*\"yawn\" + 0.009*\"reconstruct\"\n", + "2019-01-31 00:44:51,249 : INFO : topic diff=0.004989, rho=0.034503\n", + "2019-01-31 00:44:51,399 : INFO : PROGRESS: pass 0, at document #1682000/4922894\n", + "2019-01-31 00:44:52,749 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:44:53,016 : INFO : topic #41 (0.020): 0.043*\"citi\" + 0.026*\"new\" + 0.022*\"palmer\" + 0.014*\"strategist\" + 0.012*\"open\" + 0.011*\"includ\" + 0.011*\"center\" + 0.010*\"lobe\" + 0.010*\"year\" + 0.009*\"dai\"\n", + "2019-01-31 00:44:53,017 : INFO : topic #25 (0.020): 0.032*\"ring\" + 0.017*\"warmth\" + 0.017*\"lagrang\" + 0.016*\"area\" + 0.015*\"mount\" + 0.009*\"north\" + 0.008*\"palmer\" + 0.008*\"foam\" + 0.008*\"vacant\" + 0.008*\"land\"\n", + "2019-01-31 00:44:53,018 : INFO : topic #9 (0.020): 0.077*\"bone\" + 0.042*\"american\" + 0.030*\"valour\" + 0.020*\"dutch\" + 0.019*\"folei\" + 0.019*\"player\" + 0.018*\"polit\" + 0.017*\"english\" + 0.012*\"acrimoni\" + 0.011*\"simpler\"\n", + "2019-01-31 00:44:53,019 : INFO : topic #35 (0.020): 0.062*\"russia\" + 0.035*\"sovereignti\" + 0.035*\"rural\" + 0.025*\"poison\" + 0.024*\"reprint\" + 0.024*\"personifi\" + 0.023*\"moscow\" + 0.018*\"poland\" + 0.017*\"unfortun\" + 0.016*\"turin\"\n", + "2019-01-31 00:44:53,020 : INFO : topic #22 (0.020): 0.035*\"spars\" + 0.025*\"factor\" + 0.019*\"adulthood\" + 0.016*\"feel\" + 0.014*\"male\" + 0.012*\"plaisir\" + 0.011*\"hostil\" + 0.010*\"genu\" + 0.009*\"live\" + 0.008*\"yawn\"\n", + "2019-01-31 00:44:53,026 : INFO : topic diff=0.005542, rho=0.034483\n", + "2019-01-31 00:44:53,178 : INFO : PROGRESS: pass 0, at document #1684000/4922894\n", + "2019-01-31 00:44:54,550 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:44:54,820 : INFO : topic #16 (0.020): 0.049*\"king\" + 0.031*\"priest\" + 0.024*\"duke\" + 0.019*\"idiosyncrat\" + 0.019*\"quarterli\" + 0.018*\"rotterdam\" + 0.018*\"grammat\" + 0.014*\"count\" + 0.013*\"portugues\" + 0.012*\"kingdom\"\n", + "2019-01-31 00:44:54,821 : INFO : topic #41 (0.020): 0.043*\"citi\" + 0.026*\"new\" + 0.022*\"palmer\" + 0.014*\"strategist\" + 0.012*\"open\" + 0.011*\"includ\" + 0.011*\"center\" + 0.010*\"lobe\" + 0.009*\"year\" + 0.009*\"dai\"\n", + "2019-01-31 00:44:54,822 : INFO : topic #49 (0.020): 0.043*\"india\" + 0.031*\"incumb\" + 0.013*\"pakistan\" + 0.013*\"anglo\" + 0.012*\"islam\" + 0.011*\"televis\" + 0.010*\"muskoge\" + 0.010*\"khalsa\" + 0.010*\"alam\" + 0.009*\"sri\"\n", + "2019-01-31 00:44:54,824 : INFO : topic #12 (0.020): 0.009*\"number\" + 0.007*\"frontal\" + 0.007*\"gener\" + 0.006*\"exampl\" + 0.006*\"southern\" + 0.006*\"measur\" + 0.006*\"théori\" + 0.006*\"method\" + 0.006*\"poet\" + 0.006*\"differ\"\n", + "2019-01-31 00:44:54,825 : INFO : topic #34 (0.020): 0.072*\"start\" + 0.032*\"unionist\" + 0.031*\"cotton\" + 0.031*\"american\" + 0.027*\"new\" + 0.017*\"year\" + 0.015*\"california\" + 0.012*\"terri\" + 0.012*\"warrior\" + 0.012*\"north\"\n", + "2019-01-31 00:44:54,831 : INFO : topic diff=0.004566, rho=0.034462\n", + "2019-01-31 00:44:54,991 : INFO : PROGRESS: pass 0, at document #1686000/4922894\n", + "2019-01-31 00:44:56,404 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:44:56,671 : INFO : topic #24 (0.020): 0.040*\"book\" + 0.034*\"publicis\" + 0.025*\"word\" + 0.017*\"new\" + 0.014*\"edit\" + 0.014*\"presid\" + 0.012*\"nicola\" + 0.012*\"storag\" + 0.011*\"collect\" + 0.011*\"magazin\"\n", + "2019-01-31 00:44:56,672 : INFO : topic #14 (0.020): 0.025*\"forc\" + 0.021*\"aggress\" + 0.020*\"armi\" + 0.020*\"walter\" + 0.018*\"com\" + 0.014*\"oper\" + 0.013*\"unionist\" + 0.013*\"militari\" + 0.012*\"airbu\" + 0.012*\"diversifi\"\n", + "2019-01-31 00:44:56,674 : INFO : topic #42 (0.020): 0.048*\"german\" + 0.032*\"germani\" + 0.015*\"vol\" + 0.013*\"berlin\" + 0.013*\"israel\" + 0.013*\"der\" + 0.013*\"jewish\" + 0.010*\"european\" + 0.009*\"europ\" + 0.009*\"austria\"\n", + "2019-01-31 00:44:56,675 : INFO : topic #16 (0.020): 0.049*\"king\" + 0.031*\"priest\" + 0.023*\"duke\" + 0.020*\"idiosyncrat\" + 0.018*\"quarterli\" + 0.018*\"rotterdam\" + 0.018*\"grammat\" + 0.014*\"count\" + 0.013*\"portugues\" + 0.012*\"princ\"\n", + "2019-01-31 00:44:56,676 : INFO : topic #12 (0.020): 0.008*\"number\" + 0.007*\"frontal\" + 0.007*\"gener\" + 0.006*\"exampl\" + 0.006*\"théori\" + 0.006*\"southern\" + 0.006*\"method\" + 0.006*\"measur\" + 0.006*\"poet\" + 0.006*\"servitud\"\n", + "2019-01-31 00:44:56,682 : INFO : topic diff=0.005766, rho=0.034442\n", + "2019-01-31 00:44:56,840 : INFO : PROGRESS: pass 0, at document #1688000/4922894\n", + "2019-01-31 00:44:58,246 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:44:58,512 : INFO : topic #15 (0.020): 0.011*\"small\" + 0.011*\"organ\" + 0.011*\"develop\" + 0.010*\"commun\" + 0.009*\"word\" + 0.009*\"group\" + 0.008*\"peopl\" + 0.007*\"cultur\" + 0.007*\"human\" + 0.007*\"woman\"\n", + "2019-01-31 00:44:58,513 : INFO : topic #42 (0.020): 0.048*\"german\" + 0.033*\"germani\" + 0.015*\"vol\" + 0.013*\"berlin\" + 0.013*\"jewish\" + 0.013*\"der\" + 0.013*\"israel\" + 0.010*\"european\" + 0.009*\"europ\" + 0.009*\"austria\"\n", + "2019-01-31 00:44:58,515 : INFO : topic #28 (0.020): 0.031*\"build\" + 0.025*\"hous\" + 0.021*\"rivièr\" + 0.019*\"buford\" + 0.013*\"briarwood\" + 0.013*\"histor\" + 0.011*\"constitut\" + 0.011*\"linear\" + 0.010*\"strategist\" + 0.010*\"depress\"\n", + "2019-01-31 00:44:58,516 : INFO : topic #18 (0.020): 0.010*\"théori\" + 0.007*\"later\" + 0.007*\"sack\" + 0.006*\"kill\" + 0.006*\"dai\" + 0.005*\"retrospect\" + 0.005*\"like\" + 0.004*\"end\" + 0.004*\"call\" + 0.004*\"help\"\n", + "2019-01-31 00:44:58,517 : INFO : topic #1 (0.020): 0.050*\"china\" + 0.045*\"chilton\" + 0.024*\"hong\" + 0.023*\"kong\" + 0.021*\"korea\" + 0.018*\"leah\" + 0.017*\"korean\" + 0.016*\"sourc\" + 0.014*\"kim\" + 0.012*\"shirin\"\n", + "2019-01-31 00:44:58,523 : INFO : topic diff=0.004404, rho=0.034421\n", + "2019-01-31 00:44:58,680 : INFO : PROGRESS: pass 0, at document #1690000/4922894\n", + "2019-01-31 00:45:00,075 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:45:00,341 : INFO : topic #13 (0.020): 0.027*\"sourc\" + 0.027*\"australia\" + 0.025*\"london\" + 0.025*\"new\" + 0.024*\"england\" + 0.022*\"australian\" + 0.019*\"british\" + 0.018*\"ireland\" + 0.015*\"youth\" + 0.014*\"wale\"\n", + "2019-01-31 00:45:00,342 : INFO : topic #49 (0.020): 0.043*\"india\" + 0.030*\"incumb\" + 0.013*\"pakistan\" + 0.013*\"anglo\" + 0.012*\"islam\" + 0.012*\"televis\" + 0.010*\"khalsa\" + 0.010*\"muskoge\" + 0.010*\"alam\" + 0.010*\"sri\"\n", + "2019-01-31 00:45:00,343 : INFO : topic #44 (0.020): 0.030*\"rooftop\" + 0.027*\"final\" + 0.024*\"wife\" + 0.020*\"champion\" + 0.019*\"tourist\" + 0.017*\"chamber\" + 0.016*\"martin\" + 0.016*\"taxpay\" + 0.015*\"poet\" + 0.014*\"tiepolo\"\n", + "2019-01-31 00:45:00,344 : INFO : topic #24 (0.020): 0.040*\"book\" + 0.035*\"publicis\" + 0.025*\"word\" + 0.017*\"new\" + 0.014*\"edit\" + 0.014*\"presid\" + 0.012*\"nicola\" + 0.012*\"storag\" + 0.012*\"collect\" + 0.011*\"magazin\"\n", + "2019-01-31 00:45:00,346 : INFO : topic #39 (0.020): 0.051*\"canada\" + 0.038*\"canadian\" + 0.022*\"toronto\" + 0.021*\"hoar\" + 0.020*\"ontario\" + 0.015*\"hydrogen\" + 0.015*\"new\" + 0.014*\"novotná\" + 0.014*\"misericordia\" + 0.012*\"quebec\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 00:45:00,352 : INFO : topic diff=0.004640, rho=0.034401\n", + "2019-01-31 00:45:00,510 : INFO : PROGRESS: pass 0, at document #1692000/4922894\n", + "2019-01-31 00:45:01,918 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:45:02,184 : INFO : topic #1 (0.020): 0.050*\"china\" + 0.045*\"chilton\" + 0.023*\"hong\" + 0.023*\"kong\" + 0.021*\"korea\" + 0.018*\"leah\" + 0.017*\"korean\" + 0.016*\"sourc\" + 0.014*\"kim\" + 0.012*\"shirin\"\n", + "2019-01-31 00:45:02,185 : INFO : topic #49 (0.020): 0.043*\"india\" + 0.030*\"incumb\" + 0.013*\"pakistan\" + 0.012*\"anglo\" + 0.012*\"islam\" + 0.012*\"televis\" + 0.010*\"khalsa\" + 0.010*\"muskoge\" + 0.010*\"alam\" + 0.010*\"sri\"\n", + "2019-01-31 00:45:02,187 : INFO : topic #17 (0.020): 0.074*\"church\" + 0.021*\"cathol\" + 0.021*\"christian\" + 0.020*\"bishop\" + 0.017*\"sail\" + 0.015*\"retroflex\" + 0.010*\"cathedr\" + 0.009*\"historiographi\" + 0.009*\"poll\" + 0.009*\"centuri\"\n", + "2019-01-31 00:45:02,188 : INFO : topic #20 (0.020): 0.137*\"scholar\" + 0.040*\"struggl\" + 0.031*\"high\" + 0.029*\"educ\" + 0.026*\"collector\" + 0.018*\"yawn\" + 0.013*\"prognosi\" + 0.009*\"district\" + 0.009*\"gothic\" + 0.009*\"task\"\n", + "2019-01-31 00:45:02,189 : INFO : topic #14 (0.020): 0.024*\"forc\" + 0.021*\"aggress\" + 0.021*\"armi\" + 0.020*\"walter\" + 0.017*\"com\" + 0.014*\"oper\" + 0.013*\"unionist\" + 0.013*\"militari\" + 0.012*\"diversifi\" + 0.011*\"airbu\"\n", + "2019-01-31 00:45:02,195 : INFO : topic diff=0.004626, rho=0.034381\n", + "2019-01-31 00:45:02,409 : INFO : PROGRESS: pass 0, at document #1694000/4922894\n", + "2019-01-31 00:45:03,806 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:45:04,076 : INFO : topic #17 (0.020): 0.074*\"church\" + 0.021*\"cathol\" + 0.021*\"christian\" + 0.020*\"bishop\" + 0.017*\"sail\" + 0.015*\"retroflex\" + 0.010*\"cathedr\" + 0.009*\"poll\" + 0.009*\"historiographi\" + 0.009*\"parish\"\n", + "2019-01-31 00:45:04,077 : INFO : topic #47 (0.020): 0.065*\"muscl\" + 0.035*\"perceptu\" + 0.021*\"theater\" + 0.019*\"place\" + 0.017*\"compos\" + 0.016*\"damn\" + 0.014*\"orchestr\" + 0.013*\"physician\" + 0.012*\"olympo\" + 0.012*\"word\"\n", + "2019-01-31 00:45:04,078 : INFO : topic #27 (0.020): 0.074*\"questionnair\" + 0.020*\"taxpay\" + 0.018*\"candid\" + 0.013*\"tornado\" + 0.013*\"squatter\" + 0.013*\"find\" + 0.012*\"ret\" + 0.012*\"driver\" + 0.011*\"fool\" + 0.010*\"théori\"\n", + "2019-01-31 00:45:04,079 : INFO : topic #8 (0.020): 0.027*\"law\" + 0.024*\"cortic\" + 0.019*\"act\" + 0.018*\"start\" + 0.014*\"ricardo\" + 0.013*\"case\" + 0.011*\"polaris\" + 0.009*\"legal\" + 0.009*\"replac\" + 0.007*\"judaism\"\n", + "2019-01-31 00:45:04,081 : INFO : topic #6 (0.020): 0.071*\"fewer\" + 0.025*\"septemb\" + 0.024*\"epiru\" + 0.018*\"teacher\" + 0.017*\"stake\" + 0.013*\"rodríguez\" + 0.012*\"proclaim\" + 0.011*\"direct\" + 0.011*\"movi\" + 0.010*\"acrimoni\"\n", + "2019-01-31 00:45:04,087 : INFO : topic diff=0.004795, rho=0.034360\n", + "2019-01-31 00:45:04,240 : INFO : PROGRESS: pass 0, at document #1696000/4922894\n", + "2019-01-31 00:45:05,629 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:45:05,895 : INFO : topic #43 (0.020): 0.063*\"elect\" + 0.055*\"parti\" + 0.024*\"voluntari\" + 0.023*\"democrat\" + 0.020*\"member\" + 0.016*\"polici\" + 0.015*\"republ\" + 0.014*\"report\" + 0.013*\"bypass\" + 0.013*\"seaport\"\n", + "2019-01-31 00:45:05,896 : INFO : topic #25 (0.020): 0.032*\"ring\" + 0.017*\"warmth\" + 0.017*\"lagrang\" + 0.016*\"area\" + 0.015*\"mount\" + 0.009*\"north\" + 0.009*\"palmer\" + 0.008*\"vacant\" + 0.008*\"foam\" + 0.008*\"lobe\"\n", + "2019-01-31 00:45:05,898 : INFO : topic #42 (0.020): 0.049*\"german\" + 0.033*\"germani\" + 0.015*\"vol\" + 0.013*\"berlin\" + 0.013*\"jewish\" + 0.013*\"der\" + 0.012*\"israel\" + 0.010*\"european\" + 0.010*\"austria\" + 0.009*\"europ\"\n", + "2019-01-31 00:45:05,899 : INFO : topic #19 (0.020): 0.016*\"languag\" + 0.012*\"centuri\" + 0.010*\"woodcut\" + 0.009*\"origin\" + 0.009*\"form\" + 0.008*\"mean\" + 0.007*\"trade\" + 0.007*\"english\" + 0.007*\"known\" + 0.007*\"like\"\n", + "2019-01-31 00:45:05,900 : INFO : topic #28 (0.020): 0.031*\"build\" + 0.025*\"hous\" + 0.023*\"rivièr\" + 0.019*\"buford\" + 0.013*\"briarwood\" + 0.012*\"histor\" + 0.011*\"constitut\" + 0.011*\"linear\" + 0.011*\"strategist\" + 0.010*\"depress\"\n", + "2019-01-31 00:45:05,906 : INFO : topic diff=0.006264, rho=0.034340\n", + "2019-01-31 00:45:06,066 : INFO : PROGRESS: pass 0, at document #1698000/4922894\n", + "2019-01-31 00:45:07,474 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:45:07,740 : INFO : topic #44 (0.020): 0.030*\"rooftop\" + 0.027*\"final\" + 0.025*\"wife\" + 0.019*\"champion\" + 0.019*\"tourist\" + 0.017*\"chamber\" + 0.016*\"martin\" + 0.016*\"taxpay\" + 0.015*\"poet\" + 0.014*\"tiepolo\"\n", + "2019-01-31 00:45:07,742 : INFO : topic #17 (0.020): 0.073*\"church\" + 0.021*\"cathol\" + 0.020*\"christian\" + 0.020*\"bishop\" + 0.017*\"sail\" + 0.015*\"retroflex\" + 0.010*\"poll\" + 0.010*\"cathedr\" + 0.010*\"centuri\" + 0.010*\"romanc\"\n", + "2019-01-31 00:45:07,743 : INFO : topic #41 (0.020): 0.044*\"citi\" + 0.026*\"new\" + 0.023*\"palmer\" + 0.014*\"strategist\" + 0.012*\"open\" + 0.011*\"center\" + 0.011*\"includ\" + 0.010*\"lobe\" + 0.009*\"year\" + 0.009*\"highli\"\n", + "2019-01-31 00:45:07,744 : INFO : topic #20 (0.020): 0.139*\"scholar\" + 0.040*\"struggl\" + 0.031*\"high\" + 0.029*\"educ\" + 0.026*\"collector\" + 0.018*\"yawn\" + 0.013*\"prognosi\" + 0.009*\"gothic\" + 0.009*\"district\" + 0.009*\"task\"\n", + "2019-01-31 00:45:07,745 : INFO : topic #47 (0.020): 0.064*\"muscl\" + 0.036*\"perceptu\" + 0.021*\"theater\" + 0.019*\"place\" + 0.017*\"compos\" + 0.016*\"damn\" + 0.014*\"orchestr\" + 0.013*\"physician\" + 0.012*\"olympo\" + 0.011*\"word\"\n", + "2019-01-31 00:45:07,751 : INFO : topic diff=0.005738, rho=0.034320\n", + "2019-01-31 00:45:10,412 : INFO : -11.653 per-word bound, 3221.2 perplexity estimate based on a held-out corpus of 2000 documents with 537741 words\n", + "2019-01-31 00:45:10,413 : INFO : PROGRESS: pass 0, at document #1700000/4922894\n", + "2019-01-31 00:45:11,787 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:45:12,054 : INFO : topic #35 (0.020): 0.062*\"russia\" + 0.034*\"rural\" + 0.034*\"sovereignti\" + 0.025*\"poison\" + 0.024*\"reprint\" + 0.022*\"moscow\" + 0.022*\"personifi\" + 0.018*\"poland\" + 0.016*\"unfortun\" + 0.016*\"turin\"\n", + "2019-01-31 00:45:12,055 : INFO : topic #32 (0.020): 0.056*\"district\" + 0.045*\"vigour\" + 0.043*\"popolo\" + 0.039*\"tortur\" + 0.031*\"cotton\" + 0.029*\"area\" + 0.023*\"regim\" + 0.022*\"multitud\" + 0.022*\"citi\" + 0.020*\"cede\"\n", + "2019-01-31 00:45:12,056 : INFO : topic #2 (0.020): 0.043*\"isl\" + 0.038*\"shield\" + 0.019*\"narrat\" + 0.013*\"scot\" + 0.012*\"pope\" + 0.011*\"blur\" + 0.011*\"coalit\" + 0.010*\"nativist\" + 0.009*\"fleet\" + 0.009*\"class\"\n", + "2019-01-31 00:45:12,057 : INFO : topic #40 (0.020): 0.090*\"unit\" + 0.024*\"schuster\" + 0.022*\"collector\" + 0.022*\"institut\" + 0.021*\"requir\" + 0.018*\"student\" + 0.014*\"professor\" + 0.012*\"word\" + 0.011*\"governor\" + 0.011*\"degre\"\n", + "2019-01-31 00:45:12,058 : INFO : topic #44 (0.020): 0.031*\"rooftop\" + 0.027*\"final\" + 0.025*\"wife\" + 0.019*\"tourist\" + 0.019*\"champion\" + 0.017*\"chamber\" + 0.016*\"martin\" + 0.016*\"taxpay\" + 0.015*\"poet\" + 0.014*\"tiepolo\"\n", + "2019-01-31 00:45:12,064 : INFO : topic diff=0.004708, rho=0.034300\n", + "2019-01-31 00:45:12,222 : INFO : PROGRESS: pass 0, at document #1702000/4922894\n", + "2019-01-31 00:45:13,627 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:45:13,893 : INFO : topic #39 (0.020): 0.054*\"canada\" + 0.039*\"canadian\" + 0.022*\"toronto\" + 0.021*\"ontario\" + 0.020*\"hoar\" + 0.015*\"hydrogen\" + 0.014*\"new\" + 0.014*\"misericordia\" + 0.014*\"novotná\" + 0.013*\"quebec\"\n", + "2019-01-31 00:45:13,894 : INFO : topic #24 (0.020): 0.040*\"book\" + 0.035*\"publicis\" + 0.025*\"word\" + 0.017*\"new\" + 0.014*\"edit\" + 0.014*\"presid\" + 0.012*\"storag\" + 0.012*\"nicola\" + 0.011*\"worldwid\" + 0.011*\"collect\"\n", + "2019-01-31 00:45:13,895 : INFO : topic #43 (0.020): 0.062*\"elect\" + 0.055*\"parti\" + 0.024*\"voluntari\" + 0.023*\"democrat\" + 0.020*\"member\" + 0.016*\"polici\" + 0.015*\"republ\" + 0.014*\"report\" + 0.013*\"liber\" + 0.013*\"bypass\"\n", + "2019-01-31 00:45:13,896 : INFO : topic #29 (0.020): 0.027*\"companhia\" + 0.011*\"busi\" + 0.011*\"million\" + 0.010*\"bank\" + 0.010*\"market\" + 0.009*\"produc\" + 0.009*\"industri\" + 0.008*\"yawn\" + 0.007*\"manag\" + 0.007*\"trace\"\n", + "2019-01-31 00:45:13,897 : INFO : topic #45 (0.020): 0.026*\"jpg\" + 0.025*\"fifteenth\" + 0.018*\"black\" + 0.017*\"illicit\" + 0.016*\"colder\" + 0.016*\"western\" + 0.013*\"record\" + 0.011*\"blind\" + 0.008*\"light\" + 0.007*\"depress\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 00:45:13,903 : INFO : topic diff=0.005445, rho=0.034280\n", + "2019-01-31 00:45:14,058 : INFO : PROGRESS: pass 0, at document #1704000/4922894\n", + "2019-01-31 00:45:15,432 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:45:15,699 : INFO : topic #12 (0.020): 0.009*\"number\" + 0.007*\"frontal\" + 0.007*\"gener\" + 0.007*\"exampl\" + 0.006*\"poet\" + 0.006*\"servitud\" + 0.006*\"théori\" + 0.006*\"southern\" + 0.006*\"method\" + 0.006*\"measur\"\n", + "2019-01-31 00:45:15,700 : INFO : topic #11 (0.020): 0.025*\"john\" + 0.013*\"will\" + 0.012*\"jame\" + 0.012*\"david\" + 0.010*\"rival\" + 0.009*\"mexican–american\" + 0.008*\"georg\" + 0.008*\"slur\" + 0.008*\"paul\" + 0.008*\"rhyme\"\n", + "2019-01-31 00:45:15,701 : INFO : topic #24 (0.020): 0.040*\"book\" + 0.035*\"publicis\" + 0.025*\"word\" + 0.017*\"new\" + 0.014*\"edit\" + 0.014*\"presid\" + 0.012*\"nicola\" + 0.012*\"storag\" + 0.011*\"collect\" + 0.011*\"worldwid\"\n", + "2019-01-31 00:45:15,702 : INFO : topic #2 (0.020): 0.043*\"isl\" + 0.038*\"shield\" + 0.019*\"narrat\" + 0.014*\"scot\" + 0.012*\"pope\" + 0.011*\"blur\" + 0.011*\"coalit\" + 0.010*\"nativist\" + 0.009*\"fleet\" + 0.009*\"class\"\n", + "2019-01-31 00:45:15,703 : INFO : topic #37 (0.020): 0.009*\"man\" + 0.009*\"love\" + 0.008*\"charact\" + 0.007*\"septemb\" + 0.007*\"gestur\" + 0.006*\"comic\" + 0.006*\"blue\" + 0.006*\"appear\" + 0.005*\"anim\" + 0.004*\"dixi\"\n", + "2019-01-31 00:45:15,709 : INFO : topic diff=0.005435, rho=0.034259\n", + "2019-01-31 00:45:15,867 : INFO : PROGRESS: pass 0, at document #1706000/4922894\n", + "2019-01-31 00:45:17,271 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:45:17,540 : INFO : topic #41 (0.020): 0.044*\"citi\" + 0.026*\"new\" + 0.022*\"palmer\" + 0.015*\"strategist\" + 0.012*\"open\" + 0.012*\"center\" + 0.011*\"includ\" + 0.010*\"lobe\" + 0.010*\"year\" + 0.009*\"highli\"\n", + "2019-01-31 00:45:17,541 : INFO : topic #47 (0.020): 0.065*\"muscl\" + 0.036*\"perceptu\" + 0.021*\"theater\" + 0.019*\"place\" + 0.017*\"compos\" + 0.016*\"damn\" + 0.014*\"orchestr\" + 0.013*\"physician\" + 0.012*\"olympo\" + 0.011*\"word\"\n", + "2019-01-31 00:45:17,543 : INFO : topic #37 (0.020): 0.009*\"man\" + 0.009*\"love\" + 0.008*\"charact\" + 0.007*\"septemb\" + 0.007*\"gestur\" + 0.006*\"comic\" + 0.006*\"appear\" + 0.006*\"blue\" + 0.005*\"anim\" + 0.005*\"dixi\"\n", + "2019-01-31 00:45:17,544 : INFO : topic #35 (0.020): 0.062*\"russia\" + 0.036*\"sovereignti\" + 0.034*\"rural\" + 0.026*\"poison\" + 0.023*\"reprint\" + 0.023*\"personifi\" + 0.022*\"moscow\" + 0.018*\"poland\" + 0.016*\"unfortun\" + 0.015*\"turin\"\n", + "2019-01-31 00:45:17,545 : INFO : topic #0 (0.020): 0.067*\"statewid\" + 0.043*\"line\" + 0.035*\"arsen\" + 0.034*\"raid\" + 0.027*\"museo\" + 0.019*\"traceabl\" + 0.018*\"serv\" + 0.014*\"exhaust\" + 0.014*\"pain\" + 0.012*\"oper\"\n", + "2019-01-31 00:45:17,551 : INFO : topic diff=0.005527, rho=0.034239\n", + "2019-01-31 00:45:17,707 : INFO : PROGRESS: pass 0, at document #1708000/4922894\n", + "2019-01-31 00:45:19,090 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:45:19,356 : INFO : topic #43 (0.020): 0.063*\"elect\" + 0.054*\"parti\" + 0.024*\"voluntari\" + 0.023*\"democrat\" + 0.020*\"member\" + 0.016*\"polici\" + 0.015*\"seaport\" + 0.015*\"republ\" + 0.014*\"report\" + 0.014*\"liber\"\n", + "2019-01-31 00:45:19,357 : INFO : topic #3 (0.020): 0.035*\"present\" + 0.027*\"offic\" + 0.024*\"minist\" + 0.021*\"nation\" + 0.020*\"govern\" + 0.020*\"serv\" + 0.020*\"member\" + 0.019*\"gener\" + 0.017*\"seri\" + 0.015*\"start\"\n", + "2019-01-31 00:45:19,358 : INFO : topic #0 (0.020): 0.067*\"statewid\" + 0.043*\"line\" + 0.035*\"arsen\" + 0.034*\"raid\" + 0.027*\"museo\" + 0.019*\"traceabl\" + 0.018*\"serv\" + 0.014*\"exhaust\" + 0.014*\"pain\" + 0.012*\"oper\"\n", + "2019-01-31 00:45:19,359 : INFO : topic #49 (0.020): 0.042*\"india\" + 0.029*\"incumb\" + 0.013*\"islam\" + 0.013*\"pakistan\" + 0.012*\"anglo\" + 0.011*\"televis\" + 0.011*\"khalsa\" + 0.010*\"muskoge\" + 0.010*\"alam\" + 0.009*\"sri\"\n", + "2019-01-31 00:45:19,361 : INFO : topic #22 (0.020): 0.034*\"spars\" + 0.025*\"factor\" + 0.020*\"adulthood\" + 0.015*\"feel\" + 0.014*\"male\" + 0.012*\"plaisir\" + 0.012*\"hostil\" + 0.010*\"genu\" + 0.009*\"live\" + 0.008*\"median\"\n", + "2019-01-31 00:45:19,366 : INFO : topic diff=0.004782, rho=0.034219\n", + "2019-01-31 00:45:19,520 : INFO : PROGRESS: pass 0, at document #1710000/4922894\n", + "2019-01-31 00:45:20,894 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:45:21,161 : INFO : topic #30 (0.020): 0.036*\"leagu\" + 0.036*\"cleveland\" + 0.029*\"place\" + 0.027*\"taxpay\" + 0.024*\"scientist\" + 0.023*\"crete\" + 0.021*\"folei\" + 0.016*\"goal\" + 0.016*\"martin\" + 0.012*\"schmitz\"\n", + "2019-01-31 00:45:21,162 : INFO : topic #2 (0.020): 0.045*\"isl\" + 0.038*\"shield\" + 0.019*\"narrat\" + 0.014*\"scot\" + 0.013*\"pope\" + 0.013*\"blur\" + 0.011*\"coalit\" + 0.011*\"nativist\" + 0.009*\"fleet\" + 0.009*\"bahá\"\n", + "2019-01-31 00:45:21,163 : INFO : topic #28 (0.020): 0.030*\"build\" + 0.025*\"hous\" + 0.024*\"rivièr\" + 0.018*\"buford\" + 0.013*\"briarwood\" + 0.012*\"histor\" + 0.011*\"constitut\" + 0.011*\"strategist\" + 0.010*\"linear\" + 0.010*\"depress\"\n", + "2019-01-31 00:45:21,164 : INFO : topic #45 (0.020): 0.026*\"jpg\" + 0.025*\"fifteenth\" + 0.018*\"black\" + 0.017*\"illicit\" + 0.017*\"colder\" + 0.016*\"western\" + 0.013*\"record\" + 0.011*\"blind\" + 0.008*\"light\" + 0.007*\"depress\"\n", + "2019-01-31 00:45:21,165 : INFO : topic #16 (0.020): 0.050*\"king\" + 0.029*\"priest\" + 0.023*\"duke\" + 0.020*\"idiosyncrat\" + 0.018*\"rotterdam\" + 0.018*\"grammat\" + 0.017*\"quarterli\" + 0.014*\"brazil\" + 0.014*\"portugues\" + 0.013*\"count\"\n", + "2019-01-31 00:45:21,171 : INFO : topic diff=0.004746, rho=0.034199\n", + "2019-01-31 00:45:21,332 : INFO : PROGRESS: pass 0, at document #1712000/4922894\n", + "2019-01-31 00:45:22,764 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:45:23,030 : INFO : topic #41 (0.020): 0.044*\"citi\" + 0.025*\"new\" + 0.023*\"palmer\" + 0.015*\"strategist\" + 0.012*\"open\" + 0.012*\"center\" + 0.011*\"includ\" + 0.010*\"lobe\" + 0.009*\"year\" + 0.009*\"highli\"\n", + "2019-01-31 00:45:23,031 : INFO : topic #25 (0.020): 0.032*\"ring\" + 0.017*\"warmth\" + 0.016*\"lagrang\" + 0.016*\"area\" + 0.015*\"mount\" + 0.009*\"north\" + 0.009*\"palmer\" + 0.008*\"vacant\" + 0.008*\"foam\" + 0.008*\"lobe\"\n", + "2019-01-31 00:45:23,032 : INFO : topic #22 (0.020): 0.034*\"spars\" + 0.025*\"factor\" + 0.020*\"adulthood\" + 0.015*\"feel\" + 0.014*\"male\" + 0.012*\"plaisir\" + 0.012*\"hostil\" + 0.010*\"genu\" + 0.009*\"live\" + 0.008*\"median\"\n", + "2019-01-31 00:45:23,033 : INFO : topic #20 (0.020): 0.138*\"scholar\" + 0.039*\"struggl\" + 0.031*\"high\" + 0.029*\"educ\" + 0.024*\"collector\" + 0.018*\"yawn\" + 0.012*\"prognosi\" + 0.010*\"district\" + 0.009*\"gothic\" + 0.009*\"task\"\n", + "2019-01-31 00:45:23,034 : INFO : topic #29 (0.020): 0.027*\"companhia\" + 0.011*\"busi\" + 0.011*\"million\" + 0.010*\"bank\" + 0.010*\"market\" + 0.009*\"produc\" + 0.009*\"industri\" + 0.008*\"yawn\" + 0.007*\"manag\" + 0.007*\"trace\"\n", + "2019-01-31 00:45:23,040 : INFO : topic diff=0.005510, rho=0.034179\n", + "2019-01-31 00:45:23,195 : INFO : PROGRESS: pass 0, at document #1714000/4922894\n", + "2019-01-31 00:45:24,564 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:45:24,831 : INFO : topic #5 (0.020): 0.039*\"abroad\" + 0.030*\"son\" + 0.027*\"rel\" + 0.026*\"reconstruct\" + 0.021*\"band\" + 0.017*\"muscl\" + 0.016*\"simultan\" + 0.015*\"charcoal\" + 0.013*\"toyota\" + 0.010*\"myspac\"\n", + "2019-01-31 00:45:24,832 : INFO : topic #33 (0.020): 0.062*\"french\" + 0.047*\"franc\" + 0.032*\"pari\" + 0.024*\"sail\" + 0.021*\"jean\" + 0.018*\"daphn\" + 0.013*\"lazi\" + 0.012*\"loui\" + 0.010*\"piec\" + 0.008*\"convei\"\n", + "2019-01-31 00:45:24,833 : INFO : topic #15 (0.020): 0.011*\"organ\" + 0.011*\"small\" + 0.011*\"develop\" + 0.009*\"commun\" + 0.009*\"group\" + 0.009*\"word\" + 0.008*\"peopl\" + 0.007*\"cultur\" + 0.007*\"human\" + 0.007*\"woman\"\n", + "2019-01-31 00:45:24,834 : INFO : topic #21 (0.020): 0.038*\"samford\" + 0.022*\"spain\" + 0.018*\"del\" + 0.017*\"mexico\" + 0.014*\"soviet\" + 0.012*\"santa\" + 0.012*\"francisco\" + 0.012*\"juan\" + 0.012*\"lizard\" + 0.012*\"carlo\"\n", + "2019-01-31 00:45:24,835 : INFO : topic #35 (0.020): 0.060*\"russia\" + 0.035*\"sovereignti\" + 0.033*\"rural\" + 0.027*\"poison\" + 0.023*\"reprint\" + 0.023*\"personifi\" + 0.022*\"moscow\" + 0.018*\"poland\" + 0.016*\"unfortun\" + 0.014*\"turin\"\n", + "2019-01-31 00:45:24,841 : INFO : topic diff=0.005373, rho=0.034159\n", + "2019-01-31 00:45:25,000 : INFO : PROGRESS: pass 0, at document #1716000/4922894\n", + "2019-01-31 00:45:26,900 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 00:45:27,166 : INFO : topic #39 (0.020): 0.054*\"canada\" + 0.039*\"canadian\" + 0.022*\"toronto\" + 0.021*\"hoar\" + 0.021*\"ontario\" + 0.015*\"new\" + 0.014*\"hydrogen\" + 0.014*\"novotná\" + 0.014*\"misericordia\" + 0.012*\"quebec\"\n", + "2019-01-31 00:45:27,167 : INFO : topic #29 (0.020): 0.026*\"companhia\" + 0.011*\"busi\" + 0.011*\"million\" + 0.010*\"bank\" + 0.010*\"produc\" + 0.010*\"market\" + 0.009*\"industri\" + 0.008*\"yawn\" + 0.007*\"manag\" + 0.007*\"function\"\n", + "2019-01-31 00:45:27,168 : INFO : topic #15 (0.020): 0.011*\"organ\" + 0.011*\"develop\" + 0.011*\"small\" + 0.009*\"commun\" + 0.009*\"group\" + 0.009*\"word\" + 0.008*\"peopl\" + 0.007*\"cultur\" + 0.007*\"human\" + 0.007*\"woman\"\n", + "2019-01-31 00:45:27,169 : INFO : topic #41 (0.020): 0.043*\"citi\" + 0.026*\"new\" + 0.023*\"palmer\" + 0.014*\"strategist\" + 0.012*\"open\" + 0.012*\"center\" + 0.011*\"includ\" + 0.010*\"lobe\" + 0.009*\"year\" + 0.009*\"highli\"\n", + "2019-01-31 00:45:27,170 : INFO : topic #42 (0.020): 0.049*\"german\" + 0.034*\"germani\" + 0.015*\"vol\" + 0.013*\"jewish\" + 0.013*\"berlin\" + 0.013*\"der\" + 0.012*\"israel\" + 0.010*\"european\" + 0.010*\"austria\" + 0.009*\"greek\"\n", + "2019-01-31 00:45:27,176 : INFO : topic diff=0.004973, rho=0.034139\n", + "2019-01-31 00:45:27,346 : INFO : PROGRESS: pass 0, at document #1718000/4922894\n", + "2019-01-31 00:45:28,767 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:45:29,034 : INFO : topic #10 (0.020): 0.011*\"hormon\" + 0.010*\"cdd\" + 0.010*\"media\" + 0.008*\"disco\" + 0.008*\"have\" + 0.007*\"proper\" + 0.007*\"caus\" + 0.007*\"pathwai\" + 0.006*\"treat\" + 0.006*\"effect\"\n", + "2019-01-31 00:45:29,036 : INFO : topic #7 (0.020): 0.021*\"snatch\" + 0.020*\"di\" + 0.017*\"factor\" + 0.016*\"yawn\" + 0.015*\"margin\" + 0.014*\"bone\" + 0.013*\"life\" + 0.013*\"faster\" + 0.012*\"deal\" + 0.012*\"daughter\"\n", + "2019-01-31 00:45:29,037 : INFO : topic #23 (0.020): 0.136*\"audit\" + 0.067*\"best\" + 0.034*\"yawn\" + 0.030*\"jacksonvil\" + 0.026*\"japanes\" + 0.022*\"noll\" + 0.021*\"festiv\" + 0.019*\"women\" + 0.017*\"intern\" + 0.014*\"misconcept\"\n", + "2019-01-31 00:45:29,038 : INFO : topic #39 (0.020): 0.054*\"canada\" + 0.040*\"canadian\" + 0.022*\"toronto\" + 0.022*\"ontario\" + 0.021*\"hoar\" + 0.015*\"new\" + 0.014*\"hydrogen\" + 0.014*\"novotná\" + 0.013*\"misericordia\" + 0.012*\"quebec\"\n", + "2019-01-31 00:45:29,039 : INFO : topic #8 (0.020): 0.028*\"law\" + 0.024*\"cortic\" + 0.019*\"start\" + 0.018*\"act\" + 0.014*\"ricardo\" + 0.013*\"case\" + 0.011*\"polaris\" + 0.009*\"legal\" + 0.008*\"replac\" + 0.007*\"judaism\"\n", + "2019-01-31 00:45:29,045 : INFO : topic diff=0.004782, rho=0.034120\n", + "2019-01-31 00:45:31,748 : INFO : -11.861 per-word bound, 3719.0 perplexity estimate based on a held-out corpus of 2000 documents with 550836 words\n", + "2019-01-31 00:45:31,748 : INFO : PROGRESS: pass 0, at document #1720000/4922894\n", + "2019-01-31 00:45:33,148 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:45:33,415 : INFO : topic #5 (0.020): 0.038*\"abroad\" + 0.030*\"son\" + 0.027*\"rel\" + 0.026*\"reconstruct\" + 0.021*\"band\" + 0.017*\"muscl\" + 0.016*\"simultan\" + 0.015*\"charcoal\" + 0.013*\"toyota\" + 0.010*\"myspac\"\n", + "2019-01-31 00:45:33,416 : INFO : topic #47 (0.020): 0.065*\"muscl\" + 0.036*\"perceptu\" + 0.020*\"theater\" + 0.019*\"place\" + 0.018*\"damn\" + 0.017*\"compos\" + 0.014*\"orchestr\" + 0.012*\"olympo\" + 0.012*\"physician\" + 0.011*\"word\"\n", + "2019-01-31 00:45:33,417 : INFO : topic #43 (0.020): 0.063*\"elect\" + 0.054*\"parti\" + 0.024*\"voluntari\" + 0.023*\"democrat\" + 0.020*\"member\" + 0.016*\"polici\" + 0.015*\"seaport\" + 0.014*\"republ\" + 0.014*\"report\" + 0.014*\"bypass\"\n", + "2019-01-31 00:45:33,418 : INFO : topic #36 (0.020): 0.011*\"network\" + 0.011*\"prognosi\" + 0.010*\"pop\" + 0.008*\"develop\" + 0.008*\"cytokin\" + 0.008*\"championship\" + 0.008*\"softwar\" + 0.008*\"uruguayan\" + 0.007*\"brio\" + 0.007*\"user\"\n", + "2019-01-31 00:45:33,419 : INFO : topic #23 (0.020): 0.135*\"audit\" + 0.067*\"best\" + 0.034*\"yawn\" + 0.030*\"jacksonvil\" + 0.026*\"japanes\" + 0.023*\"noll\" + 0.021*\"festiv\" + 0.019*\"women\" + 0.017*\"intern\" + 0.014*\"misconcept\"\n", + "2019-01-31 00:45:33,426 : INFO : topic diff=0.004595, rho=0.034100\n", + "2019-01-31 00:45:33,578 : INFO : PROGRESS: pass 0, at document #1722000/4922894\n", + "2019-01-31 00:45:34,938 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:45:35,204 : INFO : topic #15 (0.020): 0.011*\"small\" + 0.011*\"organ\" + 0.011*\"develop\" + 0.009*\"commun\" + 0.009*\"group\" + 0.009*\"word\" + 0.008*\"peopl\" + 0.007*\"cultur\" + 0.007*\"human\" + 0.007*\"woman\"\n", + "2019-01-31 00:45:35,205 : INFO : topic #11 (0.020): 0.025*\"john\" + 0.013*\"will\" + 0.012*\"jame\" + 0.012*\"david\" + 0.011*\"rival\" + 0.010*\"mexican–american\" + 0.008*\"slur\" + 0.008*\"georg\" + 0.008*\"rhyme\" + 0.008*\"paul\"\n", + "2019-01-31 00:45:35,206 : INFO : topic #22 (0.020): 0.034*\"spars\" + 0.025*\"factor\" + 0.019*\"adulthood\" + 0.015*\"feel\" + 0.014*\"male\" + 0.012*\"plaisir\" + 0.011*\"hostil\" + 0.010*\"genu\" + 0.009*\"live\" + 0.008*\"median\"\n", + "2019-01-31 00:45:35,207 : INFO : topic #44 (0.020): 0.031*\"rooftop\" + 0.027*\"final\" + 0.025*\"wife\" + 0.020*\"tourist\" + 0.019*\"champion\" + 0.016*\"chamber\" + 0.016*\"martin\" + 0.015*\"taxpay\" + 0.014*\"tiepolo\" + 0.014*\"poet\"\n", + "2019-01-31 00:45:35,209 : INFO : topic #19 (0.020): 0.017*\"languag\" + 0.012*\"centuri\" + 0.010*\"woodcut\" + 0.009*\"form\" + 0.009*\"origin\" + 0.008*\"mean\" + 0.008*\"english\" + 0.008*\"trade\" + 0.007*\"known\" + 0.007*\"like\"\n", + "2019-01-31 00:45:35,215 : INFO : topic diff=0.005504, rho=0.034080\n", + "2019-01-31 00:45:35,369 : INFO : PROGRESS: pass 0, at document #1724000/4922894\n", + "2019-01-31 00:45:36,754 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:45:37,020 : INFO : topic #10 (0.020): 0.011*\"hormon\" + 0.010*\"cdd\" + 0.010*\"media\" + 0.008*\"disco\" + 0.008*\"have\" + 0.007*\"proper\" + 0.007*\"caus\" + 0.006*\"pathwai\" + 0.006*\"treat\" + 0.006*\"effect\"\n", + "2019-01-31 00:45:37,021 : INFO : topic #13 (0.020): 0.027*\"sourc\" + 0.027*\"australia\" + 0.025*\"london\" + 0.025*\"new\" + 0.024*\"england\" + 0.022*\"australian\" + 0.019*\"british\" + 0.017*\"ireland\" + 0.014*\"wale\" + 0.014*\"youth\"\n", + "2019-01-31 00:45:37,022 : INFO : topic #49 (0.020): 0.041*\"india\" + 0.028*\"incumb\" + 0.013*\"islam\" + 0.012*\"pakistan\" + 0.012*\"anglo\" + 0.011*\"televis\" + 0.010*\"alam\" + 0.010*\"muskoge\" + 0.010*\"khalsa\" + 0.010*\"sri\"\n", + "2019-01-31 00:45:37,023 : INFO : topic #36 (0.020): 0.011*\"network\" + 0.011*\"prognosi\" + 0.010*\"pop\" + 0.008*\"develop\" + 0.008*\"championship\" + 0.008*\"cytokin\" + 0.008*\"brio\" + 0.008*\"softwar\" + 0.008*\"diggin\" + 0.008*\"uruguayan\"\n", + "2019-01-31 00:45:37,024 : INFO : topic #24 (0.020): 0.039*\"book\" + 0.035*\"publicis\" + 0.025*\"word\" + 0.017*\"new\" + 0.014*\"edit\" + 0.013*\"presid\" + 0.012*\"storag\" + 0.012*\"nicola\" + 0.011*\"collect\" + 0.011*\"worldwid\"\n", + "2019-01-31 00:45:37,030 : INFO : topic diff=0.005104, rho=0.034060\n", + "2019-01-31 00:45:37,188 : INFO : PROGRESS: pass 0, at document #1726000/4922894\n", + "2019-01-31 00:45:38,579 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:45:38,845 : INFO : topic #10 (0.020): 0.011*\"hormon\" + 0.010*\"cdd\" + 0.010*\"media\" + 0.008*\"disco\" + 0.007*\"have\" + 0.007*\"proper\" + 0.007*\"caus\" + 0.006*\"pathwai\" + 0.006*\"treat\" + 0.006*\"effect\"\n", + "2019-01-31 00:45:38,846 : INFO : topic #12 (0.020): 0.009*\"number\" + 0.007*\"frontal\" + 0.007*\"gener\" + 0.007*\"exampl\" + 0.006*\"théori\" + 0.006*\"poet\" + 0.006*\"mode\" + 0.006*\"servitud\" + 0.006*\"southern\" + 0.006*\"differ\"\n", + "2019-01-31 00:45:38,847 : INFO : topic #21 (0.020): 0.039*\"samford\" + 0.022*\"spain\" + 0.018*\"del\" + 0.018*\"mexico\" + 0.014*\"soviet\" + 0.012*\"francisco\" + 0.012*\"santa\" + 0.012*\"lizard\" + 0.012*\"carlo\" + 0.011*\"juan\"\n", + "2019-01-31 00:45:38,849 : INFO : topic #0 (0.020): 0.068*\"statewid\" + 0.042*\"line\" + 0.036*\"arsen\" + 0.034*\"raid\" + 0.027*\"museo\" + 0.019*\"traceabl\" + 0.017*\"serv\" + 0.014*\"exhaust\" + 0.014*\"pain\" + 0.012*\"artist\"\n", + "2019-01-31 00:45:38,850 : INFO : topic #38 (0.020): 0.023*\"walter\" + 0.010*\"aza\" + 0.010*\"battalion\" + 0.008*\"forc\" + 0.008*\"empath\" + 0.007*\"armi\" + 0.007*\"teufel\" + 0.007*\"pour\" + 0.006*\"till\" + 0.006*\"militari\"\n", + "2019-01-31 00:45:38,856 : INFO : topic diff=0.005242, rho=0.034040\n", + "2019-01-31 00:45:39,069 : INFO : PROGRESS: pass 0, at document #1728000/4922894\n", + "2019-01-31 00:45:40,443 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:45:40,709 : INFO : topic #21 (0.020): 0.039*\"samford\" + 0.022*\"spain\" + 0.018*\"del\" + 0.018*\"mexico\" + 0.014*\"soviet\" + 0.012*\"santa\" + 0.012*\"francisco\" + 0.012*\"lizard\" + 0.012*\"carlo\" + 0.011*\"juan\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 00:45:40,710 : INFO : topic #36 (0.020): 0.011*\"network\" + 0.011*\"prognosi\" + 0.010*\"pop\" + 0.009*\"develop\" + 0.008*\"cytokin\" + 0.008*\"championship\" + 0.008*\"softwar\" + 0.008*\"diggin\" + 0.008*\"uruguayan\" + 0.007*\"brio\"\n", + "2019-01-31 00:45:40,712 : INFO : topic #12 (0.020): 0.009*\"number\" + 0.007*\"frontal\" + 0.007*\"gener\" + 0.007*\"exampl\" + 0.006*\"théori\" + 0.006*\"mode\" + 0.006*\"poet\" + 0.006*\"differ\" + 0.006*\"servitud\" + 0.006*\"southern\"\n", + "2019-01-31 00:45:40,713 : INFO : topic #0 (0.020): 0.067*\"statewid\" + 0.042*\"line\" + 0.036*\"arsen\" + 0.034*\"raid\" + 0.027*\"museo\" + 0.019*\"traceabl\" + 0.018*\"serv\" + 0.014*\"pain\" + 0.014*\"exhaust\" + 0.012*\"artist\"\n", + "2019-01-31 00:45:40,714 : INFO : topic #26 (0.020): 0.029*\"workplac\" + 0.028*\"woman\" + 0.027*\"champion\" + 0.025*\"men\" + 0.025*\"olymp\" + 0.023*\"medal\" + 0.020*\"event\" + 0.018*\"taxpay\" + 0.018*\"gold\" + 0.018*\"rainfal\"\n", + "2019-01-31 00:45:40,720 : INFO : topic diff=0.005225, rho=0.034021\n", + "2019-01-31 00:45:40,881 : INFO : PROGRESS: pass 0, at document #1730000/4922894\n", + "2019-01-31 00:45:42,311 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:45:42,577 : INFO : topic #7 (0.020): 0.021*\"snatch\" + 0.020*\"di\" + 0.017*\"factor\" + 0.015*\"yawn\" + 0.015*\"margin\" + 0.014*\"bone\" + 0.013*\"life\" + 0.013*\"faster\" + 0.012*\"deal\" + 0.012*\"daughter\"\n", + "2019-01-31 00:45:42,578 : INFO : topic #32 (0.020): 0.056*\"district\" + 0.045*\"vigour\" + 0.043*\"popolo\" + 0.039*\"tortur\" + 0.031*\"cotton\" + 0.028*\"area\" + 0.023*\"regim\" + 0.023*\"multitud\" + 0.022*\"citi\" + 0.019*\"cede\"\n", + "2019-01-31 00:45:42,579 : INFO : topic #38 (0.020): 0.023*\"walter\" + 0.010*\"aza\" + 0.010*\"battalion\" + 0.008*\"forc\" + 0.008*\"empath\" + 0.007*\"armi\" + 0.007*\"pour\" + 0.006*\"teufel\" + 0.006*\"militari\" + 0.006*\"till\"\n", + "2019-01-31 00:45:42,580 : INFO : topic #47 (0.020): 0.064*\"muscl\" + 0.036*\"perceptu\" + 0.021*\"theater\" + 0.019*\"place\" + 0.017*\"damn\" + 0.017*\"compos\" + 0.014*\"orchestr\" + 0.012*\"olympo\" + 0.011*\"physician\" + 0.011*\"word\"\n", + "2019-01-31 00:45:42,581 : INFO : topic #13 (0.020): 0.027*\"australia\" + 0.026*\"sourc\" + 0.025*\"london\" + 0.025*\"new\" + 0.024*\"england\" + 0.023*\"australian\" + 0.019*\"british\" + 0.018*\"ireland\" + 0.014*\"youth\" + 0.014*\"wale\"\n", + "2019-01-31 00:45:42,587 : INFO : topic diff=0.007418, rho=0.034001\n", + "2019-01-31 00:45:42,744 : INFO : PROGRESS: pass 0, at document #1732000/4922894\n", + "2019-01-31 00:45:44,132 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:45:44,398 : INFO : topic #16 (0.020): 0.050*\"king\" + 0.030*\"priest\" + 0.024*\"duke\" + 0.020*\"idiosyncrat\" + 0.019*\"rotterdam\" + 0.018*\"grammat\" + 0.017*\"quarterli\" + 0.015*\"brazil\" + 0.013*\"portugues\" + 0.013*\"count\"\n", + "2019-01-31 00:45:44,399 : INFO : topic #47 (0.020): 0.065*\"muscl\" + 0.036*\"perceptu\" + 0.021*\"theater\" + 0.019*\"place\" + 0.017*\"damn\" + 0.017*\"compos\" + 0.013*\"orchestr\" + 0.012*\"olympo\" + 0.011*\"word\" + 0.011*\"physician\"\n", + "2019-01-31 00:45:44,400 : INFO : topic #27 (0.020): 0.073*\"questionnair\" + 0.020*\"taxpay\" + 0.019*\"candid\" + 0.012*\"tornado\" + 0.012*\"find\" + 0.012*\"driver\" + 0.011*\"fool\" + 0.011*\"squatter\" + 0.010*\"théori\" + 0.010*\"ret\"\n", + "2019-01-31 00:45:44,401 : INFO : topic #34 (0.020): 0.072*\"start\" + 0.031*\"unionist\" + 0.031*\"cotton\" + 0.030*\"american\" + 0.028*\"new\" + 0.017*\"year\" + 0.015*\"california\" + 0.012*\"terri\" + 0.012*\"warrior\" + 0.012*\"north\"\n", + "2019-01-31 00:45:44,402 : INFO : topic #1 (0.020): 0.050*\"china\" + 0.043*\"chilton\" + 0.030*\"han\" + 0.023*\"hong\" + 0.023*\"korea\" + 0.023*\"kong\" + 0.018*\"korean\" + 0.018*\"leah\" + 0.015*\"sourc\" + 0.014*\"kim\"\n", + "2019-01-31 00:45:44,408 : INFO : topic diff=0.004885, rho=0.033981\n", + "2019-01-31 00:45:44,569 : INFO : PROGRESS: pass 0, at document #1734000/4922894\n", + "2019-01-31 00:45:45,981 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:45:46,247 : INFO : topic #42 (0.020): 0.047*\"german\" + 0.034*\"germani\" + 0.015*\"vol\" + 0.014*\"jewish\" + 0.013*\"berlin\" + 0.013*\"der\" + 0.012*\"israel\" + 0.010*\"european\" + 0.010*\"greek\" + 0.010*\"austria\"\n", + "2019-01-31 00:45:46,249 : INFO : topic #43 (0.020): 0.063*\"elect\" + 0.053*\"parti\" + 0.024*\"voluntari\" + 0.022*\"democrat\" + 0.021*\"member\" + 0.017*\"polici\" + 0.014*\"bypass\" + 0.014*\"republ\" + 0.014*\"seaport\" + 0.013*\"report\"\n", + "2019-01-31 00:45:46,250 : INFO : topic #46 (0.020): 0.019*\"stop\" + 0.016*\"wind\" + 0.016*\"swedish\" + 0.016*\"sweden\" + 0.015*\"norwai\" + 0.015*\"treeless\" + 0.014*\"damag\" + 0.014*\"norwegian\" + 0.013*\"huntsvil\" + 0.011*\"farid\"\n", + "2019-01-31 00:45:46,251 : INFO : topic #31 (0.020): 0.056*\"fusiform\" + 0.026*\"scientist\" + 0.026*\"taxpay\" + 0.024*\"player\" + 0.020*\"place\" + 0.014*\"clot\" + 0.013*\"leagu\" + 0.011*\"folei\" + 0.010*\"yawn\" + 0.009*\"reconstruct\"\n", + "2019-01-31 00:45:46,252 : INFO : topic #23 (0.020): 0.136*\"audit\" + 0.066*\"best\" + 0.036*\"yawn\" + 0.029*\"jacksonvil\" + 0.026*\"japanes\" + 0.022*\"noll\" + 0.021*\"festiv\" + 0.019*\"women\" + 0.017*\"intern\" + 0.014*\"misconcept\"\n", + "2019-01-31 00:45:46,258 : INFO : topic diff=0.004924, rho=0.033962\n", + "2019-01-31 00:45:46,414 : INFO : PROGRESS: pass 0, at document #1736000/4922894\n", + "2019-01-31 00:45:47,852 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:45:48,118 : INFO : topic #21 (0.020): 0.038*\"samford\" + 0.021*\"spain\" + 0.019*\"del\" + 0.017*\"mexico\" + 0.013*\"soviet\" + 0.013*\"santa\" + 0.012*\"lizard\" + 0.012*\"francisco\" + 0.012*\"carlo\" + 0.011*\"mexican\"\n", + "2019-01-31 00:45:48,120 : INFO : topic #37 (0.020): 0.010*\"man\" + 0.009*\"love\" + 0.008*\"charact\" + 0.007*\"septemb\" + 0.007*\"gestur\" + 0.006*\"comic\" + 0.006*\"appear\" + 0.005*\"blue\" + 0.005*\"anim\" + 0.005*\"admit\"\n", + "2019-01-31 00:45:48,121 : INFO : topic #32 (0.020): 0.056*\"district\" + 0.045*\"vigour\" + 0.043*\"popolo\" + 0.039*\"tortur\" + 0.031*\"cotton\" + 0.028*\"area\" + 0.023*\"regim\" + 0.022*\"multitud\" + 0.022*\"citi\" + 0.019*\"cede\"\n", + "2019-01-31 00:45:48,122 : INFO : topic #31 (0.020): 0.056*\"fusiform\" + 0.026*\"scientist\" + 0.025*\"taxpay\" + 0.024*\"player\" + 0.020*\"place\" + 0.014*\"clot\" + 0.013*\"leagu\" + 0.011*\"folei\" + 0.010*\"yawn\" + 0.009*\"reconstruct\"\n", + "2019-01-31 00:45:48,123 : INFO : topic #12 (0.020): 0.009*\"number\" + 0.007*\"frontal\" + 0.007*\"gener\" + 0.006*\"exampl\" + 0.006*\"servitud\" + 0.006*\"théori\" + 0.006*\"poet\" + 0.006*\"mode\" + 0.006*\"differ\" + 0.006*\"southern\"\n", + "2019-01-31 00:45:48,129 : INFO : topic diff=0.005243, rho=0.033942\n", + "2019-01-31 00:45:48,287 : INFO : PROGRESS: pass 0, at document #1738000/4922894\n", + "2019-01-31 00:45:49,681 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:45:49,947 : INFO : topic #18 (0.020): 0.010*\"théori\" + 0.007*\"later\" + 0.006*\"sack\" + 0.006*\"dai\" + 0.006*\"kill\" + 0.005*\"retrospect\" + 0.005*\"like\" + 0.004*\"end\" + 0.004*\"help\" + 0.004*\"kenworthi\"\n", + "2019-01-31 00:45:49,948 : INFO : topic #13 (0.020): 0.026*\"australia\" + 0.026*\"sourc\" + 0.025*\"london\" + 0.025*\"new\" + 0.023*\"england\" + 0.023*\"australian\" + 0.019*\"british\" + 0.017*\"ireland\" + 0.015*\"youth\" + 0.014*\"wale\"\n", + "2019-01-31 00:45:49,949 : INFO : topic #49 (0.020): 0.041*\"india\" + 0.028*\"incumb\" + 0.013*\"pakistan\" + 0.012*\"islam\" + 0.012*\"anglo\" + 0.011*\"khalsa\" + 0.010*\"televis\" + 0.010*\"muskoge\" + 0.010*\"alam\" + 0.010*\"sri\"\n", + "2019-01-31 00:45:49,950 : INFO : topic #20 (0.020): 0.136*\"scholar\" + 0.039*\"struggl\" + 0.030*\"high\" + 0.030*\"educ\" + 0.024*\"collector\" + 0.018*\"yawn\" + 0.012*\"prognosi\" + 0.011*\"district\" + 0.011*\"gothic\" + 0.010*\"start\"\n", + "2019-01-31 00:45:49,951 : INFO : topic #27 (0.020): 0.072*\"questionnair\" + 0.020*\"taxpay\" + 0.019*\"candid\" + 0.012*\"find\" + 0.012*\"tornado\" + 0.012*\"driver\" + 0.011*\"fool\" + 0.011*\"ret\" + 0.011*\"squatter\" + 0.010*\"champion\"\n", + "2019-01-31 00:45:49,957 : INFO : topic diff=0.005540, rho=0.033923\n", + "2019-01-31 00:45:52,718 : INFO : -11.684 per-word bound, 3289.3 perplexity estimate based on a held-out corpus of 2000 documents with 583647 words\n", + "2019-01-31 00:45:52,718 : INFO : PROGRESS: pass 0, at document #1740000/4922894\n", + "2019-01-31 00:45:54,137 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:45:54,403 : INFO : topic #13 (0.020): 0.026*\"australia\" + 0.026*\"sourc\" + 0.025*\"london\" + 0.025*\"new\" + 0.023*\"england\" + 0.023*\"australian\" + 0.019*\"british\" + 0.018*\"ireland\" + 0.015*\"youth\" + 0.014*\"wale\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 00:45:54,404 : INFO : topic #20 (0.020): 0.136*\"scholar\" + 0.039*\"struggl\" + 0.030*\"high\" + 0.030*\"educ\" + 0.024*\"collector\" + 0.018*\"yawn\" + 0.012*\"prognosi\" + 0.011*\"gothic\" + 0.011*\"district\" + 0.010*\"start\"\n", + "2019-01-31 00:45:54,405 : INFO : topic #10 (0.020): 0.010*\"hormon\" + 0.010*\"cdd\" + 0.009*\"media\" + 0.008*\"disco\" + 0.007*\"have\" + 0.007*\"caus\" + 0.006*\"proper\" + 0.006*\"pathwai\" + 0.006*\"effect\" + 0.006*\"treat\"\n", + "2019-01-31 00:45:54,406 : INFO : topic #31 (0.020): 0.055*\"fusiform\" + 0.026*\"scientist\" + 0.025*\"taxpay\" + 0.024*\"player\" + 0.020*\"place\" + 0.014*\"clot\" + 0.012*\"leagu\" + 0.011*\"folei\" + 0.010*\"yawn\" + 0.009*\"reconstruct\"\n", + "2019-01-31 00:45:54,408 : INFO : topic #19 (0.020): 0.016*\"languag\" + 0.012*\"centuri\" + 0.010*\"woodcut\" + 0.010*\"form\" + 0.009*\"origin\" + 0.009*\"mean\" + 0.008*\"english\" + 0.007*\"trade\" + 0.007*\"known\" + 0.007*\"uruguayan\"\n", + "2019-01-31 00:45:54,413 : INFO : topic diff=0.006061, rho=0.033903\n", + "2019-01-31 00:45:54,569 : INFO : PROGRESS: pass 0, at document #1742000/4922894\n", + "2019-01-31 00:45:55,943 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:45:56,209 : INFO : topic #9 (0.020): 0.073*\"bone\" + 0.044*\"american\" + 0.028*\"valour\" + 0.020*\"folei\" + 0.020*\"player\" + 0.019*\"polit\" + 0.019*\"dutch\" + 0.016*\"english\" + 0.012*\"acrimoni\" + 0.012*\"simpler\"\n", + "2019-01-31 00:45:56,211 : INFO : topic #6 (0.020): 0.070*\"fewer\" + 0.025*\"septemb\" + 0.025*\"epiru\" + 0.018*\"teacher\" + 0.016*\"stake\" + 0.013*\"rodríguez\" + 0.012*\"proclaim\" + 0.011*\"movi\" + 0.011*\"direct\" + 0.010*\"acrimoni\"\n", + "2019-01-31 00:45:56,212 : INFO : topic #20 (0.020): 0.136*\"scholar\" + 0.039*\"struggl\" + 0.030*\"high\" + 0.030*\"educ\" + 0.024*\"collector\" + 0.018*\"yawn\" + 0.012*\"prognosi\" + 0.011*\"gothic\" + 0.010*\"district\" + 0.010*\"start\"\n", + "2019-01-31 00:45:56,213 : INFO : topic #39 (0.020): 0.055*\"canada\" + 0.040*\"canadian\" + 0.023*\"toronto\" + 0.021*\"ontario\" + 0.020*\"hoar\" + 0.015*\"hydrogen\" + 0.014*\"new\" + 0.013*\"misericordia\" + 0.013*\"novotná\" + 0.012*\"quebec\"\n", + "2019-01-31 00:45:56,214 : INFO : topic #47 (0.020): 0.065*\"muscl\" + 0.035*\"perceptu\" + 0.020*\"theater\" + 0.019*\"place\" + 0.018*\"damn\" + 0.017*\"compos\" + 0.013*\"orchestr\" + 0.012*\"olympo\" + 0.012*\"physician\" + 0.011*\"word\"\n", + "2019-01-31 00:45:56,220 : INFO : topic diff=0.004280, rho=0.033884\n", + "2019-01-31 00:45:56,377 : INFO : PROGRESS: pass 0, at document #1744000/4922894\n", + "2019-01-31 00:45:57,767 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:45:58,033 : INFO : topic #41 (0.020): 0.042*\"citi\" + 0.025*\"new\" + 0.022*\"palmer\" + 0.015*\"strategist\" + 0.012*\"open\" + 0.012*\"center\" + 0.011*\"includ\" + 0.010*\"lobe\" + 0.009*\"dai\" + 0.009*\"highli\"\n", + "2019-01-31 00:45:58,034 : INFO : topic #5 (0.020): 0.039*\"abroad\" + 0.030*\"son\" + 0.027*\"rel\" + 0.026*\"reconstruct\" + 0.021*\"band\" + 0.017*\"muscl\" + 0.015*\"simultan\" + 0.014*\"charcoal\" + 0.013*\"toyota\" + 0.010*\"myspac\"\n", + "2019-01-31 00:45:58,035 : INFO : topic #48 (0.020): 0.078*\"sens\" + 0.077*\"march\" + 0.077*\"octob\" + 0.068*\"januari\" + 0.068*\"notion\" + 0.067*\"april\" + 0.066*\"juli\" + 0.065*\"august\" + 0.065*\"judici\" + 0.064*\"decatur\"\n", + "2019-01-31 00:45:58,036 : INFO : topic #7 (0.020): 0.021*\"snatch\" + 0.020*\"di\" + 0.017*\"factor\" + 0.015*\"yawn\" + 0.015*\"margin\" + 0.014*\"bone\" + 0.013*\"life\" + 0.012*\"faster\" + 0.012*\"deal\" + 0.012*\"daughter\"\n", + "2019-01-31 00:45:58,038 : INFO : topic #30 (0.020): 0.035*\"cleveland\" + 0.035*\"leagu\" + 0.030*\"place\" + 0.027*\"taxpay\" + 0.024*\"scientist\" + 0.023*\"crete\" + 0.021*\"folei\" + 0.016*\"goal\" + 0.016*\"martin\" + 0.012*\"schmitz\"\n", + "2019-01-31 00:45:58,043 : INFO : topic diff=0.006582, rho=0.033864\n", + "2019-01-31 00:45:58,201 : INFO : PROGRESS: pass 0, at document #1746000/4922894\n", + "2019-01-31 00:45:59,599 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:45:59,868 : INFO : topic #3 (0.020): 0.034*\"present\" + 0.028*\"offic\" + 0.024*\"minist\" + 0.021*\"nation\" + 0.021*\"govern\" + 0.020*\"member\" + 0.019*\"serv\" + 0.018*\"gener\" + 0.016*\"seri\" + 0.015*\"start\"\n", + "2019-01-31 00:45:59,869 : INFO : topic #9 (0.020): 0.073*\"bone\" + 0.043*\"american\" + 0.029*\"valour\" + 0.020*\"folei\" + 0.019*\"player\" + 0.019*\"dutch\" + 0.018*\"polit\" + 0.016*\"english\" + 0.012*\"acrimoni\" + 0.012*\"simpler\"\n", + "2019-01-31 00:45:59,870 : INFO : topic #13 (0.020): 0.027*\"sourc\" + 0.026*\"australia\" + 0.025*\"new\" + 0.025*\"london\" + 0.023*\"england\" + 0.023*\"australian\" + 0.019*\"british\" + 0.017*\"ireland\" + 0.016*\"youth\" + 0.014*\"wale\"\n", + "2019-01-31 00:45:59,871 : INFO : topic #30 (0.020): 0.036*\"leagu\" + 0.035*\"cleveland\" + 0.030*\"place\" + 0.027*\"taxpay\" + 0.024*\"scientist\" + 0.023*\"crete\" + 0.021*\"folei\" + 0.016*\"goal\" + 0.016*\"martin\" + 0.012*\"schmitz\"\n", + "2019-01-31 00:45:59,872 : INFO : topic #7 (0.020): 0.021*\"snatch\" + 0.020*\"di\" + 0.017*\"factor\" + 0.015*\"yawn\" + 0.015*\"margin\" + 0.014*\"bone\" + 0.013*\"life\" + 0.012*\"faster\" + 0.012*\"deal\" + 0.012*\"daughter\"\n", + "2019-01-31 00:45:59,878 : INFO : topic diff=0.005013, rho=0.033845\n", + "2019-01-31 00:46:00,039 : INFO : PROGRESS: pass 0, at document #1748000/4922894\n", + "2019-01-31 00:46:01,773 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:46:02,040 : INFO : topic #49 (0.020): 0.041*\"india\" + 0.028*\"incumb\" + 0.013*\"pakistan\" + 0.012*\"islam\" + 0.012*\"anglo\" + 0.011*\"khalsa\" + 0.010*\"muskoge\" + 0.010*\"alam\" + 0.010*\"televis\" + 0.009*\"sri\"\n", + "2019-01-31 00:46:02,041 : INFO : topic #13 (0.020): 0.027*\"sourc\" + 0.027*\"australia\" + 0.025*\"new\" + 0.025*\"london\" + 0.023*\"england\" + 0.023*\"australian\" + 0.019*\"british\" + 0.017*\"ireland\" + 0.015*\"youth\" + 0.014*\"wale\"\n", + "2019-01-31 00:46:02,043 : INFO : topic #29 (0.020): 0.026*\"companhia\" + 0.011*\"million\" + 0.011*\"bank\" + 0.011*\"busi\" + 0.010*\"produc\" + 0.010*\"market\" + 0.009*\"industri\" + 0.008*\"yawn\" + 0.008*\"manag\" + 0.007*\"trace\"\n", + "2019-01-31 00:46:02,044 : INFO : topic #22 (0.020): 0.033*\"spars\" + 0.024*\"factor\" + 0.021*\"male\" + 0.019*\"adulthood\" + 0.017*\"feel\" + 0.012*\"plaisir\" + 0.011*\"hostil\" + 0.010*\"genu\" + 0.009*\"live\" + 0.008*\"median\"\n", + "2019-01-31 00:46:02,045 : INFO : topic #23 (0.020): 0.137*\"audit\" + 0.065*\"best\" + 0.036*\"yawn\" + 0.030*\"jacksonvil\" + 0.026*\"japanes\" + 0.023*\"noll\" + 0.020*\"festiv\" + 0.018*\"women\" + 0.017*\"intern\" + 0.013*\"prison\"\n", + "2019-01-31 00:46:02,051 : INFO : topic diff=0.005182, rho=0.033826\n", + "2019-01-31 00:46:02,206 : INFO : PROGRESS: pass 0, at document #1750000/4922894\n", + "2019-01-31 00:46:04,012 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:46:04,278 : INFO : topic #13 (0.020): 0.027*\"sourc\" + 0.027*\"australia\" + 0.025*\"new\" + 0.025*\"london\" + 0.023*\"england\" + 0.023*\"australian\" + 0.019*\"british\" + 0.017*\"ireland\" + 0.015*\"youth\" + 0.014*\"wale\"\n", + "2019-01-31 00:46:04,279 : INFO : topic #26 (0.020): 0.030*\"workplac\" + 0.028*\"champion\" + 0.026*\"woman\" + 0.025*\"olymp\" + 0.024*\"men\" + 0.023*\"medal\" + 0.020*\"event\" + 0.019*\"taxpay\" + 0.018*\"rainfal\" + 0.018*\"gold\"\n", + "2019-01-31 00:46:04,280 : INFO : topic #37 (0.020): 0.010*\"man\" + 0.009*\"love\" + 0.008*\"charact\" + 0.007*\"septemb\" + 0.007*\"gestur\" + 0.006*\"appear\" + 0.006*\"comic\" + 0.005*\"blue\" + 0.005*\"anim\" + 0.005*\"admit\"\n", + "2019-01-31 00:46:04,281 : INFO : topic #30 (0.020): 0.036*\"leagu\" + 0.035*\"cleveland\" + 0.030*\"place\" + 0.027*\"taxpay\" + 0.024*\"scientist\" + 0.022*\"crete\" + 0.021*\"folei\" + 0.016*\"goal\" + 0.016*\"martin\" + 0.012*\"schmitz\"\n", + "2019-01-31 00:46:04,282 : INFO : topic #40 (0.020): 0.089*\"unit\" + 0.023*\"schuster\" + 0.023*\"collector\" + 0.022*\"institut\" + 0.021*\"requir\" + 0.019*\"student\" + 0.015*\"professor\" + 0.012*\"word\" + 0.011*\"degre\" + 0.011*\"governor\"\n", + "2019-01-31 00:46:04,288 : INFO : topic diff=0.005553, rho=0.033806\n", + "2019-01-31 00:46:04,445 : INFO : PROGRESS: pass 0, at document #1752000/4922894\n", + "2019-01-31 00:46:05,835 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:46:06,102 : INFO : topic #25 (0.020): 0.031*\"ring\" + 0.017*\"lagrang\" + 0.017*\"warmth\" + 0.016*\"area\" + 0.015*\"mount\" + 0.009*\"north\" + 0.009*\"palmer\" + 0.008*\"land\" + 0.008*\"foam\" + 0.008*\"lobe\"\n", + "2019-01-31 00:46:06,103 : INFO : topic #35 (0.020): 0.058*\"russia\" + 0.038*\"sovereignti\" + 0.033*\"rural\" + 0.025*\"poison\" + 0.023*\"reprint\" + 0.023*\"personifi\" + 0.022*\"moscow\" + 0.018*\"poland\" + 0.016*\"unfortun\" + 0.014*\"turin\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 00:46:06,104 : INFO : topic #37 (0.020): 0.010*\"man\" + 0.009*\"love\" + 0.008*\"charact\" + 0.007*\"septemb\" + 0.007*\"gestur\" + 0.006*\"comic\" + 0.006*\"appear\" + 0.005*\"blue\" + 0.005*\"anim\" + 0.005*\"admit\"\n", + "2019-01-31 00:46:06,105 : INFO : topic #21 (0.020): 0.037*\"samford\" + 0.021*\"spain\" + 0.019*\"del\" + 0.018*\"mexico\" + 0.013*\"soviet\" + 0.012*\"santa\" + 0.012*\"carlo\" + 0.012*\"lizard\" + 0.011*\"francisco\" + 0.011*\"juan\"\n", + "2019-01-31 00:46:06,106 : INFO : topic #10 (0.020): 0.010*\"cdd\" + 0.009*\"media\" + 0.009*\"hormon\" + 0.008*\"disco\" + 0.007*\"have\" + 0.007*\"caus\" + 0.006*\"pathwai\" + 0.006*\"proper\" + 0.006*\"effect\" + 0.006*\"gastrointestin\"\n", + "2019-01-31 00:46:06,112 : INFO : topic diff=0.005947, rho=0.033787\n", + "2019-01-31 00:46:06,269 : INFO : PROGRESS: pass 0, at document #1754000/4922894\n", + "2019-01-31 00:46:07,656 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:46:07,921 : INFO : topic #35 (0.020): 0.057*\"russia\" + 0.037*\"sovereignti\" + 0.033*\"rural\" + 0.025*\"poison\" + 0.023*\"reprint\" + 0.023*\"personifi\" + 0.021*\"moscow\" + 0.017*\"poland\" + 0.015*\"unfortun\" + 0.014*\"tyrant\"\n", + "2019-01-31 00:46:07,922 : INFO : topic #48 (0.020): 0.079*\"march\" + 0.078*\"sens\" + 0.078*\"octob\" + 0.069*\"notion\" + 0.069*\"januari\" + 0.068*\"april\" + 0.068*\"juli\" + 0.066*\"august\" + 0.066*\"judici\" + 0.065*\"decatur\"\n", + "2019-01-31 00:46:07,924 : INFO : topic #37 (0.020): 0.010*\"man\" + 0.009*\"love\" + 0.008*\"charact\" + 0.007*\"septemb\" + 0.007*\"gestur\" + 0.006*\"appear\" + 0.006*\"comic\" + 0.006*\"blue\" + 0.005*\"anim\" + 0.005*\"admit\"\n", + "2019-01-31 00:46:07,925 : INFO : topic #10 (0.020): 0.010*\"cdd\" + 0.009*\"media\" + 0.009*\"hormon\" + 0.008*\"disco\" + 0.007*\"have\" + 0.007*\"caus\" + 0.006*\"pathwai\" + 0.006*\"effect\" + 0.006*\"gastrointestin\" + 0.006*\"proper\"\n", + "2019-01-31 00:46:07,926 : INFO : topic #11 (0.020): 0.024*\"john\" + 0.013*\"will\" + 0.012*\"david\" + 0.012*\"jame\" + 0.011*\"rival\" + 0.010*\"mexican–american\" + 0.008*\"georg\" + 0.008*\"slur\" + 0.008*\"paul\" + 0.008*\"rhyme\"\n", + "2019-01-31 00:46:07,932 : INFO : topic diff=0.005338, rho=0.033768\n", + "2019-01-31 00:46:08,088 : INFO : PROGRESS: pass 0, at document #1756000/4922894\n", + "2019-01-31 00:46:09,473 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:46:09,739 : INFO : topic #32 (0.020): 0.054*\"district\" + 0.045*\"vigour\" + 0.044*\"popolo\" + 0.039*\"tortur\" + 0.031*\"cotton\" + 0.028*\"area\" + 0.023*\"regim\" + 0.022*\"multitud\" + 0.022*\"citi\" + 0.020*\"cede\"\n", + "2019-01-31 00:46:09,740 : INFO : topic #22 (0.020): 0.033*\"spars\" + 0.024*\"factor\" + 0.020*\"male\" + 0.019*\"adulthood\" + 0.017*\"feel\" + 0.012*\"plaisir\" + 0.011*\"hostil\" + 0.010*\"genu\" + 0.009*\"live\" + 0.008*\"median\"\n", + "2019-01-31 00:46:09,741 : INFO : topic #3 (0.020): 0.033*\"present\" + 0.028*\"offic\" + 0.024*\"minist\" + 0.022*\"nation\" + 0.021*\"govern\" + 0.020*\"member\" + 0.018*\"serv\" + 0.018*\"gener\" + 0.016*\"seri\" + 0.016*\"start\"\n", + "2019-01-31 00:46:09,742 : INFO : topic #41 (0.020): 0.041*\"citi\" + 0.025*\"new\" + 0.022*\"palmer\" + 0.014*\"strategist\" + 0.012*\"open\" + 0.012*\"center\" + 0.011*\"includ\" + 0.010*\"lobe\" + 0.009*\"highli\" + 0.009*\"dai\"\n", + "2019-01-31 00:46:09,742 : INFO : topic #21 (0.020): 0.037*\"samford\" + 0.021*\"spain\" + 0.019*\"del\" + 0.018*\"mexico\" + 0.013*\"soviet\" + 0.012*\"santa\" + 0.012*\"carlo\" + 0.012*\"lizard\" + 0.011*\"francisco\" + 0.011*\"mexican\"\n", + "2019-01-31 00:46:09,748 : INFO : topic diff=0.004541, rho=0.033748\n", + "2019-01-31 00:46:09,968 : INFO : PROGRESS: pass 0, at document #1758000/4922894\n", + "2019-01-31 00:46:11,398 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:46:11,664 : INFO : topic #40 (0.020): 0.089*\"unit\" + 0.023*\"schuster\" + 0.023*\"collector\" + 0.022*\"institut\" + 0.021*\"requir\" + 0.019*\"student\" + 0.015*\"professor\" + 0.012*\"word\" + 0.011*\"degre\" + 0.011*\"http\"\n", + "2019-01-31 00:46:11,665 : INFO : topic #30 (0.020): 0.036*\"leagu\" + 0.035*\"cleveland\" + 0.030*\"place\" + 0.027*\"taxpay\" + 0.025*\"scientist\" + 0.023*\"crete\" + 0.021*\"folei\" + 0.016*\"goal\" + 0.015*\"martin\" + 0.012*\"schmitz\"\n", + "2019-01-31 00:46:11,666 : INFO : topic #46 (0.020): 0.019*\"stop\" + 0.017*\"wind\" + 0.016*\"swedish\" + 0.015*\"sweden\" + 0.015*\"damag\" + 0.014*\"norwai\" + 0.014*\"treeless\" + 0.013*\"norwegian\" + 0.012*\"huntsvil\" + 0.011*\"farid\"\n", + "2019-01-31 00:46:11,667 : INFO : topic #43 (0.020): 0.062*\"elect\" + 0.056*\"parti\" + 0.025*\"voluntari\" + 0.021*\"democrat\" + 0.020*\"member\" + 0.017*\"polici\" + 0.014*\"bypass\" + 0.014*\"republ\" + 0.013*\"seaport\" + 0.013*\"report\"\n", + "2019-01-31 00:46:11,669 : INFO : topic #42 (0.020): 0.046*\"german\" + 0.032*\"germani\" + 0.014*\"jewish\" + 0.014*\"vol\" + 0.013*\"israel\" + 0.013*\"berlin\" + 0.013*\"der\" + 0.011*\"european\" + 0.009*\"europ\" + 0.009*\"austria\"\n", + "2019-01-31 00:46:11,674 : INFO : topic diff=0.005243, rho=0.033729\n", + "2019-01-31 00:46:14,338 : INFO : -11.536 per-word bound, 2970.2 perplexity estimate based on a held-out corpus of 2000 documents with 540914 words\n", + "2019-01-31 00:46:14,339 : INFO : PROGRESS: pass 0, at document #1760000/4922894\n", + "2019-01-31 00:46:15,706 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:46:15,972 : INFO : topic #36 (0.020): 0.012*\"network\" + 0.011*\"prognosi\" + 0.010*\"pop\" + 0.008*\"develop\" + 0.008*\"cytokin\" + 0.008*\"user\" + 0.008*\"uruguayan\" + 0.007*\"championship\" + 0.007*\"softwar\" + 0.007*\"diggin\"\n", + "2019-01-31 00:46:15,973 : INFO : topic #18 (0.020): 0.010*\"théori\" + 0.007*\"later\" + 0.006*\"sack\" + 0.006*\"kill\" + 0.006*\"dai\" + 0.005*\"retrospect\" + 0.005*\"like\" + 0.004*\"end\" + 0.004*\"help\" + 0.004*\"kenworthi\"\n", + "2019-01-31 00:46:15,974 : INFO : topic #11 (0.020): 0.025*\"john\" + 0.013*\"will\" + 0.012*\"david\" + 0.012*\"jame\" + 0.011*\"rival\" + 0.009*\"mexican–american\" + 0.008*\"georg\" + 0.008*\"slur\" + 0.008*\"paul\" + 0.008*\"rhyme\"\n", + "2019-01-31 00:46:15,975 : INFO : topic #13 (0.020): 0.027*\"sourc\" + 0.027*\"australia\" + 0.026*\"new\" + 0.025*\"london\" + 0.023*\"england\" + 0.023*\"australian\" + 0.019*\"british\" + 0.017*\"ireland\" + 0.015*\"youth\" + 0.015*\"wale\"\n", + "2019-01-31 00:46:15,976 : INFO : topic #2 (0.020): 0.047*\"isl\" + 0.037*\"shield\" + 0.018*\"narrat\" + 0.014*\"scot\" + 0.012*\"blur\" + 0.012*\"pope\" + 0.011*\"coalit\" + 0.011*\"nativist\" + 0.010*\"bahá\" + 0.009*\"crew\"\n", + "2019-01-31 00:46:15,982 : INFO : topic diff=0.004600, rho=0.033710\n", + "2019-01-31 00:46:16,141 : INFO : PROGRESS: pass 0, at document #1762000/4922894\n", + "2019-01-31 00:46:17,545 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:46:17,811 : INFO : topic #35 (0.020): 0.058*\"russia\" + 0.037*\"sovereignti\" + 0.033*\"rural\" + 0.024*\"poison\" + 0.023*\"reprint\" + 0.022*\"personifi\" + 0.021*\"moscow\" + 0.017*\"poland\" + 0.016*\"unfortun\" + 0.014*\"tyrant\"\n", + "2019-01-31 00:46:17,812 : INFO : topic #49 (0.020): 0.043*\"india\" + 0.028*\"incumb\" + 0.013*\"pakistan\" + 0.013*\"islam\" + 0.012*\"anglo\" + 0.011*\"muskoge\" + 0.011*\"khalsa\" + 0.010*\"alam\" + 0.010*\"televis\" + 0.009*\"tajikistan\"\n", + "2019-01-31 00:46:17,813 : INFO : topic #13 (0.020): 0.028*\"sourc\" + 0.027*\"australia\" + 0.026*\"new\" + 0.025*\"london\" + 0.023*\"england\" + 0.023*\"australian\" + 0.019*\"british\" + 0.017*\"ireland\" + 0.016*\"youth\" + 0.015*\"wale\"\n", + "2019-01-31 00:46:17,814 : INFO : topic #38 (0.020): 0.024*\"walter\" + 0.009*\"battalion\" + 0.009*\"aza\" + 0.009*\"forc\" + 0.007*\"armi\" + 0.007*\"empath\" + 0.006*\"teufel\" + 0.006*\"pour\" + 0.006*\"govern\" + 0.006*\"militari\"\n", + "2019-01-31 00:46:17,815 : INFO : topic #5 (0.020): 0.040*\"abroad\" + 0.029*\"son\" + 0.027*\"rel\" + 0.026*\"reconstruct\" + 0.021*\"band\" + 0.017*\"muscl\" + 0.015*\"simultan\" + 0.014*\"charcoal\" + 0.014*\"toyota\" + 0.011*\"myspac\"\n", + "2019-01-31 00:46:17,822 : INFO : topic diff=0.006460, rho=0.033691\n", + "2019-01-31 00:46:17,983 : INFO : PROGRESS: pass 0, at document #1764000/4922894\n", + "2019-01-31 00:46:19,374 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:46:19,643 : INFO : topic #25 (0.020): 0.032*\"ring\" + 0.018*\"lagrang\" + 0.017*\"warmth\" + 0.016*\"area\" + 0.015*\"mount\" + 0.009*\"north\" + 0.009*\"palmer\" + 0.008*\"foam\" + 0.008*\"land\" + 0.008*\"lobe\"\n", + "2019-01-31 00:46:19,644 : INFO : topic #7 (0.020): 0.021*\"snatch\" + 0.020*\"di\" + 0.017*\"factor\" + 0.015*\"yawn\" + 0.015*\"margin\" + 0.014*\"bone\" + 0.013*\"life\" + 0.013*\"faster\" + 0.012*\"daughter\" + 0.012*\"deal\"\n", + "2019-01-31 00:46:19,645 : INFO : topic #15 (0.020): 0.011*\"organ\" + 0.010*\"small\" + 0.010*\"develop\" + 0.010*\"group\" + 0.010*\"commun\" + 0.009*\"word\" + 0.008*\"peopl\" + 0.007*\"cultur\" + 0.007*\"human\" + 0.007*\"woman\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 00:46:19,646 : INFO : topic #9 (0.020): 0.075*\"bone\" + 0.044*\"american\" + 0.027*\"valour\" + 0.020*\"dutch\" + 0.019*\"folei\" + 0.019*\"player\" + 0.018*\"polit\" + 0.016*\"english\" + 0.013*\"acrimoni\" + 0.012*\"simpler\"\n", + "2019-01-31 00:46:19,648 : INFO : topic #41 (0.020): 0.041*\"citi\" + 0.025*\"new\" + 0.022*\"palmer\" + 0.014*\"strategist\" + 0.012*\"open\" + 0.012*\"center\" + 0.011*\"includ\" + 0.010*\"lobe\" + 0.009*\"highli\" + 0.009*\"hot\"\n", + "2019-01-31 00:46:19,653 : INFO : topic diff=0.004579, rho=0.033672\n", + "2019-01-31 00:46:19,813 : INFO : PROGRESS: pass 0, at document #1766000/4922894\n", + "2019-01-31 00:46:21,177 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:46:21,443 : INFO : topic #42 (0.020): 0.046*\"german\" + 0.032*\"germani\" + 0.014*\"vol\" + 0.014*\"jewish\" + 0.013*\"berlin\" + 0.013*\"israel\" + 0.012*\"der\" + 0.011*\"european\" + 0.010*\"europ\" + 0.009*\"austria\"\n", + "2019-01-31 00:46:21,445 : INFO : topic #31 (0.020): 0.056*\"fusiform\" + 0.027*\"scientist\" + 0.026*\"taxpay\" + 0.024*\"player\" + 0.020*\"place\" + 0.014*\"clot\" + 0.013*\"leagu\" + 0.011*\"folei\" + 0.010*\"yawn\" + 0.009*\"reconstruct\"\n", + "2019-01-31 00:46:21,446 : INFO : topic #46 (0.020): 0.018*\"stop\" + 0.016*\"wind\" + 0.016*\"swedish\" + 0.016*\"sweden\" + 0.015*\"damag\" + 0.015*\"norwai\" + 0.014*\"norwegian\" + 0.013*\"treeless\" + 0.011*\"huntsvil\" + 0.011*\"farid\"\n", + "2019-01-31 00:46:21,447 : INFO : topic #48 (0.020): 0.080*\"march\" + 0.078*\"sens\" + 0.078*\"octob\" + 0.072*\"januari\" + 0.070*\"notion\" + 0.070*\"april\" + 0.069*\"juli\" + 0.068*\"judici\" + 0.067*\"august\" + 0.065*\"decatur\"\n", + "2019-01-31 00:46:21,448 : INFO : topic #30 (0.020): 0.036*\"leagu\" + 0.036*\"cleveland\" + 0.029*\"place\" + 0.027*\"taxpay\" + 0.025*\"scientist\" + 0.023*\"crete\" + 0.020*\"folei\" + 0.016*\"goal\" + 0.015*\"martin\" + 0.012*\"schmitz\"\n", + "2019-01-31 00:46:21,454 : INFO : topic diff=0.005109, rho=0.033653\n", + "2019-01-31 00:46:21,608 : INFO : PROGRESS: pass 0, at document #1768000/4922894\n", + "2019-01-31 00:46:22,992 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:46:23,258 : INFO : topic #37 (0.020): 0.009*\"man\" + 0.009*\"love\" + 0.009*\"charact\" + 0.008*\"septemb\" + 0.007*\"gestur\" + 0.006*\"appear\" + 0.006*\"comic\" + 0.006*\"blue\" + 0.005*\"anim\" + 0.005*\"vision\"\n", + "2019-01-31 00:46:23,259 : INFO : topic #1 (0.020): 0.052*\"china\" + 0.045*\"chilton\" + 0.024*\"korea\" + 0.022*\"hong\" + 0.022*\"kong\" + 0.020*\"han\" + 0.020*\"korean\" + 0.018*\"leah\" + 0.015*\"sourc\" + 0.015*\"kim\"\n", + "2019-01-31 00:46:23,260 : INFO : topic #29 (0.020): 0.026*\"companhia\" + 0.011*\"million\" + 0.011*\"busi\" + 0.010*\"bank\" + 0.010*\"produc\" + 0.010*\"market\" + 0.009*\"industri\" + 0.009*\"yawn\" + 0.008*\"manag\" + 0.007*\"trace\"\n", + "2019-01-31 00:46:23,262 : INFO : topic #5 (0.020): 0.040*\"abroad\" + 0.029*\"son\" + 0.027*\"rel\" + 0.026*\"reconstruct\" + 0.021*\"band\" + 0.017*\"muscl\" + 0.016*\"simultan\" + 0.015*\"charcoal\" + 0.013*\"toyota\" + 0.010*\"myspac\"\n", + "2019-01-31 00:46:23,263 : INFO : topic #44 (0.020): 0.031*\"rooftop\" + 0.028*\"final\" + 0.024*\"wife\" + 0.021*\"tourist\" + 0.020*\"champion\" + 0.016*\"chamber\" + 0.015*\"taxpay\" + 0.015*\"martin\" + 0.015*\"open\" + 0.013*\"tiepolo\"\n", + "2019-01-31 00:46:23,269 : INFO : topic diff=0.005534, rho=0.033634\n", + "2019-01-31 00:46:23,424 : INFO : PROGRESS: pass 0, at document #1770000/4922894\n", + "2019-01-31 00:46:24,810 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:46:25,076 : INFO : topic #41 (0.020): 0.041*\"citi\" + 0.025*\"new\" + 0.022*\"palmer\" + 0.014*\"strategist\" + 0.012*\"open\" + 0.012*\"center\" + 0.011*\"includ\" + 0.010*\"lobe\" + 0.009*\"highli\" + 0.009*\"dai\"\n", + "2019-01-31 00:46:25,077 : INFO : topic #6 (0.020): 0.071*\"fewer\" + 0.024*\"septemb\" + 0.024*\"epiru\" + 0.018*\"teacher\" + 0.017*\"stake\" + 0.013*\"proclaim\" + 0.013*\"rodríguez\" + 0.011*\"direct\" + 0.011*\"movi\" + 0.010*\"acrimoni\"\n", + "2019-01-31 00:46:25,078 : INFO : topic #34 (0.020): 0.076*\"start\" + 0.032*\"unionist\" + 0.030*\"american\" + 0.028*\"cotton\" + 0.028*\"new\" + 0.017*\"year\" + 0.015*\"california\" + 0.012*\"terri\" + 0.012*\"warrior\" + 0.012*\"north\"\n", + "2019-01-31 00:46:25,079 : INFO : topic #14 (0.020): 0.023*\"forc\" + 0.022*\"aggress\" + 0.021*\"armi\" + 0.019*\"walter\" + 0.017*\"com\" + 0.014*\"oper\" + 0.013*\"unionist\" + 0.012*\"airbu\" + 0.012*\"militari\" + 0.011*\"diversifi\"\n", + "2019-01-31 00:46:25,081 : INFO : topic #19 (0.020): 0.016*\"languag\" + 0.012*\"centuri\" + 0.011*\"woodcut\" + 0.010*\"form\" + 0.009*\"origin\" + 0.009*\"mean\" + 0.008*\"english\" + 0.007*\"trade\" + 0.007*\"known\" + 0.006*\"uruguayan\"\n", + "2019-01-31 00:46:25,086 : INFO : topic diff=0.004971, rho=0.033615\n", + "2019-01-31 00:46:25,240 : INFO : PROGRESS: pass 0, at document #1772000/4922894\n", + "2019-01-31 00:46:26,590 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:46:26,856 : INFO : topic #35 (0.020): 0.058*\"russia\" + 0.038*\"sovereignti\" + 0.034*\"rural\" + 0.024*\"reprint\" + 0.023*\"poison\" + 0.022*\"personifi\" + 0.021*\"moscow\" + 0.016*\"poland\" + 0.016*\"unfortun\" + 0.013*\"malaysia\"\n", + "2019-01-31 00:46:26,857 : INFO : topic #36 (0.020): 0.012*\"network\" + 0.011*\"prognosi\" + 0.010*\"pop\" + 0.008*\"develop\" + 0.008*\"user\" + 0.008*\"cytokin\" + 0.007*\"uruguayan\" + 0.007*\"softwar\" + 0.007*\"championship\" + 0.007*\"includ\"\n", + "2019-01-31 00:46:26,858 : INFO : topic #31 (0.020): 0.056*\"fusiform\" + 0.027*\"scientist\" + 0.026*\"taxpay\" + 0.024*\"player\" + 0.020*\"place\" + 0.013*\"clot\" + 0.013*\"leagu\" + 0.011*\"folei\" + 0.010*\"yawn\" + 0.009*\"reconstruct\"\n", + "2019-01-31 00:46:26,859 : INFO : topic #13 (0.020): 0.028*\"australia\" + 0.027*\"sourc\" + 0.027*\"new\" + 0.025*\"london\" + 0.023*\"australian\" + 0.023*\"england\" + 0.018*\"british\" + 0.018*\"youth\" + 0.016*\"ireland\" + 0.014*\"wale\"\n", + "2019-01-31 00:46:26,860 : INFO : topic #38 (0.020): 0.023*\"walter\" + 0.009*\"battalion\" + 0.009*\"aza\" + 0.009*\"forc\" + 0.007*\"armi\" + 0.007*\"empath\" + 0.006*\"teufel\" + 0.006*\"pour\" + 0.006*\"govern\" + 0.006*\"militari\"\n", + "2019-01-31 00:46:26,866 : INFO : topic diff=0.005021, rho=0.033596\n", + "2019-01-31 00:46:27,032 : INFO : PROGRESS: pass 0, at document #1774000/4922894\n", + "2019-01-31 00:46:28,446 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:46:28,716 : INFO : topic #34 (0.020): 0.075*\"start\" + 0.032*\"unionist\" + 0.030*\"american\" + 0.028*\"new\" + 0.028*\"cotton\" + 0.017*\"year\" + 0.015*\"california\" + 0.012*\"terri\" + 0.012*\"warrior\" + 0.012*\"north\"\n", + "2019-01-31 00:46:28,717 : INFO : topic #14 (0.020): 0.024*\"forc\" + 0.023*\"aggress\" + 0.021*\"armi\" + 0.019*\"walter\" + 0.017*\"com\" + 0.014*\"oper\" + 0.013*\"unionist\" + 0.012*\"militari\" + 0.012*\"airbu\" + 0.011*\"diversifi\"\n", + "2019-01-31 00:46:28,718 : INFO : topic #4 (0.020): 0.022*\"enfranchis\" + 0.016*\"depress\" + 0.015*\"pour\" + 0.009*\"elabor\" + 0.008*\"mode\" + 0.008*\"veget\" + 0.007*\"uruguayan\" + 0.007*\"produc\" + 0.007*\"encyclopedia\" + 0.007*\"develop\"\n", + "2019-01-31 00:46:28,719 : INFO : topic #0 (0.020): 0.068*\"statewid\" + 0.041*\"line\" + 0.036*\"arsen\" + 0.035*\"raid\" + 0.027*\"museo\" + 0.019*\"traceabl\" + 0.019*\"serv\" + 0.014*\"exhaust\" + 0.013*\"pain\" + 0.013*\"oper\"\n", + "2019-01-31 00:46:28,721 : INFO : topic #18 (0.020): 0.010*\"théori\" + 0.007*\"later\" + 0.006*\"sack\" + 0.006*\"kill\" + 0.006*\"dai\" + 0.005*\"retrospect\" + 0.005*\"like\" + 0.004*\"end\" + 0.004*\"help\" + 0.004*\"kenworthi\"\n", + "2019-01-31 00:46:28,727 : INFO : topic diff=0.007867, rho=0.033577\n", + "2019-01-31 00:46:28,878 : INFO : PROGRESS: pass 0, at document #1776000/4922894\n", + "2019-01-31 00:46:30,233 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:46:30,500 : INFO : topic #18 (0.020): 0.010*\"théori\" + 0.007*\"later\" + 0.006*\"sack\" + 0.006*\"kill\" + 0.006*\"dai\" + 0.005*\"retrospect\" + 0.005*\"like\" + 0.004*\"end\" + 0.004*\"help\" + 0.004*\"kenworthi\"\n", + "2019-01-31 00:46:30,501 : INFO : topic #23 (0.020): 0.137*\"audit\" + 0.068*\"best\" + 0.035*\"yawn\" + 0.031*\"jacksonvil\" + 0.024*\"japanes\" + 0.023*\"noll\" + 0.020*\"festiv\" + 0.019*\"women\" + 0.016*\"intern\" + 0.014*\"prison\"\n", + "2019-01-31 00:46:30,502 : INFO : topic #35 (0.020): 0.059*\"russia\" + 0.037*\"sovereignti\" + 0.033*\"rural\" + 0.024*\"poison\" + 0.023*\"reprint\" + 0.022*\"personifi\" + 0.021*\"moscow\" + 0.016*\"poland\" + 0.015*\"unfortun\" + 0.013*\"malaysia\"\n", + "2019-01-31 00:46:30,503 : INFO : topic #13 (0.020): 0.028*\"sourc\" + 0.027*\"australia\" + 0.027*\"new\" + 0.025*\"london\" + 0.023*\"australian\" + 0.023*\"england\" + 0.018*\"british\" + 0.017*\"youth\" + 0.016*\"ireland\" + 0.014*\"wale\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 00:46:30,504 : INFO : topic #19 (0.020): 0.016*\"languag\" + 0.012*\"centuri\" + 0.011*\"woodcut\" + 0.010*\"form\" + 0.009*\"origin\" + 0.008*\"mean\" + 0.008*\"english\" + 0.007*\"trade\" + 0.007*\"known\" + 0.006*\"uruguayan\"\n", + "2019-01-31 00:46:30,509 : INFO : topic diff=0.005425, rho=0.033558\n", + "2019-01-31 00:46:30,668 : INFO : PROGRESS: pass 0, at document #1778000/4922894\n", + "2019-01-31 00:46:32,056 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:46:32,323 : INFO : topic #24 (0.020): 0.041*\"book\" + 0.034*\"publicis\" + 0.024*\"word\" + 0.018*\"new\" + 0.014*\"edit\" + 0.013*\"presid\" + 0.012*\"nicola\" + 0.012*\"storag\" + 0.011*\"collect\" + 0.011*\"worldwid\"\n", + "2019-01-31 00:46:32,324 : INFO : topic #11 (0.020): 0.025*\"john\" + 0.013*\"will\" + 0.012*\"jame\" + 0.011*\"david\" + 0.011*\"rival\" + 0.009*\"mexican–american\" + 0.008*\"georg\" + 0.008*\"slur\" + 0.008*\"rhyme\" + 0.008*\"paul\"\n", + "2019-01-31 00:46:32,325 : INFO : topic #32 (0.020): 0.055*\"district\" + 0.045*\"vigour\" + 0.043*\"popolo\" + 0.039*\"tortur\" + 0.031*\"cotton\" + 0.028*\"area\" + 0.023*\"regim\" + 0.023*\"multitud\" + 0.022*\"citi\" + 0.019*\"cede\"\n", + "2019-01-31 00:46:32,326 : INFO : topic #6 (0.020): 0.071*\"fewer\" + 0.024*\"septemb\" + 0.023*\"epiru\" + 0.018*\"teacher\" + 0.016*\"stake\" + 0.014*\"proclaim\" + 0.013*\"rodríguez\" + 0.011*\"direct\" + 0.011*\"movi\" + 0.010*\"acrimoni\"\n", + "2019-01-31 00:46:32,327 : INFO : topic #21 (0.020): 0.038*\"samford\" + 0.022*\"spain\" + 0.020*\"del\" + 0.017*\"mexico\" + 0.014*\"soviet\" + 0.012*\"carlo\" + 0.012*\"francisco\" + 0.012*\"santa\" + 0.012*\"lizard\" + 0.011*\"juan\"\n", + "2019-01-31 00:46:32,333 : INFO : topic diff=0.004494, rho=0.033539\n", + "2019-01-31 00:46:34,990 : INFO : -11.606 per-word bound, 3117.2 perplexity estimate based on a held-out corpus of 2000 documents with 529091 words\n", + "2019-01-31 00:46:34,990 : INFO : PROGRESS: pass 0, at document #1780000/4922894\n", + "2019-01-31 00:46:36,360 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:46:36,626 : INFO : topic #42 (0.020): 0.046*\"german\" + 0.031*\"germani\" + 0.015*\"jewish\" + 0.014*\"vol\" + 0.013*\"berlin\" + 0.013*\"israel\" + 0.012*\"der\" + 0.011*\"european\" + 0.010*\"europ\" + 0.008*\"austria\"\n", + "2019-01-31 00:46:36,627 : INFO : topic #25 (0.020): 0.032*\"ring\" + 0.017*\"lagrang\" + 0.017*\"warmth\" + 0.016*\"area\" + 0.015*\"mount\" + 0.009*\"palmer\" + 0.009*\"north\" + 0.009*\"foam\" + 0.008*\"land\" + 0.008*\"lobe\"\n", + "2019-01-31 00:46:36,629 : INFO : topic #47 (0.020): 0.063*\"muscl\" + 0.035*\"perceptu\" + 0.021*\"theater\" + 0.019*\"place\" + 0.017*\"compos\" + 0.016*\"damn\" + 0.013*\"orchestr\" + 0.012*\"olympo\" + 0.012*\"physician\" + 0.011*\"word\"\n", + "2019-01-31 00:46:36,630 : INFO : topic #35 (0.020): 0.059*\"russia\" + 0.037*\"sovereignti\" + 0.033*\"rural\" + 0.024*\"poison\" + 0.023*\"reprint\" + 0.022*\"personifi\" + 0.021*\"moscow\" + 0.016*\"poland\" + 0.016*\"unfortun\" + 0.014*\"malaysia\"\n", + "2019-01-31 00:46:36,631 : INFO : topic #41 (0.020): 0.042*\"citi\" + 0.025*\"new\" + 0.022*\"palmer\" + 0.015*\"strategist\" + 0.013*\"open\" + 0.012*\"center\" + 0.011*\"includ\" + 0.010*\"lobe\" + 0.009*\"highli\" + 0.009*\"year\"\n", + "2019-01-31 00:46:36,637 : INFO : topic diff=0.005593, rho=0.033520\n", + "2019-01-31 00:46:36,792 : INFO : PROGRESS: pass 0, at document #1782000/4922894\n", + "2019-01-31 00:46:38,183 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:46:38,449 : INFO : topic #37 (0.020): 0.009*\"man\" + 0.009*\"love\" + 0.009*\"charact\" + 0.007*\"septemb\" + 0.007*\"gestur\" + 0.006*\"appear\" + 0.006*\"comic\" + 0.006*\"blue\" + 0.005*\"anim\" + 0.005*\"vision\"\n", + "2019-01-31 00:46:38,450 : INFO : topic #4 (0.020): 0.021*\"enfranchis\" + 0.016*\"depress\" + 0.015*\"pour\" + 0.009*\"elabor\" + 0.008*\"mode\" + 0.008*\"veget\" + 0.007*\"uruguayan\" + 0.007*\"produc\" + 0.007*\"develop\" + 0.006*\"spectacl\"\n", + "2019-01-31 00:46:38,451 : INFO : topic #18 (0.020): 0.010*\"théori\" + 0.007*\"later\" + 0.006*\"sack\" + 0.006*\"dai\" + 0.006*\"kill\" + 0.005*\"retrospect\" + 0.005*\"like\" + 0.004*\"end\" + 0.004*\"help\" + 0.004*\"kenworthi\"\n", + "2019-01-31 00:46:38,452 : INFO : topic #33 (0.020): 0.062*\"french\" + 0.046*\"franc\" + 0.032*\"pari\" + 0.024*\"sail\" + 0.022*\"jean\" + 0.016*\"daphn\" + 0.013*\"lazi\" + 0.012*\"loui\" + 0.012*\"piec\" + 0.010*\"wine\"\n", + "2019-01-31 00:46:38,453 : INFO : topic #30 (0.020): 0.036*\"leagu\" + 0.036*\"cleveland\" + 0.029*\"place\" + 0.027*\"taxpay\" + 0.025*\"scientist\" + 0.023*\"crete\" + 0.020*\"folei\" + 0.016*\"goal\" + 0.015*\"martin\" + 0.012*\"schmitz\"\n", + "2019-01-31 00:46:38,459 : INFO : topic diff=0.004811, rho=0.033501\n", + "2019-01-31 00:46:38,615 : INFO : PROGRESS: pass 0, at document #1784000/4922894\n", + "2019-01-31 00:46:40,013 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:46:40,280 : INFO : topic #0 (0.020): 0.070*\"statewid\" + 0.041*\"line\" + 0.037*\"arsen\" + 0.034*\"raid\" + 0.028*\"museo\" + 0.019*\"traceabl\" + 0.018*\"serv\" + 0.014*\"exhaust\" + 0.013*\"pain\" + 0.013*\"oper\"\n", + "2019-01-31 00:46:40,281 : INFO : topic #42 (0.020): 0.045*\"german\" + 0.031*\"germani\" + 0.015*\"jewish\" + 0.014*\"vol\" + 0.014*\"israel\" + 0.013*\"berlin\" + 0.013*\"der\" + 0.011*\"european\" + 0.010*\"europ\" + 0.009*\"austria\"\n", + "2019-01-31 00:46:40,282 : INFO : topic #5 (0.020): 0.040*\"abroad\" + 0.029*\"son\" + 0.027*\"rel\" + 0.026*\"reconstruct\" + 0.021*\"band\" + 0.017*\"muscl\" + 0.016*\"simultan\" + 0.015*\"charcoal\" + 0.013*\"toyota\" + 0.010*\"myspac\"\n", + "2019-01-31 00:46:40,283 : INFO : topic #25 (0.020): 0.032*\"ring\" + 0.017*\"lagrang\" + 0.017*\"warmth\" + 0.016*\"area\" + 0.015*\"mount\" + 0.009*\"palmer\" + 0.009*\"north\" + 0.008*\"foam\" + 0.008*\"land\" + 0.008*\"lobe\"\n", + "2019-01-31 00:46:40,284 : INFO : topic #28 (0.020): 0.031*\"build\" + 0.026*\"hous\" + 0.022*\"rivièr\" + 0.018*\"buford\" + 0.014*\"histor\" + 0.013*\"briarwood\" + 0.011*\"strategist\" + 0.011*\"constitut\" + 0.010*\"linear\" + 0.010*\"depress\"\n", + "2019-01-31 00:46:40,290 : INFO : topic diff=0.004400, rho=0.033482\n", + "2019-01-31 00:46:40,450 : INFO : PROGRESS: pass 0, at document #1786000/4922894\n", + "2019-01-31 00:46:41,861 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:46:42,127 : INFO : topic #20 (0.020): 0.140*\"scholar\" + 0.039*\"struggl\" + 0.030*\"high\" + 0.029*\"educ\" + 0.024*\"collector\" + 0.018*\"yawn\" + 0.012*\"prognosi\" + 0.011*\"district\" + 0.010*\"gothic\" + 0.010*\"start\"\n", + "2019-01-31 00:46:42,128 : INFO : topic #7 (0.020): 0.021*\"snatch\" + 0.020*\"di\" + 0.018*\"factor\" + 0.015*\"yawn\" + 0.015*\"margin\" + 0.014*\"bone\" + 0.013*\"life\" + 0.013*\"faster\" + 0.012*\"daughter\" + 0.012*\"deal\"\n", + "2019-01-31 00:46:42,129 : INFO : topic #16 (0.020): 0.050*\"king\" + 0.031*\"priest\" + 0.020*\"duke\" + 0.018*\"rotterdam\" + 0.018*\"quarterli\" + 0.018*\"idiosyncrat\" + 0.017*\"grammat\" + 0.016*\"princ\" + 0.014*\"brazil\" + 0.013*\"count\"\n", + "2019-01-31 00:46:42,131 : INFO : topic #4 (0.020): 0.021*\"enfranchis\" + 0.016*\"depress\" + 0.015*\"pour\" + 0.009*\"elabor\" + 0.008*\"mode\" + 0.008*\"veget\" + 0.007*\"uruguayan\" + 0.007*\"produc\" + 0.007*\"develop\" + 0.006*\"spectacl\"\n", + "2019-01-31 00:46:42,132 : INFO : topic #21 (0.020): 0.038*\"samford\" + 0.022*\"spain\" + 0.020*\"del\" + 0.018*\"mexico\" + 0.014*\"soviet\" + 0.012*\"francisco\" + 0.012*\"carlo\" + 0.012*\"lizard\" + 0.012*\"santa\" + 0.011*\"juan\"\n", + "2019-01-31 00:46:42,139 : INFO : topic diff=0.005170, rho=0.033464\n", + "2019-01-31 00:46:42,298 : INFO : PROGRESS: pass 0, at document #1788000/4922894\n", + "2019-01-31 00:46:43,705 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:46:43,971 : INFO : topic #13 (0.020): 0.028*\"sourc\" + 0.027*\"australia\" + 0.027*\"new\" + 0.025*\"london\" + 0.023*\"england\" + 0.022*\"australian\" + 0.019*\"british\" + 0.017*\"youth\" + 0.016*\"ireland\" + 0.014*\"wale\"\n", + "2019-01-31 00:46:43,972 : INFO : topic #36 (0.020): 0.012*\"network\" + 0.011*\"prognosi\" + 0.010*\"pop\" + 0.008*\"user\" + 0.008*\"develop\" + 0.008*\"softwar\" + 0.008*\"cytokin\" + 0.008*\"uruguayan\" + 0.007*\"championship\" + 0.007*\"brio\"\n", + "2019-01-31 00:46:43,973 : INFO : topic #12 (0.020): 0.008*\"number\" + 0.007*\"frontal\" + 0.007*\"gener\" + 0.007*\"exampl\" + 0.006*\"poet\" + 0.006*\"théori\" + 0.006*\"measur\" + 0.006*\"servitud\" + 0.006*\"method\" + 0.006*\"differ\"\n", + "2019-01-31 00:46:43,974 : INFO : topic #40 (0.020): 0.089*\"unit\" + 0.023*\"schuster\" + 0.023*\"collector\" + 0.022*\"institut\" + 0.021*\"requir\" + 0.018*\"student\" + 0.015*\"professor\" + 0.012*\"word\" + 0.011*\"degre\" + 0.011*\"http\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 00:46:43,976 : INFO : topic #34 (0.020): 0.073*\"start\" + 0.032*\"unionist\" + 0.030*\"cotton\" + 0.029*\"american\" + 0.028*\"new\" + 0.017*\"year\" + 0.016*\"california\" + 0.013*\"terri\" + 0.012*\"warrior\" + 0.011*\"north\"\n", + "2019-01-31 00:46:43,981 : INFO : topic diff=0.004782, rho=0.033445\n", + "2019-01-31 00:46:44,193 : INFO : PROGRESS: pass 0, at document #1790000/4922894\n", + "2019-01-31 00:46:45,597 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:46:45,863 : INFO : topic #40 (0.020): 0.089*\"unit\" + 0.023*\"schuster\" + 0.023*\"collector\" + 0.022*\"institut\" + 0.021*\"requir\" + 0.019*\"student\" + 0.015*\"professor\" + 0.012*\"word\" + 0.011*\"http\" + 0.011*\"degre\"\n", + "2019-01-31 00:46:45,864 : INFO : topic #11 (0.020): 0.025*\"john\" + 0.013*\"will\" + 0.012*\"jame\" + 0.012*\"david\" + 0.011*\"rival\" + 0.009*\"mexican–american\" + 0.008*\"georg\" + 0.008*\"slur\" + 0.008*\"paul\" + 0.008*\"rhyme\"\n", + "2019-01-31 00:46:45,865 : INFO : topic #46 (0.020): 0.018*\"stop\" + 0.017*\"damag\" + 0.015*\"swedish\" + 0.015*\"sweden\" + 0.015*\"norwai\" + 0.015*\"wind\" + 0.013*\"norwegian\" + 0.012*\"treeless\" + 0.011*\"farid\" + 0.011*\"huntsvil\"\n", + "2019-01-31 00:46:45,866 : INFO : topic #9 (0.020): 0.073*\"bone\" + 0.042*\"american\" + 0.028*\"valour\" + 0.021*\"dutch\" + 0.019*\"folei\" + 0.018*\"player\" + 0.017*\"polit\" + 0.016*\"english\" + 0.012*\"acrimoni\" + 0.011*\"simpler\"\n", + "2019-01-31 00:46:45,867 : INFO : topic #5 (0.020): 0.039*\"abroad\" + 0.029*\"son\" + 0.027*\"rel\" + 0.026*\"reconstruct\" + 0.021*\"band\" + 0.016*\"muscl\" + 0.016*\"simultan\" + 0.015*\"charcoal\" + 0.014*\"toyota\" + 0.010*\"myspac\"\n", + "2019-01-31 00:46:45,873 : INFO : topic diff=0.005301, rho=0.033426\n", + "2019-01-31 00:46:46,033 : INFO : PROGRESS: pass 0, at document #1792000/4922894\n", + "2019-01-31 00:46:47,447 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:46:47,714 : INFO : topic #26 (0.020): 0.032*\"workplac\" + 0.027*\"champion\" + 0.026*\"woman\" + 0.025*\"men\" + 0.025*\"olymp\" + 0.023*\"medal\" + 0.020*\"event\" + 0.020*\"rainfal\" + 0.018*\"taxpay\" + 0.018*\"atheist\"\n", + "2019-01-31 00:46:47,715 : INFO : topic #46 (0.020): 0.021*\"stop\" + 0.017*\"damag\" + 0.016*\"swedish\" + 0.015*\"sweden\" + 0.015*\"wind\" + 0.014*\"norwai\" + 0.013*\"norwegian\" + 0.012*\"treeless\" + 0.011*\"farid\" + 0.011*\"huntsvil\"\n", + "2019-01-31 00:46:47,716 : INFO : topic #14 (0.020): 0.024*\"forc\" + 0.022*\"aggress\" + 0.021*\"armi\" + 0.019*\"walter\" + 0.017*\"com\" + 0.015*\"oper\" + 0.013*\"unionist\" + 0.013*\"militari\" + 0.012*\"airbu\" + 0.011*\"diversifi\"\n", + "2019-01-31 00:46:47,717 : INFO : topic #40 (0.020): 0.088*\"unit\" + 0.023*\"schuster\" + 0.023*\"collector\" + 0.022*\"institut\" + 0.021*\"requir\" + 0.018*\"student\" + 0.015*\"professor\" + 0.012*\"word\" + 0.011*\"http\" + 0.011*\"degre\"\n", + "2019-01-31 00:46:47,718 : INFO : topic #8 (0.020): 0.027*\"law\" + 0.024*\"cortic\" + 0.019*\"start\" + 0.016*\"act\" + 0.015*\"ricardo\" + 0.012*\"case\" + 0.010*\"polaris\" + 0.009*\"replac\" + 0.009*\"legal\" + 0.007*\"judaism\"\n", + "2019-01-31 00:46:47,725 : INFO : topic diff=0.005355, rho=0.033408\n", + "2019-01-31 00:46:47,884 : INFO : PROGRESS: pass 0, at document #1794000/4922894\n", + "2019-01-31 00:46:49,277 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:46:49,544 : INFO : topic #28 (0.020): 0.031*\"build\" + 0.026*\"hous\" + 0.022*\"rivièr\" + 0.018*\"buford\" + 0.014*\"histor\" + 0.013*\"briarwood\" + 0.011*\"strategist\" + 0.011*\"constitut\" + 0.010*\"linear\" + 0.010*\"depress\"\n", + "2019-01-31 00:46:49,545 : INFO : topic #24 (0.020): 0.041*\"book\" + 0.035*\"publicis\" + 0.025*\"word\" + 0.018*\"new\" + 0.014*\"edit\" + 0.013*\"presid\" + 0.012*\"storag\" + 0.012*\"nicola\" + 0.011*\"collect\" + 0.011*\"magazin\"\n", + "2019-01-31 00:46:49,546 : INFO : topic #38 (0.020): 0.024*\"walter\" + 0.009*\"aza\" + 0.009*\"battalion\" + 0.009*\"forc\" + 0.008*\"empath\" + 0.007*\"armi\" + 0.006*\"teufel\" + 0.006*\"militari\" + 0.006*\"govern\" + 0.006*\"pour\"\n", + "2019-01-31 00:46:49,547 : INFO : topic #1 (0.020): 0.051*\"china\" + 0.044*\"chilton\" + 0.028*\"hong\" + 0.027*\"kong\" + 0.023*\"korea\" + 0.019*\"korean\" + 0.017*\"han\" + 0.016*\"leah\" + 0.015*\"sourc\" + 0.014*\"kim\"\n", + "2019-01-31 00:46:49,548 : INFO : topic #22 (0.020): 0.033*\"spars\" + 0.024*\"factor\" + 0.019*\"adulthood\" + 0.017*\"male\" + 0.016*\"feel\" + 0.012*\"plaisir\" + 0.011*\"hostil\" + 0.011*\"genu\" + 0.009*\"live\" + 0.008*\"median\"\n", + "2019-01-31 00:46:49,554 : INFO : topic diff=0.004802, rho=0.033389\n", + "2019-01-31 00:46:49,712 : INFO : PROGRESS: pass 0, at document #1796000/4922894\n", + "2019-01-31 00:46:51,071 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:46:51,340 : INFO : topic #48 (0.020): 0.081*\"octob\" + 0.079*\"sens\" + 0.077*\"march\" + 0.069*\"januari\" + 0.068*\"notion\" + 0.068*\"april\" + 0.067*\"juli\" + 0.066*\"judici\" + 0.066*\"august\" + 0.064*\"decatur\"\n", + "2019-01-31 00:46:51,341 : INFO : topic #15 (0.020): 0.011*\"small\" + 0.011*\"organ\" + 0.010*\"develop\" + 0.009*\"commun\" + 0.009*\"group\" + 0.009*\"word\" + 0.009*\"peopl\" + 0.007*\"cultur\" + 0.007*\"human\" + 0.007*\"woman\"\n", + "2019-01-31 00:46:51,342 : INFO : topic #12 (0.020): 0.008*\"number\" + 0.007*\"frontal\" + 0.007*\"gener\" + 0.007*\"exampl\" + 0.006*\"poet\" + 0.006*\"théori\" + 0.006*\"servitud\" + 0.006*\"measur\" + 0.006*\"method\" + 0.006*\"differ\"\n", + "2019-01-31 00:46:51,343 : INFO : topic #45 (0.020): 0.024*\"jpg\" + 0.023*\"fifteenth\" + 0.017*\"black\" + 0.016*\"illicit\" + 0.016*\"colder\" + 0.016*\"western\" + 0.013*\"record\" + 0.011*\"blind\" + 0.008*\"depress\" + 0.008*\"light\"\n", + "2019-01-31 00:46:51,344 : INFO : topic #6 (0.020): 0.071*\"fewer\" + 0.024*\"epiru\" + 0.024*\"septemb\" + 0.018*\"teacher\" + 0.016*\"stake\" + 0.013*\"proclaim\" + 0.013*\"rodríguez\" + 0.011*\"direct\" + 0.011*\"movi\" + 0.010*\"acrimoni\"\n", + "2019-01-31 00:46:51,350 : INFO : topic diff=0.004914, rho=0.033370\n", + "2019-01-31 00:46:51,508 : INFO : PROGRESS: pass 0, at document #1798000/4922894\n", + "2019-01-31 00:46:52,890 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:46:53,158 : INFO : topic #40 (0.020): 0.087*\"unit\" + 0.023*\"schuster\" + 0.023*\"collector\" + 0.022*\"institut\" + 0.021*\"requir\" + 0.019*\"student\" + 0.015*\"professor\" + 0.012*\"word\" + 0.011*\"degre\" + 0.011*\"http\"\n", + "2019-01-31 00:46:53,159 : INFO : topic #24 (0.020): 0.041*\"book\" + 0.035*\"publicis\" + 0.025*\"word\" + 0.018*\"new\" + 0.014*\"edit\" + 0.013*\"presid\" + 0.012*\"storag\" + 0.012*\"nicola\" + 0.011*\"collect\" + 0.011*\"magazin\"\n", + "2019-01-31 00:46:53,161 : INFO : topic #43 (0.020): 0.062*\"elect\" + 0.054*\"parti\" + 0.024*\"voluntari\" + 0.023*\"democrat\" + 0.020*\"member\" + 0.017*\"polici\" + 0.014*\"republ\" + 0.013*\"selma\" + 0.013*\"bypass\" + 0.013*\"report\"\n", + "2019-01-31 00:46:53,162 : INFO : topic #17 (0.020): 0.077*\"church\" + 0.022*\"christian\" + 0.022*\"cathol\" + 0.021*\"bishop\" + 0.016*\"sail\" + 0.015*\"retroflex\" + 0.010*\"centuri\" + 0.009*\"relationship\" + 0.009*\"cathedr\" + 0.009*\"historiographi\"\n", + "2019-01-31 00:46:53,163 : INFO : topic #19 (0.020): 0.016*\"languag\" + 0.012*\"centuri\" + 0.011*\"woodcut\" + 0.009*\"form\" + 0.009*\"origin\" + 0.009*\"mean\" + 0.008*\"english\" + 0.007*\"trade\" + 0.007*\"known\" + 0.006*\"like\"\n", + "2019-01-31 00:46:53,169 : INFO : topic diff=0.004914, rho=0.033352\n", + "2019-01-31 00:46:55,851 : INFO : -11.595 per-word bound, 3093.0 perplexity estimate based on a held-out corpus of 2000 documents with 549658 words\n", + "2019-01-31 00:46:55,851 : INFO : PROGRESS: pass 0, at document #1800000/4922894\n", + "2019-01-31 00:46:57,226 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:46:57,492 : INFO : topic #27 (0.020): 0.072*\"questionnair\" + 0.021*\"taxpay\" + 0.020*\"candid\" + 0.013*\"ret\" + 0.012*\"driver\" + 0.012*\"fool\" + 0.012*\"tornado\" + 0.011*\"find\" + 0.010*\"théori\" + 0.010*\"champion\"\n", + "2019-01-31 00:46:57,494 : INFO : topic #18 (0.020): 0.010*\"théori\" + 0.007*\"later\" + 0.007*\"sack\" + 0.006*\"dai\" + 0.006*\"kill\" + 0.005*\"retrospect\" + 0.005*\"like\" + 0.004*\"end\" + 0.004*\"help\" + 0.004*\"kenworthi\"\n", + "2019-01-31 00:46:57,495 : INFO : topic #24 (0.020): 0.041*\"book\" + 0.035*\"publicis\" + 0.025*\"word\" + 0.018*\"new\" + 0.014*\"edit\" + 0.013*\"presid\" + 0.012*\"storag\" + 0.012*\"nicola\" + 0.011*\"collect\" + 0.011*\"magazin\"\n", + "2019-01-31 00:46:57,496 : INFO : topic #20 (0.020): 0.143*\"scholar\" + 0.038*\"struggl\" + 0.031*\"high\" + 0.029*\"educ\" + 0.024*\"collector\" + 0.018*\"yawn\" + 0.013*\"prognosi\" + 0.010*\"district\" + 0.010*\"gothic\" + 0.009*\"task\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 00:46:57,498 : INFO : topic #38 (0.020): 0.024*\"walter\" + 0.009*\"battalion\" + 0.009*\"aza\" + 0.008*\"forc\" + 0.008*\"empath\" + 0.007*\"armi\" + 0.006*\"militari\" + 0.006*\"govern\" + 0.006*\"pour\" + 0.006*\"teufel\"\n", + "2019-01-31 00:46:57,503 : INFO : topic diff=0.005013, rho=0.033333\n", + "2019-01-31 00:46:57,667 : INFO : PROGRESS: pass 0, at document #1802000/4922894\n", + "2019-01-31 00:46:59,089 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:46:59,355 : INFO : topic #43 (0.020): 0.064*\"elect\" + 0.055*\"parti\" + 0.024*\"democrat\" + 0.024*\"voluntari\" + 0.020*\"member\" + 0.017*\"polici\" + 0.015*\"republ\" + 0.013*\"selma\" + 0.013*\"bypass\" + 0.013*\"seaport\"\n", + "2019-01-31 00:46:59,356 : INFO : topic #20 (0.020): 0.142*\"scholar\" + 0.038*\"struggl\" + 0.031*\"high\" + 0.029*\"educ\" + 0.024*\"collector\" + 0.018*\"yawn\" + 0.013*\"prognosi\" + 0.010*\"district\" + 0.010*\"gothic\" + 0.009*\"task\"\n", + "2019-01-31 00:46:59,357 : INFO : topic #25 (0.020): 0.032*\"ring\" + 0.017*\"warmth\" + 0.017*\"lagrang\" + 0.017*\"area\" + 0.015*\"mount\" + 0.010*\"palmer\" + 0.009*\"north\" + 0.008*\"foam\" + 0.008*\"land\" + 0.008*\"vacant\"\n", + "2019-01-31 00:46:59,359 : INFO : topic #24 (0.020): 0.041*\"book\" + 0.035*\"publicis\" + 0.025*\"word\" + 0.018*\"new\" + 0.014*\"edit\" + 0.013*\"presid\" + 0.012*\"storag\" + 0.012*\"nicola\" + 0.011*\"collect\" + 0.011*\"magazin\"\n", + "2019-01-31 00:46:59,360 : INFO : topic #44 (0.020): 0.031*\"rooftop\" + 0.027*\"final\" + 0.026*\"wife\" + 0.021*\"tourist\" + 0.020*\"champion\" + 0.016*\"chamber\" + 0.015*\"taxpay\" + 0.015*\"open\" + 0.015*\"martin\" + 0.014*\"tiepolo\"\n", + "2019-01-31 00:46:59,366 : INFO : topic diff=0.005522, rho=0.033315\n", + "2019-01-31 00:46:59,525 : INFO : PROGRESS: pass 0, at document #1804000/4922894\n", + "2019-01-31 00:47:00,937 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:47:01,203 : INFO : topic #1 (0.020): 0.052*\"china\" + 0.043*\"chilton\" + 0.028*\"hong\" + 0.028*\"kong\" + 0.023*\"korea\" + 0.019*\"korean\" + 0.016*\"leah\" + 0.015*\"han\" + 0.015*\"sourc\" + 0.013*\"kim\"\n", + "2019-01-31 00:47:01,205 : INFO : topic #4 (0.020): 0.021*\"enfranchis\" + 0.016*\"depress\" + 0.015*\"pour\" + 0.009*\"elabor\" + 0.008*\"mode\" + 0.008*\"veget\" + 0.007*\"uruguayan\" + 0.007*\"candid\" + 0.007*\"produc\" + 0.006*\"develop\"\n", + "2019-01-31 00:47:01,206 : INFO : topic #28 (0.020): 0.031*\"build\" + 0.026*\"hous\" + 0.022*\"rivièr\" + 0.018*\"buford\" + 0.014*\"histor\" + 0.013*\"briarwood\" + 0.011*\"strategist\" + 0.011*\"constitut\" + 0.010*\"linear\" + 0.010*\"depress\"\n", + "2019-01-31 00:47:01,207 : INFO : topic #22 (0.020): 0.033*\"spars\" + 0.024*\"factor\" + 0.019*\"adulthood\" + 0.017*\"male\" + 0.016*\"feel\" + 0.012*\"plaisir\" + 0.011*\"hostil\" + 0.010*\"genu\" + 0.009*\"live\" + 0.008*\"median\"\n", + "2019-01-31 00:47:01,208 : INFO : topic #47 (0.020): 0.064*\"muscl\" + 0.035*\"perceptu\" + 0.020*\"theater\" + 0.019*\"place\" + 0.017*\"compos\" + 0.016*\"damn\" + 0.014*\"orchestr\" + 0.012*\"olympo\" + 0.011*\"physician\" + 0.011*\"word\"\n", + "2019-01-31 00:47:01,214 : INFO : topic diff=0.005859, rho=0.033296\n", + "2019-01-31 00:47:01,374 : INFO : PROGRESS: pass 0, at document #1806000/4922894\n", + "2019-01-31 00:47:02,767 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:47:03,033 : INFO : topic #24 (0.020): 0.041*\"book\" + 0.035*\"publicis\" + 0.025*\"word\" + 0.018*\"new\" + 0.014*\"edit\" + 0.013*\"presid\" + 0.012*\"storag\" + 0.012*\"nicola\" + 0.011*\"collect\" + 0.011*\"author\"\n", + "2019-01-31 00:47:03,034 : INFO : topic #32 (0.020): 0.054*\"district\" + 0.044*\"vigour\" + 0.043*\"popolo\" + 0.038*\"tortur\" + 0.031*\"cotton\" + 0.028*\"area\" + 0.023*\"regim\" + 0.023*\"multitud\" + 0.021*\"citi\" + 0.020*\"cede\"\n", + "2019-01-31 00:47:03,036 : INFO : topic #11 (0.020): 0.025*\"john\" + 0.013*\"will\" + 0.012*\"jame\" + 0.011*\"david\" + 0.011*\"rival\" + 0.009*\"mexican–american\" + 0.009*\"georg\" + 0.008*\"slur\" + 0.008*\"rhyme\" + 0.008*\"paul\"\n", + "2019-01-31 00:47:03,037 : INFO : topic #28 (0.020): 0.031*\"build\" + 0.026*\"hous\" + 0.022*\"rivièr\" + 0.018*\"buford\" + 0.014*\"histor\" + 0.012*\"briarwood\" + 0.011*\"strategist\" + 0.011*\"constitut\" + 0.010*\"linear\" + 0.010*\"depress\"\n", + "2019-01-31 00:47:03,038 : INFO : topic #29 (0.020): 0.028*\"companhia\" + 0.012*\"million\" + 0.011*\"busi\" + 0.010*\"bank\" + 0.010*\"market\" + 0.010*\"produc\" + 0.009*\"industri\" + 0.009*\"yawn\" + 0.008*\"manag\" + 0.007*\"trace\"\n", + "2019-01-31 00:47:03,044 : INFO : topic diff=0.004806, rho=0.033278\n", + "2019-01-31 00:47:03,202 : INFO : PROGRESS: pass 0, at document #1808000/4922894\n", + "2019-01-31 00:47:04,594 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:47:04,860 : INFO : topic #11 (0.020): 0.025*\"john\" + 0.013*\"will\" + 0.012*\"jame\" + 0.011*\"david\" + 0.011*\"rival\" + 0.009*\"mexican–american\" + 0.009*\"georg\" + 0.008*\"slur\" + 0.008*\"rhyme\" + 0.008*\"paul\"\n", + "2019-01-31 00:47:04,861 : INFO : topic #0 (0.020): 0.069*\"statewid\" + 0.041*\"line\" + 0.035*\"raid\" + 0.035*\"arsen\" + 0.029*\"museo\" + 0.019*\"traceabl\" + 0.018*\"serv\" + 0.014*\"exhaust\" + 0.013*\"pain\" + 0.012*\"oper\"\n", + "2019-01-31 00:47:04,862 : INFO : topic #29 (0.020): 0.027*\"companhia\" + 0.011*\"million\" + 0.011*\"busi\" + 0.010*\"bank\" + 0.010*\"market\" + 0.010*\"produc\" + 0.009*\"industri\" + 0.008*\"yawn\" + 0.008*\"manag\" + 0.007*\"trace\"\n", + "2019-01-31 00:47:04,864 : INFO : topic #33 (0.020): 0.062*\"french\" + 0.049*\"franc\" + 0.032*\"pari\" + 0.023*\"sail\" + 0.021*\"jean\" + 0.017*\"daphn\" + 0.014*\"lazi\" + 0.012*\"loui\" + 0.012*\"piec\" + 0.010*\"wine\"\n", + "2019-01-31 00:47:04,865 : INFO : topic #13 (0.020): 0.029*\"sourc\" + 0.027*\"australia\" + 0.027*\"london\" + 0.026*\"new\" + 0.023*\"england\" + 0.022*\"australian\" + 0.019*\"british\" + 0.016*\"ireland\" + 0.015*\"youth\" + 0.014*\"wale\"\n", + "2019-01-31 00:47:04,871 : INFO : topic diff=0.004991, rho=0.033260\n", + "2019-01-31 00:47:05,029 : INFO : PROGRESS: pass 0, at document #1810000/4922894\n", + "2019-01-31 00:47:06,420 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:47:06,687 : INFO : topic #24 (0.020): 0.041*\"book\" + 0.035*\"publicis\" + 0.025*\"word\" + 0.018*\"new\" + 0.014*\"edit\" + 0.013*\"presid\" + 0.012*\"nicola\" + 0.012*\"storag\" + 0.011*\"collect\" + 0.011*\"author\"\n", + "2019-01-31 00:47:06,688 : INFO : topic #26 (0.020): 0.032*\"workplac\" + 0.027*\"champion\" + 0.027*\"woman\" + 0.025*\"olymp\" + 0.025*\"men\" + 0.022*\"medal\" + 0.020*\"event\" + 0.020*\"rainfal\" + 0.019*\"taxpay\" + 0.018*\"atheist\"\n", + "2019-01-31 00:47:06,689 : INFO : topic #43 (0.020): 0.063*\"elect\" + 0.054*\"parti\" + 0.024*\"voluntari\" + 0.024*\"democrat\" + 0.020*\"member\" + 0.017*\"polici\" + 0.016*\"republ\" + 0.014*\"selma\" + 0.013*\"bypass\" + 0.013*\"report\"\n", + "2019-01-31 00:47:06,690 : INFO : topic #49 (0.020): 0.044*\"india\" + 0.030*\"incumb\" + 0.013*\"islam\" + 0.012*\"anglo\" + 0.012*\"pakistan\" + 0.011*\"televis\" + 0.010*\"muskoge\" + 0.010*\"alam\" + 0.009*\"sri\" + 0.009*\"khalsa\"\n", + "2019-01-31 00:47:06,691 : INFO : topic #12 (0.020): 0.008*\"number\" + 0.007*\"frontal\" + 0.007*\"gener\" + 0.007*\"exampl\" + 0.007*\"théori\" + 0.006*\"poet\" + 0.006*\"servitud\" + 0.006*\"measur\" + 0.006*\"southern\" + 0.006*\"differ\"\n", + "2019-01-31 00:47:06,697 : INFO : topic diff=0.005036, rho=0.033241\n", + "2019-01-31 00:47:06,854 : INFO : PROGRESS: pass 0, at document #1812000/4922894\n", + "2019-01-31 00:47:08,257 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:47:08,524 : INFO : topic #7 (0.020): 0.021*\"snatch\" + 0.020*\"di\" + 0.018*\"factor\" + 0.015*\"yawn\" + 0.015*\"margin\" + 0.014*\"bone\" + 0.013*\"life\" + 0.013*\"faster\" + 0.012*\"daughter\" + 0.012*\"deal\"\n", + "2019-01-31 00:47:08,525 : INFO : topic #46 (0.020): 0.019*\"stop\" + 0.016*\"swedish\" + 0.016*\"norwai\" + 0.016*\"damag\" + 0.016*\"sweden\" + 0.015*\"wind\" + 0.014*\"norwegian\" + 0.011*\"farid\" + 0.010*\"huntsvil\" + 0.010*\"denmark\"\n", + "2019-01-31 00:47:08,526 : INFO : topic #20 (0.020): 0.144*\"scholar\" + 0.039*\"struggl\" + 0.033*\"high\" + 0.029*\"educ\" + 0.023*\"collector\" + 0.017*\"yawn\" + 0.013*\"prognosi\" + 0.010*\"district\" + 0.009*\"task\" + 0.009*\"gothic\"\n", + "2019-01-31 00:47:08,527 : INFO : topic #31 (0.020): 0.056*\"fusiform\" + 0.026*\"scientist\" + 0.026*\"taxpay\" + 0.024*\"player\" + 0.020*\"place\" + 0.013*\"clot\" + 0.013*\"leagu\" + 0.011*\"folei\" + 0.010*\"yawn\" + 0.009*\"reconstruct\"\n", + "2019-01-31 00:47:08,528 : INFO : topic #9 (0.020): 0.069*\"bone\" + 0.043*\"american\" + 0.029*\"valour\" + 0.021*\"dutch\" + 0.018*\"folei\" + 0.018*\"polit\" + 0.017*\"player\" + 0.017*\"english\" + 0.012*\"acrimoni\" + 0.011*\"simpler\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 00:47:08,534 : INFO : topic diff=0.005147, rho=0.033223\n", + "2019-01-31 00:47:08,695 : INFO : PROGRESS: pass 0, at document #1814000/4922894\n", + "2019-01-31 00:47:10,105 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:47:10,371 : INFO : topic #32 (0.020): 0.054*\"district\" + 0.043*\"vigour\" + 0.043*\"popolo\" + 0.037*\"tortur\" + 0.033*\"area\" + 0.031*\"cotton\" + 0.023*\"regim\" + 0.022*\"multitud\" + 0.021*\"citi\" + 0.019*\"commun\"\n", + "2019-01-31 00:47:10,373 : INFO : topic #43 (0.020): 0.064*\"elect\" + 0.054*\"parti\" + 0.024*\"voluntari\" + 0.023*\"democrat\" + 0.020*\"member\" + 0.017*\"polici\" + 0.015*\"republ\" + 0.013*\"selma\" + 0.013*\"report\" + 0.013*\"bypass\"\n", + "2019-01-31 00:47:10,374 : INFO : topic #49 (0.020): 0.044*\"india\" + 0.030*\"incumb\" + 0.013*\"islam\" + 0.012*\"anglo\" + 0.012*\"pakistan\" + 0.011*\"televis\" + 0.010*\"muskoge\" + 0.010*\"tajikistan\" + 0.010*\"alam\" + 0.010*\"khalsa\"\n", + "2019-01-31 00:47:10,375 : INFO : topic #37 (0.020): 0.009*\"man\" + 0.009*\"love\" + 0.008*\"charact\" + 0.008*\"septemb\" + 0.007*\"gestur\" + 0.007*\"comic\" + 0.006*\"appear\" + 0.005*\"blue\" + 0.005*\"anim\" + 0.005*\"vision\"\n", + "2019-01-31 00:47:10,376 : INFO : topic #30 (0.020): 0.036*\"leagu\" + 0.035*\"cleveland\" + 0.029*\"place\" + 0.027*\"taxpay\" + 0.025*\"scientist\" + 0.023*\"crete\" + 0.021*\"folei\" + 0.016*\"goal\" + 0.015*\"martin\" + 0.012*\"schmitz\"\n", + "2019-01-31 00:47:10,382 : INFO : topic diff=0.005381, rho=0.033204\n", + "2019-01-31 00:47:10,538 : INFO : PROGRESS: pass 0, at document #1816000/4922894\n", + "2019-01-31 00:47:11,920 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:47:12,186 : INFO : topic #9 (0.020): 0.070*\"bone\" + 0.043*\"american\" + 0.029*\"valour\" + 0.021*\"dutch\" + 0.018*\"folei\" + 0.018*\"polit\" + 0.017*\"player\" + 0.017*\"english\" + 0.012*\"acrimoni\" + 0.011*\"simpler\"\n", + "2019-01-31 00:47:12,188 : INFO : topic #34 (0.020): 0.072*\"start\" + 0.032*\"unionist\" + 0.030*\"american\" + 0.029*\"cotton\" + 0.028*\"new\" + 0.017*\"year\" + 0.015*\"california\" + 0.013*\"terri\" + 0.012*\"warrior\" + 0.012*\"north\"\n", + "2019-01-31 00:47:12,189 : INFO : topic #37 (0.020): 0.009*\"man\" + 0.009*\"love\" + 0.008*\"charact\" + 0.008*\"septemb\" + 0.007*\"gestur\" + 0.007*\"comic\" + 0.006*\"appear\" + 0.006*\"blue\" + 0.005*\"anim\" + 0.005*\"vision\"\n", + "2019-01-31 00:47:12,190 : INFO : topic #32 (0.020): 0.053*\"district\" + 0.043*\"vigour\" + 0.043*\"popolo\" + 0.037*\"tortur\" + 0.033*\"area\" + 0.031*\"cotton\" + 0.023*\"regim\" + 0.022*\"multitud\" + 0.021*\"citi\" + 0.019*\"commun\"\n", + "2019-01-31 00:47:12,192 : INFO : topic #18 (0.020): 0.010*\"théori\" + 0.007*\"later\" + 0.007*\"sack\" + 0.006*\"dai\" + 0.006*\"kill\" + 0.005*\"retrospect\" + 0.005*\"like\" + 0.004*\"end\" + 0.004*\"help\" + 0.004*\"kenworthi\"\n", + "2019-01-31 00:47:12,197 : INFO : topic diff=0.005346, rho=0.033186\n", + "2019-01-31 00:47:12,358 : INFO : PROGRESS: pass 0, at document #1818000/4922894\n", + "2019-01-31 00:47:13,755 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:47:14,022 : INFO : topic #25 (0.020): 0.032*\"ring\" + 0.017*\"warmth\" + 0.017*\"lagrang\" + 0.016*\"area\" + 0.014*\"mount\" + 0.010*\"palmer\" + 0.009*\"north\" + 0.008*\"foam\" + 0.008*\"land\" + 0.008*\"lobe\"\n", + "2019-01-31 00:47:14,023 : INFO : topic #45 (0.020): 0.026*\"jpg\" + 0.023*\"fifteenth\" + 0.017*\"illicit\" + 0.017*\"black\" + 0.016*\"western\" + 0.015*\"colder\" + 0.013*\"record\" + 0.011*\"blind\" + 0.008*\"depress\" + 0.007*\"light\"\n", + "2019-01-31 00:47:14,024 : INFO : topic #11 (0.020): 0.025*\"john\" + 0.013*\"will\" + 0.012*\"jame\" + 0.011*\"david\" + 0.010*\"rival\" + 0.009*\"mexican–american\" + 0.009*\"georg\" + 0.008*\"slur\" + 0.008*\"paul\" + 0.008*\"rhyme\"\n", + "2019-01-31 00:47:14,025 : INFO : topic #20 (0.020): 0.143*\"scholar\" + 0.038*\"struggl\" + 0.032*\"high\" + 0.029*\"educ\" + 0.023*\"collector\" + 0.017*\"yawn\" + 0.013*\"prognosi\" + 0.010*\"district\" + 0.009*\"gothic\" + 0.009*\"task\"\n", + "2019-01-31 00:47:14,027 : INFO : topic #17 (0.020): 0.076*\"church\" + 0.024*\"christian\" + 0.022*\"cathol\" + 0.021*\"bishop\" + 0.016*\"sail\" + 0.015*\"retroflex\" + 0.010*\"centuri\" + 0.009*\"relationship\" + 0.009*\"historiographi\" + 0.008*\"cathedr\"\n", + "2019-01-31 00:47:14,033 : INFO : topic diff=0.005262, rho=0.033168\n", + "2019-01-31 00:47:16,646 : INFO : -11.641 per-word bound, 3193.3 perplexity estimate based on a held-out corpus of 2000 documents with 503774 words\n", + "2019-01-31 00:47:16,647 : INFO : PROGRESS: pass 0, at document #1820000/4922894\n", + "2019-01-31 00:47:18,014 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:47:18,281 : INFO : topic #12 (0.020): 0.008*\"number\" + 0.007*\"gener\" + 0.007*\"frontal\" + 0.007*\"théori\" + 0.006*\"exampl\" + 0.006*\"poet\" + 0.006*\"measur\" + 0.006*\"differ\" + 0.006*\"servitud\" + 0.006*\"southern\"\n", + "2019-01-31 00:47:18,282 : INFO : topic #17 (0.020): 0.076*\"church\" + 0.023*\"christian\" + 0.022*\"cathol\" + 0.021*\"bishop\" + 0.016*\"sail\" + 0.015*\"retroflex\" + 0.011*\"centuri\" + 0.009*\"relationship\" + 0.009*\"historiographi\" + 0.008*\"cathedr\"\n", + "2019-01-31 00:47:18,283 : INFO : topic #11 (0.020): 0.025*\"john\" + 0.013*\"will\" + 0.012*\"jame\" + 0.011*\"david\" + 0.011*\"rival\" + 0.009*\"mexican–american\" + 0.009*\"georg\" + 0.008*\"slur\" + 0.008*\"paul\" + 0.008*\"rhyme\"\n", + "2019-01-31 00:47:18,284 : INFO : topic #43 (0.020): 0.066*\"elect\" + 0.053*\"parti\" + 0.025*\"democrat\" + 0.024*\"voluntari\" + 0.020*\"member\" + 0.018*\"republ\" + 0.016*\"polici\" + 0.013*\"selma\" + 0.013*\"bypass\" + 0.013*\"report\"\n", + "2019-01-31 00:47:18,285 : INFO : topic #45 (0.020): 0.026*\"jpg\" + 0.023*\"fifteenth\" + 0.017*\"illicit\" + 0.017*\"black\" + 0.016*\"western\" + 0.015*\"colder\" + 0.013*\"record\" + 0.011*\"blind\" + 0.008*\"depress\" + 0.008*\"light\"\n", + "2019-01-31 00:47:18,291 : INFO : topic diff=0.006148, rho=0.033150\n", + "2019-01-31 00:47:18,445 : INFO : PROGRESS: pass 0, at document #1822000/4922894\n", + "2019-01-31 00:47:19,810 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:47:20,076 : INFO : topic #46 (0.020): 0.019*\"stop\" + 0.017*\"swedish\" + 0.016*\"norwai\" + 0.016*\"damag\" + 0.016*\"sweden\" + 0.015*\"wind\" + 0.014*\"norwegian\" + 0.011*\"farid\" + 0.011*\"huntsvil\" + 0.011*\"denmark\"\n", + "2019-01-31 00:47:20,077 : INFO : topic #21 (0.020): 0.036*\"samford\" + 0.023*\"spain\" + 0.021*\"del\" + 0.017*\"mexico\" + 0.014*\"soviet\" + 0.012*\"santa\" + 0.012*\"francisco\" + 0.011*\"lizard\" + 0.011*\"juan\" + 0.011*\"carlo\"\n", + "2019-01-31 00:47:20,079 : INFO : topic #39 (0.020): 0.055*\"canada\" + 0.041*\"canadian\" + 0.023*\"toronto\" + 0.022*\"hoar\" + 0.021*\"ontario\" + 0.015*\"hydrogen\" + 0.015*\"misericordia\" + 0.014*\"novotná\" + 0.014*\"new\" + 0.012*\"quebec\"\n", + "2019-01-31 00:47:20,080 : INFO : topic #20 (0.020): 0.143*\"scholar\" + 0.038*\"struggl\" + 0.032*\"high\" + 0.029*\"educ\" + 0.023*\"collector\" + 0.018*\"yawn\" + 0.013*\"prognosi\" + 0.010*\"district\" + 0.009*\"task\" + 0.009*\"gothic\"\n", + "2019-01-31 00:47:20,081 : INFO : topic #44 (0.020): 0.031*\"rooftop\" + 0.026*\"final\" + 0.025*\"wife\" + 0.022*\"tourist\" + 0.019*\"champion\" + 0.018*\"tiepolo\" + 0.016*\"chamber\" + 0.015*\"taxpay\" + 0.014*\"open\" + 0.014*\"martin\"\n", + "2019-01-31 00:47:20,087 : INFO : topic diff=0.005931, rho=0.033131\n", + "2019-01-31 00:47:20,307 : INFO : PROGRESS: pass 0, at document #1824000/4922894\n", + "2019-01-31 00:47:21,732 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:47:21,998 : INFO : topic #38 (0.020): 0.024*\"walter\" + 0.009*\"aza\" + 0.009*\"forc\" + 0.009*\"battalion\" + 0.008*\"empath\" + 0.007*\"armi\" + 0.006*\"militari\" + 0.006*\"pour\" + 0.006*\"govern\" + 0.006*\"teufel\"\n", + "2019-01-31 00:47:21,999 : INFO : topic #32 (0.020): 0.054*\"district\" + 0.044*\"vigour\" + 0.043*\"popolo\" + 0.037*\"tortur\" + 0.032*\"area\" + 0.030*\"cotton\" + 0.023*\"regim\" + 0.022*\"multitud\" + 0.021*\"citi\" + 0.020*\"commun\"\n", + "2019-01-31 00:47:22,001 : INFO : topic #21 (0.020): 0.035*\"samford\" + 0.023*\"spain\" + 0.021*\"del\" + 0.017*\"mexico\" + 0.015*\"soviet\" + 0.012*\"santa\" + 0.012*\"francisco\" + 0.011*\"lizard\" + 0.011*\"juan\" + 0.011*\"carlo\"\n", + "2019-01-31 00:47:22,002 : INFO : topic #25 (0.020): 0.031*\"ring\" + 0.017*\"warmth\" + 0.017*\"lagrang\" + 0.016*\"area\" + 0.015*\"mount\" + 0.010*\"palmer\" + 0.009*\"north\" + 0.008*\"foam\" + 0.008*\"land\" + 0.008*\"lobe\"\n", + "2019-01-31 00:47:22,003 : INFO : topic #20 (0.020): 0.143*\"scholar\" + 0.039*\"struggl\" + 0.032*\"high\" + 0.029*\"educ\" + 0.023*\"collector\" + 0.018*\"yawn\" + 0.013*\"prognosi\" + 0.010*\"district\" + 0.009*\"task\" + 0.009*\"gothic\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 00:47:22,009 : INFO : topic diff=0.005446, rho=0.033113\n", + "2019-01-31 00:47:22,173 : INFO : PROGRESS: pass 0, at document #1826000/4922894\n", + "2019-01-31 00:47:23,592 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:47:23,859 : INFO : topic #23 (0.020): 0.135*\"audit\" + 0.067*\"best\" + 0.035*\"yawn\" + 0.029*\"jacksonvil\" + 0.024*\"japanes\" + 0.023*\"noll\" + 0.021*\"festiv\" + 0.018*\"women\" + 0.017*\"intern\" + 0.013*\"prison\"\n", + "2019-01-31 00:47:23,860 : INFO : topic #27 (0.020): 0.072*\"questionnair\" + 0.022*\"taxpay\" + 0.020*\"candid\" + 0.015*\"ret\" + 0.013*\"fool\" + 0.012*\"driver\" + 0.011*\"find\" + 0.011*\"tornado\" + 0.010*\"squatter\" + 0.010*\"théori\"\n", + "2019-01-31 00:47:23,861 : INFO : topic #0 (0.020): 0.068*\"statewid\" + 0.041*\"line\" + 0.036*\"arsen\" + 0.036*\"raid\" + 0.029*\"museo\" + 0.019*\"traceabl\" + 0.018*\"serv\" + 0.014*\"exhaust\" + 0.014*\"pain\" + 0.012*\"oper\"\n", + "2019-01-31 00:47:23,862 : INFO : topic #13 (0.020): 0.029*\"sourc\" + 0.027*\"australia\" + 0.027*\"london\" + 0.026*\"new\" + 0.024*\"england\" + 0.022*\"australian\" + 0.019*\"british\" + 0.017*\"ireland\" + 0.016*\"youth\" + 0.014*\"wale\"\n", + "2019-01-31 00:47:23,863 : INFO : topic #28 (0.020): 0.032*\"build\" + 0.026*\"hous\" + 0.022*\"rivièr\" + 0.018*\"buford\" + 0.014*\"histor\" + 0.013*\"briarwood\" + 0.011*\"strategist\" + 0.011*\"constitut\" + 0.010*\"linear\" + 0.010*\"depress\"\n", + "2019-01-31 00:47:23,869 : INFO : topic diff=0.005925, rho=0.033095\n", + "2019-01-31 00:47:24,033 : INFO : PROGRESS: pass 0, at document #1828000/4922894\n", + "2019-01-31 00:47:25,411 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:47:25,678 : INFO : topic #22 (0.020): 0.033*\"spars\" + 0.024*\"factor\" + 0.020*\"adulthood\" + 0.016*\"feel\" + 0.016*\"male\" + 0.012*\"plaisir\" + 0.012*\"hostil\" + 0.010*\"genu\" + 0.009*\"live\" + 0.008*\"median\"\n", + "2019-01-31 00:47:25,679 : INFO : topic #41 (0.020): 0.041*\"citi\" + 0.025*\"new\" + 0.023*\"palmer\" + 0.015*\"strategist\" + 0.013*\"open\" + 0.012*\"center\" + 0.011*\"includ\" + 0.010*\"lobe\" + 0.009*\"highli\" + 0.009*\"dai\"\n", + "2019-01-31 00:47:25,680 : INFO : topic #27 (0.020): 0.072*\"questionnair\" + 0.021*\"taxpay\" + 0.020*\"candid\" + 0.017*\"ret\" + 0.013*\"fool\" + 0.012*\"driver\" + 0.011*\"find\" + 0.010*\"tornado\" + 0.010*\"théori\" + 0.010*\"squatter\"\n", + "2019-01-31 00:47:25,682 : INFO : topic #7 (0.020): 0.021*\"snatch\" + 0.020*\"di\" + 0.018*\"factor\" + 0.016*\"yawn\" + 0.015*\"margin\" + 0.014*\"bone\" + 0.013*\"life\" + 0.013*\"faster\" + 0.012*\"daughter\" + 0.012*\"deal\"\n", + "2019-01-31 00:47:25,683 : INFO : topic #16 (0.020): 0.052*\"king\" + 0.032*\"priest\" + 0.021*\"quarterli\" + 0.021*\"duke\" + 0.020*\"rotterdam\" + 0.017*\"idiosyncrat\" + 0.016*\"grammat\" + 0.014*\"princ\" + 0.013*\"brazil\" + 0.013*\"maria\"\n", + "2019-01-31 00:47:25,689 : INFO : topic diff=0.004206, rho=0.033077\n", + "2019-01-31 00:47:25,844 : INFO : PROGRESS: pass 0, at document #1830000/4922894\n", + "2019-01-31 00:47:27,224 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:47:27,491 : INFO : topic #15 (0.020): 0.011*\"small\" + 0.011*\"organ\" + 0.010*\"develop\" + 0.010*\"commun\" + 0.009*\"word\" + 0.009*\"group\" + 0.009*\"peopl\" + 0.007*\"cultur\" + 0.007*\"woman\" + 0.007*\"human\"\n", + "2019-01-31 00:47:27,492 : INFO : topic #38 (0.020): 0.024*\"walter\" + 0.009*\"aza\" + 0.009*\"forc\" + 0.009*\"battalion\" + 0.008*\"empath\" + 0.007*\"armi\" + 0.006*\"militari\" + 0.006*\"teufel\" + 0.006*\"pour\" + 0.006*\"govern\"\n", + "2019-01-31 00:47:27,493 : INFO : topic #47 (0.020): 0.066*\"muscl\" + 0.035*\"perceptu\" + 0.019*\"theater\" + 0.019*\"place\" + 0.017*\"compos\" + 0.016*\"damn\" + 0.014*\"orchestr\" + 0.012*\"olympo\" + 0.012*\"physician\" + 0.011*\"word\"\n", + "2019-01-31 00:47:27,494 : INFO : topic #22 (0.020): 0.033*\"spars\" + 0.026*\"factor\" + 0.020*\"adulthood\" + 0.016*\"feel\" + 0.016*\"male\" + 0.012*\"hostil\" + 0.012*\"plaisir\" + 0.010*\"genu\" + 0.009*\"live\" + 0.008*\"median\"\n", + "2019-01-31 00:47:27,495 : INFO : topic #34 (0.020): 0.072*\"start\" + 0.031*\"unionist\" + 0.030*\"american\" + 0.028*\"new\" + 0.027*\"cotton\" + 0.018*\"year\" + 0.016*\"california\" + 0.013*\"terri\" + 0.012*\"warrior\" + 0.012*\"north\"\n", + "2019-01-31 00:47:27,501 : INFO : topic diff=0.004956, rho=0.033059\n", + "2019-01-31 00:47:27,655 : INFO : PROGRESS: pass 0, at document #1832000/4922894\n", + "2019-01-31 00:47:29,025 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:47:29,292 : INFO : topic #9 (0.020): 0.068*\"bone\" + 0.042*\"american\" + 0.030*\"valour\" + 0.020*\"dutch\" + 0.018*\"folei\" + 0.017*\"polit\" + 0.017*\"player\" + 0.016*\"english\" + 0.012*\"acrimoni\" + 0.011*\"simpler\"\n", + "2019-01-31 00:47:29,293 : INFO : topic #27 (0.020): 0.072*\"questionnair\" + 0.021*\"taxpay\" + 0.020*\"candid\" + 0.017*\"ret\" + 0.013*\"fool\" + 0.012*\"driver\" + 0.011*\"find\" + 0.010*\"tornado\" + 0.010*\"théori\" + 0.010*\"squatter\"\n", + "2019-01-31 00:47:29,294 : INFO : topic #37 (0.020): 0.009*\"man\" + 0.009*\"love\" + 0.008*\"charact\" + 0.007*\"septemb\" + 0.007*\"gestur\" + 0.007*\"comic\" + 0.006*\"appear\" + 0.006*\"blue\" + 0.005*\"anim\" + 0.005*\"admit\"\n", + "2019-01-31 00:47:29,295 : INFO : topic #6 (0.020): 0.071*\"fewer\" + 0.024*\"septemb\" + 0.024*\"epiru\" + 0.018*\"teacher\" + 0.017*\"stake\" + 0.013*\"rodríguez\" + 0.013*\"proclaim\" + 0.011*\"direct\" + 0.011*\"movi\" + 0.010*\"acrimoni\"\n", + "2019-01-31 00:47:29,296 : INFO : topic #26 (0.020): 0.031*\"workplac\" + 0.027*\"woman\" + 0.027*\"champion\" + 0.025*\"men\" + 0.024*\"olymp\" + 0.023*\"medal\" + 0.020*\"event\" + 0.019*\"rainfal\" + 0.018*\"taxpay\" + 0.018*\"atheist\"\n", + "2019-01-31 00:47:29,302 : INFO : topic diff=0.004822, rho=0.033041\n", + "2019-01-31 00:47:29,467 : INFO : PROGRESS: pass 0, at document #1834000/4922894\n", + "2019-01-31 00:47:30,880 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:47:31,147 : INFO : topic #8 (0.020): 0.027*\"law\" + 0.024*\"cortic\" + 0.018*\"start\" + 0.015*\"act\" + 0.014*\"ricardo\" + 0.012*\"case\" + 0.011*\"polaris\" + 0.010*\"replac\" + 0.009*\"legal\" + 0.007*\"judaism\"\n", + "2019-01-31 00:47:31,148 : INFO : topic #26 (0.020): 0.031*\"workplac\" + 0.027*\"woman\" + 0.027*\"champion\" + 0.025*\"men\" + 0.025*\"olymp\" + 0.023*\"medal\" + 0.020*\"event\" + 0.019*\"rainfal\" + 0.018*\"taxpay\" + 0.018*\"atheist\"\n", + "2019-01-31 00:47:31,149 : INFO : topic #24 (0.020): 0.041*\"book\" + 0.035*\"publicis\" + 0.025*\"word\" + 0.018*\"new\" + 0.014*\"edit\" + 0.013*\"presid\" + 0.012*\"nicola\" + 0.012*\"storag\" + 0.012*\"collect\" + 0.011*\"author\"\n", + "2019-01-31 00:47:31,150 : INFO : topic #32 (0.020): 0.054*\"district\" + 0.044*\"vigour\" + 0.043*\"popolo\" + 0.038*\"tortur\" + 0.031*\"area\" + 0.030*\"cotton\" + 0.023*\"regim\" + 0.022*\"multitud\" + 0.021*\"citi\" + 0.020*\"commun\"\n", + "2019-01-31 00:47:31,151 : INFO : topic #27 (0.020): 0.071*\"questionnair\" + 0.021*\"taxpay\" + 0.020*\"candid\" + 0.017*\"ret\" + 0.013*\"fool\" + 0.012*\"driver\" + 0.011*\"find\" + 0.010*\"théori\" + 0.010*\"tornado\" + 0.010*\"squatter\"\n", + "2019-01-31 00:47:31,157 : INFO : topic diff=0.005927, rho=0.033023\n", + "2019-01-31 00:47:31,312 : INFO : PROGRESS: pass 0, at document #1836000/4922894\n", + "2019-01-31 00:47:32,703 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:47:32,969 : INFO : topic #18 (0.020): 0.010*\"théori\" + 0.007*\"later\" + 0.006*\"sack\" + 0.006*\"dai\" + 0.006*\"kill\" + 0.005*\"retrospect\" + 0.005*\"like\" + 0.005*\"end\" + 0.004*\"help\" + 0.004*\"call\"\n", + "2019-01-31 00:47:32,970 : INFO : topic #42 (0.020): 0.044*\"german\" + 0.031*\"germani\" + 0.016*\"israel\" + 0.015*\"vol\" + 0.014*\"jewish\" + 0.014*\"berlin\" + 0.012*\"der\" + 0.010*\"european\" + 0.009*\"europ\" + 0.008*\"austria\"\n", + "2019-01-31 00:47:32,971 : INFO : topic #8 (0.020): 0.027*\"law\" + 0.024*\"cortic\" + 0.018*\"start\" + 0.015*\"act\" + 0.014*\"ricardo\" + 0.012*\"case\" + 0.011*\"polaris\" + 0.010*\"replac\" + 0.009*\"legal\" + 0.007*\"judaism\"\n", + "2019-01-31 00:47:32,973 : INFO : topic #5 (0.020): 0.039*\"abroad\" + 0.029*\"son\" + 0.027*\"rel\" + 0.026*\"reconstruct\" + 0.021*\"band\" + 0.016*\"muscl\" + 0.016*\"simultan\" + 0.014*\"charcoal\" + 0.013*\"toyota\" + 0.010*\"myspac\"\n", + "2019-01-31 00:47:32,974 : INFO : topic #27 (0.020): 0.071*\"questionnair\" + 0.021*\"taxpay\" + 0.020*\"candid\" + 0.017*\"ret\" + 0.013*\"fool\" + 0.012*\"driver\" + 0.011*\"find\" + 0.010*\"théori\" + 0.010*\"tornado\" + 0.010*\"squatter\"\n", + "2019-01-31 00:47:32,979 : INFO : topic diff=0.005192, rho=0.033005\n", + "2019-01-31 00:47:33,137 : INFO : PROGRESS: pass 0, at document #1838000/4922894\n", + "2019-01-31 00:47:34,535 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 00:47:34,801 : INFO : topic #19 (0.020): 0.017*\"languag\" + 0.012*\"centuri\" + 0.011*\"woodcut\" + 0.010*\"form\" + 0.009*\"origin\" + 0.008*\"mean\" + 0.008*\"english\" + 0.007*\"trade\" + 0.007*\"known\" + 0.006*\"like\"\n", + "2019-01-31 00:47:34,802 : INFO : topic #23 (0.020): 0.135*\"audit\" + 0.068*\"best\" + 0.035*\"yawn\" + 0.030*\"jacksonvil\" + 0.023*\"japanes\" + 0.023*\"noll\" + 0.020*\"festiv\" + 0.018*\"women\" + 0.017*\"intern\" + 0.014*\"prison\"\n", + "2019-01-31 00:47:34,804 : INFO : topic #29 (0.020): 0.028*\"companhia\" + 0.012*\"million\" + 0.011*\"busi\" + 0.010*\"bank\" + 0.010*\"market\" + 0.010*\"produc\" + 0.009*\"industri\" + 0.009*\"yawn\" + 0.008*\"manag\" + 0.007*\"trace\"\n", + "2019-01-31 00:47:34,805 : INFO : topic #15 (0.020): 0.011*\"small\" + 0.011*\"organ\" + 0.010*\"develop\" + 0.010*\"commun\" + 0.009*\"word\" + 0.009*\"group\" + 0.008*\"peopl\" + 0.007*\"cultur\" + 0.007*\"woman\" + 0.007*\"human\"\n", + "2019-01-31 00:47:34,806 : INFO : topic #34 (0.020): 0.072*\"start\" + 0.031*\"unionist\" + 0.030*\"american\" + 0.028*\"new\" + 0.027*\"cotton\" + 0.018*\"year\" + 0.016*\"california\" + 0.013*\"terri\" + 0.012*\"warrior\" + 0.012*\"north\"\n", + "2019-01-31 00:47:34,812 : INFO : topic diff=0.005188, rho=0.032987\n", + "2019-01-31 00:47:37,592 : INFO : -11.878 per-word bound, 3762.7 perplexity estimate based on a held-out corpus of 2000 documents with 595170 words\n", + "2019-01-31 00:47:37,592 : INFO : PROGRESS: pass 0, at document #1840000/4922894\n", + "2019-01-31 00:47:39,017 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:47:39,284 : INFO : topic #15 (0.020): 0.011*\"small\" + 0.011*\"organ\" + 0.010*\"develop\" + 0.010*\"commun\" + 0.009*\"word\" + 0.009*\"group\" + 0.008*\"peopl\" + 0.007*\"cultur\" + 0.007*\"woman\" + 0.007*\"human\"\n", + "2019-01-31 00:47:39,285 : INFO : topic #22 (0.020): 0.033*\"spars\" + 0.025*\"factor\" + 0.019*\"adulthood\" + 0.016*\"feel\" + 0.015*\"male\" + 0.012*\"plaisir\" + 0.012*\"hostil\" + 0.010*\"genu\" + 0.009*\"live\" + 0.008*\"median\"\n", + "2019-01-31 00:47:39,286 : INFO : topic #11 (0.020): 0.024*\"john\" + 0.013*\"will\" + 0.012*\"jame\" + 0.011*\"david\" + 0.010*\"rival\" + 0.009*\"mexican–american\" + 0.009*\"georg\" + 0.008*\"slur\" + 0.008*\"paul\" + 0.008*\"rhyme\"\n", + "2019-01-31 00:47:39,287 : INFO : topic #21 (0.020): 0.036*\"samford\" + 0.023*\"spain\" + 0.020*\"del\" + 0.017*\"mexico\" + 0.015*\"soviet\" + 0.012*\"santa\" + 0.012*\"francisco\" + 0.012*\"carlo\" + 0.012*\"juan\" + 0.011*\"lizard\"\n", + "2019-01-31 00:47:39,288 : INFO : topic #30 (0.020): 0.035*\"leagu\" + 0.034*\"cleveland\" + 0.029*\"place\" + 0.026*\"taxpay\" + 0.024*\"scientist\" + 0.023*\"crete\" + 0.021*\"folei\" + 0.017*\"goal\" + 0.015*\"martin\" + 0.012*\"schmitz\"\n", + "2019-01-31 00:47:39,294 : INFO : topic diff=0.005160, rho=0.032969\n", + "2019-01-31 00:47:39,450 : INFO : PROGRESS: pass 0, at document #1842000/4922894\n", + "2019-01-31 00:47:40,820 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:47:41,087 : INFO : topic #45 (0.020): 0.026*\"jpg\" + 0.024*\"fifteenth\" + 0.017*\"black\" + 0.017*\"illicit\" + 0.016*\"western\" + 0.016*\"colder\" + 0.013*\"record\" + 0.011*\"blind\" + 0.007*\"depress\" + 0.007*\"light\"\n", + "2019-01-31 00:47:41,088 : INFO : topic #19 (0.020): 0.017*\"languag\" + 0.012*\"centuri\" + 0.011*\"woodcut\" + 0.010*\"form\" + 0.009*\"origin\" + 0.008*\"mean\" + 0.008*\"english\" + 0.007*\"trade\" + 0.007*\"known\" + 0.006*\"like\"\n", + "2019-01-31 00:47:41,089 : INFO : topic #30 (0.020): 0.035*\"leagu\" + 0.035*\"cleveland\" + 0.029*\"place\" + 0.026*\"taxpay\" + 0.024*\"scientist\" + 0.023*\"crete\" + 0.021*\"folei\" + 0.016*\"goal\" + 0.015*\"martin\" + 0.012*\"schmitz\"\n", + "2019-01-31 00:47:41,090 : INFO : topic #22 (0.020): 0.033*\"spars\" + 0.025*\"factor\" + 0.019*\"adulthood\" + 0.016*\"feel\" + 0.015*\"male\" + 0.012*\"plaisir\" + 0.012*\"hostil\" + 0.010*\"genu\" + 0.008*\"live\" + 0.008*\"median\"\n", + "2019-01-31 00:47:41,091 : INFO : topic #7 (0.020): 0.021*\"snatch\" + 0.020*\"di\" + 0.018*\"factor\" + 0.016*\"yawn\" + 0.015*\"margin\" + 0.014*\"bone\" + 0.013*\"life\" + 0.013*\"faster\" + 0.012*\"daughter\" + 0.012*\"deal\"\n", + "2019-01-31 00:47:41,097 : INFO : topic diff=0.005418, rho=0.032951\n", + "2019-01-31 00:47:41,253 : INFO : PROGRESS: pass 0, at document #1844000/4922894\n", + "2019-01-31 00:47:42,636 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:47:42,902 : INFO : topic #27 (0.020): 0.071*\"questionnair\" + 0.021*\"taxpay\" + 0.020*\"candid\" + 0.017*\"ret\" + 0.012*\"fool\" + 0.012*\"driver\" + 0.011*\"find\" + 0.010*\"tornado\" + 0.010*\"théori\" + 0.009*\"squatter\"\n", + "2019-01-31 00:47:42,903 : INFO : topic #12 (0.020): 0.008*\"number\" + 0.007*\"gener\" + 0.007*\"frontal\" + 0.006*\"exampl\" + 0.006*\"théori\" + 0.006*\"poet\" + 0.006*\"measur\" + 0.006*\"servitud\" + 0.006*\"differ\" + 0.006*\"method\"\n", + "2019-01-31 00:47:42,904 : INFO : topic #32 (0.020): 0.054*\"district\" + 0.043*\"vigour\" + 0.043*\"popolo\" + 0.039*\"tortur\" + 0.031*\"area\" + 0.030*\"cotton\" + 0.023*\"regim\" + 0.022*\"multitud\" + 0.021*\"citi\" + 0.020*\"commun\"\n", + "2019-01-31 00:47:42,905 : INFO : topic #43 (0.020): 0.064*\"elect\" + 0.054*\"parti\" + 0.024*\"democrat\" + 0.023*\"voluntari\" + 0.020*\"member\" + 0.017*\"republ\" + 0.016*\"polici\" + 0.014*\"report\" + 0.014*\"bypass\" + 0.014*\"selma\"\n", + "2019-01-31 00:47:42,906 : INFO : topic #35 (0.020): 0.060*\"russia\" + 0.040*\"sovereignti\" + 0.033*\"rural\" + 0.026*\"poison\" + 0.025*\"personifi\" + 0.024*\"reprint\" + 0.023*\"moscow\" + 0.018*\"poland\" + 0.017*\"unfortun\" + 0.013*\"turin\"\n", + "2019-01-31 00:47:42,912 : INFO : topic diff=0.004468, rho=0.032933\n", + "2019-01-31 00:47:43,071 : INFO : PROGRESS: pass 0, at document #1846000/4922894\n", + "2019-01-31 00:47:44,470 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:47:44,736 : INFO : topic #4 (0.020): 0.021*\"enfranchis\" + 0.015*\"depress\" + 0.014*\"pour\" + 0.009*\"mode\" + 0.009*\"elabor\" + 0.008*\"veget\" + 0.007*\"candid\" + 0.007*\"uruguayan\" + 0.007*\"produc\" + 0.006*\"develop\"\n", + "2019-01-31 00:47:44,737 : INFO : topic #11 (0.020): 0.025*\"john\" + 0.012*\"will\" + 0.012*\"jame\" + 0.011*\"david\" + 0.010*\"rival\" + 0.009*\"mexican–american\" + 0.009*\"georg\" + 0.008*\"paul\" + 0.008*\"slur\" + 0.008*\"rhyme\"\n", + "2019-01-31 00:47:44,738 : INFO : topic #49 (0.020): 0.042*\"india\" + 0.030*\"incumb\" + 0.013*\"pakistan\" + 0.013*\"islam\" + 0.013*\"anglo\" + 0.011*\"televis\" + 0.010*\"sri\" + 0.010*\"muskoge\" + 0.010*\"khalsa\" + 0.010*\"alam\"\n", + "2019-01-31 00:47:44,739 : INFO : topic #20 (0.020): 0.142*\"scholar\" + 0.039*\"struggl\" + 0.032*\"high\" + 0.028*\"educ\" + 0.024*\"collector\" + 0.018*\"yawn\" + 0.013*\"prognosi\" + 0.010*\"district\" + 0.009*\"task\" + 0.009*\"gothic\"\n", + "2019-01-31 00:47:44,740 : INFO : topic #1 (0.020): 0.053*\"china\" + 0.044*\"chilton\" + 0.027*\"hong\" + 0.026*\"kong\" + 0.024*\"korea\" + 0.019*\"korean\" + 0.017*\"leah\" + 0.015*\"sourc\" + 0.014*\"kim\" + 0.013*\"shirin\"\n", + "2019-01-31 00:47:44,746 : INFO : topic diff=0.004114, rho=0.032915\n", + "2019-01-31 00:47:44,904 : INFO : PROGRESS: pass 0, at document #1848000/4922894\n", + "2019-01-31 00:47:46,295 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:47:46,561 : INFO : topic #34 (0.020): 0.071*\"start\" + 0.031*\"unionist\" + 0.030*\"american\" + 0.029*\"new\" + 0.027*\"cotton\" + 0.018*\"year\" + 0.015*\"california\" + 0.013*\"terri\" + 0.012*\"warrior\" + 0.012*\"north\"\n", + "2019-01-31 00:47:46,562 : INFO : topic #6 (0.020): 0.071*\"fewer\" + 0.025*\"epiru\" + 0.024*\"septemb\" + 0.018*\"teacher\" + 0.016*\"stake\" + 0.013*\"rodríguez\" + 0.013*\"proclaim\" + 0.012*\"direct\" + 0.011*\"movi\" + 0.010*\"acrimoni\"\n", + "2019-01-31 00:47:46,563 : INFO : topic #25 (0.020): 0.031*\"ring\" + 0.017*\"lagrang\" + 0.017*\"warmth\" + 0.016*\"area\" + 0.015*\"mount\" + 0.009*\"palmer\" + 0.009*\"north\" + 0.009*\"foam\" + 0.008*\"land\" + 0.008*\"lobe\"\n", + "2019-01-31 00:47:46,564 : INFO : topic #46 (0.020): 0.019*\"stop\" + 0.018*\"wind\" + 0.017*\"swedish\" + 0.017*\"sweden\" + 0.016*\"damag\" + 0.016*\"norwai\" + 0.014*\"norwegian\" + 0.012*\"farid\" + 0.011*\"denmark\" + 0.010*\"danish\"\n", + "2019-01-31 00:47:46,565 : INFO : topic #18 (0.020): 0.010*\"théori\" + 0.007*\"later\" + 0.006*\"sack\" + 0.006*\"dai\" + 0.006*\"kill\" + 0.005*\"retrospect\" + 0.005*\"like\" + 0.005*\"end\" + 0.004*\"help\" + 0.004*\"call\"\n", + "2019-01-31 00:47:46,571 : INFO : topic diff=0.005729, rho=0.032898\n", + "2019-01-31 00:47:46,730 : INFO : PROGRESS: pass 0, at document #1850000/4922894\n", + "2019-01-31 00:47:48,133 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:47:48,399 : INFO : topic #25 (0.020): 0.031*\"ring\" + 0.017*\"lagrang\" + 0.017*\"warmth\" + 0.016*\"area\" + 0.015*\"mount\" + 0.009*\"palmer\" + 0.009*\"north\" + 0.008*\"foam\" + 0.008*\"land\" + 0.008*\"lobe\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 00:47:48,401 : INFO : topic #33 (0.020): 0.061*\"french\" + 0.049*\"franc\" + 0.031*\"pari\" + 0.023*\"sail\" + 0.022*\"jean\" + 0.016*\"daphn\" + 0.013*\"lazi\" + 0.012*\"loui\" + 0.012*\"piec\" + 0.010*\"wine\"\n", + "2019-01-31 00:47:48,402 : INFO : topic #6 (0.020): 0.071*\"fewer\" + 0.024*\"epiru\" + 0.024*\"septemb\" + 0.019*\"teacher\" + 0.016*\"stake\" + 0.013*\"rodríguez\" + 0.012*\"proclaim\" + 0.012*\"direct\" + 0.011*\"movi\" + 0.010*\"acrimoni\"\n", + "2019-01-31 00:47:48,403 : INFO : topic #2 (0.020): 0.048*\"isl\" + 0.040*\"shield\" + 0.017*\"narrat\" + 0.014*\"scot\" + 0.012*\"blur\" + 0.012*\"pope\" + 0.011*\"coalit\" + 0.010*\"nativist\" + 0.009*\"bahá\" + 0.009*\"fleet\"\n", + "2019-01-31 00:47:48,404 : INFO : topic #49 (0.020): 0.042*\"india\" + 0.030*\"incumb\" + 0.013*\"pakistan\" + 0.013*\"islam\" + 0.013*\"anglo\" + 0.011*\"khalsa\" + 0.011*\"televis\" + 0.010*\"sri\" + 0.010*\"muskoge\" + 0.010*\"alam\"\n", + "2019-01-31 00:47:48,410 : INFO : topic diff=0.005411, rho=0.032880\n", + "2019-01-31 00:47:48,565 : INFO : PROGRESS: pass 0, at document #1852000/4922894\n", + "2019-01-31 00:47:49,945 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:47:50,212 : INFO : topic #32 (0.020): 0.053*\"district\" + 0.044*\"popolo\" + 0.043*\"vigour\" + 0.040*\"tortur\" + 0.031*\"area\" + 0.029*\"cotton\" + 0.023*\"regim\" + 0.022*\"multitud\" + 0.021*\"citi\" + 0.020*\"commun\"\n", + "2019-01-31 00:47:50,213 : INFO : topic #43 (0.020): 0.063*\"elect\" + 0.054*\"parti\" + 0.024*\"voluntari\" + 0.023*\"democrat\" + 0.020*\"member\" + 0.017*\"republ\" + 0.016*\"polici\" + 0.014*\"report\" + 0.013*\"bypass\" + 0.013*\"selma\"\n", + "2019-01-31 00:47:50,214 : INFO : topic #2 (0.020): 0.048*\"isl\" + 0.040*\"shield\" + 0.017*\"narrat\" + 0.014*\"scot\" + 0.012*\"pope\" + 0.012*\"blur\" + 0.011*\"coalit\" + 0.010*\"nativist\" + 0.010*\"bahá\" + 0.009*\"fleet\"\n", + "2019-01-31 00:47:50,215 : INFO : topic #47 (0.020): 0.066*\"muscl\" + 0.036*\"perceptu\" + 0.020*\"theater\" + 0.019*\"place\" + 0.018*\"damn\" + 0.017*\"compos\" + 0.013*\"orchestr\" + 0.013*\"olympo\" + 0.012*\"physician\" + 0.011*\"word\"\n", + "2019-01-31 00:47:50,216 : INFO : topic #11 (0.020): 0.025*\"john\" + 0.012*\"will\" + 0.012*\"jame\" + 0.011*\"david\" + 0.010*\"rival\" + 0.009*\"mexican–american\" + 0.009*\"georg\" + 0.008*\"paul\" + 0.008*\"slur\" + 0.008*\"rhyme\"\n", + "2019-01-31 00:47:50,222 : INFO : topic diff=0.004384, rho=0.032862\n", + "2019-01-31 00:47:50,435 : INFO : PROGRESS: pass 0, at document #1854000/4922894\n", + "2019-01-31 00:47:51,806 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:47:52,072 : INFO : topic #40 (0.020): 0.087*\"unit\" + 0.023*\"collector\" + 0.023*\"schuster\" + 0.022*\"institut\" + 0.021*\"requir\" + 0.019*\"student\" + 0.015*\"professor\" + 0.012*\"word\" + 0.012*\"http\" + 0.011*\"degre\"\n", + "2019-01-31 00:47:52,073 : INFO : topic #31 (0.020): 0.057*\"fusiform\" + 0.026*\"scientist\" + 0.026*\"player\" + 0.025*\"taxpay\" + 0.020*\"place\" + 0.014*\"clot\" + 0.013*\"leagu\" + 0.011*\"folei\" + 0.010*\"yawn\" + 0.009*\"reconstruct\"\n", + "2019-01-31 00:47:52,074 : INFO : topic #4 (0.020): 0.021*\"enfranchis\" + 0.015*\"depress\" + 0.014*\"pour\" + 0.009*\"elabor\" + 0.009*\"mode\" + 0.008*\"veget\" + 0.007*\"uruguayan\" + 0.007*\"produc\" + 0.007*\"candid\" + 0.006*\"develop\"\n", + "2019-01-31 00:47:52,076 : INFO : topic #3 (0.020): 0.034*\"present\" + 0.027*\"offic\" + 0.024*\"minist\" + 0.022*\"govern\" + 0.022*\"nation\" + 0.021*\"member\" + 0.018*\"gener\" + 0.016*\"start\" + 0.016*\"seri\" + 0.016*\"serv\"\n", + "2019-01-31 00:47:52,077 : INFO : topic #18 (0.020): 0.010*\"théori\" + 0.007*\"later\" + 0.006*\"sack\" + 0.006*\"dai\" + 0.006*\"kill\" + 0.005*\"retrospect\" + 0.005*\"like\" + 0.005*\"end\" + 0.004*\"kenworthi\" + 0.004*\"call\"\n", + "2019-01-31 00:47:52,083 : INFO : topic diff=0.005173, rho=0.032844\n", + "2019-01-31 00:47:52,240 : INFO : PROGRESS: pass 0, at document #1856000/4922894\n", + "2019-01-31 00:47:53,648 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:47:53,914 : INFO : topic #15 (0.020): 0.011*\"small\" + 0.011*\"organ\" + 0.010*\"develop\" + 0.010*\"commun\" + 0.009*\"word\" + 0.009*\"group\" + 0.008*\"peopl\" + 0.008*\"woman\" + 0.007*\"cultur\" + 0.007*\"human\"\n", + "2019-01-31 00:47:53,915 : INFO : topic #38 (0.020): 0.023*\"walter\" + 0.010*\"aza\" + 0.009*\"battalion\" + 0.009*\"forc\" + 0.007*\"empath\" + 0.007*\"armi\" + 0.007*\"teufel\" + 0.006*\"govern\" + 0.006*\"militari\" + 0.006*\"pour\"\n", + "2019-01-31 00:47:53,916 : INFO : topic #21 (0.020): 0.037*\"samford\" + 0.023*\"spain\" + 0.020*\"del\" + 0.017*\"mexico\" + 0.015*\"soviet\" + 0.012*\"santa\" + 0.012*\"francisco\" + 0.011*\"carlo\" + 0.011*\"juan\" + 0.010*\"lizard\"\n", + "2019-01-31 00:47:53,917 : INFO : topic #39 (0.020): 0.054*\"canada\" + 0.041*\"canadian\" + 0.023*\"toronto\" + 0.022*\"hoar\" + 0.019*\"ontario\" + 0.016*\"hydrogen\" + 0.015*\"misericordia\" + 0.015*\"novotná\" + 0.014*\"new\" + 0.011*\"quebec\"\n", + "2019-01-31 00:47:53,918 : INFO : topic #46 (0.020): 0.019*\"wind\" + 0.018*\"stop\" + 0.016*\"sweden\" + 0.016*\"swedish\" + 0.016*\"damag\" + 0.016*\"norwai\" + 0.014*\"norwegian\" + 0.012*\"farid\" + 0.010*\"denmark\" + 0.010*\"huntsvil\"\n", + "2019-01-31 00:47:53,924 : INFO : topic diff=0.004294, rho=0.032827\n", + "2019-01-31 00:47:54,079 : INFO : PROGRESS: pass 0, at document #1858000/4922894\n", + "2019-01-31 00:47:55,457 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:47:55,723 : INFO : topic #33 (0.020): 0.061*\"french\" + 0.049*\"franc\" + 0.031*\"pari\" + 0.023*\"sail\" + 0.022*\"jean\" + 0.016*\"daphn\" + 0.013*\"lazi\" + 0.012*\"loui\" + 0.012*\"piec\" + 0.010*\"wine\"\n", + "2019-01-31 00:47:55,724 : INFO : topic #44 (0.020): 0.033*\"rooftop\" + 0.027*\"final\" + 0.024*\"wife\" + 0.021*\"tourist\" + 0.018*\"champion\" + 0.016*\"tiepolo\" + 0.015*\"chamber\" + 0.014*\"martin\" + 0.014*\"taxpay\" + 0.013*\"winner\"\n", + "2019-01-31 00:47:55,725 : INFO : topic #11 (0.020): 0.025*\"john\" + 0.012*\"will\" + 0.012*\"jame\" + 0.011*\"david\" + 0.010*\"rival\" + 0.009*\"mexican–american\" + 0.009*\"georg\" + 0.008*\"paul\" + 0.008*\"slur\" + 0.008*\"rhyme\"\n", + "2019-01-31 00:47:55,726 : INFO : topic #38 (0.020): 0.023*\"walter\" + 0.010*\"aza\" + 0.009*\"battalion\" + 0.009*\"forc\" + 0.007*\"empath\" + 0.007*\"armi\" + 0.007*\"teufel\" + 0.006*\"govern\" + 0.006*\"militari\" + 0.006*\"pour\"\n", + "2019-01-31 00:47:55,727 : INFO : topic #5 (0.020): 0.039*\"abroad\" + 0.029*\"son\" + 0.026*\"rel\" + 0.025*\"reconstruct\" + 0.021*\"band\" + 0.016*\"muscl\" + 0.016*\"simultan\" + 0.014*\"charcoal\" + 0.013*\"toyota\" + 0.010*\"myspac\"\n", + "2019-01-31 00:47:55,733 : INFO : topic diff=0.004720, rho=0.032809\n", + "2019-01-31 00:47:58,376 : INFO : -11.625 per-word bound, 3157.6 perplexity estimate based on a held-out corpus of 2000 documents with 524554 words\n", + "2019-01-31 00:47:58,376 : INFO : PROGRESS: pass 0, at document #1860000/4922894\n", + "2019-01-31 00:47:59,743 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:48:00,009 : INFO : topic #23 (0.020): 0.139*\"audit\" + 0.068*\"best\" + 0.035*\"yawn\" + 0.029*\"jacksonvil\" + 0.024*\"noll\" + 0.022*\"japanes\" + 0.019*\"festiv\" + 0.018*\"women\" + 0.016*\"intern\" + 0.013*\"prison\"\n", + "2019-01-31 00:48:00,010 : INFO : topic #27 (0.020): 0.071*\"questionnair\" + 0.021*\"candid\" + 0.021*\"taxpay\" + 0.016*\"ret\" + 0.013*\"driver\" + 0.013*\"fool\" + 0.011*\"find\" + 0.011*\"tornado\" + 0.010*\"théori\" + 0.009*\"squatter\"\n", + "2019-01-31 00:48:00,011 : INFO : topic #5 (0.020): 0.039*\"abroad\" + 0.029*\"son\" + 0.027*\"rel\" + 0.026*\"reconstruct\" + 0.021*\"band\" + 0.016*\"muscl\" + 0.016*\"simultan\" + 0.014*\"charcoal\" + 0.013*\"toyota\" + 0.010*\"myspac\"\n", + "2019-01-31 00:48:00,012 : INFO : topic #16 (0.020): 0.052*\"king\" + 0.032*\"priest\" + 0.020*\"rotterdam\" + 0.020*\"duke\" + 0.019*\"quarterli\" + 0.019*\"grammat\" + 0.017*\"idiosyncrat\" + 0.013*\"maria\" + 0.013*\"princ\" + 0.012*\"brazil\"\n", + "2019-01-31 00:48:00,013 : INFO : topic #34 (0.020): 0.071*\"start\" + 0.031*\"unionist\" + 0.029*\"american\" + 0.029*\"new\" + 0.027*\"cotton\" + 0.018*\"year\" + 0.015*\"california\" + 0.013*\"terri\" + 0.013*\"warrior\" + 0.012*\"north\"\n", + "2019-01-31 00:48:00,019 : INFO : topic diff=0.004762, rho=0.032791\n", + "2019-01-31 00:48:00,179 : INFO : PROGRESS: pass 0, at document #1862000/4922894\n", + "2019-01-31 00:48:01,586 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:48:01,853 : INFO : topic #12 (0.020): 0.008*\"number\" + 0.007*\"gener\" + 0.007*\"frontal\" + 0.006*\"théori\" + 0.006*\"exampl\" + 0.006*\"poet\" + 0.006*\"measur\" + 0.006*\"servitud\" + 0.006*\"southern\" + 0.006*\"differ\"\n", + "2019-01-31 00:48:01,854 : INFO : topic #18 (0.020): 0.010*\"théori\" + 0.007*\"later\" + 0.006*\"sack\" + 0.006*\"dai\" + 0.006*\"kill\" + 0.005*\"retrospect\" + 0.005*\"like\" + 0.005*\"end\" + 0.004*\"kenworthi\" + 0.004*\"call\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 00:48:01,855 : INFO : topic #28 (0.020): 0.032*\"build\" + 0.025*\"hous\" + 0.022*\"rivièr\" + 0.017*\"buford\" + 0.013*\"histor\" + 0.012*\"briarwood\" + 0.011*\"strategist\" + 0.011*\"constitut\" + 0.010*\"linear\" + 0.010*\"depress\"\n", + "2019-01-31 00:48:01,856 : INFO : topic #1 (0.020): 0.052*\"china\" + 0.043*\"chilton\" + 0.027*\"hong\" + 0.026*\"kong\" + 0.023*\"korea\" + 0.018*\"korean\" + 0.016*\"leah\" + 0.015*\"sourc\" + 0.013*\"kim\" + 0.013*\"shirin\"\n", + "2019-01-31 00:48:01,857 : INFO : topic #2 (0.020): 0.049*\"isl\" + 0.040*\"shield\" + 0.017*\"narrat\" + 0.014*\"scot\" + 0.012*\"pope\" + 0.012*\"blur\" + 0.011*\"coalit\" + 0.010*\"nativist\" + 0.010*\"bahá\" + 0.009*\"fleet\"\n", + "2019-01-31 00:48:01,863 : INFO : topic diff=0.004694, rho=0.032774\n", + "2019-01-31 00:48:02,023 : INFO : PROGRESS: pass 0, at document #1864000/4922894\n", + "2019-01-31 00:48:03,440 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:48:03,707 : INFO : topic #15 (0.020): 0.011*\"small\" + 0.011*\"organ\" + 0.010*\"develop\" + 0.010*\"commun\" + 0.009*\"word\" + 0.009*\"group\" + 0.008*\"peopl\" + 0.008*\"woman\" + 0.007*\"cultur\" + 0.007*\"human\"\n", + "2019-01-31 00:48:03,708 : INFO : topic #2 (0.020): 0.049*\"isl\" + 0.040*\"shield\" + 0.017*\"narrat\" + 0.014*\"scot\" + 0.012*\"pope\" + 0.011*\"blur\" + 0.011*\"coalit\" + 0.010*\"nativist\" + 0.010*\"bahá\" + 0.009*\"fleet\"\n", + "2019-01-31 00:48:03,709 : INFO : topic #24 (0.020): 0.040*\"book\" + 0.035*\"publicis\" + 0.025*\"word\" + 0.018*\"new\" + 0.014*\"edit\" + 0.013*\"presid\" + 0.012*\"nicola\" + 0.012*\"storag\" + 0.012*\"collect\" + 0.011*\"author\"\n", + "2019-01-31 00:48:03,710 : INFO : topic #37 (0.020): 0.010*\"man\" + 0.008*\"love\" + 0.008*\"charact\" + 0.007*\"septemb\" + 0.007*\"gestur\" + 0.007*\"comic\" + 0.006*\"appear\" + 0.006*\"blue\" + 0.005*\"anim\" + 0.005*\"vision\"\n", + "2019-01-31 00:48:03,712 : INFO : topic #28 (0.020): 0.032*\"build\" + 0.025*\"hous\" + 0.022*\"rivièr\" + 0.017*\"buford\" + 0.013*\"histor\" + 0.012*\"briarwood\" + 0.011*\"strategist\" + 0.011*\"constitut\" + 0.010*\"linear\" + 0.010*\"depress\"\n", + "2019-01-31 00:48:03,718 : INFO : topic diff=0.004585, rho=0.032756\n", + "2019-01-31 00:48:03,875 : INFO : PROGRESS: pass 0, at document #1866000/4922894\n", + "2019-01-31 00:48:05,241 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:48:05,510 : INFO : topic #43 (0.020): 0.064*\"elect\" + 0.054*\"parti\" + 0.024*\"voluntari\" + 0.023*\"democrat\" + 0.020*\"member\" + 0.017*\"republ\" + 0.016*\"polici\" + 0.014*\"bypass\" + 0.014*\"selma\" + 0.014*\"report\"\n", + "2019-01-31 00:48:05,511 : INFO : topic #3 (0.020): 0.034*\"present\" + 0.027*\"offic\" + 0.024*\"minist\" + 0.022*\"nation\" + 0.021*\"govern\" + 0.021*\"member\" + 0.018*\"gener\" + 0.016*\"start\" + 0.016*\"seri\" + 0.016*\"serv\"\n", + "2019-01-31 00:48:05,512 : INFO : topic #15 (0.020): 0.011*\"small\" + 0.010*\"organ\" + 0.010*\"develop\" + 0.010*\"commun\" + 0.009*\"word\" + 0.009*\"group\" + 0.008*\"peopl\" + 0.007*\"woman\" + 0.007*\"cultur\" + 0.007*\"human\"\n", + "2019-01-31 00:48:05,514 : INFO : topic #41 (0.020): 0.041*\"citi\" + 0.025*\"new\" + 0.023*\"palmer\" + 0.015*\"strategist\" + 0.013*\"open\" + 0.013*\"center\" + 0.011*\"includ\" + 0.010*\"lobe\" + 0.009*\"highli\" + 0.009*\"dai\"\n", + "2019-01-31 00:48:05,515 : INFO : topic #20 (0.020): 0.139*\"scholar\" + 0.038*\"struggl\" + 0.032*\"high\" + 0.027*\"educ\" + 0.024*\"collector\" + 0.017*\"yawn\" + 0.013*\"prognosi\" + 0.011*\"district\" + 0.009*\"gothic\" + 0.009*\"start\"\n", + "2019-01-31 00:48:05,520 : INFO : topic diff=0.005214, rho=0.032739\n", + "2019-01-31 00:48:05,678 : INFO : PROGRESS: pass 0, at document #1868000/4922894\n", + "2019-01-31 00:48:07,071 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:48:07,337 : INFO : topic #36 (0.020): 0.011*\"network\" + 0.011*\"prognosi\" + 0.011*\"pop\" + 0.008*\"develop\" + 0.008*\"cytokin\" + 0.008*\"diggin\" + 0.008*\"user\" + 0.007*\"uruguayan\" + 0.007*\"softwar\" + 0.007*\"includ\"\n", + "2019-01-31 00:48:07,339 : INFO : topic #48 (0.020): 0.082*\"octob\" + 0.080*\"march\" + 0.078*\"sens\" + 0.076*\"juli\" + 0.073*\"notion\" + 0.073*\"januari\" + 0.072*\"april\" + 0.071*\"judici\" + 0.071*\"august\" + 0.070*\"decatur\"\n", + "2019-01-31 00:48:07,340 : INFO : topic #1 (0.020): 0.052*\"china\" + 0.042*\"chilton\" + 0.028*\"hong\" + 0.027*\"kong\" + 0.023*\"korea\" + 0.018*\"korean\" + 0.017*\"leah\" + 0.015*\"sourc\" + 0.013*\"kim\" + 0.013*\"shirin\"\n", + "2019-01-31 00:48:07,341 : INFO : topic #43 (0.020): 0.064*\"elect\" + 0.053*\"parti\" + 0.024*\"voluntari\" + 0.023*\"democrat\" + 0.020*\"member\" + 0.017*\"republ\" + 0.016*\"polici\" + 0.014*\"bypass\" + 0.014*\"report\" + 0.014*\"selma\"\n", + "2019-01-31 00:48:07,342 : INFO : topic #7 (0.020): 0.020*\"snatch\" + 0.020*\"di\" + 0.018*\"factor\" + 0.016*\"margin\" + 0.016*\"yawn\" + 0.014*\"bone\" + 0.014*\"life\" + 0.013*\"faster\" + 0.012*\"daughter\" + 0.012*\"deal\"\n", + "2019-01-31 00:48:07,348 : INFO : topic diff=0.004594, rho=0.032721\n", + "2019-01-31 00:48:07,510 : INFO : PROGRESS: pass 0, at document #1870000/4922894\n", + "2019-01-31 00:48:08,912 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:48:09,178 : INFO : topic #29 (0.020): 0.028*\"companhia\" + 0.012*\"million\" + 0.011*\"busi\" + 0.011*\"bank\" + 0.010*\"market\" + 0.010*\"produc\" + 0.009*\"industri\" + 0.008*\"yawn\" + 0.008*\"manag\" + 0.007*\"trace\"\n", + "2019-01-31 00:48:09,179 : INFO : topic #48 (0.020): 0.082*\"octob\" + 0.080*\"march\" + 0.078*\"sens\" + 0.075*\"juli\" + 0.074*\"januari\" + 0.073*\"notion\" + 0.073*\"april\" + 0.072*\"judici\" + 0.071*\"august\" + 0.070*\"decatur\"\n", + "2019-01-31 00:48:09,181 : INFO : topic #32 (0.020): 0.052*\"district\" + 0.043*\"popolo\" + 0.043*\"vigour\" + 0.040*\"tortur\" + 0.030*\"area\" + 0.029*\"cotton\" + 0.023*\"regim\" + 0.022*\"multitud\" + 0.022*\"citi\" + 0.020*\"commun\"\n", + "2019-01-31 00:48:09,182 : INFO : topic #15 (0.020): 0.011*\"small\" + 0.010*\"organ\" + 0.010*\"develop\" + 0.010*\"commun\" + 0.009*\"word\" + 0.009*\"group\" + 0.008*\"peopl\" + 0.007*\"woman\" + 0.007*\"cultur\" + 0.007*\"human\"\n", + "2019-01-31 00:48:09,183 : INFO : topic #46 (0.020): 0.019*\"stop\" + 0.018*\"wind\" + 0.017*\"swedish\" + 0.017*\"sweden\" + 0.016*\"norwai\" + 0.015*\"damag\" + 0.014*\"norwegian\" + 0.013*\"denmark\" + 0.012*\"farid\" + 0.011*\"danish\"\n", + "2019-01-31 00:48:09,188 : INFO : topic diff=0.005372, rho=0.032703\n", + "2019-01-31 00:48:09,343 : INFO : PROGRESS: pass 0, at document #1872000/4922894\n", + "2019-01-31 00:48:10,720 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:48:10,986 : INFO : topic #39 (0.020): 0.052*\"canada\" + 0.041*\"canadian\" + 0.030*\"ontario\" + 0.022*\"toronto\" + 0.021*\"hoar\" + 0.015*\"hydrogen\" + 0.014*\"new\" + 0.014*\"misericordia\" + 0.014*\"novotná\" + 0.012*\"quebec\"\n", + "2019-01-31 00:48:10,987 : INFO : topic #44 (0.020): 0.032*\"rooftop\" + 0.027*\"final\" + 0.024*\"wife\" + 0.021*\"tourist\" + 0.018*\"champion\" + 0.015*\"tiepolo\" + 0.015*\"chamber\" + 0.014*\"taxpay\" + 0.014*\"martin\" + 0.013*\"open\"\n", + "2019-01-31 00:48:10,988 : INFO : topic #49 (0.020): 0.043*\"india\" + 0.030*\"incumb\" + 0.013*\"anglo\" + 0.012*\"pakistan\" + 0.012*\"islam\" + 0.011*\"televis\" + 0.010*\"alam\" + 0.010*\"khalsa\" + 0.010*\"muskoge\" + 0.010*\"sri\"\n", + "2019-01-31 00:48:10,989 : INFO : topic #3 (0.020): 0.034*\"present\" + 0.027*\"offic\" + 0.024*\"minist\" + 0.022*\"nation\" + 0.021*\"govern\" + 0.021*\"member\" + 0.018*\"gener\" + 0.016*\"start\" + 0.016*\"serv\" + 0.016*\"seri\"\n", + "2019-01-31 00:48:10,990 : INFO : topic #5 (0.020): 0.039*\"abroad\" + 0.029*\"son\" + 0.027*\"rel\" + 0.025*\"reconstruct\" + 0.021*\"band\" + 0.016*\"muscl\" + 0.016*\"simultan\" + 0.014*\"charcoal\" + 0.014*\"toyota\" + 0.010*\"myspac\"\n", + "2019-01-31 00:48:10,996 : INFO : topic diff=0.004824, rho=0.032686\n", + "2019-01-31 00:48:11,156 : INFO : PROGRESS: pass 0, at document #1874000/4922894\n", + "2019-01-31 00:48:12,572 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:48:12,838 : INFO : topic #3 (0.020): 0.034*\"present\" + 0.027*\"offic\" + 0.024*\"minist\" + 0.022*\"nation\" + 0.021*\"govern\" + 0.021*\"member\" + 0.018*\"gener\" + 0.016*\"start\" + 0.016*\"serv\" + 0.016*\"seri\"\n", + "2019-01-31 00:48:12,840 : INFO : topic #38 (0.020): 0.023*\"walter\" + 0.009*\"aza\" + 0.009*\"battalion\" + 0.009*\"forc\" + 0.007*\"armi\" + 0.007*\"empath\" + 0.007*\"teufel\" + 0.006*\"govern\" + 0.006*\"militari\" + 0.006*\"pour\"\n", + "2019-01-31 00:48:12,841 : INFO : topic #35 (0.020): 0.057*\"russia\" + 0.036*\"sovereignti\" + 0.032*\"rural\" + 0.032*\"personifi\" + 0.028*\"poison\" + 0.023*\"reprint\" + 0.021*\"moscow\" + 0.019*\"poland\" + 0.016*\"unfortun\" + 0.014*\"czech\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 00:48:12,842 : INFO : topic #42 (0.020): 0.045*\"german\" + 0.029*\"germani\" + 0.016*\"vol\" + 0.016*\"israel\" + 0.015*\"jewish\" + 0.013*\"berlin\" + 0.013*\"der\" + 0.011*\"european\" + 0.009*\"europ\" + 0.009*\"itali\"\n", + "2019-01-31 00:48:12,843 : INFO : topic #29 (0.020): 0.028*\"companhia\" + 0.012*\"million\" + 0.011*\"busi\" + 0.011*\"bank\" + 0.010*\"market\" + 0.010*\"produc\" + 0.009*\"industri\" + 0.008*\"yawn\" + 0.008*\"manag\" + 0.007*\"trace\"\n", + "2019-01-31 00:48:12,849 : INFO : topic diff=0.004910, rho=0.032669\n", + "2019-01-31 00:48:13,006 : INFO : PROGRESS: pass 0, at document #1876000/4922894\n", + "2019-01-31 00:48:14,399 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:48:14,666 : INFO : topic #20 (0.020): 0.140*\"scholar\" + 0.038*\"struggl\" + 0.032*\"high\" + 0.027*\"educ\" + 0.023*\"collector\" + 0.017*\"yawn\" + 0.013*\"prognosi\" + 0.011*\"district\" + 0.010*\"start\" + 0.009*\"gothic\"\n", + "2019-01-31 00:48:14,667 : INFO : topic #12 (0.020): 0.008*\"number\" + 0.007*\"gener\" + 0.007*\"frontal\" + 0.007*\"exampl\" + 0.006*\"servitud\" + 0.006*\"théori\" + 0.006*\"southern\" + 0.006*\"poet\" + 0.006*\"measur\" + 0.006*\"method\"\n", + "2019-01-31 00:48:14,668 : INFO : topic #2 (0.020): 0.048*\"isl\" + 0.039*\"shield\" + 0.017*\"narrat\" + 0.013*\"scot\" + 0.012*\"pope\" + 0.012*\"blur\" + 0.011*\"coalit\" + 0.010*\"nativist\" + 0.010*\"bahá\" + 0.009*\"fleet\"\n", + "2019-01-31 00:48:14,669 : INFO : topic #34 (0.020): 0.072*\"start\" + 0.031*\"unionist\" + 0.029*\"american\" + 0.029*\"new\" + 0.027*\"cotton\" + 0.018*\"year\" + 0.015*\"california\" + 0.013*\"warrior\" + 0.013*\"terri\" + 0.012*\"north\"\n", + "2019-01-31 00:48:14,670 : INFO : topic #0 (0.020): 0.067*\"statewid\" + 0.042*\"line\" + 0.035*\"arsen\" + 0.033*\"raid\" + 0.027*\"museo\" + 0.020*\"traceabl\" + 0.019*\"serv\" + 0.013*\"pain\" + 0.013*\"exhaust\" + 0.013*\"oper\"\n", + "2019-01-31 00:48:14,676 : INFO : topic diff=0.004562, rho=0.032651\n", + "2019-01-31 00:48:14,836 : INFO : PROGRESS: pass 0, at document #1878000/4922894\n", + "2019-01-31 00:48:16,231 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:48:16,497 : INFO : topic #47 (0.020): 0.065*\"muscl\" + 0.036*\"perceptu\" + 0.022*\"theater\" + 0.019*\"damn\" + 0.019*\"place\" + 0.017*\"compos\" + 0.013*\"orchestr\" + 0.013*\"olympo\" + 0.012*\"physician\" + 0.011*\"word\"\n", + "2019-01-31 00:48:16,498 : INFO : topic #38 (0.020): 0.023*\"walter\" + 0.009*\"aza\" + 0.009*\"battalion\" + 0.009*\"forc\" + 0.007*\"armi\" + 0.007*\"empath\" + 0.007*\"teufel\" + 0.006*\"govern\" + 0.006*\"militari\" + 0.006*\"pour\"\n", + "2019-01-31 00:48:16,500 : INFO : topic #25 (0.020): 0.030*\"ring\" + 0.017*\"lagrang\" + 0.016*\"area\" + 0.016*\"warmth\" + 0.015*\"mount\" + 0.009*\"palmer\" + 0.008*\"foam\" + 0.008*\"north\" + 0.008*\"land\" + 0.008*\"vacant\"\n", + "2019-01-31 00:48:16,501 : INFO : topic #30 (0.020): 0.035*\"leagu\" + 0.034*\"cleveland\" + 0.029*\"place\" + 0.026*\"taxpay\" + 0.024*\"scientist\" + 0.023*\"crete\" + 0.021*\"folei\" + 0.016*\"goal\" + 0.015*\"martin\" + 0.012*\"schmitz\"\n", + "2019-01-31 00:48:16,502 : INFO : topic #11 (0.020): 0.025*\"john\" + 0.012*\"will\" + 0.012*\"jame\" + 0.011*\"david\" + 0.010*\"rival\" + 0.009*\"mexican–american\" + 0.008*\"georg\" + 0.008*\"paul\" + 0.008*\"slur\" + 0.008*\"rhyme\"\n", + "2019-01-31 00:48:16,507 : INFO : topic diff=0.005380, rho=0.032634\n", + "2019-01-31 00:48:19,080 : INFO : -11.425 per-word bound, 2750.4 perplexity estimate based on a held-out corpus of 2000 documents with 504946 words\n", + "2019-01-31 00:48:19,081 : INFO : PROGRESS: pass 0, at document #1880000/4922894\n", + "2019-01-31 00:48:20,424 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:48:20,689 : INFO : topic #34 (0.020): 0.072*\"start\" + 0.031*\"unionist\" + 0.030*\"american\" + 0.029*\"new\" + 0.027*\"cotton\" + 0.018*\"year\" + 0.015*\"california\" + 0.013*\"warrior\" + 0.013*\"terri\" + 0.012*\"north\"\n", + "2019-01-31 00:48:20,691 : INFO : topic #17 (0.020): 0.075*\"church\" + 0.024*\"christian\" + 0.022*\"cathol\" + 0.022*\"bishop\" + 0.015*\"sail\" + 0.015*\"retroflex\" + 0.010*\"centuri\" + 0.010*\"relationship\" + 0.009*\"cathedr\" + 0.009*\"historiographi\"\n", + "2019-01-31 00:48:20,692 : INFO : topic #1 (0.020): 0.053*\"china\" + 0.042*\"chilton\" + 0.025*\"hong\" + 0.025*\"kong\" + 0.022*\"korea\" + 0.018*\"korean\" + 0.016*\"leah\" + 0.015*\"sourc\" + 0.012*\"shirin\" + 0.012*\"kim\"\n", + "2019-01-31 00:48:20,693 : INFO : topic #2 (0.020): 0.047*\"isl\" + 0.039*\"shield\" + 0.017*\"narrat\" + 0.013*\"scot\" + 0.012*\"pope\" + 0.012*\"blur\" + 0.011*\"coalit\" + 0.010*\"nativist\" + 0.009*\"bahá\" + 0.009*\"fleet\"\n", + "2019-01-31 00:48:20,694 : INFO : topic #18 (0.020): 0.010*\"théori\" + 0.007*\"later\" + 0.006*\"sack\" + 0.006*\"dai\" + 0.006*\"kill\" + 0.005*\"retrospect\" + 0.005*\"like\" + 0.005*\"end\" + 0.004*\"kenworthi\" + 0.004*\"help\"\n", + "2019-01-31 00:48:20,700 : INFO : topic diff=0.005206, rho=0.032616\n", + "2019-01-31 00:48:20,854 : INFO : PROGRESS: pass 0, at document #1882000/4922894\n", + "2019-01-31 00:48:22,245 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:48:22,511 : INFO : topic #41 (0.020): 0.041*\"citi\" + 0.025*\"new\" + 0.023*\"palmer\" + 0.014*\"strategist\" + 0.013*\"center\" + 0.012*\"open\" + 0.011*\"includ\" + 0.010*\"lobe\" + 0.009*\"dai\" + 0.009*\"highli\"\n", + "2019-01-31 00:48:22,512 : INFO : topic #5 (0.020): 0.039*\"abroad\" + 0.029*\"son\" + 0.026*\"rel\" + 0.025*\"reconstruct\" + 0.021*\"band\" + 0.016*\"muscl\" + 0.016*\"simultan\" + 0.014*\"charcoal\" + 0.013*\"toyota\" + 0.010*\"myspac\"\n", + "2019-01-31 00:48:22,513 : INFO : topic #31 (0.020): 0.056*\"fusiform\" + 0.026*\"scientist\" + 0.025*\"player\" + 0.025*\"taxpay\" + 0.020*\"place\" + 0.013*\"clot\" + 0.012*\"leagu\" + 0.011*\"folei\" + 0.010*\"yawn\" + 0.008*\"reconstruct\"\n", + "2019-01-31 00:48:22,515 : INFO : topic #15 (0.020): 0.011*\"small\" + 0.010*\"organ\" + 0.010*\"develop\" + 0.010*\"commun\" + 0.009*\"group\" + 0.009*\"word\" + 0.008*\"peopl\" + 0.007*\"woman\" + 0.007*\"cultur\" + 0.007*\"human\"\n", + "2019-01-31 00:48:22,516 : INFO : topic #22 (0.020): 0.034*\"spars\" + 0.024*\"factor\" + 0.019*\"adulthood\" + 0.015*\"feel\" + 0.014*\"male\" + 0.012*\"hostil\" + 0.011*\"plaisir\" + 0.010*\"genu\" + 0.010*\"live\" + 0.008*\"median\"\n", + "2019-01-31 00:48:22,521 : INFO : topic diff=0.005047, rho=0.032599\n", + "2019-01-31 00:48:22,680 : INFO : PROGRESS: pass 0, at document #1884000/4922894\n", + "2019-01-31 00:48:24,080 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:48:24,346 : INFO : topic #27 (0.020): 0.070*\"questionnair\" + 0.022*\"candid\" + 0.020*\"taxpay\" + 0.014*\"ret\" + 0.014*\"driver\" + 0.011*\"find\" + 0.011*\"fool\" + 0.010*\"théori\" + 0.010*\"tornado\" + 0.010*\"landslid\"\n", + "2019-01-31 00:48:24,348 : INFO : topic #47 (0.020): 0.064*\"muscl\" + 0.035*\"perceptu\" + 0.022*\"theater\" + 0.018*\"place\" + 0.018*\"damn\" + 0.017*\"compos\" + 0.013*\"orchestr\" + 0.013*\"olympo\" + 0.012*\"physician\" + 0.012*\"word\"\n", + "2019-01-31 00:48:24,349 : INFO : topic #14 (0.020): 0.024*\"forc\" + 0.022*\"armi\" + 0.022*\"aggress\" + 0.021*\"walter\" + 0.018*\"com\" + 0.014*\"militari\" + 0.014*\"oper\" + 0.014*\"unionist\" + 0.012*\"airmen\" + 0.011*\"diversifi\"\n", + "2019-01-31 00:48:24,350 : INFO : topic #4 (0.020): 0.020*\"enfranchis\" + 0.015*\"depress\" + 0.015*\"pour\" + 0.009*\"mode\" + 0.009*\"elabor\" + 0.008*\"veget\" + 0.007*\"candid\" + 0.007*\"uruguayan\" + 0.007*\"produc\" + 0.006*\"develop\"\n", + "2019-01-31 00:48:24,351 : INFO : topic #35 (0.020): 0.056*\"russia\" + 0.036*\"sovereignti\" + 0.033*\"rural\" + 0.031*\"personifi\" + 0.028*\"poison\" + 0.026*\"reprint\" + 0.021*\"moscow\" + 0.019*\"poland\" + 0.016*\"unfortun\" + 0.014*\"czech\"\n", + "2019-01-31 00:48:24,357 : INFO : topic diff=0.006740, rho=0.032582\n", + "2019-01-31 00:48:24,574 : INFO : PROGRESS: pass 0, at document #1886000/4922894\n", + "2019-01-31 00:48:25,990 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:48:26,256 : INFO : topic #0 (0.020): 0.066*\"statewid\" + 0.041*\"line\" + 0.034*\"arsen\" + 0.033*\"raid\" + 0.026*\"museo\" + 0.019*\"traceabl\" + 0.018*\"serv\" + 0.017*\"pain\" + 0.013*\"oper\" + 0.013*\"exhaust\"\n", + "2019-01-31 00:48:26,257 : INFO : topic #2 (0.020): 0.048*\"isl\" + 0.038*\"shield\" + 0.017*\"narrat\" + 0.014*\"scot\" + 0.012*\"pope\" + 0.012*\"blur\" + 0.011*\"coalit\" + 0.010*\"nativist\" + 0.010*\"bahá\" + 0.009*\"fleet\"\n", + "2019-01-31 00:48:26,258 : INFO : topic #9 (0.020): 0.068*\"bone\" + 0.041*\"american\" + 0.029*\"valour\" + 0.023*\"dutch\" + 0.018*\"folei\" + 0.018*\"polit\" + 0.017*\"player\" + 0.016*\"english\" + 0.011*\"acrimoni\" + 0.011*\"netherland\"\n", + "2019-01-31 00:48:26,259 : INFO : topic #38 (0.020): 0.023*\"walter\" + 0.009*\"aza\" + 0.009*\"forc\" + 0.009*\"battalion\" + 0.007*\"armi\" + 0.007*\"empath\" + 0.006*\"teufel\" + 0.006*\"govern\" + 0.006*\"militari\" + 0.006*\"pour\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 00:48:26,260 : INFO : topic #27 (0.020): 0.070*\"questionnair\" + 0.021*\"candid\" + 0.021*\"taxpay\" + 0.014*\"ret\" + 0.014*\"driver\" + 0.011*\"find\" + 0.011*\"fool\" + 0.010*\"théori\" + 0.010*\"tornado\" + 0.010*\"squatter\"\n", + "2019-01-31 00:48:26,266 : INFO : topic diff=0.006519, rho=0.032564\n", + "2019-01-31 00:48:26,425 : INFO : PROGRESS: pass 0, at document #1888000/4922894\n", + "2019-01-31 00:48:27,833 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:48:28,100 : INFO : topic #27 (0.020): 0.070*\"questionnair\" + 0.021*\"candid\" + 0.020*\"taxpay\" + 0.015*\"ret\" + 0.014*\"driver\" + 0.011*\"find\" + 0.011*\"fool\" + 0.010*\"théori\" + 0.010*\"squatter\" + 0.010*\"tornado\"\n", + "2019-01-31 00:48:28,101 : INFO : topic #28 (0.020): 0.032*\"build\" + 0.025*\"hous\" + 0.022*\"rivièr\" + 0.017*\"buford\" + 0.013*\"histor\" + 0.012*\"briarwood\" + 0.011*\"strategist\" + 0.011*\"constitut\" + 0.010*\"linear\" + 0.010*\"depress\"\n", + "2019-01-31 00:48:28,102 : INFO : topic #37 (0.020): 0.010*\"man\" + 0.008*\"love\" + 0.008*\"charact\" + 0.008*\"septemb\" + 0.007*\"comic\" + 0.007*\"gestur\" + 0.006*\"appear\" + 0.005*\"anim\" + 0.005*\"blue\" + 0.005*\"workplac\"\n", + "2019-01-31 00:48:28,103 : INFO : topic #39 (0.020): 0.055*\"canada\" + 0.041*\"canadian\" + 0.028*\"ontario\" + 0.022*\"toronto\" + 0.021*\"hoar\" + 0.015*\"hydrogen\" + 0.014*\"new\" + 0.014*\"novotná\" + 0.014*\"misericordia\" + 0.013*\"quebec\"\n", + "2019-01-31 00:48:28,104 : INFO : topic #13 (0.020): 0.028*\"sourc\" + 0.027*\"australia\" + 0.026*\"london\" + 0.024*\"new\" + 0.023*\"england\" + 0.022*\"australian\" + 0.019*\"british\" + 0.017*\"ireland\" + 0.014*\"youth\" + 0.013*\"wale\"\n", + "2019-01-31 00:48:28,110 : INFO : topic diff=0.004895, rho=0.032547\n", + "2019-01-31 00:48:28,272 : INFO : PROGRESS: pass 0, at document #1890000/4922894\n", + "2019-01-31 00:48:29,697 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:48:29,962 : INFO : topic #36 (0.020): 0.011*\"network\" + 0.011*\"prognosi\" + 0.011*\"pop\" + 0.008*\"develop\" + 0.008*\"cytokin\" + 0.008*\"user\" + 0.008*\"uruguayan\" + 0.007*\"diggin\" + 0.007*\"softwar\" + 0.007*\"includ\"\n", + "2019-01-31 00:48:29,964 : INFO : topic #15 (0.020): 0.011*\"small\" + 0.010*\"organ\" + 0.010*\"commun\" + 0.010*\"develop\" + 0.009*\"group\" + 0.009*\"word\" + 0.008*\"peopl\" + 0.008*\"woman\" + 0.007*\"cultur\" + 0.007*\"human\"\n", + "2019-01-31 00:48:29,965 : INFO : topic #22 (0.020): 0.034*\"spars\" + 0.024*\"factor\" + 0.019*\"adulthood\" + 0.015*\"feel\" + 0.013*\"male\" + 0.011*\"hostil\" + 0.011*\"plaisir\" + 0.010*\"genu\" + 0.010*\"live\" + 0.008*\"biom\"\n", + "2019-01-31 00:48:29,966 : INFO : topic #24 (0.020): 0.039*\"book\" + 0.035*\"publicis\" + 0.025*\"word\" + 0.018*\"new\" + 0.014*\"edit\" + 0.013*\"presid\" + 0.012*\"collect\" + 0.012*\"storag\" + 0.012*\"nicola\" + 0.011*\"author\"\n", + "2019-01-31 00:48:29,966 : INFO : topic #13 (0.020): 0.028*\"sourc\" + 0.027*\"australia\" + 0.026*\"london\" + 0.024*\"new\" + 0.023*\"england\" + 0.022*\"australian\" + 0.019*\"british\" + 0.017*\"ireland\" + 0.015*\"youth\" + 0.013*\"wale\"\n", + "2019-01-31 00:48:29,972 : INFO : topic diff=0.005038, rho=0.032530\n", + "2019-01-31 00:48:30,132 : INFO : PROGRESS: pass 0, at document #1892000/4922894\n", + "2019-01-31 00:48:31,549 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:48:31,815 : INFO : topic #36 (0.020): 0.011*\"network\" + 0.011*\"prognosi\" + 0.011*\"pop\" + 0.008*\"develop\" + 0.008*\"cytokin\" + 0.008*\"user\" + 0.008*\"uruguayan\" + 0.007*\"diggin\" + 0.007*\"softwar\" + 0.007*\"includ\"\n", + "2019-01-31 00:48:31,816 : INFO : topic #17 (0.020): 0.075*\"church\" + 0.024*\"christian\" + 0.022*\"cathol\" + 0.021*\"bishop\" + 0.015*\"sail\" + 0.015*\"retroflex\" + 0.010*\"centuri\" + 0.010*\"relationship\" + 0.009*\"historiographi\" + 0.009*\"cathedr\"\n", + "2019-01-31 00:48:31,817 : INFO : topic #18 (0.020): 0.010*\"théori\" + 0.007*\"later\" + 0.006*\"sack\" + 0.006*\"dai\" + 0.006*\"kill\" + 0.005*\"retrospect\" + 0.005*\"like\" + 0.005*\"end\" + 0.004*\"kenworthi\" + 0.004*\"help\"\n", + "2019-01-31 00:48:31,818 : INFO : topic #46 (0.020): 0.021*\"stop\" + 0.017*\"wind\" + 0.016*\"sweden\" + 0.016*\"norwai\" + 0.015*\"swedish\" + 0.015*\"norwegian\" + 0.014*\"damag\" + 0.013*\"huntsvil\" + 0.012*\"denmark\" + 0.010*\"farid\"\n", + "2019-01-31 00:48:31,819 : INFO : topic #1 (0.020): 0.053*\"china\" + 0.044*\"chilton\" + 0.024*\"hong\" + 0.023*\"kong\" + 0.022*\"korea\" + 0.018*\"korean\" + 0.016*\"leah\" + 0.015*\"sourc\" + 0.013*\"kim\" + 0.012*\"han\"\n", + "2019-01-31 00:48:31,825 : INFO : topic diff=0.004405, rho=0.032513\n", + "2019-01-31 00:48:31,978 : INFO : PROGRESS: pass 0, at document #1894000/4922894\n", + "2019-01-31 00:48:33,340 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:48:33,606 : INFO : topic #31 (0.020): 0.056*\"fusiform\" + 0.026*\"scientist\" + 0.026*\"taxpay\" + 0.025*\"player\" + 0.020*\"place\" + 0.013*\"clot\" + 0.012*\"leagu\" + 0.011*\"folei\" + 0.010*\"yawn\" + 0.009*\"reconstruct\"\n", + "2019-01-31 00:48:33,608 : INFO : topic #9 (0.020): 0.069*\"bone\" + 0.042*\"american\" + 0.028*\"valour\" + 0.022*\"dutch\" + 0.019*\"folei\" + 0.018*\"polit\" + 0.017*\"player\" + 0.016*\"english\" + 0.011*\"acrimoni\" + 0.011*\"netherland\"\n", + "2019-01-31 00:48:33,609 : INFO : topic #32 (0.020): 0.051*\"district\" + 0.043*\"vigour\" + 0.043*\"popolo\" + 0.040*\"tortur\" + 0.032*\"cotton\" + 0.029*\"area\" + 0.024*\"multitud\" + 0.023*\"regim\" + 0.021*\"citi\" + 0.020*\"commun\"\n", + "2019-01-31 00:48:33,610 : INFO : topic #35 (0.020): 0.055*\"russia\" + 0.037*\"sovereignti\" + 0.032*\"rural\" + 0.031*\"personifi\" + 0.027*\"poison\" + 0.026*\"reprint\" + 0.020*\"moscow\" + 0.019*\"poland\" + 0.016*\"unfortun\" + 0.014*\"czech\"\n", + "2019-01-31 00:48:33,611 : INFO : topic #24 (0.020): 0.039*\"book\" + 0.035*\"publicis\" + 0.025*\"word\" + 0.018*\"new\" + 0.014*\"edit\" + 0.013*\"presid\" + 0.012*\"collect\" + 0.012*\"storag\" + 0.012*\"nicola\" + 0.011*\"magazin\"\n", + "2019-01-31 00:48:33,617 : INFO : topic diff=0.004884, rho=0.032496\n", + "2019-01-31 00:48:33,770 : INFO : PROGRESS: pass 0, at document #1896000/4922894\n", + "2019-01-31 00:48:35,143 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:48:35,409 : INFO : topic #42 (0.020): 0.045*\"german\" + 0.029*\"germani\" + 0.016*\"vol\" + 0.014*\"israel\" + 0.014*\"jewish\" + 0.013*\"der\" + 0.013*\"berlin\" + 0.010*\"european\" + 0.009*\"itali\" + 0.009*\"europ\"\n", + "2019-01-31 00:48:35,410 : INFO : topic #31 (0.020): 0.057*\"fusiform\" + 0.026*\"scientist\" + 0.026*\"taxpay\" + 0.025*\"player\" + 0.020*\"place\" + 0.013*\"clot\" + 0.012*\"leagu\" + 0.011*\"folei\" + 0.010*\"yawn\" + 0.009*\"reconstruct\"\n", + "2019-01-31 00:48:35,411 : INFO : topic #3 (0.020): 0.034*\"present\" + 0.027*\"offic\" + 0.024*\"minist\" + 0.022*\"nation\" + 0.021*\"govern\" + 0.021*\"member\" + 0.017*\"serv\" + 0.017*\"gener\" + 0.016*\"start\" + 0.016*\"seri\"\n", + "2019-01-31 00:48:35,413 : INFO : topic #23 (0.020): 0.136*\"audit\" + 0.066*\"best\" + 0.036*\"yawn\" + 0.028*\"jacksonvil\" + 0.023*\"noll\" + 0.022*\"japanes\" + 0.019*\"festiv\" + 0.018*\"women\" + 0.016*\"intern\" + 0.013*\"prison\"\n", + "2019-01-31 00:48:35,413 : INFO : topic #1 (0.020): 0.053*\"china\" + 0.044*\"chilton\" + 0.024*\"hong\" + 0.023*\"kong\" + 0.022*\"korea\" + 0.017*\"korean\" + 0.016*\"leah\" + 0.014*\"sourc\" + 0.013*\"kim\" + 0.012*\"ashvil\"\n", + "2019-01-31 00:48:35,419 : INFO : topic diff=0.005429, rho=0.032478\n", + "2019-01-31 00:48:35,577 : INFO : PROGRESS: pass 0, at document #1898000/4922894\n", + "2019-01-31 00:48:36,960 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:48:37,226 : INFO : topic #10 (0.020): 0.012*\"cdd\" + 0.008*\"disco\" + 0.008*\"media\" + 0.007*\"hormon\" + 0.007*\"have\" + 0.007*\"caus\" + 0.006*\"proper\" + 0.006*\"pathwai\" + 0.006*\"effect\" + 0.006*\"human\"\n", + "2019-01-31 00:48:37,227 : INFO : topic #28 (0.020): 0.032*\"build\" + 0.025*\"hous\" + 0.022*\"rivièr\" + 0.017*\"buford\" + 0.013*\"histor\" + 0.012*\"briarwood\" + 0.011*\"constitut\" + 0.011*\"strategist\" + 0.010*\"linear\" + 0.010*\"depress\"\n", + "2019-01-31 00:48:37,228 : INFO : topic #4 (0.020): 0.020*\"enfranchis\" + 0.015*\"pour\" + 0.015*\"depress\" + 0.009*\"mode\" + 0.009*\"elabor\" + 0.007*\"veget\" + 0.007*\"encyclopedia\" + 0.007*\"uruguayan\" + 0.007*\"candid\" + 0.007*\"produc\"\n", + "2019-01-31 00:48:37,230 : INFO : topic #36 (0.020): 0.011*\"network\" + 0.011*\"prognosi\" + 0.010*\"pop\" + 0.008*\"develop\" + 0.008*\"cytokin\" + 0.008*\"user\" + 0.007*\"uruguayan\" + 0.007*\"diggin\" + 0.007*\"softwar\" + 0.007*\"includ\"\n", + "2019-01-31 00:48:37,231 : INFO : topic #29 (0.020): 0.027*\"companhia\" + 0.012*\"million\" + 0.011*\"busi\" + 0.011*\"market\" + 0.011*\"bank\" + 0.010*\"produc\" + 0.009*\"industri\" + 0.008*\"yawn\" + 0.008*\"manag\" + 0.007*\"trace\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 00:48:37,236 : INFO : topic diff=0.004155, rho=0.032461\n", + "2019-01-31 00:48:39,962 : INFO : -11.640 per-word bound, 3191.1 perplexity estimate based on a held-out corpus of 2000 documents with 590783 words\n", + "2019-01-31 00:48:39,962 : INFO : PROGRESS: pass 0, at document #1900000/4922894\n", + "2019-01-31 00:48:41,355 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:48:41,621 : INFO : topic #20 (0.020): 0.145*\"scholar\" + 0.038*\"struggl\" + 0.035*\"high\" + 0.028*\"educ\" + 0.023*\"collector\" + 0.017*\"yawn\" + 0.013*\"prognosi\" + 0.010*\"district\" + 0.009*\"start\" + 0.009*\"task\"\n", + "2019-01-31 00:48:41,622 : INFO : topic #33 (0.020): 0.061*\"french\" + 0.047*\"franc\" + 0.029*\"pari\" + 0.024*\"sail\" + 0.022*\"jean\" + 0.016*\"daphn\" + 0.013*\"loui\" + 0.012*\"lazi\" + 0.012*\"piec\" + 0.010*\"wine\"\n", + "2019-01-31 00:48:41,623 : INFO : topic #18 (0.020): 0.010*\"théori\" + 0.007*\"later\" + 0.006*\"sack\" + 0.006*\"dai\" + 0.006*\"kill\" + 0.005*\"retrospect\" + 0.005*\"like\" + 0.005*\"end\" + 0.004*\"kenworthi\" + 0.004*\"help\"\n", + "2019-01-31 00:48:41,625 : INFO : topic #41 (0.020): 0.042*\"citi\" + 0.026*\"new\" + 0.023*\"palmer\" + 0.014*\"strategist\" + 0.012*\"open\" + 0.012*\"center\" + 0.011*\"includ\" + 0.010*\"lobe\" + 0.009*\"dai\" + 0.009*\"highli\"\n", + "2019-01-31 00:48:41,626 : INFO : topic #30 (0.020): 0.035*\"leagu\" + 0.035*\"cleveland\" + 0.029*\"place\" + 0.026*\"taxpay\" + 0.024*\"scientist\" + 0.023*\"crete\" + 0.021*\"folei\" + 0.016*\"goal\" + 0.015*\"martin\" + 0.012*\"schmitz\"\n", + "2019-01-31 00:48:41,632 : INFO : topic diff=0.005479, rho=0.032444\n", + "2019-01-31 00:48:41,786 : INFO : PROGRESS: pass 0, at document #1902000/4922894\n", + "2019-01-31 00:48:43,163 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:48:43,429 : INFO : topic #32 (0.020): 0.052*\"district\" + 0.044*\"vigour\" + 0.043*\"popolo\" + 0.039*\"tortur\" + 0.032*\"cotton\" + 0.029*\"area\" + 0.024*\"multitud\" + 0.023*\"regim\" + 0.021*\"citi\" + 0.020*\"commun\"\n", + "2019-01-31 00:48:43,430 : INFO : topic #7 (0.020): 0.020*\"snatch\" + 0.020*\"di\" + 0.018*\"factor\" + 0.016*\"margin\" + 0.015*\"yawn\" + 0.014*\"bone\" + 0.013*\"life\" + 0.012*\"faster\" + 0.012*\"daughter\" + 0.012*\"deal\"\n", + "2019-01-31 00:48:43,431 : INFO : topic #45 (0.020): 0.026*\"jpg\" + 0.024*\"fifteenth\" + 0.018*\"illicit\" + 0.017*\"colder\" + 0.017*\"black\" + 0.016*\"western\" + 0.014*\"record\" + 0.010*\"blind\" + 0.008*\"depress\" + 0.007*\"light\"\n", + "2019-01-31 00:48:43,432 : INFO : topic #34 (0.020): 0.072*\"start\" + 0.031*\"unionist\" + 0.029*\"american\" + 0.029*\"new\" + 0.027*\"cotton\" + 0.018*\"year\" + 0.015*\"california\" + 0.013*\"warrior\" + 0.013*\"terri\" + 0.012*\"north\"\n", + "2019-01-31 00:48:43,433 : INFO : topic #19 (0.020): 0.016*\"languag\" + 0.013*\"centuri\" + 0.011*\"woodcut\" + 0.009*\"form\" + 0.009*\"origin\" + 0.009*\"mean\" + 0.007*\"english\" + 0.007*\"trade\" + 0.007*\"known\" + 0.006*\"like\"\n", + "2019-01-31 00:48:43,439 : INFO : topic diff=0.004403, rho=0.032427\n", + "2019-01-31 00:48:43,593 : INFO : PROGRESS: pass 0, at document #1904000/4922894\n", + "2019-01-31 00:48:44,988 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:48:45,254 : INFO : topic #46 (0.020): 0.020*\"stop\" + 0.018*\"wind\" + 0.016*\"norwai\" + 0.016*\"sweden\" + 0.015*\"swedish\" + 0.015*\"norwegian\" + 0.013*\"damag\" + 0.013*\"denmark\" + 0.012*\"huntsvil\" + 0.011*\"farid\"\n", + "2019-01-31 00:48:45,255 : INFO : topic #24 (0.020): 0.039*\"book\" + 0.034*\"publicis\" + 0.025*\"word\" + 0.018*\"new\" + 0.014*\"edit\" + 0.013*\"presid\" + 0.012*\"collect\" + 0.012*\"storag\" + 0.012*\"nicola\" + 0.011*\"author\"\n", + "2019-01-31 00:48:45,256 : INFO : topic #20 (0.020): 0.145*\"scholar\" + 0.038*\"struggl\" + 0.036*\"high\" + 0.028*\"educ\" + 0.023*\"collector\" + 0.017*\"yawn\" + 0.013*\"prognosi\" + 0.010*\"district\" + 0.009*\"start\" + 0.009*\"gothic\"\n", + "2019-01-31 00:48:45,257 : INFO : topic #18 (0.020): 0.010*\"théori\" + 0.007*\"later\" + 0.006*\"sack\" + 0.006*\"dai\" + 0.006*\"kill\" + 0.005*\"retrospect\" + 0.005*\"like\" + 0.005*\"end\" + 0.004*\"kenworthi\" + 0.004*\"call\"\n", + "2019-01-31 00:48:45,258 : INFO : topic #21 (0.020): 0.038*\"samford\" + 0.022*\"spain\" + 0.019*\"del\" + 0.016*\"mexico\" + 0.014*\"soviet\" + 0.012*\"santa\" + 0.012*\"juan\" + 0.011*\"carlo\" + 0.011*\"francisco\" + 0.010*\"lizard\"\n", + "2019-01-31 00:48:45,264 : INFO : topic diff=0.004702, rho=0.032410\n", + "2019-01-31 00:48:45,421 : INFO : PROGRESS: pass 0, at document #1906000/4922894\n", + "2019-01-31 00:48:46,814 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:48:47,080 : INFO : topic #36 (0.020): 0.011*\"prognosi\" + 0.011*\"network\" + 0.010*\"pop\" + 0.008*\"develop\" + 0.008*\"cytokin\" + 0.007*\"user\" + 0.007*\"window\" + 0.007*\"uruguayan\" + 0.007*\"includ\" + 0.007*\"diggin\"\n", + "2019-01-31 00:48:47,081 : INFO : topic #49 (0.020): 0.045*\"india\" + 0.033*\"incumb\" + 0.014*\"televis\" + 0.013*\"anglo\" + 0.011*\"pakistan\" + 0.011*\"islam\" + 0.011*\"khalsa\" + 0.010*\"sri\" + 0.009*\"tajikistan\" + 0.009*\"muskoge\"\n", + "2019-01-31 00:48:47,082 : INFO : topic #40 (0.020): 0.087*\"unit\" + 0.023*\"schuster\" + 0.022*\"institut\" + 0.022*\"collector\" + 0.021*\"requir\" + 0.019*\"student\" + 0.015*\"professor\" + 0.012*\"word\" + 0.011*\"http\" + 0.011*\"degre\"\n", + "2019-01-31 00:48:47,084 : INFO : topic #19 (0.020): 0.016*\"languag\" + 0.013*\"centuri\" + 0.011*\"woodcut\" + 0.010*\"form\" + 0.009*\"origin\" + 0.009*\"mean\" + 0.007*\"english\" + 0.007*\"trade\" + 0.007*\"known\" + 0.006*\"like\"\n", + "2019-01-31 00:48:47,085 : INFO : topic #47 (0.020): 0.067*\"muscl\" + 0.035*\"perceptu\" + 0.021*\"theater\" + 0.018*\"place\" + 0.018*\"damn\" + 0.017*\"compos\" + 0.013*\"orchestr\" + 0.013*\"olympo\" + 0.012*\"physician\" + 0.012*\"word\"\n", + "2019-01-31 00:48:47,090 : INFO : topic diff=0.005282, rho=0.032393\n", + "2019-01-31 00:48:47,244 : INFO : PROGRESS: pass 0, at document #1908000/4922894\n", + "2019-01-31 00:48:48,625 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:48:48,891 : INFO : topic #10 (0.020): 0.012*\"cdd\" + 0.008*\"disco\" + 0.008*\"media\" + 0.007*\"hormon\" + 0.007*\"have\" + 0.007*\"caus\" + 0.007*\"pathwai\" + 0.006*\"proper\" + 0.006*\"effect\" + 0.006*\"acid\"\n", + "2019-01-31 00:48:48,892 : INFO : topic #45 (0.020): 0.026*\"jpg\" + 0.024*\"fifteenth\" + 0.019*\"illicit\" + 0.016*\"colder\" + 0.016*\"black\" + 0.016*\"western\" + 0.014*\"record\" + 0.010*\"blind\" + 0.008*\"depress\" + 0.007*\"light\"\n", + "2019-01-31 00:48:48,893 : INFO : topic #47 (0.020): 0.067*\"muscl\" + 0.035*\"perceptu\" + 0.021*\"theater\" + 0.018*\"place\" + 0.018*\"damn\" + 0.017*\"compos\" + 0.013*\"orchestr\" + 0.012*\"olympo\" + 0.012*\"physician\" + 0.012*\"word\"\n", + "2019-01-31 00:48:48,894 : INFO : topic #20 (0.020): 0.145*\"scholar\" + 0.038*\"struggl\" + 0.036*\"high\" + 0.028*\"educ\" + 0.023*\"collector\" + 0.017*\"yawn\" + 0.013*\"prognosi\" + 0.010*\"district\" + 0.009*\"gothic\" + 0.009*\"start\"\n", + "2019-01-31 00:48:48,895 : INFO : topic #18 (0.020): 0.010*\"théori\" + 0.007*\"later\" + 0.006*\"sack\" + 0.006*\"dai\" + 0.006*\"kill\" + 0.005*\"retrospect\" + 0.005*\"like\" + 0.005*\"end\" + 0.004*\"kenworthi\" + 0.004*\"call\"\n", + "2019-01-31 00:48:48,901 : INFO : topic diff=0.005380, rho=0.032376\n", + "2019-01-31 00:48:49,054 : INFO : PROGRESS: pass 0, at document #1910000/4922894\n", + "2019-01-31 00:48:50,428 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:48:50,695 : INFO : topic #33 (0.020): 0.062*\"french\" + 0.047*\"franc\" + 0.029*\"pari\" + 0.024*\"sail\" + 0.022*\"jean\" + 0.017*\"daphn\" + 0.013*\"lazi\" + 0.013*\"loui\" + 0.012*\"piec\" + 0.010*\"wine\"\n", + "2019-01-31 00:48:50,696 : INFO : topic #45 (0.020): 0.026*\"jpg\" + 0.024*\"fifteenth\" + 0.020*\"illicit\" + 0.016*\"colder\" + 0.016*\"black\" + 0.016*\"western\" + 0.014*\"record\" + 0.010*\"blind\" + 0.008*\"depress\" + 0.007*\"light\"\n", + "2019-01-31 00:48:50,697 : INFO : topic #17 (0.020): 0.078*\"church\" + 0.024*\"christian\" + 0.022*\"cathol\" + 0.021*\"bishop\" + 0.015*\"retroflex\" + 0.015*\"sail\" + 0.010*\"centuri\" + 0.010*\"relationship\" + 0.009*\"historiographi\" + 0.009*\"cathedr\"\n", + "2019-01-31 00:48:50,698 : INFO : topic #49 (0.020): 0.045*\"india\" + 0.033*\"incumb\" + 0.014*\"televis\" + 0.013*\"anglo\" + 0.011*\"pakistan\" + 0.011*\"islam\" + 0.011*\"khalsa\" + 0.010*\"muskoge\" + 0.010*\"sri\" + 0.009*\"singh\"\n", + "2019-01-31 00:48:50,699 : INFO : topic #11 (0.020): 0.025*\"john\" + 0.012*\"will\" + 0.012*\"jame\" + 0.011*\"david\" + 0.010*\"rival\" + 0.009*\"mexican–american\" + 0.009*\"georg\" + 0.008*\"slur\" + 0.008*\"paul\" + 0.008*\"rhyme\"\n", + "2019-01-31 00:48:50,705 : INFO : topic diff=0.005164, rho=0.032359\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 00:48:50,862 : INFO : PROGRESS: pass 0, at document #1912000/4922894\n", + "2019-01-31 00:48:52,281 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:48:52,547 : INFO : topic #13 (0.020): 0.027*\"sourc\" + 0.027*\"australia\" + 0.026*\"london\" + 0.025*\"new\" + 0.023*\"england\" + 0.022*\"australian\" + 0.019*\"british\" + 0.017*\"ireland\" + 0.015*\"youth\" + 0.014*\"wale\"\n", + "2019-01-31 00:48:52,548 : INFO : topic #38 (0.020): 0.023*\"walter\" + 0.011*\"aza\" + 0.009*\"battalion\" + 0.009*\"forc\" + 0.008*\"teufel\" + 0.007*\"empath\" + 0.007*\"armi\" + 0.007*\"till\" + 0.006*\"pour\" + 0.006*\"militari\"\n", + "2019-01-31 00:48:52,549 : INFO : topic #14 (0.020): 0.024*\"forc\" + 0.022*\"aggress\" + 0.021*\"armi\" + 0.020*\"walter\" + 0.018*\"com\" + 0.014*\"unionist\" + 0.014*\"oper\" + 0.014*\"militari\" + 0.012*\"airmen\" + 0.011*\"airbu\"\n", + "2019-01-31 00:48:52,550 : INFO : topic #44 (0.020): 0.031*\"rooftop\" + 0.027*\"final\" + 0.024*\"wife\" + 0.022*\"tourist\" + 0.018*\"champion\" + 0.015*\"tiepolo\" + 0.014*\"chamber\" + 0.014*\"open\" + 0.013*\"taxpay\" + 0.013*\"winner\"\n", + "2019-01-31 00:48:52,551 : INFO : topic #1 (0.020): 0.054*\"china\" + 0.045*\"chilton\" + 0.023*\"hong\" + 0.023*\"kong\" + 0.021*\"korea\" + 0.017*\"korean\" + 0.015*\"leah\" + 0.014*\"sourc\" + 0.012*\"ashvil\" + 0.012*\"kim\"\n", + "2019-01-31 00:48:52,557 : INFO : topic diff=0.005078, rho=0.032342\n", + "2019-01-31 00:48:52,711 : INFO : PROGRESS: pass 0, at document #1914000/4922894\n", + "2019-01-31 00:48:54,077 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:48:54,344 : INFO : topic #5 (0.020): 0.039*\"abroad\" + 0.029*\"son\" + 0.026*\"rel\" + 0.025*\"reconstruct\" + 0.021*\"band\" + 0.017*\"muscl\" + 0.016*\"simultan\" + 0.014*\"charcoal\" + 0.013*\"toyota\" + 0.010*\"myspac\"\n", + "2019-01-31 00:48:54,345 : INFO : topic #28 (0.020): 0.032*\"build\" + 0.025*\"hous\" + 0.022*\"rivièr\" + 0.017*\"buford\" + 0.013*\"histor\" + 0.012*\"strategist\" + 0.011*\"briarwood\" + 0.011*\"constitut\" + 0.010*\"linear\" + 0.010*\"depress\"\n", + "2019-01-31 00:48:54,346 : INFO : topic #24 (0.020): 0.039*\"book\" + 0.035*\"publicis\" + 0.025*\"word\" + 0.018*\"new\" + 0.014*\"edit\" + 0.013*\"presid\" + 0.013*\"collect\" + 0.012*\"storag\" + 0.011*\"nicola\" + 0.011*\"author\"\n", + "2019-01-31 00:48:54,347 : INFO : topic #44 (0.020): 0.031*\"rooftop\" + 0.027*\"final\" + 0.024*\"wife\" + 0.022*\"tourist\" + 0.018*\"champion\" + 0.015*\"tiepolo\" + 0.014*\"chamber\" + 0.014*\"open\" + 0.013*\"taxpay\" + 0.013*\"winner\"\n", + "2019-01-31 00:48:54,348 : INFO : topic #34 (0.020): 0.072*\"start\" + 0.031*\"unionist\" + 0.029*\"american\" + 0.029*\"new\" + 0.027*\"cotton\" + 0.018*\"year\" + 0.015*\"california\" + 0.013*\"warrior\" + 0.013*\"terri\" + 0.012*\"north\"\n", + "2019-01-31 00:48:54,354 : INFO : topic diff=0.004101, rho=0.032325\n", + "2019-01-31 00:48:54,510 : INFO : PROGRESS: pass 0, at document #1916000/4922894\n", + "2019-01-31 00:48:55,910 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:48:56,176 : INFO : topic #32 (0.020): 0.051*\"district\" + 0.044*\"vigour\" + 0.043*\"popolo\" + 0.039*\"tortur\" + 0.032*\"cotton\" + 0.029*\"area\" + 0.025*\"multitud\" + 0.023*\"regim\" + 0.022*\"citi\" + 0.019*\"cede\"\n", + "2019-01-31 00:48:56,177 : INFO : topic #28 (0.020): 0.032*\"build\" + 0.025*\"hous\" + 0.022*\"rivièr\" + 0.017*\"buford\" + 0.013*\"histor\" + 0.011*\"strategist\" + 0.011*\"briarwood\" + 0.011*\"constitut\" + 0.011*\"linear\" + 0.010*\"depress\"\n", + "2019-01-31 00:48:56,178 : INFO : topic #17 (0.020): 0.078*\"church\" + 0.023*\"christian\" + 0.022*\"cathol\" + 0.020*\"bishop\" + 0.016*\"retroflex\" + 0.015*\"sail\" + 0.010*\"centuri\" + 0.010*\"relationship\" + 0.009*\"historiographi\" + 0.009*\"cathedr\"\n", + "2019-01-31 00:48:56,179 : INFO : topic #34 (0.020): 0.072*\"start\" + 0.031*\"unionist\" + 0.030*\"american\" + 0.029*\"new\" + 0.026*\"cotton\" + 0.018*\"year\" + 0.014*\"california\" + 0.013*\"warrior\" + 0.012*\"terri\" + 0.012*\"north\"\n", + "2019-01-31 00:48:56,180 : INFO : topic #26 (0.020): 0.030*\"woman\" + 0.030*\"workplac\" + 0.027*\"champion\" + 0.027*\"men\" + 0.026*\"olymp\" + 0.023*\"medal\" + 0.021*\"event\" + 0.020*\"taxpay\" + 0.019*\"atheist\" + 0.019*\"rainfal\"\n", + "2019-01-31 00:48:56,186 : INFO : topic diff=0.005098, rho=0.032309\n", + "2019-01-31 00:48:56,400 : INFO : PROGRESS: pass 0, at document #1918000/4922894\n", + "2019-01-31 00:48:57,779 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:48:58,045 : INFO : topic #34 (0.020): 0.071*\"start\" + 0.031*\"unionist\" + 0.030*\"american\" + 0.029*\"new\" + 0.026*\"cotton\" + 0.018*\"year\" + 0.014*\"california\" + 0.013*\"warrior\" + 0.012*\"terri\" + 0.012*\"north\"\n", + "2019-01-31 00:48:58,046 : INFO : topic #46 (0.020): 0.020*\"stop\" + 0.019*\"wind\" + 0.017*\"norwai\" + 0.016*\"sweden\" + 0.016*\"swedish\" + 0.015*\"norwegian\" + 0.013*\"huntsvil\" + 0.013*\"denmark\" + 0.013*\"damag\" + 0.011*\"farid\"\n", + "2019-01-31 00:48:58,047 : INFO : topic #21 (0.020): 0.037*\"samford\" + 0.021*\"spain\" + 0.019*\"del\" + 0.017*\"mexico\" + 0.014*\"soviet\" + 0.012*\"santa\" + 0.012*\"juan\" + 0.011*\"carlo\" + 0.011*\"francisco\" + 0.010*\"lizard\"\n", + "2019-01-31 00:48:58,048 : INFO : topic #30 (0.020): 0.036*\"cleveland\" + 0.035*\"leagu\" + 0.029*\"place\" + 0.026*\"taxpay\" + 0.024*\"scientist\" + 0.023*\"crete\" + 0.021*\"folei\" + 0.016*\"goal\" + 0.015*\"martin\" + 0.012*\"schmitz\"\n", + "2019-01-31 00:48:58,049 : INFO : topic #27 (0.020): 0.070*\"questionnair\" + 0.020*\"candid\" + 0.020*\"taxpay\" + 0.015*\"ret\" + 0.013*\"driver\" + 0.011*\"find\" + 0.010*\"fool\" + 0.010*\"tornado\" + 0.010*\"champion\" + 0.010*\"théori\"\n", + "2019-01-31 00:48:58,055 : INFO : topic diff=0.005077, rho=0.032292\n", + "2019-01-31 00:49:00,704 : INFO : -11.487 per-word bound, 2869.5 perplexity estimate based on a held-out corpus of 2000 documents with 550615 words\n", + "2019-01-31 00:49:00,704 : INFO : PROGRESS: pass 0, at document #1920000/4922894\n", + "2019-01-31 00:49:02,079 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:49:02,345 : INFO : topic #43 (0.020): 0.068*\"elect\" + 0.055*\"parti\" + 0.023*\"voluntari\" + 0.023*\"democrat\" + 0.020*\"member\" + 0.017*\"polici\" + 0.016*\"republ\" + 0.014*\"report\" + 0.014*\"bypass\" + 0.013*\"selma\"\n", + "2019-01-31 00:49:02,346 : INFO : topic #0 (0.020): 0.063*\"statewid\" + 0.042*\"line\" + 0.034*\"arsen\" + 0.034*\"raid\" + 0.025*\"museo\" + 0.019*\"traceabl\" + 0.018*\"serv\" + 0.016*\"pain\" + 0.013*\"exhaust\" + 0.013*\"oper\"\n", + "2019-01-31 00:49:02,347 : INFO : topic #27 (0.020): 0.070*\"questionnair\" + 0.020*\"candid\" + 0.020*\"taxpay\" + 0.015*\"ret\" + 0.013*\"driver\" + 0.012*\"find\" + 0.010*\"tornado\" + 0.010*\"fool\" + 0.010*\"champion\" + 0.010*\"théori\"\n", + "2019-01-31 00:49:02,348 : INFO : topic #35 (0.020): 0.058*\"russia\" + 0.037*\"sovereignti\" + 0.034*\"rural\" + 0.028*\"personifi\" + 0.027*\"poison\" + 0.025*\"reprint\" + 0.021*\"moscow\" + 0.019*\"poland\" + 0.016*\"unfortun\" + 0.015*\"czech\"\n", + "2019-01-31 00:49:02,350 : INFO : topic #17 (0.020): 0.078*\"church\" + 0.023*\"christian\" + 0.022*\"cathol\" + 0.020*\"bishop\" + 0.016*\"retroflex\" + 0.015*\"sail\" + 0.010*\"centuri\" + 0.010*\"relationship\" + 0.009*\"historiographi\" + 0.008*\"cathedr\"\n", + "2019-01-31 00:49:02,355 : INFO : topic diff=0.005703, rho=0.032275\n", + "2019-01-31 00:49:02,509 : INFO : PROGRESS: pass 0, at document #1922000/4922894\n", + "2019-01-31 00:49:03,872 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:49:04,140 : INFO : topic #14 (0.020): 0.024*\"forc\" + 0.023*\"aggress\" + 0.020*\"armi\" + 0.020*\"walter\" + 0.018*\"com\" + 0.014*\"unionist\" + 0.014*\"oper\" + 0.014*\"militari\" + 0.012*\"airmen\" + 0.012*\"airbu\"\n", + "2019-01-31 00:49:04,141 : INFO : topic #9 (0.020): 0.068*\"bone\" + 0.042*\"american\" + 0.028*\"valour\" + 0.021*\"dutch\" + 0.018*\"folei\" + 0.018*\"polit\" + 0.016*\"player\" + 0.016*\"english\" + 0.012*\"acrimoni\" + 0.010*\"simpler\"\n", + "2019-01-31 00:49:04,142 : INFO : topic #4 (0.020): 0.021*\"enfranchis\" + 0.015*\"pour\" + 0.015*\"depress\" + 0.009*\"mode\" + 0.009*\"elabor\" + 0.008*\"veget\" + 0.007*\"uruguayan\" + 0.007*\"encyclopedia\" + 0.007*\"candid\" + 0.006*\"produc\"\n", + "2019-01-31 00:49:04,144 : INFO : topic #11 (0.020): 0.025*\"john\" + 0.013*\"will\" + 0.012*\"jame\" + 0.011*\"david\" + 0.010*\"rival\" + 0.009*\"mexican–american\" + 0.009*\"georg\" + 0.008*\"slur\" + 0.008*\"paul\" + 0.008*\"rhyme\"\n", + "2019-01-31 00:49:04,145 : INFO : topic #13 (0.020): 0.028*\"australia\" + 0.027*\"sourc\" + 0.026*\"new\" + 0.025*\"london\" + 0.023*\"england\" + 0.022*\"australian\" + 0.019*\"british\" + 0.017*\"ireland\" + 0.016*\"youth\" + 0.014*\"wale\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 00:49:04,151 : INFO : topic diff=0.005001, rho=0.032258\n", + "2019-01-31 00:49:04,304 : INFO : PROGRESS: pass 0, at document #1924000/4922894\n", + "2019-01-31 00:49:05,687 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:49:05,954 : INFO : topic #7 (0.020): 0.021*\"snatch\" + 0.020*\"di\" + 0.019*\"factor\" + 0.016*\"margin\" + 0.015*\"yawn\" + 0.014*\"bone\" + 0.013*\"life\" + 0.012*\"faster\" + 0.012*\"deal\" + 0.012*\"daughter\"\n", + "2019-01-31 00:49:05,955 : INFO : topic #49 (0.020): 0.044*\"india\" + 0.032*\"incumb\" + 0.013*\"anglo\" + 0.013*\"televis\" + 0.012*\"islam\" + 0.011*\"pakistan\" + 0.010*\"khalsa\" + 0.010*\"muskoge\" + 0.010*\"sri\" + 0.009*\"start\"\n", + "2019-01-31 00:49:05,956 : INFO : topic #29 (0.020): 0.028*\"companhia\" + 0.012*\"million\" + 0.012*\"busi\" + 0.011*\"bank\" + 0.010*\"market\" + 0.010*\"produc\" + 0.009*\"industri\" + 0.008*\"yawn\" + 0.008*\"manag\" + 0.007*\"trace\"\n", + "2019-01-31 00:49:05,957 : INFO : topic #28 (0.020): 0.032*\"build\" + 0.025*\"hous\" + 0.022*\"rivièr\" + 0.017*\"buford\" + 0.013*\"histor\" + 0.011*\"strategist\" + 0.011*\"briarwood\" + 0.011*\"constitut\" + 0.010*\"linear\" + 0.010*\"depress\"\n", + "2019-01-31 00:49:05,958 : INFO : topic #36 (0.020): 0.011*\"network\" + 0.011*\"pop\" + 0.011*\"prognosi\" + 0.008*\"cytokin\" + 0.008*\"develop\" + 0.008*\"softwar\" + 0.007*\"uruguayan\" + 0.007*\"user\" + 0.007*\"diggin\" + 0.007*\"includ\"\n", + "2019-01-31 00:49:05,964 : INFO : topic diff=0.004528, rho=0.032241\n", + "2019-01-31 00:49:06,125 : INFO : PROGRESS: pass 0, at document #1926000/4922894\n", + "2019-01-31 00:49:07,542 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:49:07,808 : INFO : topic #22 (0.020): 0.035*\"spars\" + 0.024*\"factor\" + 0.018*\"adulthood\" + 0.015*\"feel\" + 0.013*\"male\" + 0.011*\"plaisir\" + 0.011*\"hostil\" + 0.010*\"genu\" + 0.009*\"live\" + 0.009*\"biom\"\n", + "2019-01-31 00:49:07,810 : INFO : topic #19 (0.020): 0.016*\"languag\" + 0.013*\"centuri\" + 0.010*\"woodcut\" + 0.010*\"form\" + 0.009*\"origin\" + 0.009*\"mean\" + 0.007*\"english\" + 0.007*\"trade\" + 0.007*\"known\" + 0.006*\"uruguayan\"\n", + "2019-01-31 00:49:07,811 : INFO : topic #16 (0.020): 0.052*\"king\" + 0.034*\"priest\" + 0.021*\"duke\" + 0.020*\"rotterdam\" + 0.019*\"grammat\" + 0.018*\"quarterli\" + 0.018*\"idiosyncrat\" + 0.014*\"maria\" + 0.013*\"count\" + 0.013*\"portugues\"\n", + "2019-01-31 00:49:07,812 : INFO : topic #26 (0.020): 0.030*\"workplac\" + 0.029*\"woman\" + 0.028*\"champion\" + 0.027*\"olymp\" + 0.026*\"men\" + 0.023*\"medal\" + 0.021*\"event\" + 0.019*\"taxpay\" + 0.019*\"atheist\" + 0.019*\"alic\"\n", + "2019-01-31 00:49:07,813 : INFO : topic #11 (0.020): 0.025*\"john\" + 0.013*\"will\" + 0.012*\"jame\" + 0.011*\"david\" + 0.010*\"rival\" + 0.009*\"mexican–american\" + 0.009*\"georg\" + 0.008*\"slur\" + 0.008*\"paul\" + 0.008*\"rhyme\"\n", + "2019-01-31 00:49:07,819 : INFO : topic diff=0.004828, rho=0.032225\n", + "2019-01-31 00:49:07,976 : INFO : PROGRESS: pass 0, at document #1928000/4922894\n", + "2019-01-31 00:49:09,367 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:49:09,633 : INFO : topic #7 (0.020): 0.021*\"snatch\" + 0.020*\"di\" + 0.019*\"factor\" + 0.016*\"margin\" + 0.015*\"yawn\" + 0.014*\"bone\" + 0.013*\"life\" + 0.012*\"faster\" + 0.011*\"daughter\" + 0.011*\"deal\"\n", + "2019-01-31 00:49:09,635 : INFO : topic #18 (0.020): 0.010*\"théori\" + 0.007*\"later\" + 0.006*\"sack\" + 0.006*\"kill\" + 0.006*\"dai\" + 0.005*\"retrospect\" + 0.005*\"like\" + 0.005*\"end\" + 0.004*\"call\" + 0.004*\"kenworthi\"\n", + "2019-01-31 00:49:09,636 : INFO : topic #49 (0.020): 0.044*\"india\" + 0.032*\"incumb\" + 0.013*\"anglo\" + 0.013*\"televis\" + 0.012*\"islam\" + 0.012*\"pakistan\" + 0.010*\"khalsa\" + 0.010*\"muskoge\" + 0.010*\"sri\" + 0.009*\"start\"\n", + "2019-01-31 00:49:09,637 : INFO : topic #9 (0.020): 0.069*\"bone\" + 0.042*\"american\" + 0.029*\"valour\" + 0.020*\"dutch\" + 0.019*\"folei\" + 0.018*\"polit\" + 0.016*\"player\" + 0.016*\"english\" + 0.012*\"acrimoni\" + 0.010*\"netherland\"\n", + "2019-01-31 00:49:09,638 : INFO : topic #16 (0.020): 0.052*\"king\" + 0.033*\"priest\" + 0.021*\"duke\" + 0.020*\"rotterdam\" + 0.019*\"grammat\" + 0.018*\"idiosyncrat\" + 0.018*\"quarterli\" + 0.013*\"maria\" + 0.013*\"count\" + 0.012*\"portugues\"\n", + "2019-01-31 00:49:09,643 : INFO : topic diff=0.005096, rho=0.032208\n", + "2019-01-31 00:49:09,801 : INFO : PROGRESS: pass 0, at document #1930000/4922894\n", + "2019-01-31 00:49:11,188 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:49:11,454 : INFO : topic #3 (0.020): 0.035*\"present\" + 0.027*\"offic\" + 0.023*\"minist\" + 0.022*\"nation\" + 0.021*\"govern\" + 0.020*\"member\" + 0.018*\"serv\" + 0.016*\"gener\" + 0.016*\"start\" + 0.015*\"seri\"\n", + "2019-01-31 00:49:11,455 : INFO : topic #46 (0.020): 0.020*\"stop\" + 0.018*\"wind\" + 0.017*\"norwai\" + 0.016*\"sweden\" + 0.016*\"swedish\" + 0.015*\"norwegian\" + 0.013*\"denmark\" + 0.012*\"damag\" + 0.012*\"huntsvil\" + 0.011*\"danish\"\n", + "2019-01-31 00:49:11,456 : INFO : topic #5 (0.020): 0.039*\"abroad\" + 0.029*\"son\" + 0.027*\"rel\" + 0.025*\"reconstruct\" + 0.021*\"band\" + 0.017*\"muscl\" + 0.016*\"simultan\" + 0.015*\"charcoal\" + 0.013*\"toyota\" + 0.010*\"myspac\"\n", + "2019-01-31 00:49:11,457 : INFO : topic #35 (0.020): 0.061*\"russia\" + 0.038*\"sovereignti\" + 0.034*\"rural\" + 0.026*\"personifi\" + 0.025*\"poison\" + 0.024*\"reprint\" + 0.021*\"moscow\" + 0.018*\"poland\" + 0.017*\"turin\" + 0.015*\"unfortun\"\n", + "2019-01-31 00:49:11,458 : INFO : topic #49 (0.020): 0.044*\"india\" + 0.031*\"incumb\" + 0.013*\"anglo\" + 0.013*\"televis\" + 0.012*\"islam\" + 0.012*\"pakistan\" + 0.010*\"khalsa\" + 0.010*\"muskoge\" + 0.009*\"sri\" + 0.009*\"alam\"\n", + "2019-01-31 00:49:11,465 : INFO : topic diff=0.004761, rho=0.032191\n", + "2019-01-31 00:49:11,618 : INFO : PROGRESS: pass 0, at document #1932000/4922894\n", + "2019-01-31 00:49:13,007 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:49:13,274 : INFO : topic #44 (0.020): 0.031*\"rooftop\" + 0.027*\"final\" + 0.024*\"wife\" + 0.022*\"tourist\" + 0.019*\"champion\" + 0.015*\"tiepolo\" + 0.015*\"chamber\" + 0.014*\"open\" + 0.014*\"taxpay\" + 0.013*\"martin\"\n", + "2019-01-31 00:49:13,276 : INFO : topic #30 (0.020): 0.036*\"cleveland\" + 0.036*\"leagu\" + 0.029*\"place\" + 0.026*\"taxpay\" + 0.024*\"scientist\" + 0.023*\"crete\" + 0.022*\"folei\" + 0.017*\"goal\" + 0.015*\"martin\" + 0.012*\"schmitz\"\n", + "2019-01-31 00:49:13,277 : INFO : topic #43 (0.020): 0.067*\"elect\" + 0.055*\"parti\" + 0.024*\"voluntari\" + 0.023*\"democrat\" + 0.020*\"member\" + 0.016*\"polici\" + 0.016*\"republ\" + 0.014*\"bypass\" + 0.013*\"report\" + 0.013*\"selma\"\n", + "2019-01-31 00:49:13,278 : INFO : topic #42 (0.020): 0.045*\"german\" + 0.030*\"germani\" + 0.015*\"vol\" + 0.014*\"jewish\" + 0.014*\"israel\" + 0.013*\"der\" + 0.012*\"berlin\" + 0.010*\"european\" + 0.010*\"europ\" + 0.009*\"itali\"\n", + "2019-01-31 00:49:13,279 : INFO : topic #13 (0.020): 0.028*\"australia\" + 0.027*\"sourc\" + 0.026*\"new\" + 0.025*\"london\" + 0.023*\"australian\" + 0.022*\"england\" + 0.019*\"british\" + 0.017*\"ireland\" + 0.016*\"youth\" + 0.014*\"wale\"\n", + "2019-01-31 00:49:13,284 : INFO : topic diff=0.004585, rho=0.032174\n", + "2019-01-31 00:49:13,441 : INFO : PROGRESS: pass 0, at document #1934000/4922894\n", + "2019-01-31 00:49:14,825 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:49:15,095 : INFO : topic #37 (0.020): 0.009*\"man\" + 0.009*\"charact\" + 0.008*\"love\" + 0.008*\"septemb\" + 0.007*\"gestur\" + 0.007*\"comic\" + 0.006*\"appear\" + 0.006*\"anim\" + 0.005*\"blue\" + 0.005*\"dixi\"\n", + "2019-01-31 00:49:15,096 : INFO : topic #35 (0.020): 0.060*\"russia\" + 0.039*\"sovereignti\" + 0.034*\"rural\" + 0.027*\"poison\" + 0.026*\"personifi\" + 0.024*\"reprint\" + 0.020*\"moscow\" + 0.019*\"poland\" + 0.016*\"turin\" + 0.015*\"unfortun\"\n", + "2019-01-31 00:49:15,097 : INFO : topic #11 (0.020): 0.025*\"john\" + 0.012*\"will\" + 0.012*\"jame\" + 0.011*\"david\" + 0.010*\"rival\" + 0.009*\"mexican–american\" + 0.009*\"georg\" + 0.008*\"slur\" + 0.008*\"paul\" + 0.007*\"rhyme\"\n", + "2019-01-31 00:49:15,098 : INFO : topic #7 (0.020): 0.021*\"snatch\" + 0.020*\"di\" + 0.019*\"factor\" + 0.016*\"margin\" + 0.015*\"yawn\" + 0.014*\"bone\" + 0.013*\"life\" + 0.013*\"faster\" + 0.012*\"deal\" + 0.011*\"daughter\"\n", + "2019-01-31 00:49:15,099 : INFO : topic #43 (0.020): 0.067*\"elect\" + 0.055*\"parti\" + 0.024*\"voluntari\" + 0.023*\"democrat\" + 0.020*\"member\" + 0.016*\"polici\" + 0.016*\"republ\" + 0.014*\"bypass\" + 0.013*\"report\" + 0.013*\"selma\"\n", + "2019-01-31 00:49:15,105 : INFO : topic diff=0.004978, rho=0.032158\n", + "2019-01-31 00:49:15,262 : INFO : PROGRESS: pass 0, at document #1936000/4922894\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 00:49:16,655 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:49:16,921 : INFO : topic #24 (0.020): 0.038*\"book\" + 0.035*\"publicis\" + 0.025*\"word\" + 0.018*\"new\" + 0.014*\"edit\" + 0.013*\"presid\" + 0.012*\"collect\" + 0.012*\"storag\" + 0.012*\"nicola\" + 0.011*\"magazin\"\n", + "2019-01-31 00:49:16,922 : INFO : topic #33 (0.020): 0.062*\"french\" + 0.049*\"franc\" + 0.029*\"pari\" + 0.025*\"sail\" + 0.023*\"jean\" + 0.017*\"daphn\" + 0.013*\"lazi\" + 0.012*\"loui\" + 0.011*\"piec\" + 0.009*\"wine\"\n", + "2019-01-31 00:49:16,923 : INFO : topic #11 (0.020): 0.025*\"john\" + 0.012*\"will\" + 0.012*\"jame\" + 0.011*\"david\" + 0.010*\"rival\" + 0.009*\"mexican–american\" + 0.009*\"georg\" + 0.008*\"slur\" + 0.008*\"paul\" + 0.007*\"rhyme\"\n", + "2019-01-31 00:49:16,924 : INFO : topic #9 (0.020): 0.071*\"bone\" + 0.042*\"american\" + 0.028*\"valour\" + 0.020*\"dutch\" + 0.018*\"folei\" + 0.017*\"polit\" + 0.016*\"player\" + 0.015*\"english\" + 0.011*\"acrimoni\" + 0.010*\"netherland\"\n", + "2019-01-31 00:49:16,925 : INFO : topic #7 (0.020): 0.021*\"snatch\" + 0.020*\"di\" + 0.018*\"factor\" + 0.016*\"margin\" + 0.015*\"yawn\" + 0.014*\"bone\" + 0.013*\"life\" + 0.013*\"faster\" + 0.012*\"deal\" + 0.011*\"daughter\"\n", + "2019-01-31 00:49:16,931 : INFO : topic diff=0.005146, rho=0.032141\n", + "2019-01-31 00:49:17,089 : INFO : PROGRESS: pass 0, at document #1938000/4922894\n", + "2019-01-31 00:49:18,503 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:49:18,770 : INFO : topic #29 (0.020): 0.028*\"companhia\" + 0.012*\"million\" + 0.012*\"busi\" + 0.011*\"market\" + 0.010*\"bank\" + 0.010*\"produc\" + 0.009*\"industri\" + 0.008*\"yawn\" + 0.008*\"manag\" + 0.007*\"trace\"\n", + "2019-01-31 00:49:18,771 : INFO : topic #42 (0.020): 0.045*\"german\" + 0.030*\"germani\" + 0.015*\"vol\" + 0.014*\"jewish\" + 0.014*\"israel\" + 0.013*\"der\" + 0.012*\"berlin\" + 0.010*\"european\" + 0.009*\"europ\" + 0.009*\"itali\"\n", + "2019-01-31 00:49:18,772 : INFO : topic #31 (0.020): 0.054*\"fusiform\" + 0.026*\"taxpay\" + 0.026*\"scientist\" + 0.024*\"player\" + 0.020*\"place\" + 0.014*\"clot\" + 0.013*\"leagu\" + 0.012*\"folei\" + 0.010*\"yawn\" + 0.009*\"reconstruct\"\n", + "2019-01-31 00:49:18,773 : INFO : topic #36 (0.020): 0.011*\"pop\" + 0.011*\"prognosi\" + 0.011*\"network\" + 0.009*\"cytokin\" + 0.008*\"develop\" + 0.008*\"softwar\" + 0.008*\"uruguayan\" + 0.007*\"user\" + 0.007*\"diggin\" + 0.007*\"includ\"\n", + "2019-01-31 00:49:18,774 : INFO : topic #44 (0.020): 0.032*\"rooftop\" + 0.026*\"final\" + 0.024*\"wife\" + 0.022*\"tourist\" + 0.019*\"champion\" + 0.015*\"tiepolo\" + 0.014*\"chamber\" + 0.014*\"taxpay\" + 0.013*\"open\" + 0.013*\"martin\"\n", + "2019-01-31 00:49:18,780 : INFO : topic diff=0.004266, rho=0.032125\n", + "2019-01-31 00:49:21,493 : INFO : -11.841 per-word bound, 3667.3 perplexity estimate based on a held-out corpus of 2000 documents with 583447 words\n", + "2019-01-31 00:49:21,494 : INFO : PROGRESS: pass 0, at document #1940000/4922894\n", + "2019-01-31 00:49:22,896 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:49:23,163 : INFO : topic #11 (0.020): 0.025*\"john\" + 0.012*\"will\" + 0.012*\"jame\" + 0.011*\"david\" + 0.010*\"rival\" + 0.009*\"mexican–american\" + 0.009*\"georg\" + 0.008*\"slur\" + 0.008*\"paul\" + 0.007*\"rhyme\"\n", + "2019-01-31 00:49:23,164 : INFO : topic #27 (0.020): 0.068*\"questionnair\" + 0.019*\"candid\" + 0.019*\"taxpay\" + 0.016*\"ret\" + 0.013*\"driver\" + 0.012*\"find\" + 0.011*\"tornado\" + 0.010*\"champion\" + 0.010*\"fool\" + 0.009*\"squatter\"\n", + "2019-01-31 00:49:23,165 : INFO : topic #31 (0.020): 0.054*\"fusiform\" + 0.026*\"taxpay\" + 0.026*\"scientist\" + 0.024*\"player\" + 0.020*\"place\" + 0.014*\"clot\" + 0.013*\"leagu\" + 0.012*\"folei\" + 0.010*\"yawn\" + 0.009*\"reconstruct\"\n", + "2019-01-31 00:49:23,166 : INFO : topic #43 (0.020): 0.067*\"elect\" + 0.055*\"parti\" + 0.024*\"voluntari\" + 0.023*\"democrat\" + 0.020*\"member\" + 0.017*\"polici\" + 0.016*\"republ\" + 0.014*\"bypass\" + 0.013*\"report\" + 0.013*\"liber\"\n", + "2019-01-31 00:49:23,167 : INFO : topic #13 (0.020): 0.027*\"australia\" + 0.027*\"sourc\" + 0.026*\"new\" + 0.024*\"london\" + 0.023*\"australian\" + 0.022*\"england\" + 0.019*\"british\" + 0.017*\"ireland\" + 0.016*\"youth\" + 0.014*\"wale\"\n", + "2019-01-31 00:49:23,173 : INFO : topic diff=0.005050, rho=0.032108\n", + "2019-01-31 00:49:23,328 : INFO : PROGRESS: pass 0, at document #1942000/4922894\n", + "2019-01-31 00:49:24,705 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:49:24,971 : INFO : topic #24 (0.020): 0.038*\"book\" + 0.035*\"publicis\" + 0.025*\"word\" + 0.018*\"new\" + 0.013*\"edit\" + 0.013*\"presid\" + 0.012*\"collect\" + 0.012*\"storag\" + 0.012*\"nicola\" + 0.011*\"worldwid\"\n", + "2019-01-31 00:49:24,972 : INFO : topic #13 (0.020): 0.028*\"sourc\" + 0.027*\"australia\" + 0.026*\"new\" + 0.024*\"london\" + 0.023*\"australian\" + 0.022*\"england\" + 0.019*\"british\" + 0.017*\"ireland\" + 0.016*\"youth\" + 0.014*\"wale\"\n", + "2019-01-31 00:49:24,973 : INFO : topic #39 (0.020): 0.057*\"canada\" + 0.042*\"canadian\" + 0.024*\"toronto\" + 0.024*\"ontario\" + 0.020*\"hoar\" + 0.015*\"hydrogen\" + 0.014*\"new\" + 0.013*\"novotná\" + 0.013*\"misericordia\" + 0.012*\"quebec\"\n", + "2019-01-31 00:49:24,974 : INFO : topic #8 (0.020): 0.025*\"law\" + 0.024*\"cortic\" + 0.019*\"start\" + 0.018*\"act\" + 0.013*\"ricardo\" + 0.012*\"case\" + 0.010*\"polaris\" + 0.009*\"replac\" + 0.009*\"legal\" + 0.007*\"judaism\"\n", + "2019-01-31 00:49:24,975 : INFO : topic #40 (0.020): 0.087*\"unit\" + 0.024*\"schuster\" + 0.022*\"institut\" + 0.022*\"collector\" + 0.021*\"requir\" + 0.018*\"student\" + 0.015*\"professor\" + 0.012*\"word\" + 0.011*\"http\" + 0.011*\"governor\"\n", + "2019-01-31 00:49:24,981 : INFO : topic diff=0.006021, rho=0.032092\n", + "2019-01-31 00:49:25,134 : INFO : PROGRESS: pass 0, at document #1944000/4922894\n", + "2019-01-31 00:49:26,508 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:49:26,774 : INFO : topic #7 (0.020): 0.021*\"snatch\" + 0.020*\"di\" + 0.019*\"factor\" + 0.016*\"margin\" + 0.015*\"yawn\" + 0.014*\"bone\" + 0.013*\"life\" + 0.013*\"faster\" + 0.012*\"daughter\" + 0.011*\"deal\"\n", + "2019-01-31 00:49:26,775 : INFO : topic #1 (0.020): 0.055*\"china\" + 0.046*\"chilton\" + 0.024*\"korea\" + 0.022*\"hong\" + 0.021*\"kong\" + 0.018*\"korean\" + 0.017*\"sourc\" + 0.014*\"leah\" + 0.013*\"shirin\" + 0.013*\"kim\"\n", + "2019-01-31 00:49:26,776 : INFO : topic #45 (0.020): 0.027*\"jpg\" + 0.025*\"fifteenth\" + 0.018*\"illicit\" + 0.017*\"black\" + 0.017*\"colder\" + 0.016*\"western\" + 0.013*\"record\" + 0.010*\"blind\" + 0.008*\"depress\" + 0.007*\"light\"\n", + "2019-01-31 00:49:26,778 : INFO : topic #6 (0.020): 0.072*\"fewer\" + 0.025*\"epiru\" + 0.024*\"septemb\" + 0.019*\"teacher\" + 0.016*\"stake\" + 0.013*\"rodríguez\" + 0.012*\"proclaim\" + 0.011*\"direct\" + 0.011*\"movi\" + 0.010*\"acrimoni\"\n", + "2019-01-31 00:49:26,779 : INFO : topic #23 (0.020): 0.138*\"audit\" + 0.067*\"best\" + 0.035*\"yawn\" + 0.028*\"jacksonvil\" + 0.023*\"noll\" + 0.021*\"japanes\" + 0.018*\"women\" + 0.018*\"festiv\" + 0.017*\"intern\" + 0.014*\"prison\"\n", + "2019-01-31 00:49:26,784 : INFO : topic diff=0.004810, rho=0.032075\n", + "2019-01-31 00:49:26,935 : INFO : PROGRESS: pass 0, at document #1946000/4922894\n", + "2019-01-31 00:49:28,281 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:49:28,547 : INFO : topic #22 (0.020): 0.035*\"spars\" + 0.023*\"factor\" + 0.018*\"adulthood\" + 0.015*\"feel\" + 0.013*\"male\" + 0.011*\"plaisir\" + 0.010*\"hostil\" + 0.010*\"genu\" + 0.009*\"biom\" + 0.009*\"live\"\n", + "2019-01-31 00:49:28,548 : INFO : topic #27 (0.020): 0.068*\"questionnair\" + 0.019*\"candid\" + 0.019*\"taxpay\" + 0.017*\"ret\" + 0.013*\"driver\" + 0.011*\"find\" + 0.011*\"tornado\" + 0.011*\"champion\" + 0.010*\"fool\" + 0.009*\"théori\"\n", + "2019-01-31 00:49:28,549 : INFO : topic #31 (0.020): 0.053*\"fusiform\" + 0.026*\"taxpay\" + 0.025*\"scientist\" + 0.025*\"player\" + 0.020*\"place\" + 0.014*\"clot\" + 0.013*\"leagu\" + 0.012*\"folei\" + 0.010*\"yawn\" + 0.009*\"reconstruct\"\n", + "2019-01-31 00:49:28,550 : INFO : topic #34 (0.020): 0.072*\"start\" + 0.032*\"unionist\" + 0.030*\"new\" + 0.029*\"american\" + 0.026*\"cotton\" + 0.018*\"year\" + 0.015*\"california\" + 0.013*\"warrior\" + 0.013*\"terri\" + 0.012*\"north\"\n", + "2019-01-31 00:49:28,551 : INFO : topic #33 (0.020): 0.061*\"french\" + 0.050*\"franc\" + 0.030*\"pari\" + 0.024*\"sail\" + 0.023*\"jean\" + 0.017*\"daphn\" + 0.013*\"lazi\" + 0.013*\"loui\" + 0.011*\"piec\" + 0.009*\"wine\"\n", + "2019-01-31 00:49:28,557 : INFO : topic diff=0.005310, rho=0.032059\n", + "2019-01-31 00:49:28,716 : INFO : PROGRESS: pass 0, at document #1948000/4922894\n", + "2019-01-31 00:49:30,262 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 00:49:30,529 : INFO : topic #36 (0.020): 0.011*\"network\" + 0.011*\"pop\" + 0.011*\"prognosi\" + 0.009*\"cytokin\" + 0.008*\"develop\" + 0.008*\"softwar\" + 0.008*\"diggin\" + 0.008*\"uruguayan\" + 0.007*\"user\" + 0.007*\"includ\"\n", + "2019-01-31 00:49:30,530 : INFO : topic #41 (0.020): 0.042*\"citi\" + 0.025*\"new\" + 0.022*\"palmer\" + 0.015*\"strategist\" + 0.013*\"center\" + 0.012*\"open\" + 0.011*\"includ\" + 0.010*\"lobe\" + 0.009*\"dai\" + 0.009*\"year\"\n", + "2019-01-31 00:49:30,531 : INFO : topic #12 (0.020): 0.009*\"number\" + 0.007*\"frontal\" + 0.007*\"gener\" + 0.006*\"exampl\" + 0.006*\"théori\" + 0.006*\"southern\" + 0.006*\"servitud\" + 0.006*\"poet\" + 0.006*\"utopian\" + 0.006*\"method\"\n", + "2019-01-31 00:49:30,532 : INFO : topic #25 (0.020): 0.031*\"ring\" + 0.017*\"lagrang\" + 0.017*\"warmth\" + 0.016*\"area\" + 0.015*\"mount\" + 0.009*\"palmer\" + 0.008*\"foam\" + 0.008*\"north\" + 0.008*\"land\" + 0.008*\"lobe\"\n", + "2019-01-31 00:49:30,534 : INFO : topic #43 (0.020): 0.065*\"elect\" + 0.054*\"parti\" + 0.024*\"voluntari\" + 0.023*\"democrat\" + 0.020*\"liber\" + 0.019*\"member\" + 0.016*\"polici\" + 0.016*\"republ\" + 0.016*\"conserv\" + 0.013*\"bypass\"\n", + "2019-01-31 00:49:30,540 : INFO : topic diff=0.005105, rho=0.032042\n", + "2019-01-31 00:49:30,695 : INFO : PROGRESS: pass 0, at document #1950000/4922894\n", + "2019-01-31 00:49:32,065 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:49:32,332 : INFO : topic #48 (0.020): 0.082*\"march\" + 0.078*\"octob\" + 0.078*\"sens\" + 0.072*\"januari\" + 0.071*\"juli\" + 0.071*\"notion\" + 0.069*\"judici\" + 0.069*\"april\" + 0.068*\"august\" + 0.066*\"decatur\"\n", + "2019-01-31 00:49:32,333 : INFO : topic #36 (0.020): 0.012*\"network\" + 0.011*\"pop\" + 0.011*\"prognosi\" + 0.009*\"cytokin\" + 0.009*\"develop\" + 0.008*\"diggin\" + 0.008*\"softwar\" + 0.008*\"uruguayan\" + 0.007*\"user\" + 0.007*\"includ\"\n", + "2019-01-31 00:49:32,334 : INFO : topic #37 (0.020): 0.009*\"man\" + 0.009*\"charact\" + 0.008*\"septemb\" + 0.008*\"love\" + 0.007*\"comic\" + 0.007*\"gestur\" + 0.006*\"appear\" + 0.006*\"anim\" + 0.005*\"dixi\" + 0.005*\"blue\"\n", + "2019-01-31 00:49:32,335 : INFO : topic #16 (0.020): 0.051*\"king\" + 0.033*\"priest\" + 0.022*\"duke\" + 0.020*\"rotterdam\" + 0.018*\"quarterli\" + 0.018*\"grammat\" + 0.018*\"idiosyncrat\" + 0.014*\"maria\" + 0.013*\"count\" + 0.013*\"kingdom\"\n", + "2019-01-31 00:49:32,337 : INFO : topic #29 (0.020): 0.028*\"companhia\" + 0.012*\"million\" + 0.011*\"busi\" + 0.011*\"produc\" + 0.011*\"market\" + 0.010*\"bank\" + 0.009*\"industri\" + 0.009*\"yawn\" + 0.008*\"manag\" + 0.007*\"trace\"\n", + "2019-01-31 00:49:32,342 : INFO : topic diff=0.005118, rho=0.032026\n", + "2019-01-31 00:49:32,564 : INFO : PROGRESS: pass 0, at document #1952000/4922894\n", + "2019-01-31 00:49:34,000 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:49:34,267 : INFO : topic #38 (0.020): 0.023*\"walter\" + 0.011*\"aza\" + 0.009*\"battalion\" + 0.008*\"forc\" + 0.008*\"teufel\" + 0.007*\"armi\" + 0.007*\"till\" + 0.007*\"empath\" + 0.006*\"govern\" + 0.006*\"militari\"\n", + "2019-01-31 00:49:34,268 : INFO : topic #39 (0.020): 0.056*\"canada\" + 0.041*\"canadian\" + 0.024*\"toronto\" + 0.023*\"ontario\" + 0.021*\"hoar\" + 0.015*\"hydrogen\" + 0.014*\"new\" + 0.014*\"novotná\" + 0.013*\"misericordia\" + 0.012*\"quebec\"\n", + "2019-01-31 00:49:34,269 : INFO : topic #27 (0.020): 0.068*\"questionnair\" + 0.020*\"candid\" + 0.019*\"taxpay\" + 0.016*\"ret\" + 0.013*\"driver\" + 0.011*\"find\" + 0.011*\"tornado\" + 0.011*\"champion\" + 0.010*\"fool\" + 0.009*\"théori\"\n", + "2019-01-31 00:49:34,270 : INFO : topic #12 (0.020): 0.009*\"number\" + 0.007*\"frontal\" + 0.007*\"gener\" + 0.006*\"exampl\" + 0.006*\"théori\" + 0.006*\"southern\" + 0.006*\"servitud\" + 0.006*\"poet\" + 0.005*\"mode\" + 0.005*\"measur\"\n", + "2019-01-31 00:49:34,272 : INFO : topic #14 (0.020): 0.024*\"forc\" + 0.022*\"aggress\" + 0.020*\"armi\" + 0.020*\"walter\" + 0.018*\"com\" + 0.014*\"unionist\" + 0.013*\"militari\" + 0.013*\"oper\" + 0.013*\"airmen\" + 0.012*\"airbu\"\n", + "2019-01-31 00:49:34,278 : INFO : topic diff=0.005351, rho=0.032009\n", + "2019-01-31 00:49:34,429 : INFO : PROGRESS: pass 0, at document #1954000/4922894\n", + "2019-01-31 00:49:35,765 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:49:36,031 : INFO : topic #44 (0.020): 0.032*\"rooftop\" + 0.026*\"final\" + 0.024*\"wife\" + 0.021*\"tourist\" + 0.019*\"champion\" + 0.014*\"chamber\" + 0.014*\"tiepolo\" + 0.013*\"taxpay\" + 0.013*\"open\" + 0.013*\"martin\"\n", + "2019-01-31 00:49:36,032 : INFO : topic #43 (0.020): 0.064*\"elect\" + 0.056*\"parti\" + 0.024*\"voluntari\" + 0.023*\"democrat\" + 0.019*\"liber\" + 0.019*\"member\" + 0.016*\"polici\" + 0.016*\"republ\" + 0.015*\"conserv\" + 0.013*\"bypass\"\n", + "2019-01-31 00:49:36,034 : INFO : topic #38 (0.020): 0.023*\"walter\" + 0.011*\"aza\" + 0.009*\"battalion\" + 0.008*\"forc\" + 0.008*\"teufel\" + 0.007*\"armi\" + 0.007*\"till\" + 0.007*\"empath\" + 0.006*\"govern\" + 0.006*\"militari\"\n", + "2019-01-31 00:49:36,035 : INFO : topic #8 (0.020): 0.025*\"law\" + 0.024*\"cortic\" + 0.019*\"start\" + 0.019*\"act\" + 0.013*\"ricardo\" + 0.012*\"case\" + 0.010*\"polaris\" + 0.009*\"replac\" + 0.009*\"legal\" + 0.007*\"unionist\"\n", + "2019-01-31 00:49:36,036 : INFO : topic #47 (0.020): 0.065*\"muscl\" + 0.034*\"perceptu\" + 0.019*\"theater\" + 0.018*\"place\" + 0.017*\"compos\" + 0.017*\"damn\" + 0.014*\"physician\" + 0.014*\"orchestr\" + 0.013*\"olympo\" + 0.011*\"word\"\n", + "2019-01-31 00:49:36,042 : INFO : topic diff=0.005795, rho=0.031993\n", + "2019-01-31 00:49:36,198 : INFO : PROGRESS: pass 0, at document #1956000/4922894\n", + "2019-01-31 00:49:37,586 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:49:37,853 : INFO : topic #37 (0.020): 0.009*\"man\" + 0.009*\"charact\" + 0.008*\"septemb\" + 0.008*\"love\" + 0.007*\"comic\" + 0.007*\"gestur\" + 0.006*\"appear\" + 0.006*\"anim\" + 0.005*\"blue\" + 0.005*\"vision\"\n", + "2019-01-31 00:49:37,854 : INFO : topic #45 (0.020): 0.027*\"jpg\" + 0.025*\"fifteenth\" + 0.018*\"illicit\" + 0.017*\"black\" + 0.016*\"colder\" + 0.016*\"western\" + 0.013*\"record\" + 0.011*\"blind\" + 0.008*\"depress\" + 0.007*\"light\"\n", + "2019-01-31 00:49:37,855 : INFO : topic #28 (0.020): 0.031*\"build\" + 0.024*\"hous\" + 0.022*\"rivièr\" + 0.017*\"buford\" + 0.013*\"histor\" + 0.011*\"briarwood\" + 0.011*\"strategist\" + 0.011*\"constitut\" + 0.010*\"depress\" + 0.010*\"linear\"\n", + "2019-01-31 00:49:37,856 : INFO : topic #44 (0.020): 0.032*\"rooftop\" + 0.025*\"final\" + 0.024*\"wife\" + 0.022*\"tourist\" + 0.019*\"champion\" + 0.014*\"chamber\" + 0.014*\"tiepolo\" + 0.014*\"taxpay\" + 0.013*\"open\" + 0.013*\"martin\"\n", + "2019-01-31 00:49:37,857 : INFO : topic #6 (0.020): 0.072*\"fewer\" + 0.025*\"epiru\" + 0.023*\"septemb\" + 0.019*\"teacher\" + 0.016*\"stake\" + 0.013*\"rodríguez\" + 0.012*\"proclaim\" + 0.011*\"direct\" + 0.011*\"movi\" + 0.010*\"acrimoni\"\n", + "2019-01-31 00:49:37,863 : INFO : topic diff=0.004210, rho=0.031976\n", + "2019-01-31 00:49:38,016 : INFO : PROGRESS: pass 0, at document #1958000/4922894\n", + "2019-01-31 00:49:39,383 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:49:39,650 : INFO : topic #33 (0.020): 0.063*\"french\" + 0.049*\"franc\" + 0.031*\"pari\" + 0.025*\"sail\" + 0.023*\"jean\" + 0.017*\"daphn\" + 0.013*\"lazi\" + 0.012*\"loui\" + 0.011*\"piec\" + 0.008*\"wine\"\n", + "2019-01-31 00:49:39,651 : INFO : topic #19 (0.020): 0.016*\"languag\" + 0.013*\"centuri\" + 0.010*\"woodcut\" + 0.010*\"form\" + 0.009*\"mean\" + 0.009*\"origin\" + 0.007*\"english\" + 0.007*\"trade\" + 0.007*\"known\" + 0.006*\"like\"\n", + "2019-01-31 00:49:39,652 : INFO : topic #39 (0.020): 0.057*\"canada\" + 0.041*\"canadian\" + 0.024*\"toronto\" + 0.023*\"ontario\" + 0.021*\"hoar\" + 0.015*\"hydrogen\" + 0.014*\"new\" + 0.014*\"novotná\" + 0.013*\"misericordia\" + 0.012*\"quebec\"\n", + "2019-01-31 00:49:39,653 : INFO : topic #43 (0.020): 0.064*\"elect\" + 0.056*\"parti\" + 0.024*\"voluntari\" + 0.023*\"democrat\" + 0.019*\"member\" + 0.019*\"liber\" + 0.016*\"polici\" + 0.015*\"republ\" + 0.015*\"conserv\" + 0.014*\"bypass\"\n", + "2019-01-31 00:49:39,654 : INFO : topic #4 (0.020): 0.023*\"enfranchis\" + 0.015*\"depress\" + 0.015*\"pour\" + 0.009*\"elabor\" + 0.009*\"mode\" + 0.008*\"veget\" + 0.007*\"uruguayan\" + 0.007*\"encyclopedia\" + 0.006*\"produc\" + 0.006*\"candid\"\n", + "2019-01-31 00:49:39,660 : INFO : topic diff=0.004268, rho=0.031960\n", + "2019-01-31 00:49:42,355 : INFO : -11.600 per-word bound, 3103.8 perplexity estimate based on a held-out corpus of 2000 documents with 554316 words\n", + "2019-01-31 00:49:42,356 : INFO : PROGRESS: pass 0, at document #1960000/4922894\n", + "2019-01-31 00:49:43,749 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 00:49:44,016 : INFO : topic #46 (0.020): 0.020*\"sweden\" + 0.018*\"stop\" + 0.017*\"swedish\" + 0.016*\"norwai\" + 0.016*\"wind\" + 0.015*\"norwegian\" + 0.015*\"damag\" + 0.013*\"denmark\" + 0.011*\"danish\" + 0.011*\"turkish\"\n", + "2019-01-31 00:49:44,017 : INFO : topic #20 (0.020): 0.145*\"scholar\" + 0.039*\"struggl\" + 0.035*\"high\" + 0.029*\"educ\" + 0.023*\"collector\" + 0.017*\"yawn\" + 0.013*\"prognosi\" + 0.010*\"district\" + 0.009*\"task\" + 0.009*\"start\"\n", + "2019-01-31 00:49:44,018 : INFO : topic #21 (0.020): 0.036*\"samford\" + 0.022*\"spain\" + 0.019*\"del\" + 0.016*\"mexico\" + 0.015*\"soviet\" + 0.012*\"juan\" + 0.011*\"carlo\" + 0.011*\"santa\" + 0.011*\"josé\" + 0.011*\"francisco\"\n", + "2019-01-31 00:49:44,019 : INFO : topic #19 (0.020): 0.016*\"languag\" + 0.013*\"centuri\" + 0.010*\"woodcut\" + 0.010*\"form\" + 0.009*\"mean\" + 0.009*\"origin\" + 0.007*\"english\" + 0.007*\"trade\" + 0.007*\"known\" + 0.006*\"like\"\n", + "2019-01-31 00:49:44,020 : INFO : topic #35 (0.020): 0.060*\"russia\" + 0.039*\"sovereignti\" + 0.034*\"rural\" + 0.026*\"poison\" + 0.024*\"personifi\" + 0.023*\"reprint\" + 0.021*\"moscow\" + 0.018*\"poland\" + 0.015*\"unfortun\" + 0.014*\"czech\"\n", + "2019-01-31 00:49:44,026 : INFO : topic diff=0.004810, rho=0.031944\n", + "2019-01-31 00:49:44,180 : INFO : PROGRESS: pass 0, at document #1962000/4922894\n", + "2019-01-31 00:49:45,551 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:49:45,817 : INFO : topic #49 (0.020): 0.043*\"india\" + 0.032*\"incumb\" + 0.013*\"anglo\" + 0.013*\"televis\" + 0.013*\"islam\" + 0.012*\"pakistan\" + 0.011*\"khalsa\" + 0.010*\"muskoge\" + 0.010*\"sri\" + 0.009*\"singh\"\n", + "2019-01-31 00:49:45,818 : INFO : topic #8 (0.020): 0.025*\"law\" + 0.024*\"cortic\" + 0.019*\"start\" + 0.018*\"act\" + 0.013*\"ricardo\" + 0.012*\"case\" + 0.010*\"polaris\" + 0.009*\"replac\" + 0.009*\"legal\" + 0.007*\"princess\"\n", + "2019-01-31 00:49:45,819 : INFO : topic #9 (0.020): 0.071*\"bone\" + 0.042*\"american\" + 0.029*\"valour\" + 0.020*\"dutch\" + 0.018*\"folei\" + 0.018*\"polit\" + 0.017*\"player\" + 0.015*\"english\" + 0.011*\"acrimoni\" + 0.011*\"netherland\"\n", + "2019-01-31 00:49:45,820 : INFO : topic #30 (0.020): 0.035*\"leagu\" + 0.035*\"cleveland\" + 0.029*\"place\" + 0.027*\"taxpay\" + 0.024*\"scientist\" + 0.022*\"crete\" + 0.021*\"folei\" + 0.016*\"goal\" + 0.015*\"martin\" + 0.012*\"schmitz\"\n", + "2019-01-31 00:49:45,821 : INFO : topic #37 (0.020): 0.010*\"man\" + 0.009*\"charact\" + 0.008*\"septemb\" + 0.008*\"love\" + 0.007*\"gestur\" + 0.007*\"comic\" + 0.006*\"appear\" + 0.006*\"anim\" + 0.005*\"blue\" + 0.005*\"vision\"\n", + "2019-01-31 00:49:45,827 : INFO : topic diff=0.004444, rho=0.031928\n", + "2019-01-31 00:49:45,978 : INFO : PROGRESS: pass 0, at document #1964000/4922894\n", + "2019-01-31 00:49:47,331 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:49:47,598 : INFO : topic #49 (0.020): 0.043*\"india\" + 0.032*\"incumb\" + 0.013*\"anglo\" + 0.012*\"televis\" + 0.012*\"islam\" + 0.012*\"pakistan\" + 0.011*\"khalsa\" + 0.010*\"muskoge\" + 0.010*\"sri\" + 0.009*\"alam\"\n", + "2019-01-31 00:49:47,599 : INFO : topic #10 (0.020): 0.012*\"cdd\" + 0.008*\"disco\" + 0.007*\"media\" + 0.007*\"hormon\" + 0.007*\"have\" + 0.007*\"caus\" + 0.006*\"pathwai\" + 0.006*\"proper\" + 0.006*\"effect\" + 0.006*\"acid\"\n", + "2019-01-31 00:49:47,600 : INFO : topic #46 (0.020): 0.020*\"sweden\" + 0.018*\"stop\" + 0.017*\"wind\" + 0.017*\"swedish\" + 0.016*\"norwai\" + 0.014*\"norwegian\" + 0.014*\"damag\" + 0.013*\"denmark\" + 0.012*\"turkish\" + 0.011*\"farid\"\n", + "2019-01-31 00:49:47,601 : INFO : topic #3 (0.020): 0.036*\"present\" + 0.027*\"offic\" + 0.024*\"minist\" + 0.022*\"nation\" + 0.021*\"govern\" + 0.020*\"member\" + 0.018*\"serv\" + 0.016*\"start\" + 0.016*\"gener\" + 0.015*\"seri\"\n", + "2019-01-31 00:49:47,602 : INFO : topic #39 (0.020): 0.057*\"canada\" + 0.041*\"canadian\" + 0.024*\"toronto\" + 0.023*\"ontario\" + 0.020*\"hoar\" + 0.015*\"hydrogen\" + 0.014*\"new\" + 0.014*\"novotná\" + 0.013*\"misericordia\" + 0.012*\"quebec\"\n", + "2019-01-31 00:49:47,608 : INFO : topic diff=0.005240, rho=0.031911\n", + "2019-01-31 00:49:47,767 : INFO : PROGRESS: pass 0, at document #1966000/4922894\n", + "2019-01-31 00:49:49,263 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:49:49,530 : INFO : topic #22 (0.020): 0.035*\"spars\" + 0.024*\"factor\" + 0.018*\"adulthood\" + 0.015*\"feel\" + 0.013*\"male\" + 0.011*\"genu\" + 0.011*\"plaisir\" + 0.010*\"hostil\" + 0.009*\"live\" + 0.008*\"biom\"\n", + "2019-01-31 00:49:49,531 : INFO : topic #25 (0.020): 0.031*\"ring\" + 0.017*\"warmth\" + 0.016*\"lagrang\" + 0.016*\"area\" + 0.016*\"mount\" + 0.009*\"palmer\" + 0.008*\"land\" + 0.008*\"foam\" + 0.008*\"north\" + 0.008*\"lobe\"\n", + "2019-01-31 00:49:49,532 : INFO : topic #26 (0.020): 0.030*\"workplac\" + 0.028*\"champion\" + 0.027*\"woman\" + 0.025*\"men\" + 0.025*\"olymp\" + 0.024*\"medal\" + 0.021*\"event\" + 0.020*\"alic\" + 0.019*\"taxpay\" + 0.018*\"atheist\"\n", + "2019-01-31 00:49:49,533 : INFO : topic #1 (0.020): 0.054*\"china\" + 0.044*\"chilton\" + 0.024*\"hong\" + 0.023*\"korea\" + 0.023*\"kong\" + 0.018*\"korean\" + 0.017*\"sourc\" + 0.015*\"leah\" + 0.014*\"kim\" + 0.013*\"shirin\"\n", + "2019-01-31 00:49:49,534 : INFO : topic #9 (0.020): 0.072*\"bone\" + 0.042*\"american\" + 0.029*\"valour\" + 0.020*\"dutch\" + 0.018*\"folei\" + 0.018*\"polit\" + 0.016*\"player\" + 0.015*\"english\" + 0.011*\"acrimoni\" + 0.010*\"netherland\"\n", + "2019-01-31 00:49:49,539 : INFO : topic diff=0.005688, rho=0.031895\n", + "2019-01-31 00:49:49,694 : INFO : PROGRESS: pass 0, at document #1968000/4922894\n", + "2019-01-31 00:49:51,077 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:49:51,343 : INFO : topic #39 (0.020): 0.057*\"canada\" + 0.041*\"canadian\" + 0.023*\"toronto\" + 0.022*\"ontario\" + 0.020*\"hoar\" + 0.015*\"hydrogen\" + 0.014*\"new\" + 0.014*\"novotná\" + 0.013*\"misericordia\" + 0.012*\"quebec\"\n", + "2019-01-31 00:49:51,344 : INFO : topic #31 (0.020): 0.054*\"fusiform\" + 0.026*\"taxpay\" + 0.026*\"scientist\" + 0.025*\"player\" + 0.021*\"place\" + 0.014*\"clot\" + 0.013*\"leagu\" + 0.012*\"folei\" + 0.010*\"yawn\" + 0.009*\"reconstruct\"\n", + "2019-01-31 00:49:51,346 : INFO : topic #41 (0.020): 0.042*\"citi\" + 0.025*\"new\" + 0.022*\"palmer\" + 0.014*\"strategist\" + 0.013*\"center\" + 0.012*\"open\" + 0.011*\"includ\" + 0.010*\"lobe\" + 0.009*\"dai\" + 0.009*\"highli\"\n", + "2019-01-31 00:49:51,347 : INFO : topic #14 (0.020): 0.024*\"forc\" + 0.022*\"aggress\" + 0.021*\"walter\" + 0.021*\"armi\" + 0.018*\"com\" + 0.014*\"unionist\" + 0.014*\"oper\" + 0.013*\"militari\" + 0.012*\"airmen\" + 0.011*\"airbu\"\n", + "2019-01-31 00:49:51,348 : INFO : topic #1 (0.020): 0.053*\"china\" + 0.044*\"chilton\" + 0.024*\"hong\" + 0.023*\"kong\" + 0.022*\"korea\" + 0.018*\"korean\" + 0.017*\"sourc\" + 0.015*\"leah\" + 0.014*\"kim\" + 0.013*\"shirin\"\n", + "2019-01-31 00:49:51,353 : INFO : topic diff=0.005224, rho=0.031879\n", + "2019-01-31 00:49:51,508 : INFO : PROGRESS: pass 0, at document #1970000/4922894\n", + "2019-01-31 00:49:52,884 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:49:53,150 : INFO : topic #30 (0.020): 0.035*\"leagu\" + 0.035*\"cleveland\" + 0.029*\"place\" + 0.027*\"taxpay\" + 0.024*\"scientist\" + 0.022*\"crete\" + 0.021*\"folei\" + 0.016*\"goal\" + 0.015*\"martin\" + 0.012*\"schmitz\"\n", + "2019-01-31 00:49:53,151 : INFO : topic #38 (0.020): 0.023*\"walter\" + 0.010*\"aza\" + 0.008*\"battalion\" + 0.008*\"forc\" + 0.008*\"teufel\" + 0.007*\"armi\" + 0.007*\"till\" + 0.007*\"empath\" + 0.006*\"govern\" + 0.006*\"militari\"\n", + "2019-01-31 00:49:53,152 : INFO : topic #33 (0.020): 0.062*\"french\" + 0.048*\"franc\" + 0.031*\"pari\" + 0.025*\"sail\" + 0.023*\"jean\" + 0.017*\"daphn\" + 0.013*\"lazi\" + 0.012*\"loui\" + 0.011*\"piec\" + 0.009*\"wine\"\n", + "2019-01-31 00:49:53,154 : INFO : topic #36 (0.020): 0.012*\"network\" + 0.011*\"pop\" + 0.011*\"prognosi\" + 0.009*\"develop\" + 0.008*\"cytokin\" + 0.008*\"softwar\" + 0.008*\"diggin\" + 0.008*\"uruguayan\" + 0.007*\"includ\" + 0.007*\"base\"\n", + "2019-01-31 00:49:53,154 : INFO : topic #32 (0.020): 0.051*\"district\" + 0.045*\"vigour\" + 0.043*\"popolo\" + 0.038*\"tortur\" + 0.033*\"cotton\" + 0.028*\"area\" + 0.024*\"multitud\" + 0.022*\"regim\" + 0.021*\"citi\" + 0.020*\"cede\"\n", + "2019-01-31 00:49:53,160 : INFO : topic diff=0.004855, rho=0.031863\n", + "2019-01-31 00:49:53,313 : INFO : PROGRESS: pass 0, at document #1972000/4922894\n", + "2019-01-31 00:49:54,682 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:49:54,948 : INFO : topic #5 (0.020): 0.039*\"abroad\" + 0.029*\"son\" + 0.027*\"rel\" + 0.025*\"reconstruct\" + 0.021*\"band\" + 0.017*\"muscl\" + 0.016*\"simultan\" + 0.015*\"charcoal\" + 0.014*\"toyota\" + 0.010*\"myspac\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 00:49:54,949 : INFO : topic #1 (0.020): 0.054*\"china\" + 0.044*\"chilton\" + 0.023*\"hong\" + 0.023*\"kong\" + 0.022*\"korea\" + 0.019*\"korean\" + 0.017*\"sourc\" + 0.015*\"leah\" + 0.015*\"kim\" + 0.013*\"shirin\"\n", + "2019-01-31 00:49:54,950 : INFO : topic #41 (0.020): 0.043*\"citi\" + 0.025*\"new\" + 0.022*\"palmer\" + 0.014*\"strategist\" + 0.013*\"center\" + 0.012*\"open\" + 0.011*\"includ\" + 0.010*\"lobe\" + 0.009*\"dai\" + 0.009*\"yawn\"\n", + "2019-01-31 00:49:54,952 : INFO : topic #46 (0.020): 0.019*\"sweden\" + 0.018*\"damag\" + 0.018*\"stop\" + 0.017*\"swedish\" + 0.016*\"wind\" + 0.015*\"norwai\" + 0.014*\"norwegian\" + 0.013*\"denmark\" + 0.011*\"turkish\" + 0.011*\"danish\"\n", + "2019-01-31 00:49:54,952 : INFO : topic #48 (0.020): 0.082*\"march\" + 0.077*\"octob\" + 0.076*\"sens\" + 0.072*\"januari\" + 0.071*\"notion\" + 0.069*\"juli\" + 0.069*\"april\" + 0.068*\"judici\" + 0.067*\"august\" + 0.066*\"decatur\"\n", + "2019-01-31 00:49:54,958 : INFO : topic diff=0.004669, rho=0.031846\n", + "2019-01-31 00:49:55,117 : INFO : PROGRESS: pass 0, at document #1974000/4922894\n", + "2019-01-31 00:49:56,526 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:49:56,792 : INFO : topic #47 (0.020): 0.064*\"muscl\" + 0.034*\"perceptu\" + 0.019*\"theater\" + 0.017*\"place\" + 0.017*\"compos\" + 0.016*\"damn\" + 0.014*\"physician\" + 0.014*\"orchestr\" + 0.013*\"olympo\" + 0.012*\"word\"\n", + "2019-01-31 00:49:56,793 : INFO : topic #28 (0.020): 0.031*\"build\" + 0.024*\"hous\" + 0.021*\"rivièr\" + 0.017*\"buford\" + 0.013*\"histor\" + 0.012*\"briarwood\" + 0.011*\"strategist\" + 0.011*\"constitut\" + 0.010*\"depress\" + 0.010*\"linear\"\n", + "2019-01-31 00:49:56,795 : INFO : topic #21 (0.020): 0.036*\"samford\" + 0.022*\"spain\" + 0.019*\"del\" + 0.016*\"mexico\" + 0.015*\"soviet\" + 0.012*\"juan\" + 0.012*\"santa\" + 0.011*\"carlo\" + 0.011*\"francisco\" + 0.011*\"josé\"\n", + "2019-01-31 00:49:56,796 : INFO : topic #2 (0.020): 0.049*\"isl\" + 0.037*\"shield\" + 0.018*\"narrat\" + 0.014*\"scot\" + 0.012*\"pope\" + 0.012*\"blur\" + 0.011*\"coalit\" + 0.010*\"nativist\" + 0.010*\"class\" + 0.010*\"bahá\"\n", + "2019-01-31 00:49:56,797 : INFO : topic #27 (0.020): 0.069*\"questionnair\" + 0.020*\"candid\" + 0.019*\"taxpay\" + 0.014*\"ret\" + 0.013*\"driver\" + 0.012*\"tornado\" + 0.012*\"find\" + 0.011*\"fool\" + 0.010*\"champion\" + 0.009*\"landslid\"\n", + "2019-01-31 00:49:56,803 : INFO : topic diff=0.004973, rho=0.031830\n", + "2019-01-31 00:49:56,954 : INFO : PROGRESS: pass 0, at document #1976000/4922894\n", + "2019-01-31 00:49:58,316 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:49:58,583 : INFO : topic #39 (0.020): 0.057*\"canada\" + 0.041*\"canadian\" + 0.023*\"toronto\" + 0.022*\"ontario\" + 0.020*\"hoar\" + 0.015*\"new\" + 0.015*\"hydrogen\" + 0.013*\"novotná\" + 0.013*\"misericordia\" + 0.012*\"vancouv\"\n", + "2019-01-31 00:49:58,584 : INFO : topic #23 (0.020): 0.135*\"audit\" + 0.065*\"best\" + 0.034*\"yawn\" + 0.029*\"jacksonvil\" + 0.022*\"noll\" + 0.021*\"japanes\" + 0.020*\"festiv\" + 0.019*\"women\" + 0.016*\"intern\" + 0.015*\"misconcept\"\n", + "2019-01-31 00:49:58,585 : INFO : topic #43 (0.020): 0.064*\"elect\" + 0.055*\"parti\" + 0.024*\"voluntari\" + 0.023*\"democrat\" + 0.019*\"member\" + 0.018*\"liber\" + 0.016*\"polici\" + 0.014*\"republ\" + 0.014*\"bypass\" + 0.014*\"conserv\"\n", + "2019-01-31 00:49:58,586 : INFO : topic #20 (0.020): 0.146*\"scholar\" + 0.039*\"struggl\" + 0.035*\"high\" + 0.029*\"educ\" + 0.023*\"collector\" + 0.017*\"yawn\" + 0.013*\"prognosi\" + 0.009*\"district\" + 0.009*\"task\" + 0.009*\"class\"\n", + "2019-01-31 00:49:58,587 : INFO : topic #36 (0.020): 0.012*\"network\" + 0.011*\"pop\" + 0.011*\"prognosi\" + 0.009*\"develop\" + 0.008*\"cytokin\" + 0.008*\"softwar\" + 0.008*\"diggin\" + 0.008*\"uruguayan\" + 0.007*\"includ\" + 0.007*\"brio\"\n", + "2019-01-31 00:49:58,593 : INFO : topic diff=0.004903, rho=0.031814\n", + "2019-01-31 00:49:58,753 : INFO : PROGRESS: pass 0, at document #1978000/4922894\n", + "2019-01-31 00:50:00,170 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:50:00,437 : INFO : topic #34 (0.020): 0.071*\"start\" + 0.031*\"unionist\" + 0.029*\"new\" + 0.029*\"american\" + 0.026*\"cotton\" + 0.018*\"year\" + 0.016*\"california\" + 0.014*\"terri\" + 0.013*\"warrior\" + 0.012*\"north\"\n", + "2019-01-31 00:50:00,438 : INFO : topic #7 (0.020): 0.020*\"snatch\" + 0.020*\"di\" + 0.019*\"factor\" + 0.015*\"margin\" + 0.015*\"yawn\" + 0.014*\"bone\" + 0.013*\"life\" + 0.013*\"faster\" + 0.012*\"will\" + 0.011*\"deal\"\n", + "2019-01-31 00:50:00,439 : INFO : topic #28 (0.020): 0.031*\"build\" + 0.024*\"hous\" + 0.021*\"rivièr\" + 0.017*\"buford\" + 0.013*\"histor\" + 0.012*\"briarwood\" + 0.011*\"strategist\" + 0.011*\"constitut\" + 0.010*\"depress\" + 0.010*\"linear\"\n", + "2019-01-31 00:50:00,440 : INFO : topic #31 (0.020): 0.055*\"fusiform\" + 0.026*\"scientist\" + 0.026*\"taxpay\" + 0.025*\"player\" + 0.021*\"place\" + 0.014*\"clot\" + 0.013*\"leagu\" + 0.012*\"folei\" + 0.010*\"yawn\" + 0.009*\"reconstruct\"\n", + "2019-01-31 00:50:00,442 : INFO : topic #25 (0.020): 0.032*\"ring\" + 0.017*\"warmth\" + 0.017*\"lagrang\" + 0.016*\"area\" + 0.015*\"mount\" + 0.009*\"palmer\" + 0.009*\"land\" + 0.008*\"foam\" + 0.008*\"north\" + 0.008*\"lobe\"\n", + "2019-01-31 00:50:00,447 : INFO : topic diff=0.004569, rho=0.031798\n", + "2019-01-31 00:50:03,141 : INFO : -11.702 per-word bound, 3330.5 perplexity estimate based on a held-out corpus of 2000 documents with 579388 words\n", + "2019-01-31 00:50:03,142 : INFO : PROGRESS: pass 0, at document #1980000/4922894\n", + "2019-01-31 00:50:04,519 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:50:04,787 : INFO : topic #32 (0.020): 0.053*\"district\" + 0.045*\"vigour\" + 0.043*\"popolo\" + 0.038*\"tortur\" + 0.032*\"cotton\" + 0.028*\"area\" + 0.024*\"multitud\" + 0.021*\"regim\" + 0.021*\"citi\" + 0.020*\"cede\"\n", + "2019-01-31 00:50:04,788 : INFO : topic #1 (0.020): 0.054*\"china\" + 0.045*\"chilton\" + 0.025*\"kong\" + 0.024*\"hong\" + 0.022*\"korea\" + 0.018*\"korean\" + 0.016*\"sourc\" + 0.014*\"leah\" + 0.014*\"kim\" + 0.012*\"shirin\"\n", + "2019-01-31 00:50:04,788 : INFO : topic #9 (0.020): 0.072*\"bone\" + 0.043*\"american\" + 0.029*\"valour\" + 0.019*\"dutch\" + 0.018*\"polit\" + 0.017*\"folei\" + 0.016*\"player\" + 0.015*\"english\" + 0.010*\"acrimoni\" + 0.010*\"surnam\"\n", + "2019-01-31 00:50:04,789 : INFO : topic #34 (0.020): 0.071*\"start\" + 0.031*\"unionist\" + 0.029*\"new\" + 0.029*\"american\" + 0.026*\"cotton\" + 0.017*\"year\" + 0.016*\"california\" + 0.014*\"terri\" + 0.013*\"warrior\" + 0.012*\"north\"\n", + "2019-01-31 00:50:04,790 : INFO : topic #26 (0.020): 0.030*\"workplac\" + 0.028*\"woman\" + 0.028*\"champion\" + 0.025*\"men\" + 0.025*\"olymp\" + 0.024*\"medal\" + 0.021*\"event\" + 0.019*\"taxpay\" + 0.018*\"atheist\" + 0.018*\"alic\"\n", + "2019-01-31 00:50:04,797 : INFO : topic diff=0.004592, rho=0.031782\n", + "2019-01-31 00:50:05,007 : INFO : PROGRESS: pass 0, at document #1982000/4922894\n", + "2019-01-31 00:50:06,583 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:50:06,850 : INFO : topic #10 (0.020): 0.011*\"cdd\" + 0.008*\"media\" + 0.008*\"disco\" + 0.007*\"pathwai\" + 0.007*\"hormon\" + 0.007*\"have\" + 0.007*\"caus\" + 0.006*\"acid\" + 0.006*\"treat\" + 0.006*\"effect\"\n", + "2019-01-31 00:50:06,851 : INFO : topic #28 (0.020): 0.031*\"build\" + 0.024*\"hous\" + 0.021*\"rivièr\" + 0.017*\"buford\" + 0.013*\"histor\" + 0.012*\"briarwood\" + 0.011*\"strategist\" + 0.011*\"constitut\" + 0.010*\"depress\" + 0.010*\"linear\"\n", + "2019-01-31 00:50:06,852 : INFO : topic #45 (0.020): 0.026*\"jpg\" + 0.025*\"fifteenth\" + 0.018*\"illicit\" + 0.016*\"black\" + 0.016*\"western\" + 0.016*\"colder\" + 0.013*\"record\" + 0.010*\"blind\" + 0.009*\"arm\" + 0.008*\"depress\"\n", + "2019-01-31 00:50:06,854 : INFO : topic #19 (0.020): 0.016*\"languag\" + 0.013*\"centuri\" + 0.010*\"woodcut\" + 0.010*\"form\" + 0.009*\"mean\" + 0.009*\"origin\" + 0.008*\"english\" + 0.007*\"trade\" + 0.007*\"known\" + 0.006*\"like\"\n", + "2019-01-31 00:50:06,855 : INFO : topic #27 (0.020): 0.069*\"questionnair\" + 0.019*\"candid\" + 0.019*\"taxpay\" + 0.013*\"ret\" + 0.012*\"driver\" + 0.012*\"tornado\" + 0.012*\"find\" + 0.012*\"fool\" + 0.010*\"champion\" + 0.009*\"squatter\"\n", + "2019-01-31 00:50:06,861 : INFO : topic diff=0.004786, rho=0.031766\n", + "2019-01-31 00:50:07,017 : INFO : PROGRESS: pass 0, at document #1984000/4922894\n", + "2019-01-31 00:50:08,393 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:50:08,659 : INFO : topic #32 (0.020): 0.052*\"district\" + 0.045*\"vigour\" + 0.044*\"popolo\" + 0.038*\"tortur\" + 0.032*\"cotton\" + 0.027*\"area\" + 0.024*\"multitud\" + 0.021*\"regim\" + 0.021*\"citi\" + 0.020*\"cede\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 00:50:08,660 : INFO : topic #48 (0.020): 0.080*\"march\" + 0.077*\"octob\" + 0.077*\"sens\" + 0.071*\"januari\" + 0.069*\"notion\" + 0.069*\"juli\" + 0.069*\"april\" + 0.067*\"august\" + 0.066*\"judici\" + 0.066*\"decatur\"\n", + "2019-01-31 00:50:08,661 : INFO : topic #6 (0.020): 0.073*\"fewer\" + 0.024*\"epiru\" + 0.023*\"septemb\" + 0.019*\"teacher\" + 0.016*\"stake\" + 0.013*\"rodríguez\" + 0.012*\"proclaim\" + 0.012*\"direct\" + 0.011*\"movi\" + 0.010*\"acrimoni\"\n", + "2019-01-31 00:50:08,662 : INFO : topic #30 (0.020): 0.035*\"leagu\" + 0.035*\"cleveland\" + 0.029*\"place\" + 0.027*\"taxpay\" + 0.024*\"scientist\" + 0.023*\"crete\" + 0.021*\"folei\" + 0.016*\"goal\" + 0.015*\"martin\" + 0.012*\"schmitz\"\n", + "2019-01-31 00:50:08,663 : INFO : topic #9 (0.020): 0.071*\"bone\" + 0.043*\"american\" + 0.029*\"valour\" + 0.019*\"dutch\" + 0.018*\"polit\" + 0.018*\"folei\" + 0.016*\"player\" + 0.015*\"english\" + 0.011*\"acrimoni\" + 0.010*\"simpler\"\n", + "2019-01-31 00:50:08,669 : INFO : topic diff=0.005008, rho=0.031750\n", + "2019-01-31 00:50:08,822 : INFO : PROGRESS: pass 0, at document #1986000/4922894\n", + "2019-01-31 00:50:10,180 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:50:10,446 : INFO : topic #6 (0.020): 0.073*\"fewer\" + 0.024*\"epiru\" + 0.023*\"septemb\" + 0.019*\"teacher\" + 0.016*\"stake\" + 0.013*\"rodríguez\" + 0.012*\"proclaim\" + 0.012*\"direct\" + 0.011*\"movi\" + 0.010*\"acrimoni\"\n", + "2019-01-31 00:50:10,447 : INFO : topic #42 (0.020): 0.045*\"german\" + 0.031*\"germani\" + 0.015*\"vol\" + 0.014*\"israel\" + 0.014*\"jewish\" + 0.013*\"berlin\" + 0.013*\"der\" + 0.010*\"european\" + 0.009*\"europ\" + 0.009*\"austria\"\n", + "2019-01-31 00:50:10,448 : INFO : topic #18 (0.020): 0.010*\"théori\" + 0.007*\"later\" + 0.006*\"sack\" + 0.006*\"dai\" + 0.006*\"kill\" + 0.005*\"retrospect\" + 0.005*\"like\" + 0.005*\"end\" + 0.004*\"call\" + 0.004*\"help\"\n", + "2019-01-31 00:50:10,449 : INFO : topic #15 (0.020): 0.011*\"small\" + 0.010*\"organ\" + 0.010*\"develop\" + 0.010*\"commun\" + 0.009*\"group\" + 0.009*\"word\" + 0.008*\"peopl\" + 0.008*\"woman\" + 0.007*\"cultur\" + 0.007*\"human\"\n", + "2019-01-31 00:50:10,450 : INFO : topic #32 (0.020): 0.052*\"district\" + 0.044*\"vigour\" + 0.044*\"popolo\" + 0.038*\"tortur\" + 0.032*\"cotton\" + 0.027*\"area\" + 0.024*\"multitud\" + 0.022*\"regim\" + 0.021*\"citi\" + 0.020*\"cede\"\n", + "2019-01-31 00:50:10,456 : INFO : topic diff=0.004318, rho=0.031734\n", + "2019-01-31 00:50:10,615 : INFO : PROGRESS: pass 0, at document #1988000/4922894\n", + "2019-01-31 00:50:12,029 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:50:12,296 : INFO : topic #14 (0.020): 0.024*\"forc\" + 0.022*\"aggress\" + 0.021*\"walter\" + 0.021*\"armi\" + 0.018*\"com\" + 0.014*\"militari\" + 0.013*\"oper\" + 0.013*\"unionist\" + 0.012*\"airmen\" + 0.011*\"airbu\"\n", + "2019-01-31 00:50:12,297 : INFO : topic #35 (0.020): 0.062*\"russia\" + 0.041*\"sovereignti\" + 0.035*\"rural\" + 0.026*\"personifi\" + 0.025*\"poison\" + 0.022*\"reprint\" + 0.020*\"moscow\" + 0.018*\"poland\" + 0.016*\"unfortun\" + 0.015*\"czech\"\n", + "2019-01-31 00:50:12,297 : INFO : topic #5 (0.020): 0.039*\"abroad\" + 0.028*\"son\" + 0.027*\"rel\" + 0.025*\"reconstruct\" + 0.021*\"band\" + 0.017*\"muscl\" + 0.016*\"simultan\" + 0.015*\"charcoal\" + 0.014*\"toyota\" + 0.010*\"myspac\"\n", + "2019-01-31 00:50:12,298 : INFO : topic #9 (0.020): 0.071*\"bone\" + 0.043*\"american\" + 0.029*\"valour\" + 0.019*\"polit\" + 0.019*\"dutch\" + 0.017*\"folei\" + 0.017*\"player\" + 0.015*\"english\" + 0.011*\"acrimoni\" + 0.010*\"simpler\"\n", + "2019-01-31 00:50:12,299 : INFO : topic #36 (0.020): 0.011*\"network\" + 0.011*\"pop\" + 0.011*\"prognosi\" + 0.009*\"develop\" + 0.008*\"cytokin\" + 0.008*\"softwar\" + 0.008*\"diggin\" + 0.008*\"uruguayan\" + 0.007*\"user\" + 0.007*\"includ\"\n", + "2019-01-31 00:50:12,305 : INFO : topic diff=0.004584, rho=0.031718\n", + "2019-01-31 00:50:12,464 : INFO : PROGRESS: pass 0, at document #1990000/4922894\n", + "2019-01-31 00:50:13,854 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:50:14,121 : INFO : topic #25 (0.020): 0.032*\"ring\" + 0.017*\"warmth\" + 0.017*\"lagrang\" + 0.016*\"area\" + 0.016*\"mount\" + 0.009*\"palmer\" + 0.009*\"land\" + 0.008*\"north\" + 0.008*\"foam\" + 0.008*\"lobe\"\n", + "2019-01-31 00:50:14,122 : INFO : topic #30 (0.020): 0.036*\"leagu\" + 0.035*\"cleveland\" + 0.029*\"place\" + 0.027*\"taxpay\" + 0.024*\"scientist\" + 0.023*\"crete\" + 0.021*\"folei\" + 0.016*\"goal\" + 0.015*\"martin\" + 0.012*\"schmitz\"\n", + "2019-01-31 00:50:14,123 : INFO : topic #3 (0.020): 0.035*\"present\" + 0.027*\"offic\" + 0.025*\"minist\" + 0.022*\"govern\" + 0.021*\"nation\" + 0.021*\"member\" + 0.017*\"serv\" + 0.016*\"start\" + 0.016*\"gener\" + 0.016*\"seri\"\n", + "2019-01-31 00:50:14,124 : INFO : topic #35 (0.020): 0.062*\"russia\" + 0.041*\"sovereignti\" + 0.035*\"rural\" + 0.025*\"personifi\" + 0.025*\"poison\" + 0.023*\"reprint\" + 0.020*\"moscow\" + 0.018*\"poland\" + 0.016*\"unfortun\" + 0.015*\"czech\"\n", + "2019-01-31 00:50:14,125 : INFO : topic #41 (0.020): 0.042*\"citi\" + 0.025*\"new\" + 0.022*\"palmer\" + 0.014*\"strategist\" + 0.013*\"center\" + 0.012*\"open\" + 0.011*\"includ\" + 0.010*\"lobe\" + 0.009*\"hot\" + 0.009*\"yawn\"\n", + "2019-01-31 00:50:14,131 : INFO : topic diff=0.004435, rho=0.031702\n", + "2019-01-31 00:50:14,295 : INFO : PROGRESS: pass 0, at document #1992000/4922894\n", + "2019-01-31 00:50:15,836 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:50:16,103 : INFO : topic #16 (0.020): 0.054*\"king\" + 0.032*\"priest\" + 0.022*\"duke\" + 0.019*\"rotterdam\" + 0.018*\"idiosyncrat\" + 0.017*\"grammat\" + 0.017*\"quarterli\" + 0.013*\"count\" + 0.013*\"portugues\" + 0.013*\"brazil\"\n", + "2019-01-31 00:50:16,105 : INFO : topic #30 (0.020): 0.036*\"leagu\" + 0.035*\"cleveland\" + 0.029*\"place\" + 0.027*\"taxpay\" + 0.024*\"scientist\" + 0.023*\"crete\" + 0.021*\"folei\" + 0.016*\"goal\" + 0.015*\"martin\" + 0.012*\"schmitz\"\n", + "2019-01-31 00:50:16,106 : INFO : topic #10 (0.020): 0.011*\"cdd\" + 0.008*\"media\" + 0.008*\"disco\" + 0.007*\"have\" + 0.007*\"hormon\" + 0.007*\"pathwai\" + 0.007*\"caus\" + 0.006*\"treat\" + 0.006*\"proper\" + 0.006*\"effect\"\n", + "2019-01-31 00:50:16,107 : INFO : topic #39 (0.020): 0.056*\"canada\" + 0.040*\"canadian\" + 0.023*\"toronto\" + 0.021*\"ontario\" + 0.020*\"hoar\" + 0.015*\"novotná\" + 0.015*\"new\" + 0.014*\"hydrogen\" + 0.013*\"misericordia\" + 0.012*\"quebec\"\n", + "2019-01-31 00:50:16,108 : INFO : topic #49 (0.020): 0.042*\"india\" + 0.031*\"incumb\" + 0.013*\"televis\" + 0.013*\"islam\" + 0.013*\"anglo\" + 0.012*\"pakistan\" + 0.011*\"khalsa\" + 0.010*\"muskoge\" + 0.010*\"alam\" + 0.009*\"singh\"\n", + "2019-01-31 00:50:16,114 : INFO : topic diff=0.006156, rho=0.031686\n", + "2019-01-31 00:50:16,268 : INFO : PROGRESS: pass 0, at document #1994000/4922894\n", + "2019-01-31 00:50:17,626 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:50:17,892 : INFO : topic #7 (0.020): 0.021*\"di\" + 0.020*\"snatch\" + 0.019*\"factor\" + 0.015*\"margin\" + 0.015*\"yawn\" + 0.014*\"bone\" + 0.013*\"life\" + 0.013*\"faster\" + 0.011*\"will\" + 0.011*\"daughter\"\n", + "2019-01-31 00:50:17,893 : INFO : topic #27 (0.020): 0.067*\"questionnair\" + 0.019*\"candid\" + 0.019*\"taxpay\" + 0.013*\"driver\" + 0.012*\"ret\" + 0.012*\"fool\" + 0.012*\"find\" + 0.012*\"tornado\" + 0.010*\"horac\" + 0.010*\"champion\"\n", + "2019-01-31 00:50:17,894 : INFO : topic #41 (0.020): 0.042*\"citi\" + 0.025*\"new\" + 0.022*\"palmer\" + 0.014*\"strategist\" + 0.013*\"center\" + 0.012*\"open\" + 0.011*\"includ\" + 0.010*\"lobe\" + 0.009*\"hot\" + 0.009*\"yawn\"\n", + "2019-01-31 00:50:17,895 : INFO : topic #49 (0.020): 0.042*\"india\" + 0.031*\"incumb\" + 0.014*\"anglo\" + 0.013*\"televis\" + 0.013*\"islam\" + 0.012*\"pakistan\" + 0.012*\"khalsa\" + 0.010*\"muskoge\" + 0.010*\"alam\" + 0.009*\"singh\"\n", + "2019-01-31 00:50:17,896 : INFO : topic #25 (0.020): 0.032*\"ring\" + 0.017*\"warmth\" + 0.016*\"lagrang\" + 0.016*\"area\" + 0.015*\"mount\" + 0.009*\"palmer\" + 0.009*\"land\" + 0.008*\"north\" + 0.008*\"foam\" + 0.008*\"lobe\"\n", + "2019-01-31 00:50:17,902 : INFO : topic diff=0.004276, rho=0.031670\n", + "2019-01-31 00:50:18,056 : INFO : PROGRESS: pass 0, at document #1996000/4922894\n", + "2019-01-31 00:50:19,416 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:50:19,683 : INFO : topic #49 (0.020): 0.042*\"india\" + 0.031*\"incumb\" + 0.015*\"anglo\" + 0.013*\"televis\" + 0.013*\"islam\" + 0.012*\"pakistan\" + 0.012*\"khalsa\" + 0.010*\"muskoge\" + 0.010*\"alam\" + 0.009*\"singh\"\n", + "2019-01-31 00:50:19,684 : INFO : topic #41 (0.020): 0.042*\"citi\" + 0.025*\"new\" + 0.022*\"palmer\" + 0.014*\"strategist\" + 0.013*\"center\" + 0.012*\"open\" + 0.011*\"includ\" + 0.010*\"lobe\" + 0.009*\"hot\" + 0.009*\"yawn\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 00:50:19,685 : INFO : topic #35 (0.020): 0.061*\"russia\" + 0.042*\"sovereignti\" + 0.034*\"rural\" + 0.025*\"personifi\" + 0.025*\"poison\" + 0.023*\"reprint\" + 0.020*\"moscow\" + 0.018*\"poland\" + 0.016*\"unfortun\" + 0.014*\"czech\"\n", + "2019-01-31 00:50:19,686 : INFO : topic #48 (0.020): 0.079*\"sens\" + 0.079*\"march\" + 0.077*\"octob\" + 0.069*\"januari\" + 0.069*\"juli\" + 0.069*\"april\" + 0.069*\"notion\" + 0.067*\"august\" + 0.067*\"judici\" + 0.064*\"decatur\"\n", + "2019-01-31 00:50:19,686 : INFO : topic #26 (0.020): 0.029*\"workplac\" + 0.028*\"woman\" + 0.028*\"champion\" + 0.026*\"men\" + 0.026*\"olymp\" + 0.023*\"medal\" + 0.020*\"event\" + 0.020*\"alic\" + 0.019*\"taxpay\" + 0.018*\"atheist\"\n", + "2019-01-31 00:50:19,692 : INFO : topic diff=0.006056, rho=0.031654\n", + "2019-01-31 00:50:19,856 : INFO : PROGRESS: pass 0, at document #1998000/4922894\n", + "2019-01-31 00:50:21,302 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:50:21,568 : INFO : topic #10 (0.020): 0.011*\"cdd\" + 0.008*\"media\" + 0.008*\"disco\" + 0.007*\"pathwai\" + 0.007*\"have\" + 0.007*\"hormon\" + 0.007*\"caus\" + 0.006*\"treat\" + 0.006*\"acid\" + 0.005*\"effect\"\n", + "2019-01-31 00:50:21,569 : INFO : topic #35 (0.020): 0.060*\"russia\" + 0.043*\"sovereignti\" + 0.035*\"rural\" + 0.025*\"personifi\" + 0.025*\"poison\" + 0.023*\"reprint\" + 0.021*\"moscow\" + 0.018*\"poland\" + 0.016*\"unfortun\" + 0.014*\"czech\"\n", + "2019-01-31 00:50:21,570 : INFO : topic #3 (0.020): 0.035*\"present\" + 0.026*\"offic\" + 0.024*\"minist\" + 0.021*\"govern\" + 0.021*\"nation\" + 0.021*\"member\" + 0.017*\"gener\" + 0.016*\"start\" + 0.016*\"serv\" + 0.016*\"seri\"\n", + "2019-01-31 00:50:21,571 : INFO : topic #29 (0.020): 0.028*\"companhia\" + 0.012*\"million\" + 0.012*\"busi\" + 0.011*\"bank\" + 0.010*\"market\" + 0.010*\"produc\" + 0.009*\"industri\" + 0.009*\"yawn\" + 0.008*\"manag\" + 0.007*\"trace\"\n", + "2019-01-31 00:50:21,573 : INFO : topic #19 (0.020): 0.016*\"languag\" + 0.013*\"centuri\" + 0.010*\"woodcut\" + 0.009*\"form\" + 0.009*\"mean\" + 0.009*\"origin\" + 0.008*\"english\" + 0.008*\"trade\" + 0.007*\"known\" + 0.006*\"like\"\n", + "2019-01-31 00:50:21,578 : INFO : topic diff=0.006084, rho=0.031639\n", + "2019-01-31 00:50:24,256 : INFO : -11.843 per-word bound, 3674.2 perplexity estimate based on a held-out corpus of 2000 documents with 538045 words\n", + "2019-01-31 00:50:24,256 : INFO : PROGRESS: pass 0, at document #2000000/4922894\n", + "2019-01-31 00:50:25,637 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:50:25,903 : INFO : topic #27 (0.020): 0.067*\"questionnair\" + 0.019*\"taxpay\" + 0.019*\"candid\" + 0.013*\"driver\" + 0.012*\"ret\" + 0.012*\"tornado\" + 0.012*\"fool\" + 0.012*\"find\" + 0.010*\"horac\" + 0.010*\"champion\"\n", + "2019-01-31 00:50:25,904 : INFO : topic #13 (0.020): 0.027*\"sourc\" + 0.027*\"australia\" + 0.026*\"new\" + 0.025*\"london\" + 0.023*\"australian\" + 0.023*\"england\" + 0.019*\"british\" + 0.017*\"ireland\" + 0.016*\"youth\" + 0.014*\"wale\"\n", + "2019-01-31 00:50:25,905 : INFO : topic #30 (0.020): 0.036*\"cleveland\" + 0.035*\"leagu\" + 0.030*\"place\" + 0.027*\"taxpay\" + 0.025*\"scientist\" + 0.023*\"crete\" + 0.021*\"folei\" + 0.016*\"goal\" + 0.015*\"martin\" + 0.012*\"schmitz\"\n", + "2019-01-31 00:50:25,906 : INFO : topic #47 (0.020): 0.066*\"muscl\" + 0.034*\"perceptu\" + 0.019*\"theater\" + 0.017*\"place\" + 0.017*\"compos\" + 0.017*\"damn\" + 0.013*\"orchestr\" + 0.013*\"physician\" + 0.012*\"olympo\" + 0.012*\"word\"\n", + "2019-01-31 00:50:25,907 : INFO : topic #37 (0.020): 0.010*\"man\" + 0.009*\"charact\" + 0.008*\"septemb\" + 0.008*\"love\" + 0.007*\"gestur\" + 0.007*\"comic\" + 0.006*\"appear\" + 0.006*\"anim\" + 0.005*\"blue\" + 0.005*\"workplac\"\n", + "2019-01-31 00:50:25,913 : INFO : topic diff=0.004384, rho=0.031623\n", + "2019-01-31 00:50:26,072 : INFO : PROGRESS: pass 0, at document #2002000/4922894\n", + "2019-01-31 00:50:27,472 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:50:27,738 : INFO : topic #13 (0.020): 0.027*\"australia\" + 0.027*\"sourc\" + 0.026*\"new\" + 0.025*\"london\" + 0.023*\"australian\" + 0.022*\"england\" + 0.019*\"british\" + 0.017*\"ireland\" + 0.016*\"youth\" + 0.014*\"wale\"\n", + "2019-01-31 00:50:27,739 : INFO : topic #47 (0.020): 0.066*\"muscl\" + 0.034*\"perceptu\" + 0.020*\"theater\" + 0.018*\"place\" + 0.017*\"compos\" + 0.017*\"damn\" + 0.013*\"orchestr\" + 0.013*\"physician\" + 0.012*\"olympo\" + 0.012*\"word\"\n", + "2019-01-31 00:50:27,740 : INFO : topic #15 (0.020): 0.011*\"small\" + 0.010*\"organ\" + 0.010*\"commun\" + 0.010*\"develop\" + 0.009*\"group\" + 0.009*\"word\" + 0.008*\"peopl\" + 0.008*\"woman\" + 0.007*\"cultur\" + 0.007*\"human\"\n", + "2019-01-31 00:50:27,741 : INFO : topic #24 (0.020): 0.039*\"book\" + 0.035*\"publicis\" + 0.025*\"word\" + 0.018*\"new\" + 0.014*\"edit\" + 0.013*\"presid\" + 0.012*\"collect\" + 0.011*\"storag\" + 0.011*\"nicola\" + 0.011*\"magazin\"\n", + "2019-01-31 00:50:27,742 : INFO : topic #19 (0.020): 0.016*\"languag\" + 0.013*\"centuri\" + 0.010*\"woodcut\" + 0.009*\"form\" + 0.009*\"origin\" + 0.009*\"mean\" + 0.008*\"english\" + 0.008*\"trade\" + 0.007*\"known\" + 0.006*\"like\"\n", + "2019-01-31 00:50:27,748 : INFO : topic diff=0.005064, rho=0.031607\n", + "2019-01-31 00:50:27,903 : INFO : PROGRESS: pass 0, at document #2004000/4922894\n", + "2019-01-31 00:50:29,300 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:50:29,566 : INFO : topic #39 (0.020): 0.056*\"canada\" + 0.041*\"canadian\" + 0.023*\"toronto\" + 0.022*\"ontario\" + 0.020*\"hoar\" + 0.015*\"hydrogen\" + 0.015*\"new\" + 0.014*\"novotná\" + 0.013*\"misericordia\" + 0.012*\"quebec\"\n", + "2019-01-31 00:50:29,567 : INFO : topic #8 (0.020): 0.027*\"law\" + 0.023*\"cortic\" + 0.019*\"start\" + 0.017*\"act\" + 0.013*\"ricardo\" + 0.012*\"case\" + 0.010*\"polaris\" + 0.009*\"legal\" + 0.009*\"replac\" + 0.008*\"princess\"\n", + "2019-01-31 00:50:29,568 : INFO : topic #30 (0.020): 0.036*\"cleveland\" + 0.035*\"leagu\" + 0.030*\"place\" + 0.027*\"taxpay\" + 0.024*\"scientist\" + 0.023*\"crete\" + 0.021*\"folei\" + 0.016*\"goal\" + 0.015*\"martin\" + 0.012*\"schmitz\"\n", + "2019-01-31 00:50:29,569 : INFO : topic #1 (0.020): 0.052*\"china\" + 0.047*\"chilton\" + 0.024*\"kong\" + 0.024*\"hong\" + 0.021*\"korea\" + 0.018*\"korean\" + 0.016*\"sourc\" + 0.015*\"leah\" + 0.014*\"kim\" + 0.012*\"shirin\"\n", + "2019-01-31 00:50:29,570 : INFO : topic #2 (0.020): 0.050*\"isl\" + 0.037*\"shield\" + 0.018*\"narrat\" + 0.014*\"scot\" + 0.012*\"pope\" + 0.012*\"blur\" + 0.011*\"coalit\" + 0.011*\"nativist\" + 0.009*\"bahá\" + 0.009*\"class\"\n", + "2019-01-31 00:50:29,576 : INFO : topic diff=0.004193, rho=0.031591\n", + "2019-01-31 00:50:29,737 : INFO : PROGRESS: pass 0, at document #2006000/4922894\n", + "2019-01-31 00:50:31,113 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:50:31,379 : INFO : topic #0 (0.020): 0.066*\"statewid\" + 0.040*\"line\" + 0.034*\"arsen\" + 0.034*\"raid\" + 0.027*\"museo\" + 0.020*\"traceabl\" + 0.018*\"serv\" + 0.014*\"pain\" + 0.013*\"exhaust\" + 0.013*\"oper\"\n", + "2019-01-31 00:50:31,380 : INFO : topic #26 (0.020): 0.029*\"workplac\" + 0.028*\"champion\" + 0.028*\"woman\" + 0.026*\"men\" + 0.025*\"olymp\" + 0.023*\"medal\" + 0.020*\"event\" + 0.019*\"taxpay\" + 0.019*\"alic\" + 0.018*\"atheist\"\n", + "2019-01-31 00:50:31,381 : INFO : topic #10 (0.020): 0.011*\"cdd\" + 0.008*\"media\" + 0.008*\"disco\" + 0.007*\"pathwai\" + 0.007*\"hormon\" + 0.007*\"have\" + 0.007*\"caus\" + 0.006*\"treat\" + 0.006*\"acid\" + 0.005*\"effect\"\n", + "2019-01-31 00:50:31,382 : INFO : topic #20 (0.020): 0.147*\"scholar\" + 0.039*\"struggl\" + 0.036*\"high\" + 0.029*\"educ\" + 0.022*\"collector\" + 0.017*\"yawn\" + 0.013*\"prognosi\" + 0.010*\"district\" + 0.010*\"gothic\" + 0.009*\"task\"\n", + "2019-01-31 00:50:31,383 : INFO : topic #24 (0.020): 0.039*\"book\" + 0.035*\"publicis\" + 0.025*\"word\" + 0.018*\"new\" + 0.014*\"edit\" + 0.013*\"presid\" + 0.012*\"collect\" + 0.011*\"nicola\" + 0.011*\"storag\" + 0.011*\"magazin\"\n", + "2019-01-31 00:50:31,389 : INFO : topic diff=0.004469, rho=0.031575\n", + "2019-01-31 00:50:31,543 : INFO : PROGRESS: pass 0, at document #2008000/4922894\n", + "2019-01-31 00:50:32,913 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:50:33,179 : INFO : topic #41 (0.020): 0.042*\"citi\" + 0.025*\"new\" + 0.023*\"palmer\" + 0.014*\"strategist\" + 0.012*\"center\" + 0.012*\"open\" + 0.011*\"includ\" + 0.010*\"lobe\" + 0.009*\"hot\" + 0.009*\"dai\"\n", + "2019-01-31 00:50:33,180 : INFO : topic #1 (0.020): 0.053*\"china\" + 0.047*\"chilton\" + 0.024*\"hong\" + 0.024*\"kong\" + 0.021*\"korea\" + 0.018*\"korean\" + 0.016*\"sourc\" + 0.015*\"leah\" + 0.014*\"kim\" + 0.012*\"shirin\"\n", + "2019-01-31 00:50:33,181 : INFO : topic #6 (0.020): 0.073*\"fewer\" + 0.024*\"epiru\" + 0.023*\"septemb\" + 0.019*\"teacher\" + 0.017*\"stake\" + 0.013*\"rodríguez\" + 0.012*\"proclaim\" + 0.011*\"direct\" + 0.011*\"movi\" + 0.010*\"acrimoni\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 00:50:33,182 : INFO : topic #31 (0.020): 0.053*\"fusiform\" + 0.026*\"taxpay\" + 0.026*\"scientist\" + 0.025*\"player\" + 0.020*\"place\" + 0.014*\"clot\" + 0.013*\"leagu\" + 0.011*\"folei\" + 0.010*\"yawn\" + 0.009*\"reconstruct\"\n", + "2019-01-31 00:50:33,183 : INFO : topic #27 (0.020): 0.068*\"questionnair\" + 0.019*\"candid\" + 0.019*\"taxpay\" + 0.013*\"driver\" + 0.012*\"ret\" + 0.012*\"tornado\" + 0.012*\"find\" + 0.011*\"fool\" + 0.010*\"champion\" + 0.010*\"horac\"\n", + "2019-01-31 00:50:33,189 : INFO : topic diff=0.004875, rho=0.031560\n", + "2019-01-31 00:50:33,348 : INFO : PROGRESS: pass 0, at document #2010000/4922894\n", + "2019-01-31 00:50:34,751 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:50:35,018 : INFO : topic #37 (0.020): 0.009*\"man\" + 0.009*\"charact\" + 0.008*\"septemb\" + 0.008*\"love\" + 0.007*\"comic\" + 0.007*\"gestur\" + 0.006*\"appear\" + 0.006*\"anim\" + 0.005*\"vision\" + 0.005*\"blue\"\n", + "2019-01-31 00:50:35,019 : INFO : topic #27 (0.020): 0.068*\"questionnair\" + 0.019*\"taxpay\" + 0.019*\"candid\" + 0.013*\"driver\" + 0.012*\"ret\" + 0.012*\"tornado\" + 0.012*\"find\" + 0.011*\"fool\" + 0.010*\"champion\" + 0.010*\"horac\"\n", + "2019-01-31 00:50:35,020 : INFO : topic #7 (0.020): 0.020*\"di\" + 0.020*\"snatch\" + 0.018*\"factor\" + 0.015*\"margin\" + 0.015*\"yawn\" + 0.014*\"bone\" + 0.013*\"life\" + 0.013*\"faster\" + 0.012*\"will\" + 0.012*\"john\"\n", + "2019-01-31 00:50:35,021 : INFO : topic #32 (0.020): 0.053*\"district\" + 0.045*\"vigour\" + 0.044*\"popolo\" + 0.037*\"tortur\" + 0.033*\"cotton\" + 0.027*\"area\" + 0.024*\"multitud\" + 0.021*\"regim\" + 0.021*\"citi\" + 0.020*\"cede\"\n", + "2019-01-31 00:50:35,022 : INFO : topic #0 (0.020): 0.066*\"statewid\" + 0.041*\"line\" + 0.034*\"arsen\" + 0.034*\"raid\" + 0.027*\"museo\" + 0.020*\"traceabl\" + 0.018*\"serv\" + 0.014*\"pain\" + 0.013*\"exhaust\" + 0.013*\"oper\"\n", + "2019-01-31 00:50:35,027 : INFO : topic diff=0.004891, rho=0.031544\n", + "2019-01-31 00:50:35,186 : INFO : PROGRESS: pass 0, at document #2012000/4922894\n", + "2019-01-31 00:50:36,604 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:50:36,871 : INFO : topic #28 (0.020): 0.031*\"build\" + 0.025*\"hous\" + 0.022*\"rivièr\" + 0.017*\"buford\" + 0.014*\"histor\" + 0.012*\"briarwood\" + 0.011*\"constitut\" + 0.010*\"strategist\" + 0.010*\"depress\" + 0.010*\"linear\"\n", + "2019-01-31 00:50:36,872 : INFO : topic #3 (0.020): 0.034*\"present\" + 0.027*\"offic\" + 0.024*\"minist\" + 0.021*\"govern\" + 0.021*\"nation\" + 0.021*\"member\" + 0.017*\"serv\" + 0.017*\"gener\" + 0.016*\"start\" + 0.016*\"seri\"\n", + "2019-01-31 00:50:36,873 : INFO : topic #31 (0.020): 0.054*\"fusiform\" + 0.026*\"taxpay\" + 0.026*\"scientist\" + 0.024*\"player\" + 0.020*\"place\" + 0.014*\"clot\" + 0.013*\"leagu\" + 0.011*\"folei\" + 0.010*\"yawn\" + 0.009*\"reconstruct\"\n", + "2019-01-31 00:50:36,874 : INFO : topic #15 (0.020): 0.011*\"small\" + 0.010*\"organ\" + 0.010*\"commun\" + 0.010*\"develop\" + 0.009*\"group\" + 0.009*\"word\" + 0.008*\"peopl\" + 0.007*\"woman\" + 0.007*\"cultur\" + 0.007*\"human\"\n", + "2019-01-31 00:50:36,875 : INFO : topic #33 (0.020): 0.060*\"french\" + 0.048*\"franc\" + 0.031*\"pari\" + 0.025*\"sail\" + 0.023*\"jean\" + 0.017*\"daphn\" + 0.013*\"lazi\" + 0.012*\"loui\" + 0.011*\"piec\" + 0.010*\"wine\"\n", + "2019-01-31 00:50:36,881 : INFO : topic diff=0.005384, rho=0.031528\n", + "2019-01-31 00:50:37,092 : INFO : PROGRESS: pass 0, at document #2014000/4922894\n", + "2019-01-31 00:50:38,478 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:50:38,745 : INFO : topic #38 (0.020): 0.024*\"walter\" + 0.010*\"aza\" + 0.008*\"battalion\" + 0.008*\"forc\" + 0.008*\"teufel\" + 0.007*\"armi\" + 0.007*\"till\" + 0.007*\"empath\" + 0.006*\"govern\" + 0.006*\"militari\"\n", + "2019-01-31 00:50:38,746 : INFO : topic #44 (0.020): 0.034*\"rooftop\" + 0.026*\"final\" + 0.024*\"wife\" + 0.020*\"tourist\" + 0.019*\"champion\" + 0.015*\"chamber\" + 0.015*\"tiepolo\" + 0.014*\"martin\" + 0.014*\"taxpay\" + 0.012*\"women\"\n", + "2019-01-31 00:50:38,747 : INFO : topic #13 (0.020): 0.028*\"sourc\" + 0.027*\"australia\" + 0.026*\"new\" + 0.025*\"london\" + 0.023*\"australian\" + 0.022*\"england\" + 0.019*\"british\" + 0.018*\"ireland\" + 0.015*\"youth\" + 0.014*\"wale\"\n", + "2019-01-31 00:50:38,748 : INFO : topic #31 (0.020): 0.055*\"fusiform\" + 0.026*\"taxpay\" + 0.026*\"scientist\" + 0.024*\"player\" + 0.020*\"place\" + 0.014*\"clot\" + 0.013*\"leagu\" + 0.011*\"folei\" + 0.010*\"yawn\" + 0.009*\"reconstruct\"\n", + "2019-01-31 00:50:38,749 : INFO : topic #24 (0.020): 0.039*\"book\" + 0.036*\"publicis\" + 0.025*\"word\" + 0.018*\"new\" + 0.014*\"edit\" + 0.013*\"presid\" + 0.012*\"collect\" + 0.011*\"nicola\" + 0.011*\"storag\" + 0.011*\"magazin\"\n", + "2019-01-31 00:50:38,755 : INFO : topic diff=0.005063, rho=0.031513\n", + "2019-01-31 00:50:38,914 : INFO : PROGRESS: pass 0, at document #2016000/4922894\n", + "2019-01-31 00:50:40,451 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:50:40,718 : INFO : topic #19 (0.020): 0.015*\"languag\" + 0.013*\"centuri\" + 0.010*\"woodcut\" + 0.009*\"form\" + 0.009*\"origin\" + 0.009*\"mean\" + 0.008*\"trade\" + 0.007*\"english\" + 0.007*\"known\" + 0.007*\"like\"\n", + "2019-01-31 00:50:40,719 : INFO : topic #44 (0.020): 0.034*\"rooftop\" + 0.026*\"final\" + 0.024*\"wife\" + 0.020*\"tourist\" + 0.019*\"champion\" + 0.015*\"chamber\" + 0.015*\"tiepolo\" + 0.014*\"martin\" + 0.014*\"taxpay\" + 0.013*\"women\"\n", + "2019-01-31 00:50:40,720 : INFO : topic #14 (0.020): 0.024*\"forc\" + 0.022*\"aggress\" + 0.021*\"walter\" + 0.021*\"armi\" + 0.018*\"com\" + 0.014*\"militari\" + 0.014*\"oper\" + 0.013*\"unionist\" + 0.012*\"airbu\" + 0.011*\"diversifi\"\n", + "2019-01-31 00:50:40,721 : INFO : topic #8 (0.020): 0.027*\"law\" + 0.023*\"cortic\" + 0.019*\"start\" + 0.017*\"act\" + 0.013*\"ricardo\" + 0.012*\"case\" + 0.010*\"polaris\" + 0.009*\"legal\" + 0.009*\"replac\" + 0.008*\"princess\"\n", + "2019-01-31 00:50:40,722 : INFO : topic #11 (0.020): 0.025*\"john\" + 0.013*\"will\" + 0.012*\"jame\" + 0.011*\"david\" + 0.010*\"rival\" + 0.009*\"mexican–american\" + 0.009*\"georg\" + 0.008*\"slur\" + 0.008*\"paul\" + 0.008*\"rhyme\"\n", + "2019-01-31 00:50:40,728 : INFO : topic diff=0.004565, rho=0.031497\n", + "2019-01-31 00:50:40,888 : INFO : PROGRESS: pass 0, at document #2018000/4922894\n", + "2019-01-31 00:50:42,311 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:50:42,578 : INFO : topic #25 (0.020): 0.033*\"ring\" + 0.017*\"warmth\" + 0.016*\"area\" + 0.016*\"lagrang\" + 0.015*\"mount\" + 0.009*\"palmer\" + 0.009*\"land\" + 0.008*\"north\" + 0.008*\"foam\" + 0.008*\"lobe\"\n", + "2019-01-31 00:50:42,579 : INFO : topic #22 (0.020): 0.034*\"spars\" + 0.024*\"factor\" + 0.018*\"adulthood\" + 0.015*\"feel\" + 0.013*\"male\" + 0.011*\"plaisir\" + 0.010*\"genu\" + 0.010*\"hostil\" + 0.009*\"live\" + 0.008*\"biom\"\n", + "2019-01-31 00:50:42,580 : INFO : topic #39 (0.020): 0.056*\"canada\" + 0.042*\"canadian\" + 0.023*\"toronto\" + 0.021*\"ontario\" + 0.021*\"hoar\" + 0.015*\"hydrogen\" + 0.014*\"new\" + 0.014*\"novotná\" + 0.013*\"misericordia\" + 0.012*\"quebec\"\n", + "2019-01-31 00:50:42,581 : INFO : topic #0 (0.020): 0.065*\"statewid\" + 0.041*\"line\" + 0.034*\"raid\" + 0.033*\"arsen\" + 0.027*\"museo\" + 0.020*\"traceabl\" + 0.018*\"serv\" + 0.014*\"pain\" + 0.013*\"exhaust\" + 0.013*\"oper\"\n", + "2019-01-31 00:50:42,582 : INFO : topic #14 (0.020): 0.024*\"forc\" + 0.022*\"aggress\" + 0.021*\"walter\" + 0.020*\"armi\" + 0.019*\"com\" + 0.014*\"militari\" + 0.014*\"oper\" + 0.013*\"unionist\" + 0.012*\"airbu\" + 0.011*\"diversifi\"\n", + "2019-01-31 00:50:42,588 : INFO : topic diff=0.004261, rho=0.031481\n", + "2019-01-31 00:50:45,312 : INFO : -11.609 per-word bound, 3124.1 perplexity estimate based on a held-out corpus of 2000 documents with 559192 words\n", + "2019-01-31 00:50:45,313 : INFO : PROGRESS: pass 0, at document #2020000/4922894\n", + "2019-01-31 00:50:46,717 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:50:46,983 : INFO : topic #35 (0.020): 0.059*\"russia\" + 0.039*\"sovereignti\" + 0.035*\"rural\" + 0.025*\"poison\" + 0.024*\"personifi\" + 0.023*\"reprint\" + 0.021*\"moscow\" + 0.018*\"poland\" + 0.016*\"unfortun\" + 0.014*\"czech\"\n", + "2019-01-31 00:50:46,984 : INFO : topic #12 (0.020): 0.009*\"number\" + 0.008*\"frontal\" + 0.007*\"gener\" + 0.007*\"exampl\" + 0.006*\"poet\" + 0.006*\"servitud\" + 0.006*\"théori\" + 0.006*\"southern\" + 0.006*\"method\" + 0.005*\"measur\"\n", + "2019-01-31 00:50:46,986 : INFO : topic #7 (0.020): 0.020*\"di\" + 0.020*\"snatch\" + 0.018*\"factor\" + 0.015*\"margin\" + 0.015*\"yawn\" + 0.014*\"bone\" + 0.013*\"life\" + 0.013*\"faster\" + 0.012*\"will\" + 0.012*\"john\"\n", + "2019-01-31 00:50:46,987 : INFO : topic #21 (0.020): 0.037*\"samford\" + 0.023*\"spain\" + 0.019*\"mexico\" + 0.019*\"del\" + 0.015*\"soviet\" + 0.012*\"juan\" + 0.011*\"carlo\" + 0.011*\"santa\" + 0.011*\"francisco\" + 0.011*\"lizard\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 00:50:46,988 : INFO : topic #23 (0.020): 0.136*\"audit\" + 0.066*\"best\" + 0.032*\"yawn\" + 0.031*\"jacksonvil\" + 0.022*\"japanes\" + 0.020*\"noll\" + 0.019*\"festiv\" + 0.018*\"women\" + 0.016*\"intern\" + 0.014*\"misconcept\"\n", + "2019-01-31 00:50:46,994 : INFO : topic diff=0.004643, rho=0.031466\n", + "2019-01-31 00:50:47,150 : INFO : PROGRESS: pass 0, at document #2022000/4922894\n", + "2019-01-31 00:50:48,545 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:50:48,812 : INFO : topic #6 (0.020): 0.072*\"fewer\" + 0.024*\"epiru\" + 0.023*\"septemb\" + 0.019*\"teacher\" + 0.017*\"stake\" + 0.013*\"rodríguez\" + 0.012*\"proclaim\" + 0.011*\"direct\" + 0.011*\"movi\" + 0.010*\"acrimoni\"\n", + "2019-01-31 00:50:48,813 : INFO : topic #16 (0.020): 0.055*\"king\" + 0.030*\"priest\" + 0.021*\"duke\" + 0.020*\"rotterdam\" + 0.019*\"idiosyncrat\" + 0.018*\"grammat\" + 0.016*\"quarterli\" + 0.014*\"count\" + 0.014*\"portugues\" + 0.012*\"brazil\"\n", + "2019-01-31 00:50:48,814 : INFO : topic #5 (0.020): 0.039*\"abroad\" + 0.029*\"son\" + 0.027*\"rel\" + 0.026*\"reconstruct\" + 0.021*\"band\" + 0.017*\"muscl\" + 0.016*\"simultan\" + 0.014*\"charcoal\" + 0.014*\"toyota\" + 0.010*\"vocabulari\"\n", + "2019-01-31 00:50:48,815 : INFO : topic #10 (0.020): 0.012*\"cdd\" + 0.008*\"media\" + 0.008*\"disco\" + 0.008*\"have\" + 0.007*\"hormon\" + 0.007*\"pathwai\" + 0.007*\"caus\" + 0.006*\"proper\" + 0.006*\"treat\" + 0.005*\"cancer\"\n", + "2019-01-31 00:50:48,816 : INFO : topic #35 (0.020): 0.058*\"russia\" + 0.039*\"sovereignti\" + 0.035*\"rural\" + 0.026*\"poison\" + 0.024*\"personifi\" + 0.023*\"reprint\" + 0.020*\"moscow\" + 0.018*\"poland\" + 0.016*\"unfortun\" + 0.014*\"czech\"\n", + "2019-01-31 00:50:48,822 : INFO : topic diff=0.003888, rho=0.031450\n", + "2019-01-31 00:50:48,981 : INFO : PROGRESS: pass 0, at document #2024000/4922894\n", + "2019-01-31 00:50:50,381 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:50:50,647 : INFO : topic #30 (0.020): 0.035*\"leagu\" + 0.035*\"cleveland\" + 0.030*\"place\" + 0.027*\"taxpay\" + 0.025*\"scientist\" + 0.023*\"crete\" + 0.021*\"folei\" + 0.016*\"goal\" + 0.015*\"martin\" + 0.012*\"schmitz\"\n", + "2019-01-31 00:50:50,648 : INFO : topic #28 (0.020): 0.031*\"build\" + 0.025*\"hous\" + 0.021*\"rivièr\" + 0.017*\"buford\" + 0.013*\"histor\" + 0.013*\"briarwood\" + 0.011*\"constitut\" + 0.010*\"strategist\" + 0.010*\"depress\" + 0.010*\"linear\"\n", + "2019-01-31 00:50:50,650 : INFO : topic #29 (0.020): 0.028*\"companhia\" + 0.012*\"million\" + 0.011*\"busi\" + 0.010*\"market\" + 0.010*\"bank\" + 0.010*\"produc\" + 0.009*\"industri\" + 0.009*\"yawn\" + 0.008*\"manag\" + 0.007*\"function\"\n", + "2019-01-31 00:50:50,651 : INFO : topic #24 (0.020): 0.039*\"book\" + 0.035*\"publicis\" + 0.025*\"word\" + 0.018*\"new\" + 0.014*\"edit\" + 0.013*\"presid\" + 0.012*\"collect\" + 0.012*\"storag\" + 0.012*\"nicola\" + 0.011*\"magazin\"\n", + "2019-01-31 00:50:50,652 : INFO : topic #4 (0.020): 0.022*\"enfranchis\" + 0.015*\"depress\" + 0.014*\"pour\" + 0.008*\"elabor\" + 0.008*\"mode\" + 0.008*\"veget\" + 0.007*\"uruguayan\" + 0.007*\"encyclopedia\" + 0.006*\"spectacl\" + 0.006*\"produc\"\n", + "2019-01-31 00:50:50,658 : INFO : topic diff=0.005177, rho=0.031435\n", + "2019-01-31 00:50:50,812 : INFO : PROGRESS: pass 0, at document #2026000/4922894\n", + "2019-01-31 00:50:52,178 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:50:52,444 : INFO : topic #30 (0.020): 0.035*\"cleveland\" + 0.035*\"leagu\" + 0.031*\"place\" + 0.027*\"taxpay\" + 0.025*\"scientist\" + 0.023*\"crete\" + 0.021*\"folei\" + 0.016*\"goal\" + 0.015*\"martin\" + 0.012*\"schmitz\"\n", + "2019-01-31 00:50:52,445 : INFO : topic #44 (0.020): 0.033*\"rooftop\" + 0.026*\"final\" + 0.024*\"wife\" + 0.021*\"tourist\" + 0.019*\"champion\" + 0.015*\"martin\" + 0.015*\"tiepolo\" + 0.015*\"chamber\" + 0.014*\"taxpay\" + 0.012*\"women\"\n", + "2019-01-31 00:50:52,447 : INFO : topic #43 (0.020): 0.062*\"elect\" + 0.054*\"parti\" + 0.025*\"voluntari\" + 0.022*\"democrat\" + 0.019*\"member\" + 0.016*\"polici\" + 0.016*\"liber\" + 0.014*\"republ\" + 0.014*\"conserv\" + 0.013*\"bypass\"\n", + "2019-01-31 00:50:52,448 : INFO : topic #28 (0.020): 0.031*\"build\" + 0.025*\"hous\" + 0.021*\"rivièr\" + 0.017*\"buford\" + 0.013*\"histor\" + 0.013*\"briarwood\" + 0.011*\"constitut\" + 0.010*\"strategist\" + 0.010*\"depress\" + 0.010*\"linear\"\n", + "2019-01-31 00:50:52,449 : INFO : topic #29 (0.020): 0.028*\"companhia\" + 0.012*\"million\" + 0.011*\"busi\" + 0.011*\"bank\" + 0.010*\"market\" + 0.010*\"produc\" + 0.009*\"industri\" + 0.009*\"yawn\" + 0.007*\"manag\" + 0.007*\"function\"\n", + "2019-01-31 00:50:52,455 : INFO : topic diff=0.004865, rho=0.031419\n", + "2019-01-31 00:50:52,608 : INFO : PROGRESS: pass 0, at document #2028000/4922894\n", + "2019-01-31 00:50:53,978 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:50:54,244 : INFO : topic #46 (0.020): 0.018*\"damag\" + 0.017*\"stop\" + 0.017*\"sweden\" + 0.016*\"swedish\" + 0.016*\"wind\" + 0.015*\"norwai\" + 0.014*\"norwegian\" + 0.012*\"turkish\" + 0.012*\"denmark\" + 0.011*\"huntsvil\"\n", + "2019-01-31 00:50:54,245 : INFO : topic #8 (0.020): 0.027*\"law\" + 0.023*\"cortic\" + 0.019*\"start\" + 0.017*\"act\" + 0.013*\"ricardo\" + 0.012*\"case\" + 0.010*\"polaris\" + 0.009*\"legal\" + 0.009*\"replac\" + 0.008*\"princess\"\n", + "2019-01-31 00:50:54,247 : INFO : topic #21 (0.020): 0.036*\"samford\" + 0.023*\"spain\" + 0.018*\"del\" + 0.018*\"mexico\" + 0.015*\"soviet\" + 0.012*\"carlo\" + 0.012*\"juan\" + 0.011*\"santa\" + 0.011*\"francisco\" + 0.011*\"josé\"\n", + "2019-01-31 00:50:54,247 : INFO : topic #48 (0.020): 0.081*\"march\" + 0.079*\"sens\" + 0.077*\"octob\" + 0.072*\"juli\" + 0.071*\"april\" + 0.070*\"januari\" + 0.069*\"august\" + 0.069*\"notion\" + 0.069*\"judici\" + 0.066*\"decatur\"\n", + "2019-01-31 00:50:54,249 : INFO : topic #37 (0.020): 0.010*\"man\" + 0.009*\"charact\" + 0.008*\"septemb\" + 0.007*\"love\" + 0.007*\"comic\" + 0.007*\"gestur\" + 0.006*\"anim\" + 0.006*\"appear\" + 0.005*\"vision\" + 0.005*\"blue\"\n", + "2019-01-31 00:50:54,254 : INFO : topic diff=0.004494, rho=0.031404\n", + "2019-01-31 00:50:54,410 : INFO : PROGRESS: pass 0, at document #2030000/4922894\n", + "2019-01-31 00:50:55,770 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:50:56,036 : INFO : topic #42 (0.020): 0.048*\"german\" + 0.032*\"germani\" + 0.015*\"vol\" + 0.014*\"berlin\" + 0.014*\"israel\" + 0.014*\"jewish\" + 0.013*\"der\" + 0.011*\"european\" + 0.010*\"europ\" + 0.009*\"austria\"\n", + "2019-01-31 00:50:56,037 : INFO : topic #33 (0.020): 0.062*\"french\" + 0.047*\"franc\" + 0.031*\"pari\" + 0.024*\"sail\" + 0.023*\"jean\" + 0.017*\"daphn\" + 0.014*\"lazi\" + 0.013*\"loui\" + 0.011*\"piec\" + 0.010*\"wine\"\n", + "2019-01-31 00:50:56,038 : INFO : topic #21 (0.020): 0.036*\"samford\" + 0.023*\"spain\" + 0.018*\"del\" + 0.018*\"mexico\" + 0.015*\"soviet\" + 0.012*\"juan\" + 0.012*\"carlo\" + 0.011*\"santa\" + 0.011*\"francisco\" + 0.011*\"josé\"\n", + "2019-01-31 00:50:56,039 : INFO : topic #32 (0.020): 0.052*\"district\" + 0.046*\"popolo\" + 0.045*\"vigour\" + 0.038*\"tortur\" + 0.033*\"cotton\" + 0.027*\"area\" + 0.023*\"multitud\" + 0.021*\"regim\" + 0.021*\"citi\" + 0.020*\"cede\"\n", + "2019-01-31 00:50:56,040 : INFO : topic #14 (0.020): 0.024*\"forc\" + 0.022*\"aggress\" + 0.021*\"walter\" + 0.021*\"armi\" + 0.018*\"com\" + 0.014*\"unionist\" + 0.014*\"oper\" + 0.014*\"militari\" + 0.012*\"diversifi\" + 0.012*\"airbu\"\n", + "2019-01-31 00:50:56,046 : INFO : topic diff=0.004602, rho=0.031388\n", + "2019-01-31 00:50:56,201 : INFO : PROGRESS: pass 0, at document #2032000/4922894\n", + "2019-01-31 00:50:57,580 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:50:57,847 : INFO : topic #11 (0.020): 0.024*\"john\" + 0.013*\"will\" + 0.012*\"jame\" + 0.011*\"david\" + 0.010*\"rival\" + 0.009*\"mexican–american\" + 0.009*\"georg\" + 0.009*\"slur\" + 0.008*\"paul\" + 0.008*\"rhyme\"\n", + "2019-01-31 00:50:57,848 : INFO : topic #2 (0.020): 0.048*\"isl\" + 0.038*\"shield\" + 0.019*\"narrat\" + 0.013*\"scot\" + 0.012*\"pope\" + 0.012*\"blur\" + 0.011*\"nativist\" + 0.010*\"coalit\" + 0.009*\"fleet\" + 0.009*\"class\"\n", + "2019-01-31 00:50:57,849 : INFO : topic #33 (0.020): 0.063*\"french\" + 0.048*\"franc\" + 0.031*\"pari\" + 0.024*\"sail\" + 0.023*\"jean\" + 0.017*\"daphn\" + 0.013*\"lazi\" + 0.012*\"loui\" + 0.011*\"piec\" + 0.011*\"wine\"\n", + "2019-01-31 00:50:57,850 : INFO : topic #35 (0.020): 0.057*\"russia\" + 0.038*\"sovereignti\" + 0.034*\"rural\" + 0.026*\"poison\" + 0.026*\"personifi\" + 0.024*\"reprint\" + 0.020*\"moscow\" + 0.019*\"poland\" + 0.015*\"unfortun\" + 0.014*\"czech\"\n", + "2019-01-31 00:50:57,851 : INFO : topic #4 (0.020): 0.022*\"enfranchis\" + 0.015*\"depress\" + 0.015*\"pour\" + 0.008*\"elabor\" + 0.008*\"mode\" + 0.008*\"veget\" + 0.007*\"uruguayan\" + 0.006*\"encyclopedia\" + 0.006*\"spectacl\" + 0.006*\"produc\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 00:50:57,857 : INFO : topic diff=0.005449, rho=0.031373\n", + "2019-01-31 00:50:58,012 : INFO : PROGRESS: pass 0, at document #2034000/4922894\n", + "2019-01-31 00:50:59,392 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:50:59,659 : INFO : topic #31 (0.020): 0.054*\"fusiform\" + 0.026*\"taxpay\" + 0.026*\"scientist\" + 0.024*\"player\" + 0.020*\"place\" + 0.014*\"clot\" + 0.013*\"leagu\" + 0.011*\"folei\" + 0.010*\"yawn\" + 0.009*\"reconstruct\"\n", + "2019-01-31 00:50:59,660 : INFO : topic #33 (0.020): 0.062*\"french\" + 0.047*\"franc\" + 0.030*\"pari\" + 0.024*\"sail\" + 0.023*\"jean\" + 0.017*\"daphn\" + 0.013*\"lazi\" + 0.012*\"loui\" + 0.011*\"piec\" + 0.011*\"wine\"\n", + "2019-01-31 00:50:59,661 : INFO : topic #20 (0.020): 0.146*\"scholar\" + 0.039*\"struggl\" + 0.036*\"high\" + 0.029*\"educ\" + 0.021*\"collector\" + 0.017*\"yawn\" + 0.013*\"prognosi\" + 0.010*\"district\" + 0.010*\"gothic\" + 0.009*\"start\"\n", + "2019-01-31 00:50:59,662 : INFO : topic #30 (0.020): 0.036*\"leagu\" + 0.035*\"cleveland\" + 0.031*\"place\" + 0.027*\"taxpay\" + 0.025*\"scientist\" + 0.024*\"crete\" + 0.021*\"folei\" + 0.016*\"goal\" + 0.016*\"martin\" + 0.012*\"schmitz\"\n", + "2019-01-31 00:50:59,663 : INFO : topic #5 (0.020): 0.039*\"abroad\" + 0.029*\"son\" + 0.027*\"rel\" + 0.026*\"reconstruct\" + 0.020*\"band\" + 0.016*\"muscl\" + 0.016*\"simultan\" + 0.014*\"charcoal\" + 0.014*\"toyota\" + 0.010*\"vocabulari\"\n", + "2019-01-31 00:50:59,669 : INFO : topic diff=0.005613, rho=0.031357\n", + "2019-01-31 00:50:59,827 : INFO : PROGRESS: pass 0, at document #2036000/4922894\n", + "2019-01-31 00:51:01,222 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:51:01,488 : INFO : topic #28 (0.020): 0.032*\"build\" + 0.025*\"hous\" + 0.021*\"rivièr\" + 0.017*\"buford\" + 0.014*\"histor\" + 0.012*\"briarwood\" + 0.011*\"constitut\" + 0.010*\"depress\" + 0.010*\"linear\" + 0.010*\"strategist\"\n", + "2019-01-31 00:51:01,489 : INFO : topic #16 (0.020): 0.054*\"king\" + 0.031*\"priest\" + 0.020*\"rotterdam\" + 0.020*\"duke\" + 0.018*\"idiosyncrat\" + 0.018*\"grammat\" + 0.018*\"quarterli\" + 0.014*\"portugues\" + 0.014*\"count\" + 0.012*\"brazil\"\n", + "2019-01-31 00:51:01,490 : INFO : topic #32 (0.020): 0.052*\"district\" + 0.046*\"popolo\" + 0.045*\"vigour\" + 0.038*\"tortur\" + 0.033*\"cotton\" + 0.027*\"area\" + 0.023*\"multitud\" + 0.021*\"regim\" + 0.021*\"citi\" + 0.020*\"cede\"\n", + "2019-01-31 00:51:01,491 : INFO : topic #43 (0.020): 0.062*\"elect\" + 0.055*\"parti\" + 0.025*\"voluntari\" + 0.022*\"democrat\" + 0.019*\"member\" + 0.016*\"polici\" + 0.015*\"liber\" + 0.014*\"republ\" + 0.014*\"conserv\" + 0.013*\"bypass\"\n", + "2019-01-31 00:51:01,492 : INFO : topic #27 (0.020): 0.069*\"questionnair\" + 0.020*\"taxpay\" + 0.019*\"candid\" + 0.012*\"driver\" + 0.012*\"tornado\" + 0.012*\"find\" + 0.012*\"ret\" + 0.011*\"fool\" + 0.011*\"squatter\" + 0.010*\"champion\"\n", + "2019-01-31 00:51:01,499 : INFO : topic diff=0.005632, rho=0.031342\n", + "2019-01-31 00:51:01,655 : INFO : PROGRESS: pass 0, at document #2038000/4922894\n", + "2019-01-31 00:51:03,010 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:51:03,276 : INFO : topic #17 (0.020): 0.075*\"church\" + 0.024*\"cathol\" + 0.021*\"christian\" + 0.020*\"bishop\" + 0.017*\"retroflex\" + 0.017*\"sail\" + 0.011*\"cathedr\" + 0.010*\"centuri\" + 0.009*\"relationship\" + 0.009*\"poll\"\n", + "2019-01-31 00:51:03,277 : INFO : topic #42 (0.020): 0.047*\"german\" + 0.031*\"germani\" + 0.015*\"israel\" + 0.014*\"vol\" + 0.014*\"berlin\" + 0.013*\"jewish\" + 0.012*\"der\" + 0.011*\"european\" + 0.009*\"europ\" + 0.009*\"isra\"\n", + "2019-01-31 00:51:03,279 : INFO : topic #38 (0.020): 0.024*\"walter\" + 0.011*\"aza\" + 0.008*\"battalion\" + 0.008*\"forc\" + 0.008*\"teufel\" + 0.007*\"armi\" + 0.007*\"empath\" + 0.007*\"till\" + 0.006*\"govern\" + 0.006*\"militari\"\n", + "2019-01-31 00:51:03,280 : INFO : topic #29 (0.020): 0.028*\"companhia\" + 0.012*\"million\" + 0.012*\"busi\" + 0.011*\"bank\" + 0.010*\"market\" + 0.010*\"produc\" + 0.009*\"industri\" + 0.009*\"yawn\" + 0.008*\"manag\" + 0.007*\"function\"\n", + "2019-01-31 00:51:03,281 : INFO : topic #34 (0.020): 0.071*\"start\" + 0.031*\"unionist\" + 0.031*\"new\" + 0.030*\"american\" + 0.026*\"cotton\" + 0.018*\"year\" + 0.015*\"california\" + 0.013*\"terri\" + 0.013*\"warrior\" + 0.012*\"north\"\n", + "2019-01-31 00:51:03,287 : INFO : topic diff=0.005952, rho=0.031327\n", + "2019-01-31 00:51:06,053 : INFO : -11.678 per-word bound, 3276.1 perplexity estimate based on a held-out corpus of 2000 documents with 596515 words\n", + "2019-01-31 00:51:06,054 : INFO : PROGRESS: pass 0, at document #2040000/4922894\n", + "2019-01-31 00:51:07,463 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:51:07,729 : INFO : topic #19 (0.020): 0.016*\"languag\" + 0.014*\"centuri\" + 0.010*\"woodcut\" + 0.009*\"form\" + 0.009*\"origin\" + 0.009*\"mean\" + 0.008*\"trade\" + 0.008*\"english\" + 0.007*\"known\" + 0.006*\"like\"\n", + "2019-01-31 00:51:07,730 : INFO : topic #15 (0.020): 0.011*\"small\" + 0.010*\"organ\" + 0.010*\"commun\" + 0.010*\"develop\" + 0.009*\"group\" + 0.009*\"word\" + 0.008*\"peopl\" + 0.007*\"woman\" + 0.007*\"cultur\" + 0.007*\"human\"\n", + "2019-01-31 00:51:07,731 : INFO : topic #35 (0.020): 0.057*\"russia\" + 0.038*\"sovereignti\" + 0.034*\"rural\" + 0.028*\"personifi\" + 0.026*\"poison\" + 0.024*\"reprint\" + 0.020*\"moscow\" + 0.018*\"poland\" + 0.015*\"unfortun\" + 0.014*\"czech\"\n", + "2019-01-31 00:51:07,732 : INFO : topic #3 (0.020): 0.037*\"present\" + 0.027*\"minist\" + 0.026*\"offic\" + 0.021*\"nation\" + 0.021*\"member\" + 0.020*\"govern\" + 0.016*\"gener\" + 0.016*\"start\" + 0.016*\"serv\" + 0.015*\"seri\"\n", + "2019-01-31 00:51:07,733 : INFO : topic #6 (0.020): 0.071*\"fewer\" + 0.023*\"epiru\" + 0.023*\"septemb\" + 0.019*\"teacher\" + 0.017*\"stake\" + 0.013*\"rodríguez\" + 0.012*\"proclaim\" + 0.012*\"direct\" + 0.011*\"movi\" + 0.010*\"acrimoni\"\n", + "2019-01-31 00:51:07,739 : INFO : topic diff=0.005178, rho=0.031311\n", + "2019-01-31 00:51:07,895 : INFO : PROGRESS: pass 0, at document #2042000/4922894\n", + "2019-01-31 00:51:09,279 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:51:09,545 : INFO : topic #0 (0.020): 0.065*\"statewid\" + 0.039*\"line\" + 0.035*\"raid\" + 0.035*\"arsen\" + 0.027*\"museo\" + 0.020*\"traceabl\" + 0.017*\"serv\" + 0.014*\"pain\" + 0.013*\"exhaust\" + 0.012*\"oper\"\n", + "2019-01-31 00:51:09,546 : INFO : topic #7 (0.020): 0.020*\"snatch\" + 0.020*\"di\" + 0.018*\"factor\" + 0.015*\"margin\" + 0.015*\"yawn\" + 0.014*\"bone\" + 0.013*\"life\" + 0.013*\"faster\" + 0.012*\"will\" + 0.012*\"deal\"\n", + "2019-01-31 00:51:09,547 : INFO : topic #2 (0.020): 0.047*\"isl\" + 0.039*\"shield\" + 0.019*\"narrat\" + 0.013*\"scot\" + 0.012*\"pope\" + 0.011*\"blur\" + 0.011*\"nativist\" + 0.010*\"coalit\" + 0.009*\"fleet\" + 0.009*\"class\"\n", + "2019-01-31 00:51:09,548 : INFO : topic #21 (0.020): 0.036*\"samford\" + 0.022*\"spain\" + 0.019*\"del\" + 0.018*\"mexico\" + 0.015*\"soviet\" + 0.012*\"carlo\" + 0.012*\"juan\" + 0.012*\"santa\" + 0.011*\"francisco\" + 0.011*\"lizard\"\n", + "2019-01-31 00:51:09,549 : INFO : topic #39 (0.020): 0.056*\"canada\" + 0.043*\"canadian\" + 0.022*\"toronto\" + 0.021*\"ontario\" + 0.021*\"hoar\" + 0.019*\"colonist\" + 0.015*\"hydrogen\" + 0.014*\"new\" + 0.013*\"misericordia\" + 0.013*\"novotná\"\n", + "2019-01-31 00:51:09,556 : INFO : topic diff=0.004144, rho=0.031296\n", + "2019-01-31 00:51:09,715 : INFO : PROGRESS: pass 0, at document #2044000/4922894\n", + "2019-01-31 00:51:11,122 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:51:11,388 : INFO : topic #2 (0.020): 0.048*\"isl\" + 0.039*\"shield\" + 0.019*\"narrat\" + 0.013*\"scot\" + 0.012*\"pope\" + 0.011*\"blur\" + 0.011*\"nativist\" + 0.010*\"coalit\" + 0.010*\"fleet\" + 0.009*\"class\"\n", + "2019-01-31 00:51:11,389 : INFO : topic #48 (0.020): 0.078*\"march\" + 0.076*\"sens\" + 0.076*\"octob\" + 0.071*\"juli\" + 0.069*\"notion\" + 0.069*\"januari\" + 0.068*\"judici\" + 0.068*\"april\" + 0.068*\"august\" + 0.067*\"decatur\"\n", + "2019-01-31 00:51:11,391 : INFO : topic #37 (0.020): 0.009*\"man\" + 0.009*\"charact\" + 0.008*\"septemb\" + 0.007*\"love\" + 0.007*\"comic\" + 0.007*\"gestur\" + 0.006*\"appear\" + 0.006*\"anim\" + 0.005*\"blue\" + 0.005*\"vision\"\n", + "2019-01-31 00:51:11,391 : INFO : topic #1 (0.020): 0.056*\"china\" + 0.048*\"chilton\" + 0.023*\"hong\" + 0.023*\"kong\" + 0.022*\"korea\" + 0.018*\"korean\" + 0.016*\"sourc\" + 0.016*\"leah\" + 0.015*\"shirin\" + 0.014*\"kim\"\n", + "2019-01-31 00:51:11,393 : INFO : topic #4 (0.020): 0.022*\"enfranchis\" + 0.015*\"depress\" + 0.015*\"pour\" + 0.008*\"elabor\" + 0.008*\"mode\" + 0.008*\"veget\" + 0.007*\"uruguayan\" + 0.007*\"encyclopedia\" + 0.007*\"spectacl\" + 0.006*\"produc\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 00:51:11,398 : INFO : topic diff=0.004961, rho=0.031281\n", + "2019-01-31 00:51:11,558 : INFO : PROGRESS: pass 0, at document #2046000/4922894\n", + "2019-01-31 00:51:12,971 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:51:13,238 : INFO : topic #28 (0.020): 0.032*\"build\" + 0.026*\"hous\" + 0.021*\"rivièr\" + 0.017*\"buford\" + 0.014*\"histor\" + 0.012*\"briarwood\" + 0.011*\"constitut\" + 0.010*\"depress\" + 0.010*\"linear\" + 0.010*\"strategist\"\n", + "2019-01-31 00:51:13,239 : INFO : topic #29 (0.020): 0.028*\"companhia\" + 0.012*\"million\" + 0.012*\"busi\" + 0.011*\"bank\" + 0.010*\"market\" + 0.010*\"produc\" + 0.009*\"industri\" + 0.009*\"yawn\" + 0.008*\"manag\" + 0.007*\"function\"\n", + "2019-01-31 00:51:13,240 : INFO : topic #46 (0.020): 0.019*\"damag\" + 0.017*\"stop\" + 0.017*\"sweden\" + 0.016*\"swedish\" + 0.015*\"norwai\" + 0.015*\"wind\" + 0.014*\"norwegian\" + 0.012*\"turkish\" + 0.011*\"denmark\" + 0.011*\"ton\"\n", + "2019-01-31 00:51:13,241 : INFO : topic #36 (0.020): 0.012*\"network\" + 0.011*\"pop\" + 0.011*\"prognosi\" + 0.008*\"develop\" + 0.008*\"softwar\" + 0.008*\"diggin\" + 0.008*\"user\" + 0.007*\"cytokin\" + 0.007*\"includ\" + 0.007*\"ural\"\n", + "2019-01-31 00:51:13,242 : INFO : topic #34 (0.020): 0.071*\"start\" + 0.031*\"unionist\" + 0.031*\"new\" + 0.030*\"american\" + 0.026*\"cotton\" + 0.018*\"year\" + 0.016*\"california\" + 0.013*\"warrior\" + 0.013*\"terri\" + 0.012*\"north\"\n", + "2019-01-31 00:51:13,248 : INFO : topic diff=0.004858, rho=0.031265\n", + "2019-01-31 00:51:13,464 : INFO : PROGRESS: pass 0, at document #2048000/4922894\n", + "2019-01-31 00:51:14,840 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:51:15,106 : INFO : topic #0 (0.020): 0.064*\"statewid\" + 0.040*\"line\" + 0.035*\"raid\" + 0.034*\"arsen\" + 0.026*\"museo\" + 0.020*\"traceabl\" + 0.017*\"serv\" + 0.013*\"pain\" + 0.013*\"exhaust\" + 0.012*\"oper\"\n", + "2019-01-31 00:51:15,107 : INFO : topic #4 (0.020): 0.022*\"enfranchis\" + 0.015*\"depress\" + 0.015*\"pour\" + 0.008*\"mode\" + 0.008*\"elabor\" + 0.007*\"veget\" + 0.007*\"uruguayan\" + 0.007*\"spectacl\" + 0.007*\"encyclopedia\" + 0.006*\"produc\"\n", + "2019-01-31 00:51:15,109 : INFO : topic #17 (0.020): 0.076*\"church\" + 0.024*\"cathol\" + 0.022*\"christian\" + 0.020*\"bishop\" + 0.018*\"retroflex\" + 0.016*\"sail\" + 0.010*\"cathedr\" + 0.010*\"centuri\" + 0.009*\"poll\" + 0.009*\"relationship\"\n", + "2019-01-31 00:51:15,110 : INFO : topic #10 (0.020): 0.011*\"cdd\" + 0.008*\"media\" + 0.008*\"disco\" + 0.007*\"pathwai\" + 0.007*\"hormon\" + 0.007*\"have\" + 0.007*\"caus\" + 0.006*\"effect\" + 0.006*\"proper\" + 0.006*\"treat\"\n", + "2019-01-31 00:51:15,111 : INFO : topic #44 (0.020): 0.033*\"rooftop\" + 0.027*\"final\" + 0.024*\"wife\" + 0.020*\"tourist\" + 0.018*\"champion\" + 0.015*\"martin\" + 0.015*\"tiepolo\" + 0.014*\"chamber\" + 0.014*\"taxpay\" + 0.012*\"defeat\"\n", + "2019-01-31 00:51:15,117 : INFO : topic diff=0.004943, rho=0.031250\n", + "2019-01-31 00:51:15,272 : INFO : PROGRESS: pass 0, at document #2050000/4922894\n", + "2019-01-31 00:51:16,645 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:51:16,911 : INFO : topic #15 (0.020): 0.011*\"small\" + 0.010*\"organ\" + 0.010*\"develop\" + 0.010*\"commun\" + 0.009*\"group\" + 0.009*\"word\" + 0.008*\"peopl\" + 0.007*\"woman\" + 0.007*\"cultur\" + 0.007*\"human\"\n", + "2019-01-31 00:51:16,912 : INFO : topic #2 (0.020): 0.048*\"isl\" + 0.039*\"shield\" + 0.019*\"narrat\" + 0.013*\"scot\" + 0.012*\"pope\" + 0.011*\"blur\" + 0.011*\"nativist\" + 0.010*\"coalit\" + 0.010*\"fleet\" + 0.009*\"class\"\n", + "2019-01-31 00:51:16,914 : INFO : topic #22 (0.020): 0.034*\"spars\" + 0.024*\"factor\" + 0.018*\"adulthood\" + 0.015*\"feel\" + 0.013*\"male\" + 0.011*\"plaisir\" + 0.010*\"genu\" + 0.010*\"hostil\" + 0.009*\"biom\" + 0.008*\"live\"\n", + "2019-01-31 00:51:16,915 : INFO : topic #4 (0.020): 0.022*\"enfranchis\" + 0.015*\"depress\" + 0.015*\"pour\" + 0.008*\"elabor\" + 0.008*\"mode\" + 0.008*\"veget\" + 0.007*\"uruguayan\" + 0.007*\"encyclopedia\" + 0.007*\"spectacl\" + 0.006*\"produc\"\n", + "2019-01-31 00:51:16,916 : INFO : topic #41 (0.020): 0.041*\"citi\" + 0.025*\"new\" + 0.022*\"palmer\" + 0.014*\"strategist\" + 0.012*\"center\" + 0.012*\"open\" + 0.011*\"includ\" + 0.010*\"lobe\" + 0.009*\"dai\" + 0.009*\"highli\"\n", + "2019-01-31 00:51:16,922 : INFO : topic diff=0.004641, rho=0.031235\n", + "2019-01-31 00:51:17,075 : INFO : PROGRESS: pass 0, at document #2052000/4922894\n", + "2019-01-31 00:51:18,441 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:51:18,708 : INFO : topic #19 (0.020): 0.016*\"languag\" + 0.014*\"centuri\" + 0.010*\"woodcut\" + 0.009*\"form\" + 0.009*\"origin\" + 0.009*\"mean\" + 0.008*\"trade\" + 0.008*\"english\" + 0.007*\"known\" + 0.006*\"like\"\n", + "2019-01-31 00:51:18,709 : INFO : topic #21 (0.020): 0.036*\"samford\" + 0.022*\"spain\" + 0.019*\"del\" + 0.018*\"mexico\" + 0.014*\"soviet\" + 0.012*\"carlo\" + 0.011*\"juan\" + 0.011*\"santa\" + 0.011*\"francisco\" + 0.011*\"italian\"\n", + "2019-01-31 00:51:18,710 : INFO : topic #36 (0.020): 0.012*\"network\" + 0.012*\"pop\" + 0.011*\"prognosi\" + 0.008*\"develop\" + 0.008*\"user\" + 0.008*\"softwar\" + 0.007*\"brio\" + 0.007*\"diggin\" + 0.007*\"ural\" + 0.007*\"includ\"\n", + "2019-01-31 00:51:18,711 : INFO : topic #46 (0.020): 0.019*\"damag\" + 0.017*\"sweden\" + 0.017*\"stop\" + 0.017*\"swedish\" + 0.015*\"norwai\" + 0.015*\"wind\" + 0.014*\"norwegian\" + 0.012*\"turkish\" + 0.012*\"denmark\" + 0.011*\"danish\"\n", + "2019-01-31 00:51:18,712 : INFO : topic #0 (0.020): 0.065*\"statewid\" + 0.040*\"line\" + 0.035*\"raid\" + 0.034*\"arsen\" + 0.026*\"museo\" + 0.020*\"traceabl\" + 0.017*\"serv\" + 0.014*\"pain\" + 0.013*\"exhaust\" + 0.012*\"oper\"\n", + "2019-01-31 00:51:18,718 : INFO : topic diff=0.004776, rho=0.031220\n", + "2019-01-31 00:51:18,877 : INFO : PROGRESS: pass 0, at document #2054000/4922894\n", + "2019-01-31 00:51:20,263 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:51:20,530 : INFO : topic #46 (0.020): 0.018*\"damag\" + 0.017*\"stop\" + 0.017*\"sweden\" + 0.016*\"swedish\" + 0.015*\"norwai\" + 0.015*\"wind\" + 0.014*\"norwegian\" + 0.012*\"denmark\" + 0.012*\"turkish\" + 0.012*\"danish\"\n", + "2019-01-31 00:51:20,531 : INFO : topic #48 (0.020): 0.079*\"march\" + 0.076*\"octob\" + 0.076*\"sens\" + 0.071*\"juli\" + 0.070*\"januari\" + 0.070*\"notion\" + 0.068*\"april\" + 0.068*\"august\" + 0.068*\"judici\" + 0.067*\"decatur\"\n", + "2019-01-31 00:51:20,532 : INFO : topic #19 (0.020): 0.016*\"languag\" + 0.014*\"centuri\" + 0.010*\"woodcut\" + 0.009*\"form\" + 0.009*\"origin\" + 0.008*\"mean\" + 0.008*\"trade\" + 0.008*\"english\" + 0.007*\"known\" + 0.006*\"like\"\n", + "2019-01-31 00:51:20,533 : INFO : topic #36 (0.020): 0.012*\"network\" + 0.011*\"pop\" + 0.011*\"prognosi\" + 0.008*\"develop\" + 0.008*\"softwar\" + 0.008*\"user\" + 0.008*\"brio\" + 0.007*\"ural\" + 0.007*\"diggin\" + 0.007*\"includ\"\n", + "2019-01-31 00:51:20,534 : INFO : topic #21 (0.020): 0.036*\"samford\" + 0.022*\"spain\" + 0.019*\"del\" + 0.018*\"mexico\" + 0.014*\"soviet\" + 0.012*\"carlo\" + 0.012*\"juan\" + 0.011*\"santa\" + 0.011*\"francisco\" + 0.011*\"josé\"\n", + "2019-01-31 00:51:20,540 : INFO : topic diff=0.004122, rho=0.031204\n", + "2019-01-31 00:51:20,695 : INFO : PROGRESS: pass 0, at document #2056000/4922894\n", + "2019-01-31 00:51:22,077 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:51:22,344 : INFO : topic #7 (0.020): 0.021*\"snatch\" + 0.020*\"di\" + 0.018*\"factor\" + 0.015*\"margin\" + 0.015*\"yawn\" + 0.014*\"bone\" + 0.013*\"life\" + 0.013*\"faster\" + 0.012*\"deal\" + 0.012*\"will\"\n", + "2019-01-31 00:51:22,345 : INFO : topic #5 (0.020): 0.038*\"abroad\" + 0.029*\"son\" + 0.027*\"rel\" + 0.025*\"reconstruct\" + 0.020*\"band\" + 0.017*\"muscl\" + 0.016*\"simultan\" + 0.014*\"charcoal\" + 0.013*\"toyota\" + 0.010*\"vocabulari\"\n", + "2019-01-31 00:51:22,346 : INFO : topic #36 (0.020): 0.012*\"network\" + 0.011*\"pop\" + 0.011*\"prognosi\" + 0.008*\"develop\" + 0.008*\"diggin\" + 0.008*\"softwar\" + 0.007*\"ural\" + 0.007*\"user\" + 0.007*\"brio\" + 0.007*\"uruguayan\"\n", + "2019-01-31 00:51:22,347 : INFO : topic #34 (0.020): 0.070*\"start\" + 0.031*\"new\" + 0.030*\"unionist\" + 0.030*\"american\" + 0.026*\"cotton\" + 0.018*\"year\" + 0.016*\"california\" + 0.013*\"terri\" + 0.013*\"warrior\" + 0.012*\"north\"\n", + "2019-01-31 00:51:22,348 : INFO : topic #27 (0.020): 0.069*\"questionnair\" + 0.020*\"taxpay\" + 0.019*\"candid\" + 0.013*\"tornado\" + 0.013*\"driver\" + 0.012*\"squatter\" + 0.012*\"find\" + 0.011*\"théori\" + 0.011*\"ret\" + 0.010*\"fool\"\n", + "2019-01-31 00:51:22,354 : INFO : topic diff=0.005014, rho=0.031189\n", + "2019-01-31 00:51:22,513 : INFO : PROGRESS: pass 0, at document #2058000/4922894\n", + "2019-01-31 00:51:23,908 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 00:51:24,174 : INFO : topic #33 (0.020): 0.060*\"french\" + 0.046*\"franc\" + 0.030*\"pari\" + 0.024*\"sail\" + 0.022*\"jean\" + 0.017*\"daphn\" + 0.013*\"lazi\" + 0.012*\"loui\" + 0.012*\"wreath\" + 0.011*\"piec\"\n", + "2019-01-31 00:51:24,175 : INFO : topic #38 (0.020): 0.024*\"walter\" + 0.011*\"aza\" + 0.009*\"teufel\" + 0.009*\"battalion\" + 0.008*\"forc\" + 0.008*\"empath\" + 0.007*\"till\" + 0.007*\"armi\" + 0.006*\"govern\" + 0.006*\"pour\"\n", + "2019-01-31 00:51:24,176 : INFO : topic #9 (0.020): 0.076*\"bone\" + 0.045*\"american\" + 0.026*\"valour\" + 0.018*\"folei\" + 0.018*\"player\" + 0.018*\"dutch\" + 0.018*\"polit\" + 0.016*\"english\" + 0.013*\"acrimoni\" + 0.011*\"simpler\"\n", + "2019-01-31 00:51:24,177 : INFO : topic #34 (0.020): 0.070*\"start\" + 0.031*\"new\" + 0.030*\"unionist\" + 0.030*\"american\" + 0.026*\"cotton\" + 0.018*\"year\" + 0.016*\"california\" + 0.013*\"terri\" + 0.013*\"warrior\" + 0.012*\"north\"\n", + "2019-01-31 00:51:24,178 : INFO : topic #28 (0.020): 0.031*\"build\" + 0.026*\"hous\" + 0.021*\"rivièr\" + 0.017*\"buford\" + 0.013*\"histor\" + 0.012*\"briarwood\" + 0.011*\"strategist\" + 0.010*\"constitut\" + 0.010*\"depress\" + 0.010*\"linear\"\n", + "2019-01-31 00:51:24,184 : INFO : topic diff=0.004734, rho=0.031174\n", + "2019-01-31 00:51:26,892 : INFO : -12.012 per-word bound, 4131.2 perplexity estimate based on a held-out corpus of 2000 documents with 573678 words\n", + "2019-01-31 00:51:26,892 : INFO : PROGRESS: pass 0, at document #2060000/4922894\n", + "2019-01-31 00:51:28,286 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:51:28,552 : INFO : topic #14 (0.020): 0.023*\"forc\" + 0.022*\"aggress\" + 0.021*\"armi\" + 0.020*\"walter\" + 0.018*\"com\" + 0.014*\"unionist\" + 0.014*\"oper\" + 0.013*\"militari\" + 0.012*\"diversifi\" + 0.012*\"airbu\"\n", + "2019-01-31 00:51:28,553 : INFO : topic #3 (0.020): 0.035*\"present\" + 0.027*\"minist\" + 0.027*\"offic\" + 0.021*\"nation\" + 0.021*\"govern\" + 0.020*\"member\" + 0.018*\"serv\" + 0.017*\"gener\" + 0.016*\"start\" + 0.015*\"seri\"\n", + "2019-01-31 00:51:28,554 : INFO : topic #46 (0.020): 0.018*\"damag\" + 0.017*\"sweden\" + 0.016*\"swedish\" + 0.016*\"stop\" + 0.016*\"wind\" + 0.016*\"norwai\" + 0.014*\"norwegian\" + 0.012*\"danish\" + 0.012*\"denmark\" + 0.011*\"turkish\"\n", + "2019-01-31 00:51:28,555 : INFO : topic #39 (0.020): 0.056*\"canada\" + 0.043*\"canadian\" + 0.022*\"toronto\" + 0.021*\"hoar\" + 0.020*\"ontario\" + 0.017*\"colonist\" + 0.015*\"hydrogen\" + 0.014*\"new\" + 0.013*\"novotná\" + 0.013*\"misericordia\"\n", + "2019-01-31 00:51:28,557 : INFO : topic #12 (0.020): 0.009*\"number\" + 0.008*\"frontal\" + 0.007*\"exampl\" + 0.007*\"gener\" + 0.006*\"poet\" + 0.006*\"théori\" + 0.006*\"servitud\" + 0.006*\"southern\" + 0.005*\"measur\" + 0.005*\"differ\"\n", + "2019-01-31 00:51:28,562 : INFO : topic diff=0.005191, rho=0.031159\n", + "2019-01-31 00:51:28,722 : INFO : PROGRESS: pass 0, at document #2062000/4922894\n", + "2019-01-31 00:51:30,140 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:51:30,406 : INFO : topic #35 (0.020): 0.057*\"russia\" + 0.037*\"sovereignti\" + 0.033*\"rural\" + 0.028*\"personifi\" + 0.025*\"poison\" + 0.024*\"reprint\" + 0.020*\"moscow\" + 0.018*\"poland\" + 0.015*\"unfortun\" + 0.013*\"malaysia\"\n", + "2019-01-31 00:51:30,407 : INFO : topic #15 (0.020): 0.011*\"small\" + 0.010*\"organ\" + 0.010*\"develop\" + 0.010*\"commun\" + 0.009*\"group\" + 0.009*\"word\" + 0.008*\"peopl\" + 0.007*\"woman\" + 0.007*\"cultur\" + 0.007*\"human\"\n", + "2019-01-31 00:51:30,408 : INFO : topic #37 (0.020): 0.010*\"man\" + 0.009*\"charact\" + 0.008*\"septemb\" + 0.007*\"love\" + 0.007*\"comic\" + 0.007*\"gestur\" + 0.006*\"anim\" + 0.006*\"appear\" + 0.005*\"vision\" + 0.005*\"blue\"\n", + "2019-01-31 00:51:30,409 : INFO : topic #19 (0.020): 0.016*\"languag\" + 0.014*\"centuri\" + 0.010*\"woodcut\" + 0.009*\"form\" + 0.009*\"origin\" + 0.008*\"mean\" + 0.008*\"trade\" + 0.007*\"english\" + 0.007*\"known\" + 0.006*\"like\"\n", + "2019-01-31 00:51:30,410 : INFO : topic #45 (0.020): 0.027*\"jpg\" + 0.026*\"fifteenth\" + 0.018*\"illicit\" + 0.017*\"colder\" + 0.016*\"western\" + 0.016*\"black\" + 0.013*\"record\" + 0.011*\"blind\" + 0.008*\"depress\" + 0.008*\"light\"\n", + "2019-01-31 00:51:30,416 : INFO : topic diff=0.004206, rho=0.031144\n", + "2019-01-31 00:51:30,572 : INFO : PROGRESS: pass 0, at document #2064000/4922894\n", + "2019-01-31 00:51:31,945 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:51:32,210 : INFO : topic #39 (0.020): 0.056*\"canada\" + 0.043*\"canadian\" + 0.021*\"toronto\" + 0.021*\"hoar\" + 0.020*\"ontario\" + 0.017*\"colonist\" + 0.015*\"hydrogen\" + 0.014*\"new\" + 0.013*\"novotná\" + 0.013*\"misericordia\"\n", + "2019-01-31 00:51:32,211 : INFO : topic #3 (0.020): 0.036*\"present\" + 0.027*\"offic\" + 0.026*\"minist\" + 0.021*\"nation\" + 0.020*\"govern\" + 0.020*\"member\" + 0.018*\"serv\" + 0.017*\"gener\" + 0.016*\"start\" + 0.015*\"seri\"\n", + "2019-01-31 00:51:32,212 : INFO : topic #4 (0.020): 0.021*\"enfranchis\" + 0.015*\"depress\" + 0.015*\"pour\" + 0.008*\"mode\" + 0.008*\"elabor\" + 0.008*\"veget\" + 0.007*\"uruguayan\" + 0.007*\"spectacl\" + 0.007*\"encyclopedia\" + 0.006*\"develop\"\n", + "2019-01-31 00:51:32,214 : INFO : topic #6 (0.020): 0.071*\"fewer\" + 0.024*\"epiru\" + 0.023*\"septemb\" + 0.019*\"teacher\" + 0.017*\"stake\" + 0.013*\"rodríguez\" + 0.012*\"proclaim\" + 0.011*\"direct\" + 0.011*\"movi\" + 0.010*\"acrimoni\"\n", + "2019-01-31 00:51:32,215 : INFO : topic #13 (0.020): 0.028*\"australia\" + 0.027*\"sourc\" + 0.027*\"new\" + 0.025*\"london\" + 0.023*\"australian\" + 0.022*\"england\" + 0.019*\"ireland\" + 0.018*\"british\" + 0.016*\"youth\" + 0.014*\"wale\"\n", + "2019-01-31 00:51:32,221 : INFO : topic diff=0.005277, rho=0.031129\n", + "2019-01-31 00:51:32,376 : INFO : PROGRESS: pass 0, at document #2066000/4922894\n", + "2019-01-31 00:51:33,741 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:51:34,008 : INFO : topic #49 (0.020): 0.042*\"india\" + 0.030*\"incumb\" + 0.014*\"anglo\" + 0.014*\"islam\" + 0.013*\"televis\" + 0.013*\"pakistan\" + 0.011*\"muskoge\" + 0.010*\"khalsa\" + 0.010*\"alam\" + 0.010*\"affection\"\n", + "2019-01-31 00:51:34,009 : INFO : topic #30 (0.020): 0.035*\"leagu\" + 0.035*\"cleveland\" + 0.030*\"place\" + 0.027*\"taxpay\" + 0.024*\"scientist\" + 0.023*\"crete\" + 0.020*\"folei\" + 0.016*\"goal\" + 0.015*\"martin\" + 0.012*\"schmitz\"\n", + "2019-01-31 00:51:34,010 : INFO : topic #6 (0.020): 0.072*\"fewer\" + 0.024*\"epiru\" + 0.023*\"septemb\" + 0.019*\"teacher\" + 0.017*\"stake\" + 0.013*\"rodríguez\" + 0.012*\"proclaim\" + 0.011*\"direct\" + 0.011*\"movi\" + 0.010*\"acrimoni\"\n", + "2019-01-31 00:51:34,011 : INFO : topic #23 (0.020): 0.134*\"audit\" + 0.065*\"best\" + 0.031*\"yawn\" + 0.030*\"jacksonvil\" + 0.023*\"japanes\" + 0.020*\"festiv\" + 0.019*\"noll\" + 0.019*\"women\" + 0.016*\"intern\" + 0.014*\"misconcept\"\n", + "2019-01-31 00:51:34,012 : INFO : topic #24 (0.020): 0.039*\"book\" + 0.035*\"publicis\" + 0.025*\"word\" + 0.018*\"new\" + 0.014*\"edit\" + 0.012*\"presid\" + 0.012*\"collect\" + 0.012*\"nicola\" + 0.012*\"storag\" + 0.011*\"author\"\n", + "2019-01-31 00:51:34,018 : INFO : topic diff=0.004418, rho=0.031114\n", + "2019-01-31 00:51:34,169 : INFO : PROGRESS: pass 0, at document #2068000/4922894\n", + "2019-01-31 00:51:35,522 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:51:35,789 : INFO : topic #30 (0.020): 0.035*\"cleveland\" + 0.035*\"leagu\" + 0.030*\"place\" + 0.027*\"taxpay\" + 0.024*\"scientist\" + 0.023*\"crete\" + 0.020*\"folei\" + 0.016*\"goal\" + 0.015*\"martin\" + 0.012*\"schmitz\"\n", + "2019-01-31 00:51:35,790 : INFO : topic #32 (0.020): 0.053*\"district\" + 0.045*\"vigour\" + 0.044*\"popolo\" + 0.038*\"tortur\" + 0.034*\"cotton\" + 0.027*\"area\" + 0.023*\"multitud\" + 0.021*\"regim\" + 0.021*\"citi\" + 0.020*\"cede\"\n", + "2019-01-31 00:51:35,791 : INFO : topic #22 (0.020): 0.034*\"spars\" + 0.023*\"factor\" + 0.019*\"adulthood\" + 0.015*\"feel\" + 0.013*\"male\" + 0.011*\"plaisir\" + 0.010*\"genu\" + 0.010*\"hostil\" + 0.008*\"live\" + 0.008*\"western\"\n", + "2019-01-31 00:51:35,792 : INFO : topic #10 (0.020): 0.011*\"cdd\" + 0.008*\"media\" + 0.008*\"disco\" + 0.007*\"hormon\" + 0.007*\"pathwai\" + 0.007*\"have\" + 0.007*\"caus\" + 0.006*\"effect\" + 0.006*\"proper\" + 0.006*\"treat\"\n", + "2019-01-31 00:51:35,793 : INFO : topic #11 (0.020): 0.024*\"john\" + 0.012*\"will\" + 0.012*\"jame\" + 0.011*\"david\" + 0.010*\"rival\" + 0.009*\"mexican–american\" + 0.009*\"georg\" + 0.008*\"slur\" + 0.008*\"paul\" + 0.008*\"rhyme\"\n", + "2019-01-31 00:51:35,799 : INFO : topic diff=0.004478, rho=0.031099\n", + "2019-01-31 00:51:35,957 : INFO : PROGRESS: pass 0, at document #2070000/4922894\n", + "2019-01-31 00:51:37,338 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 00:51:37,604 : INFO : topic #20 (0.020): 0.147*\"scholar\" + 0.040*\"struggl\" + 0.036*\"high\" + 0.028*\"educ\" + 0.022*\"collector\" + 0.017*\"yawn\" + 0.013*\"prognosi\" + 0.010*\"district\" + 0.009*\"gothic\" + 0.009*\"class\"\n", + "2019-01-31 00:51:37,605 : INFO : topic #46 (0.020): 0.017*\"stop\" + 0.017*\"damag\" + 0.017*\"sweden\" + 0.016*\"wind\" + 0.016*\"swedish\" + 0.016*\"norwai\" + 0.014*\"norwegian\" + 0.011*\"turkish\" + 0.011*\"treeless\" + 0.011*\"denmark\"\n", + "2019-01-31 00:51:37,606 : INFO : topic #45 (0.020): 0.027*\"jpg\" + 0.026*\"fifteenth\" + 0.018*\"illicit\" + 0.017*\"colder\" + 0.016*\"black\" + 0.016*\"western\" + 0.013*\"record\" + 0.011*\"blind\" + 0.008*\"depress\" + 0.007*\"light\"\n", + "2019-01-31 00:51:37,607 : INFO : topic #43 (0.020): 0.062*\"elect\" + 0.054*\"parti\" + 0.025*\"voluntari\" + 0.022*\"democrat\" + 0.020*\"member\" + 0.016*\"polici\" + 0.015*\"liber\" + 0.014*\"republ\" + 0.014*\"bypass\" + 0.013*\"selma\"\n", + "2019-01-31 00:51:37,608 : INFO : topic #35 (0.020): 0.056*\"russia\" + 0.036*\"sovereignti\" + 0.032*\"rural\" + 0.028*\"personifi\" + 0.025*\"poison\" + 0.023*\"reprint\" + 0.020*\"moscow\" + 0.018*\"poland\" + 0.015*\"unfortun\" + 0.014*\"malaysia\"\n", + "2019-01-31 00:51:37,614 : INFO : topic diff=0.004602, rho=0.031083\n", + "2019-01-31 00:51:37,763 : INFO : PROGRESS: pass 0, at document #2072000/4922894\n", + "2019-01-31 00:51:39,102 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:51:39,369 : INFO : topic #40 (0.020): 0.090*\"unit\" + 0.023*\"schuster\" + 0.023*\"collector\" + 0.022*\"institut\" + 0.022*\"requir\" + 0.019*\"student\" + 0.015*\"professor\" + 0.012*\"word\" + 0.011*\"governor\" + 0.011*\"http\"\n", + "2019-01-31 00:51:39,370 : INFO : topic #2 (0.020): 0.049*\"isl\" + 0.038*\"shield\" + 0.019*\"narrat\" + 0.014*\"scot\" + 0.012*\"pope\" + 0.011*\"nativist\" + 0.011*\"blur\" + 0.010*\"coalit\" + 0.009*\"fleet\" + 0.009*\"class\"\n", + "2019-01-31 00:51:39,371 : INFO : topic #44 (0.020): 0.032*\"rooftop\" + 0.027*\"final\" + 0.024*\"wife\" + 0.020*\"tourist\" + 0.019*\"champion\" + 0.016*\"martin\" + 0.015*\"tiepolo\" + 0.014*\"taxpay\" + 0.014*\"chamber\" + 0.012*\"women\"\n", + "2019-01-31 00:51:39,371 : INFO : topic #1 (0.020): 0.055*\"china\" + 0.050*\"chilton\" + 0.023*\"hong\" + 0.023*\"kong\" + 0.022*\"korea\" + 0.018*\"korean\" + 0.017*\"leah\" + 0.016*\"sourc\" + 0.015*\"kim\" + 0.014*\"shirin\"\n", + "2019-01-31 00:51:39,373 : INFO : topic #19 (0.020): 0.016*\"languag\" + 0.013*\"centuri\" + 0.010*\"woodcut\" + 0.009*\"form\" + 0.009*\"origin\" + 0.009*\"mean\" + 0.008*\"trade\" + 0.007*\"english\" + 0.007*\"known\" + 0.006*\"like\"\n", + "2019-01-31 00:51:39,378 : INFO : topic diff=0.004903, rho=0.031068\n", + "2019-01-31 00:51:39,535 : INFO : PROGRESS: pass 0, at document #2074000/4922894\n", + "2019-01-31 00:51:40,923 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:51:41,190 : INFO : topic #35 (0.020): 0.055*\"russia\" + 0.036*\"sovereignti\" + 0.032*\"rural\" + 0.029*\"personifi\" + 0.026*\"poison\" + 0.023*\"reprint\" + 0.020*\"moscow\" + 0.018*\"poland\" + 0.015*\"unfortun\" + 0.014*\"malaysia\"\n", + "2019-01-31 00:51:41,191 : INFO : topic #8 (0.020): 0.028*\"law\" + 0.024*\"cortic\" + 0.019*\"start\" + 0.019*\"act\" + 0.013*\"ricardo\" + 0.012*\"case\" + 0.010*\"polaris\" + 0.009*\"replac\" + 0.009*\"legal\" + 0.008*\"justic\"\n", + "2019-01-31 00:51:41,192 : INFO : topic #9 (0.020): 0.077*\"bone\" + 0.043*\"american\" + 0.028*\"valour\" + 0.019*\"player\" + 0.018*\"folei\" + 0.017*\"dutch\" + 0.017*\"polit\" + 0.016*\"english\" + 0.012*\"acrimoni\" + 0.011*\"simpler\"\n", + "2019-01-31 00:51:41,193 : INFO : topic #4 (0.020): 0.021*\"enfranchis\" + 0.015*\"depress\" + 0.015*\"pour\" + 0.008*\"mode\" + 0.008*\"elabor\" + 0.007*\"uruguayan\" + 0.007*\"veget\" + 0.007*\"spectacl\" + 0.006*\"encyclopedia\" + 0.006*\"develop\"\n", + "2019-01-31 00:51:41,194 : INFO : topic #17 (0.020): 0.076*\"church\" + 0.023*\"cathol\" + 0.022*\"christian\" + 0.020*\"bishop\" + 0.017*\"retroflex\" + 0.016*\"sail\" + 0.010*\"historiographi\" + 0.009*\"centuri\" + 0.009*\"cathedr\" + 0.009*\"relationship\"\n", + "2019-01-31 00:51:41,200 : INFO : topic diff=0.005879, rho=0.031054\n", + "2019-01-31 00:51:41,357 : INFO : PROGRESS: pass 0, at document #2076000/4922894\n", + "2019-01-31 00:51:42,731 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:51:42,997 : INFO : topic #21 (0.020): 0.036*\"samford\" + 0.022*\"spain\" + 0.020*\"del\" + 0.017*\"mexico\" + 0.014*\"soviet\" + 0.012*\"carlo\" + 0.012*\"francisco\" + 0.011*\"juan\" + 0.011*\"santa\" + 0.011*\"italian\"\n", + "2019-01-31 00:51:42,998 : INFO : topic #40 (0.020): 0.090*\"unit\" + 0.023*\"schuster\" + 0.023*\"collector\" + 0.022*\"institut\" + 0.022*\"requir\" + 0.019*\"student\" + 0.015*\"professor\" + 0.012*\"word\" + 0.011*\"governor\" + 0.011*\"http\"\n", + "2019-01-31 00:51:42,999 : INFO : topic #10 (0.020): 0.010*\"cdd\" + 0.008*\"media\" + 0.008*\"disco\" + 0.008*\"pathwai\" + 0.007*\"hormon\" + 0.007*\"have\" + 0.007*\"caus\" + 0.006*\"effect\" + 0.006*\"treat\" + 0.006*\"proper\"\n", + "2019-01-31 00:51:43,000 : INFO : topic #20 (0.020): 0.146*\"scholar\" + 0.040*\"struggl\" + 0.035*\"high\" + 0.029*\"educ\" + 0.022*\"collector\" + 0.018*\"yawn\" + 0.013*\"prognosi\" + 0.010*\"district\" + 0.010*\"gothic\" + 0.009*\"start\"\n", + "2019-01-31 00:51:43,002 : INFO : topic #46 (0.020): 0.018*\"damag\" + 0.017*\"sweden\" + 0.017*\"norwai\" + 0.017*\"stop\" + 0.016*\"swedish\" + 0.016*\"wind\" + 0.014*\"norwegian\" + 0.011*\"turkish\" + 0.011*\"denmark\" + 0.011*\"danish\"\n", + "2019-01-31 00:51:43,007 : INFO : topic diff=0.004777, rho=0.031039\n", + "2019-01-31 00:51:43,218 : INFO : PROGRESS: pass 0, at document #2078000/4922894\n", + "2019-01-31 00:51:44,580 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:51:44,847 : INFO : topic #44 (0.020): 0.032*\"rooftop\" + 0.027*\"final\" + 0.023*\"wife\" + 0.020*\"tourist\" + 0.019*\"champion\" + 0.016*\"martin\" + 0.014*\"tiepolo\" + 0.014*\"taxpay\" + 0.014*\"chamber\" + 0.012*\"women\"\n", + "2019-01-31 00:51:44,848 : INFO : topic #4 (0.020): 0.021*\"enfranchis\" + 0.015*\"depress\" + 0.014*\"pour\" + 0.008*\"mode\" + 0.008*\"elabor\" + 0.007*\"veget\" + 0.007*\"uruguayan\" + 0.007*\"spectacl\" + 0.006*\"encyclopedia\" + 0.006*\"develop\"\n", + "2019-01-31 00:51:44,849 : INFO : topic #33 (0.020): 0.060*\"french\" + 0.045*\"franc\" + 0.030*\"pari\" + 0.024*\"sail\" + 0.022*\"jean\" + 0.016*\"daphn\" + 0.013*\"lazi\" + 0.012*\"loui\" + 0.011*\"piec\" + 0.011*\"wreath\"\n", + "2019-01-31 00:51:44,850 : INFO : topic #35 (0.020): 0.055*\"russia\" + 0.037*\"sovereignti\" + 0.031*\"rural\" + 0.029*\"personifi\" + 0.026*\"poison\" + 0.023*\"reprint\" + 0.020*\"moscow\" + 0.018*\"poland\" + 0.015*\"unfortun\" + 0.014*\"turin\"\n", + "2019-01-31 00:51:44,851 : INFO : topic #43 (0.020): 0.062*\"elect\" + 0.054*\"parti\" + 0.025*\"voluntari\" + 0.021*\"democrat\" + 0.020*\"member\" + 0.016*\"polici\" + 0.015*\"liber\" + 0.014*\"republ\" + 0.014*\"bypass\" + 0.013*\"report\"\n", + "2019-01-31 00:51:44,857 : INFO : topic diff=0.004845, rho=0.031024\n", + "2019-01-31 00:51:47,535 : INFO : -11.723 per-word bound, 3379.6 perplexity estimate based on a held-out corpus of 2000 documents with 550703 words\n", + "2019-01-31 00:51:47,536 : INFO : PROGRESS: pass 0, at document #2080000/4922894\n", + "2019-01-31 00:51:48,923 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:51:49,191 : INFO : topic #38 (0.020): 0.025*\"walter\" + 0.010*\"aza\" + 0.009*\"battalion\" + 0.008*\"forc\" + 0.008*\"teufel\" + 0.008*\"empath\" + 0.007*\"till\" + 0.007*\"armi\" + 0.006*\"pour\" + 0.006*\"govern\"\n", + "2019-01-31 00:51:49,192 : INFO : topic #0 (0.020): 0.063*\"statewid\" + 0.039*\"line\" + 0.035*\"raid\" + 0.035*\"arsen\" + 0.027*\"museo\" + 0.019*\"traceabl\" + 0.017*\"serv\" + 0.014*\"pain\" + 0.013*\"rosenwald\" + 0.012*\"exhaust\"\n", + "2019-01-31 00:51:49,193 : INFO : topic #32 (0.020): 0.057*\"district\" + 0.045*\"vigour\" + 0.044*\"popolo\" + 0.037*\"tortur\" + 0.034*\"cotton\" + 0.026*\"area\" + 0.022*\"multitud\" + 0.021*\"citi\" + 0.021*\"regim\" + 0.020*\"cede\"\n", + "2019-01-31 00:51:49,194 : INFO : topic #41 (0.020): 0.041*\"citi\" + 0.024*\"new\" + 0.022*\"palmer\" + 0.014*\"strategist\" + 0.012*\"center\" + 0.012*\"open\" + 0.011*\"includ\" + 0.010*\"lobe\" + 0.009*\"dai\" + 0.009*\"highli\"\n", + "2019-01-31 00:51:49,195 : INFO : topic #12 (0.020): 0.009*\"number\" + 0.008*\"frontal\" + 0.007*\"exampl\" + 0.006*\"poet\" + 0.006*\"gener\" + 0.006*\"théori\" + 0.006*\"servitud\" + 0.006*\"southern\" + 0.006*\"measur\" + 0.006*\"differ\"\n", + "2019-01-31 00:51:49,202 : INFO : topic diff=0.004875, rho=0.031009\n", + "2019-01-31 00:51:49,392 : INFO : PROGRESS: pass 0, at document #2082000/4922894\n", + "2019-01-31 00:51:50,750 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 00:51:51,015 : INFO : topic #32 (0.020): 0.057*\"district\" + 0.045*\"vigour\" + 0.044*\"popolo\" + 0.037*\"tortur\" + 0.034*\"cotton\" + 0.026*\"area\" + 0.022*\"multitud\" + 0.021*\"citi\" + 0.021*\"regim\" + 0.020*\"cede\"\n", + "2019-01-31 00:51:51,016 : INFO : topic #27 (0.020): 0.069*\"questionnair\" + 0.019*\"taxpay\" + 0.019*\"candid\" + 0.013*\"driver\" + 0.012*\"fool\" + 0.012*\"tornado\" + 0.012*\"squatter\" + 0.012*\"théori\" + 0.011*\"find\" + 0.010*\"ret\"\n", + "2019-01-31 00:51:51,018 : INFO : topic #5 (0.020): 0.038*\"abroad\" + 0.029*\"son\" + 0.027*\"rel\" + 0.025*\"reconstruct\" + 0.020*\"band\" + 0.016*\"muscl\" + 0.016*\"simultan\" + 0.015*\"charcoal\" + 0.014*\"toyota\" + 0.010*\"vocabulari\"\n", + "2019-01-31 00:51:51,019 : INFO : topic #1 (0.020): 0.055*\"china\" + 0.049*\"chilton\" + 0.023*\"hong\" + 0.023*\"kong\" + 0.022*\"korea\" + 0.018*\"korean\" + 0.017*\"leah\" + 0.016*\"sourc\" + 0.014*\"shirin\" + 0.014*\"kim\"\n", + "2019-01-31 00:51:51,020 : INFO : topic #6 (0.020): 0.071*\"fewer\" + 0.025*\"epiru\" + 0.022*\"septemb\" + 0.019*\"teacher\" + 0.016*\"stake\" + 0.013*\"rodríguez\" + 0.012*\"proclaim\" + 0.012*\"direct\" + 0.011*\"movi\" + 0.010*\"acrimoni\"\n", + "2019-01-31 00:51:51,026 : INFO : topic diff=0.005542, rho=0.030994\n", + "2019-01-31 00:51:51,187 : INFO : PROGRESS: pass 0, at document #2084000/4922894\n", + "2019-01-31 00:51:52,622 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:51:52,888 : INFO : topic #3 (0.020): 0.035*\"present\" + 0.027*\"offic\" + 0.026*\"minist\" + 0.021*\"nation\" + 0.021*\"govern\" + 0.020*\"member\" + 0.017*\"serv\" + 0.017*\"gener\" + 0.016*\"start\" + 0.015*\"seri\"\n", + "2019-01-31 00:51:52,889 : INFO : topic #46 (0.020): 0.017*\"damag\" + 0.017*\"stop\" + 0.017*\"sweden\" + 0.016*\"norwai\" + 0.016*\"swedish\" + 0.016*\"wind\" + 0.014*\"norwegian\" + 0.011*\"treeless\" + 0.011*\"turkish\" + 0.011*\"denmark\"\n", + "2019-01-31 00:51:52,890 : INFO : topic #36 (0.020): 0.012*\"network\" + 0.011*\"pop\" + 0.011*\"prognosi\" + 0.008*\"develop\" + 0.008*\"diggin\" + 0.008*\"user\" + 0.007*\"softwar\" + 0.007*\"ural\" + 0.007*\"cytokin\" + 0.007*\"championship\"\n", + "2019-01-31 00:51:52,891 : INFO : topic #16 (0.020): 0.054*\"king\" + 0.031*\"priest\" + 0.021*\"duke\" + 0.020*\"rotterdam\" + 0.019*\"grammat\" + 0.017*\"idiosyncrat\" + 0.017*\"quarterli\" + 0.013*\"count\" + 0.012*\"kingdom\" + 0.012*\"portugues\"\n", + "2019-01-31 00:51:52,893 : INFO : topic #26 (0.020): 0.028*\"woman\" + 0.028*\"champion\" + 0.028*\"workplac\" + 0.026*\"men\" + 0.025*\"olymp\" + 0.023*\"medal\" + 0.020*\"event\" + 0.019*\"atheist\" + 0.019*\"taxpay\" + 0.019*\"alic\"\n", + "2019-01-31 00:51:52,899 : INFO : topic diff=0.004858, rho=0.030979\n", + "2019-01-31 00:51:53,053 : INFO : PROGRESS: pass 0, at document #2086000/4922894\n", + "2019-01-31 00:51:54,423 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:51:54,689 : INFO : topic #15 (0.020): 0.011*\"small\" + 0.010*\"organ\" + 0.010*\"develop\" + 0.010*\"commun\" + 0.009*\"group\" + 0.009*\"word\" + 0.008*\"peopl\" + 0.007*\"woman\" + 0.007*\"human\" + 0.007*\"cultur\"\n", + "2019-01-31 00:51:54,690 : INFO : topic #1 (0.020): 0.055*\"china\" + 0.049*\"chilton\" + 0.023*\"hong\" + 0.023*\"kong\" + 0.021*\"korea\" + 0.018*\"korean\" + 0.016*\"leah\" + 0.016*\"sourc\" + 0.014*\"shirin\" + 0.013*\"kim\"\n", + "2019-01-31 00:51:54,692 : INFO : topic #11 (0.020): 0.024*\"john\" + 0.012*\"will\" + 0.012*\"jame\" + 0.011*\"david\" + 0.010*\"rival\" + 0.009*\"mexican–american\" + 0.009*\"georg\" + 0.008*\"slur\" + 0.008*\"paul\" + 0.008*\"rhyme\"\n", + "2019-01-31 00:51:54,693 : INFO : topic #43 (0.020): 0.062*\"elect\" + 0.054*\"parti\" + 0.025*\"voluntari\" + 0.022*\"democrat\" + 0.020*\"member\" + 0.016*\"polici\" + 0.015*\"liber\" + 0.014*\"republ\" + 0.013*\"bypass\" + 0.013*\"report\"\n", + "2019-01-31 00:51:54,694 : INFO : topic #21 (0.020): 0.036*\"samford\" + 0.022*\"spain\" + 0.019*\"del\" + 0.017*\"mexico\" + 0.014*\"soviet\" + 0.012*\"francisco\" + 0.012*\"carlo\" + 0.011*\"lizard\" + 0.011*\"italian\" + 0.011*\"juan\"\n", + "2019-01-31 00:51:54,700 : INFO : topic diff=0.004670, rho=0.030964\n", + "2019-01-31 00:51:54,859 : INFO : PROGRESS: pass 0, at document #2088000/4922894\n", + "2019-01-31 00:51:56,260 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:51:56,526 : INFO : topic #39 (0.020): 0.056*\"canada\" + 0.043*\"canadian\" + 0.022*\"toronto\" + 0.022*\"hoar\" + 0.019*\"ontario\" + 0.016*\"colonist\" + 0.015*\"hydrogen\" + 0.014*\"new\" + 0.014*\"novotná\" + 0.014*\"misericordia\"\n", + "2019-01-31 00:51:56,528 : INFO : topic #20 (0.020): 0.146*\"scholar\" + 0.040*\"struggl\" + 0.036*\"high\" + 0.029*\"educ\" + 0.022*\"collector\" + 0.018*\"yawn\" + 0.013*\"prognosi\" + 0.010*\"district\" + 0.009*\"gothic\" + 0.009*\"class\"\n", + "2019-01-31 00:51:56,529 : INFO : topic #9 (0.020): 0.075*\"bone\" + 0.043*\"american\" + 0.028*\"valour\" + 0.018*\"player\" + 0.018*\"folei\" + 0.017*\"dutch\" + 0.017*\"polit\" + 0.015*\"english\" + 0.012*\"acrimoni\" + 0.011*\"simpler\"\n", + "2019-01-31 00:51:56,530 : INFO : topic #23 (0.020): 0.136*\"audit\" + 0.066*\"best\" + 0.032*\"yawn\" + 0.030*\"jacksonvil\" + 0.022*\"japanes\" + 0.020*\"noll\" + 0.019*\"festiv\" + 0.019*\"women\" + 0.016*\"intern\" + 0.014*\"misconcept\"\n", + "2019-01-31 00:51:56,531 : INFO : topic #33 (0.020): 0.059*\"french\" + 0.044*\"franc\" + 0.031*\"pari\" + 0.025*\"sail\" + 0.022*\"jean\" + 0.016*\"daphn\" + 0.013*\"lazi\" + 0.012*\"loui\" + 0.011*\"piec\" + 0.010*\"wine\"\n", + "2019-01-31 00:51:56,537 : INFO : topic diff=0.005544, rho=0.030949\n", + "2019-01-31 00:51:56,695 : INFO : PROGRESS: pass 0, at document #2090000/4922894\n", + "2019-01-31 00:51:58,093 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:51:58,359 : INFO : topic #13 (0.020): 0.028*\"australia\" + 0.028*\"sourc\" + 0.026*\"new\" + 0.025*\"london\" + 0.023*\"australian\" + 0.022*\"england\" + 0.020*\"british\" + 0.018*\"ireland\" + 0.016*\"youth\" + 0.014*\"wale\"\n", + "2019-01-31 00:51:58,360 : INFO : topic #36 (0.020): 0.012*\"network\" + 0.011*\"prognosi\" + 0.011*\"pop\" + 0.008*\"develop\" + 0.008*\"diggin\" + 0.008*\"brio\" + 0.007*\"user\" + 0.007*\"championship\" + 0.007*\"cytokin\" + 0.007*\"softwar\"\n", + "2019-01-31 00:51:58,362 : INFO : topic #44 (0.020): 0.031*\"rooftop\" + 0.026*\"final\" + 0.023*\"wife\" + 0.020*\"tourist\" + 0.020*\"champion\" + 0.016*\"martin\" + 0.014*\"taxpay\" + 0.014*\"tiepolo\" + 0.014*\"chamber\" + 0.012*\"women\"\n", + "2019-01-31 00:51:58,363 : INFO : topic #41 (0.020): 0.041*\"citi\" + 0.025*\"new\" + 0.022*\"palmer\" + 0.014*\"strategist\" + 0.012*\"center\" + 0.012*\"open\" + 0.011*\"includ\" + 0.010*\"lobe\" + 0.009*\"dai\" + 0.009*\"highli\"\n", + "2019-01-31 00:51:58,364 : INFO : topic #5 (0.020): 0.039*\"abroad\" + 0.029*\"son\" + 0.027*\"rel\" + 0.025*\"reconstruct\" + 0.020*\"band\" + 0.016*\"muscl\" + 0.016*\"simultan\" + 0.015*\"charcoal\" + 0.014*\"toyota\" + 0.010*\"vocabulari\"\n", + "2019-01-31 00:51:58,370 : INFO : topic diff=0.005200, rho=0.030934\n", + "2019-01-31 00:51:58,527 : INFO : PROGRESS: pass 0, at document #2092000/4922894\n", + "2019-01-31 00:51:59,915 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:52:00,182 : INFO : topic #2 (0.020): 0.048*\"isl\" + 0.038*\"shield\" + 0.019*\"narrat\" + 0.013*\"scot\" + 0.012*\"pope\" + 0.012*\"blur\" + 0.012*\"nativist\" + 0.011*\"coalit\" + 0.009*\"class\" + 0.009*\"fleet\"\n", + "2019-01-31 00:52:00,183 : INFO : topic #45 (0.020): 0.027*\"jpg\" + 0.026*\"fifteenth\" + 0.018*\"illicit\" + 0.016*\"black\" + 0.016*\"colder\" + 0.016*\"western\" + 0.012*\"record\" + 0.011*\"blind\" + 0.009*\"depress\" + 0.007*\"arm\"\n", + "2019-01-31 00:52:00,184 : INFO : topic #40 (0.020): 0.088*\"unit\" + 0.023*\"schuster\" + 0.022*\"collector\" + 0.022*\"requir\" + 0.021*\"institut\" + 0.019*\"student\" + 0.015*\"professor\" + 0.012*\"http\" + 0.012*\"word\" + 0.011*\"governor\"\n", + "2019-01-31 00:52:00,185 : INFO : topic #36 (0.020): 0.012*\"network\" + 0.011*\"prognosi\" + 0.011*\"pop\" + 0.008*\"develop\" + 0.008*\"diggin\" + 0.008*\"brio\" + 0.008*\"championship\" + 0.007*\"cytokin\" + 0.007*\"softwar\" + 0.007*\"user\"\n", + "2019-01-31 00:52:00,186 : INFO : topic #1 (0.020): 0.054*\"china\" + 0.050*\"chilton\" + 0.023*\"hong\" + 0.022*\"kong\" + 0.022*\"korea\" + 0.019*\"korean\" + 0.017*\"sourc\" + 0.016*\"leah\" + 0.015*\"shirin\" + 0.014*\"kim\"\n", + "2019-01-31 00:52:00,192 : INFO : topic diff=0.004904, rho=0.030920\n", + "2019-01-31 00:52:00,351 : INFO : PROGRESS: pass 0, at document #2094000/4922894\n", + "2019-01-31 00:52:01,745 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:52:02,012 : INFO : topic #15 (0.020): 0.011*\"small\" + 0.011*\"organ\" + 0.010*\"develop\" + 0.010*\"commun\" + 0.009*\"group\" + 0.009*\"word\" + 0.008*\"peopl\" + 0.007*\"woman\" + 0.007*\"human\" + 0.007*\"cultur\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 00:52:02,014 : INFO : topic #36 (0.020): 0.012*\"network\" + 0.011*\"pop\" + 0.011*\"prognosi\" + 0.008*\"develop\" + 0.008*\"diggin\" + 0.008*\"brio\" + 0.008*\"cytokin\" + 0.007*\"user\" + 0.007*\"championship\" + 0.007*\"softwar\"\n", + "2019-01-31 00:52:02,015 : INFO : topic #23 (0.020): 0.137*\"audit\" + 0.065*\"best\" + 0.032*\"yawn\" + 0.030*\"jacksonvil\" + 0.022*\"japanes\" + 0.020*\"noll\" + 0.020*\"festiv\" + 0.019*\"women\" + 0.016*\"intern\" + 0.014*\"misconcept\"\n", + "2019-01-31 00:52:02,016 : INFO : topic #26 (0.020): 0.028*\"woman\" + 0.028*\"champion\" + 0.028*\"workplac\" + 0.025*\"men\" + 0.025*\"olymp\" + 0.022*\"medal\" + 0.021*\"alic\" + 0.020*\"event\" + 0.019*\"atheist\" + 0.019*\"taxpay\"\n", + "2019-01-31 00:52:02,017 : INFO : topic #12 (0.020): 0.009*\"number\" + 0.008*\"frontal\" + 0.007*\"exampl\" + 0.007*\"théori\" + 0.006*\"southern\" + 0.006*\"gener\" + 0.006*\"poet\" + 0.006*\"servitud\" + 0.006*\"measur\" + 0.005*\"differ\"\n", + "2019-01-31 00:52:02,023 : INFO : topic diff=0.005287, rho=0.030905\n", + "2019-01-31 00:52:02,175 : INFO : PROGRESS: pass 0, at document #2096000/4922894\n", + "2019-01-31 00:52:03,536 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:52:03,803 : INFO : topic #49 (0.020): 0.043*\"india\" + 0.030*\"incumb\" + 0.014*\"islam\" + 0.014*\"anglo\" + 0.013*\"pakistan\" + 0.012*\"televis\" + 0.011*\"affection\" + 0.011*\"khalsa\" + 0.010*\"muskoge\" + 0.009*\"alam\"\n", + "2019-01-31 00:52:03,804 : INFO : topic #20 (0.020): 0.146*\"scholar\" + 0.040*\"struggl\" + 0.036*\"high\" + 0.029*\"educ\" + 0.022*\"collector\" + 0.018*\"yawn\" + 0.014*\"prognosi\" + 0.010*\"district\" + 0.009*\"class\" + 0.009*\"gothic\"\n", + "2019-01-31 00:52:03,806 : INFO : topic #43 (0.020): 0.063*\"elect\" + 0.054*\"parti\" + 0.024*\"voluntari\" + 0.022*\"democrat\" + 0.020*\"member\" + 0.017*\"polici\" + 0.015*\"republ\" + 0.015*\"liber\" + 0.013*\"bypass\" + 0.013*\"seaport\"\n", + "2019-01-31 00:52:03,807 : INFO : topic #24 (0.020): 0.039*\"book\" + 0.035*\"publicis\" + 0.025*\"word\" + 0.018*\"new\" + 0.014*\"edit\" + 0.013*\"presid\" + 0.012*\"collect\" + 0.012*\"nicola\" + 0.012*\"storag\" + 0.011*\"author\"\n", + "2019-01-31 00:52:03,808 : INFO : topic #9 (0.020): 0.074*\"bone\" + 0.043*\"american\" + 0.028*\"valour\" + 0.019*\"folei\" + 0.018*\"player\" + 0.017*\"dutch\" + 0.017*\"polit\" + 0.015*\"english\" + 0.012*\"acrimoni\" + 0.011*\"simpler\"\n", + "2019-01-31 00:52:03,814 : INFO : topic diff=0.005021, rho=0.030890\n", + "2019-01-31 00:52:03,977 : INFO : PROGRESS: pass 0, at document #2098000/4922894\n", + "2019-01-31 00:52:05,405 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:52:05,671 : INFO : topic #35 (0.020): 0.055*\"russia\" + 0.036*\"sovereignti\" + 0.032*\"rural\" + 0.027*\"personifi\" + 0.026*\"poison\" + 0.023*\"reprint\" + 0.019*\"moscow\" + 0.017*\"poland\" + 0.015*\"unfortun\" + 0.014*\"tyrant\"\n", + "2019-01-31 00:52:05,672 : INFO : topic #6 (0.020): 0.070*\"fewer\" + 0.025*\"epiru\" + 0.023*\"septemb\" + 0.019*\"teacher\" + 0.016*\"stake\" + 0.013*\"rodríguez\" + 0.012*\"proclaim\" + 0.011*\"direct\" + 0.011*\"movi\" + 0.010*\"acrimoni\"\n", + "2019-01-31 00:52:05,673 : INFO : topic #39 (0.020): 0.056*\"canada\" + 0.043*\"canadian\" + 0.022*\"toronto\" + 0.022*\"hoar\" + 0.019*\"ontario\" + 0.015*\"colonist\" + 0.015*\"hydrogen\" + 0.014*\"misericordia\" + 0.014*\"new\" + 0.013*\"novotná\"\n", + "2019-01-31 00:52:05,675 : INFO : topic #31 (0.020): 0.053*\"fusiform\" + 0.026*\"scientist\" + 0.026*\"taxpay\" + 0.024*\"player\" + 0.020*\"place\" + 0.014*\"clot\" + 0.013*\"leagu\" + 0.011*\"folei\" + 0.010*\"yawn\" + 0.009*\"reconstruct\"\n", + "2019-01-31 00:52:05,676 : INFO : topic #36 (0.020): 0.012*\"network\" + 0.011*\"prognosi\" + 0.011*\"pop\" + 0.008*\"develop\" + 0.008*\"diggin\" + 0.008*\"brio\" + 0.008*\"cytokin\" + 0.007*\"user\" + 0.007*\"championship\" + 0.007*\"softwar\"\n", + "2019-01-31 00:52:05,681 : INFO : topic diff=0.005405, rho=0.030875\n", + "2019-01-31 00:52:08,311 : INFO : -11.540 per-word bound, 2978.5 perplexity estimate based on a held-out corpus of 2000 documents with 524481 words\n", + "2019-01-31 00:52:08,311 : INFO : PROGRESS: pass 0, at document #2100000/4922894\n", + "2019-01-31 00:52:10,020 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:52:10,288 : INFO : topic #45 (0.020): 0.027*\"jpg\" + 0.026*\"fifteenth\" + 0.018*\"illicit\" + 0.016*\"black\" + 0.016*\"colder\" + 0.015*\"western\" + 0.012*\"record\" + 0.010*\"blind\" + 0.009*\"depress\" + 0.007*\"light\"\n", + "2019-01-31 00:52:10,290 : INFO : topic #14 (0.020): 0.024*\"forc\" + 0.021*\"aggress\" + 0.021*\"walter\" + 0.021*\"armi\" + 0.018*\"com\" + 0.014*\"unionist\" + 0.013*\"oper\" + 0.013*\"militari\" + 0.011*\"airbu\" + 0.011*\"diversifi\"\n", + "2019-01-31 00:52:10,291 : INFO : topic #12 (0.020): 0.009*\"number\" + 0.007*\"frontal\" + 0.007*\"exampl\" + 0.007*\"théori\" + 0.006*\"gener\" + 0.006*\"poet\" + 0.006*\"southern\" + 0.006*\"servitud\" + 0.006*\"measur\" + 0.006*\"differ\"\n", + "2019-01-31 00:52:10,292 : INFO : topic #48 (0.020): 0.078*\"march\" + 0.076*\"octob\" + 0.074*\"sens\" + 0.069*\"notion\" + 0.068*\"januari\" + 0.067*\"juli\" + 0.066*\"decatur\" + 0.066*\"august\" + 0.065*\"april\" + 0.065*\"judici\"\n", + "2019-01-31 00:52:10,293 : INFO : topic #32 (0.020): 0.055*\"district\" + 0.045*\"popolo\" + 0.043*\"vigour\" + 0.037*\"tortur\" + 0.035*\"cotton\" + 0.026*\"area\" + 0.022*\"multitud\" + 0.021*\"regim\" + 0.021*\"citi\" + 0.020*\"cede\"\n", + "2019-01-31 00:52:10,299 : INFO : topic diff=0.005316, rho=0.030861\n", + "2019-01-31 00:52:10,459 : INFO : PROGRESS: pass 0, at document #2102000/4922894\n", + "2019-01-31 00:52:11,876 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:52:12,142 : INFO : topic #2 (0.020): 0.048*\"isl\" + 0.038*\"shield\" + 0.018*\"narrat\" + 0.014*\"scot\" + 0.012*\"pope\" + 0.012*\"blur\" + 0.011*\"nativist\" + 0.011*\"coalit\" + 0.009*\"class\" + 0.009*\"fleet\"\n", + "2019-01-31 00:52:12,143 : INFO : topic #47 (0.020): 0.064*\"muscl\" + 0.032*\"perceptu\" + 0.020*\"theater\" + 0.017*\"compos\" + 0.017*\"place\" + 0.017*\"damn\" + 0.014*\"orchestr\" + 0.012*\"olympo\" + 0.012*\"word\" + 0.011*\"physician\"\n", + "2019-01-31 00:52:12,144 : INFO : topic #9 (0.020): 0.080*\"bone\" + 0.044*\"american\" + 0.027*\"valour\" + 0.018*\"folei\" + 0.018*\"player\" + 0.017*\"dutch\" + 0.017*\"polit\" + 0.015*\"english\" + 0.012*\"acrimoni\" + 0.010*\"simpler\"\n", + "2019-01-31 00:52:12,145 : INFO : topic #20 (0.020): 0.145*\"scholar\" + 0.040*\"struggl\" + 0.035*\"high\" + 0.029*\"educ\" + 0.022*\"collector\" + 0.017*\"yawn\" + 0.013*\"prognosi\" + 0.010*\"district\" + 0.010*\"gothic\" + 0.009*\"class\"\n", + "2019-01-31 00:52:12,146 : INFO : topic #21 (0.020): 0.035*\"samford\" + 0.022*\"spain\" + 0.019*\"del\" + 0.017*\"mexico\" + 0.013*\"soviet\" + 0.011*\"francisco\" + 0.011*\"carlo\" + 0.011*\"lizard\" + 0.011*\"italian\" + 0.011*\"juan\"\n", + "2019-01-31 00:52:12,152 : INFO : topic diff=0.005163, rho=0.030846\n", + "2019-01-31 00:52:12,310 : INFO : PROGRESS: pass 0, at document #2104000/4922894\n", + "2019-01-31 00:52:14,205 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:52:14,472 : INFO : topic #40 (0.020): 0.090*\"unit\" + 0.023*\"schuster\" + 0.022*\"collector\" + 0.022*\"requir\" + 0.021*\"institut\" + 0.019*\"student\" + 0.015*\"professor\" + 0.012*\"word\" + 0.011*\"http\" + 0.011*\"governor\"\n", + "2019-01-31 00:52:14,473 : INFO : topic #1 (0.020): 0.053*\"china\" + 0.049*\"chilton\" + 0.021*\"hong\" + 0.021*\"korea\" + 0.021*\"kong\" + 0.019*\"korean\" + 0.016*\"leah\" + 0.016*\"sourc\" + 0.014*\"kim\" + 0.014*\"shirin\"\n", + "2019-01-31 00:52:14,474 : INFO : topic #7 (0.020): 0.021*\"snatch\" + 0.020*\"di\" + 0.018*\"factor\" + 0.015*\"yawn\" + 0.015*\"margin\" + 0.014*\"bone\" + 0.013*\"faster\" + 0.013*\"life\" + 0.012*\"deal\" + 0.012*\"daughter\"\n", + "2019-01-31 00:52:14,475 : INFO : topic #14 (0.020): 0.024*\"forc\" + 0.022*\"aggress\" + 0.021*\"walter\" + 0.021*\"armi\" + 0.018*\"com\" + 0.014*\"unionist\" + 0.013*\"oper\" + 0.013*\"militari\" + 0.011*\"diversifi\" + 0.011*\"airbu\"\n", + "2019-01-31 00:52:14,476 : INFO : topic #39 (0.020): 0.057*\"canada\" + 0.043*\"canadian\" + 0.023*\"toronto\" + 0.022*\"hoar\" + 0.019*\"ontario\" + 0.015*\"colonist\" + 0.014*\"hydrogen\" + 0.014*\"misericordia\" + 0.014*\"new\" + 0.013*\"novotná\"\n", + "2019-01-31 00:52:14,482 : INFO : topic diff=0.004590, rho=0.030831\n", + "2019-01-31 00:52:14,635 : INFO : PROGRESS: pass 0, at document #2106000/4922894\n", + "2019-01-31 00:52:16,005 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:52:16,272 : INFO : topic #18 (0.020): 0.010*\"théori\" + 0.007*\"later\" + 0.007*\"sack\" + 0.006*\"kill\" + 0.006*\"dai\" + 0.005*\"retrospect\" + 0.005*\"like\" + 0.005*\"end\" + 0.004*\"help\" + 0.004*\"call\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 00:52:16,273 : INFO : topic #1 (0.020): 0.056*\"china\" + 0.049*\"chilton\" + 0.022*\"korea\" + 0.021*\"hong\" + 0.021*\"kong\" + 0.019*\"korean\" + 0.016*\"sourc\" + 0.016*\"leah\" + 0.014*\"kim\" + 0.014*\"shirin\"\n", + "2019-01-31 00:52:16,274 : INFO : topic #46 (0.020): 0.022*\"damag\" + 0.018*\"stop\" + 0.015*\"sweden\" + 0.015*\"swedish\" + 0.015*\"norwai\" + 0.015*\"wind\" + 0.013*\"norwegian\" + 0.013*\"ton\" + 0.011*\"farid\" + 0.011*\"turkish\"\n", + "2019-01-31 00:52:16,275 : INFO : topic #48 (0.020): 0.076*\"march\" + 0.076*\"octob\" + 0.074*\"sens\" + 0.068*\"notion\" + 0.067*\"januari\" + 0.066*\"juli\" + 0.065*\"decatur\" + 0.065*\"august\" + 0.064*\"april\" + 0.064*\"judici\"\n", + "2019-01-31 00:52:16,276 : INFO : topic #41 (0.020): 0.041*\"citi\" + 0.025*\"new\" + 0.022*\"palmer\" + 0.014*\"strategist\" + 0.012*\"center\" + 0.012*\"open\" + 0.011*\"includ\" + 0.010*\"lobe\" + 0.009*\"dai\" + 0.009*\"highli\"\n", + "2019-01-31 00:52:16,282 : INFO : topic diff=0.005471, rho=0.030817\n", + "2019-01-31 00:52:16,437 : INFO : PROGRESS: pass 0, at document #2108000/4922894\n", + "2019-01-31 00:52:17,815 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:52:18,081 : INFO : topic #37 (0.020): 0.010*\"man\" + 0.009*\"charact\" + 0.009*\"septemb\" + 0.007*\"comic\" + 0.007*\"love\" + 0.006*\"anim\" + 0.006*\"gestur\" + 0.006*\"appear\" + 0.005*\"workplac\" + 0.005*\"vision\"\n", + "2019-01-31 00:52:18,082 : INFO : topic #24 (0.020): 0.039*\"book\" + 0.035*\"publicis\" + 0.025*\"word\" + 0.018*\"new\" + 0.015*\"edit\" + 0.013*\"presid\" + 0.012*\"collect\" + 0.012*\"nicola\" + 0.012*\"storag\" + 0.011*\"author\"\n", + "2019-01-31 00:52:18,083 : INFO : topic #22 (0.020): 0.033*\"spars\" + 0.023*\"factor\" + 0.020*\"adulthood\" + 0.015*\"feel\" + 0.013*\"male\" + 0.011*\"plaisir\" + 0.010*\"hostil\" + 0.010*\"genu\" + 0.009*\"live\" + 0.008*\"median\"\n", + "2019-01-31 00:52:18,084 : INFO : topic #45 (0.020): 0.027*\"jpg\" + 0.026*\"fifteenth\" + 0.018*\"illicit\" + 0.016*\"colder\" + 0.016*\"black\" + 0.016*\"western\" + 0.013*\"record\" + 0.011*\"blind\" + 0.009*\"depress\" + 0.007*\"light\"\n", + "2019-01-31 00:52:18,085 : INFO : topic #0 (0.020): 0.066*\"statewid\" + 0.039*\"line\" + 0.033*\"arsen\" + 0.033*\"raid\" + 0.026*\"museo\" + 0.019*\"traceabl\" + 0.018*\"serv\" + 0.013*\"pain\" + 0.012*\"exhaust\" + 0.012*\"rosenwald\"\n", + "2019-01-31 00:52:18,091 : INFO : topic diff=0.005763, rho=0.030802\n", + "2019-01-31 00:52:18,300 : INFO : PROGRESS: pass 0, at document #2110000/4922894\n", + "2019-01-31 00:52:19,687 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:52:19,953 : INFO : topic #33 (0.020): 0.060*\"french\" + 0.047*\"franc\" + 0.030*\"pari\" + 0.024*\"sail\" + 0.022*\"jean\" + 0.017*\"daphn\" + 0.013*\"lazi\" + 0.012*\"loui\" + 0.011*\"piec\" + 0.010*\"wine\"\n", + "2019-01-31 00:52:19,954 : INFO : topic #37 (0.020): 0.010*\"man\" + 0.009*\"charact\" + 0.009*\"septemb\" + 0.007*\"comic\" + 0.007*\"love\" + 0.007*\"anim\" + 0.006*\"gestur\" + 0.006*\"appear\" + 0.005*\"workplac\" + 0.005*\"vision\"\n", + "2019-01-31 00:52:19,956 : INFO : topic #20 (0.020): 0.145*\"scholar\" + 0.040*\"struggl\" + 0.035*\"high\" + 0.029*\"educ\" + 0.022*\"collector\" + 0.017*\"yawn\" + 0.013*\"prognosi\" + 0.010*\"district\" + 0.009*\"gothic\" + 0.009*\"task\"\n", + "2019-01-31 00:52:19,956 : INFO : topic #35 (0.020): 0.055*\"russia\" + 0.036*\"sovereignti\" + 0.032*\"rural\" + 0.026*\"poison\" + 0.026*\"personifi\" + 0.024*\"reprint\" + 0.020*\"moscow\" + 0.018*\"poland\" + 0.016*\"malaysia\" + 0.015*\"unfortun\"\n", + "2019-01-31 00:52:19,957 : INFO : topic #17 (0.020): 0.077*\"church\" + 0.023*\"christian\" + 0.022*\"cathol\" + 0.020*\"bishop\" + 0.016*\"sail\" + 0.015*\"retroflex\" + 0.009*\"relationship\" + 0.009*\"centuri\" + 0.009*\"historiographi\" + 0.009*\"cathedr\"\n", + "2019-01-31 00:52:19,963 : INFO : topic diff=0.004764, rho=0.030787\n", + "2019-01-31 00:52:20,118 : INFO : PROGRESS: pass 0, at document #2112000/4922894\n", + "2019-01-31 00:52:21,503 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:52:21,769 : INFO : topic #43 (0.020): 0.063*\"elect\" + 0.055*\"parti\" + 0.024*\"voluntari\" + 0.023*\"democrat\" + 0.020*\"member\" + 0.016*\"polici\" + 0.015*\"republ\" + 0.015*\"liber\" + 0.013*\"seaport\" + 0.013*\"bypass\"\n", + "2019-01-31 00:52:21,770 : INFO : topic #34 (0.020): 0.069*\"start\" + 0.031*\"new\" + 0.030*\"american\" + 0.029*\"unionist\" + 0.027*\"cotton\" + 0.020*\"year\" + 0.015*\"california\" + 0.013*\"warrior\" + 0.012*\"terri\" + 0.012*\"north\"\n", + "2019-01-31 00:52:21,771 : INFO : topic #37 (0.020): 0.010*\"man\" + 0.009*\"charact\" + 0.009*\"septemb\" + 0.007*\"comic\" + 0.007*\"love\" + 0.007*\"anim\" + 0.006*\"gestur\" + 0.006*\"appear\" + 0.005*\"workplac\" + 0.005*\"blue\"\n", + "2019-01-31 00:52:21,772 : INFO : topic #27 (0.020): 0.070*\"questionnair\" + 0.020*\"candid\" + 0.019*\"taxpay\" + 0.014*\"driver\" + 0.012*\"tornado\" + 0.012*\"find\" + 0.012*\"champion\" + 0.012*\"fool\" + 0.011*\"théori\" + 0.011*\"ret\"\n", + "2019-01-31 00:52:21,774 : INFO : topic #6 (0.020): 0.071*\"fewer\" + 0.025*\"epiru\" + 0.023*\"septemb\" + 0.019*\"teacher\" + 0.016*\"stake\" + 0.013*\"rodríguez\" + 0.013*\"proclaim\" + 0.011*\"direct\" + 0.011*\"movi\" + 0.010*\"acrimoni\"\n", + "2019-01-31 00:52:21,779 : INFO : topic diff=0.004469, rho=0.030773\n", + "2019-01-31 00:52:21,944 : INFO : PROGRESS: pass 0, at document #2114000/4922894\n", + "2019-01-31 00:52:23,390 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:52:23,656 : INFO : topic #10 (0.020): 0.011*\"cdd\" + 0.008*\"hormon\" + 0.008*\"media\" + 0.008*\"disco\" + 0.007*\"pathwai\" + 0.007*\"caus\" + 0.007*\"have\" + 0.007*\"proper\" + 0.006*\"treat\" + 0.006*\"effect\"\n", + "2019-01-31 00:52:23,657 : INFO : topic #6 (0.020): 0.070*\"fewer\" + 0.025*\"epiru\" + 0.023*\"septemb\" + 0.019*\"teacher\" + 0.016*\"stake\" + 0.013*\"rodríguez\" + 0.013*\"proclaim\" + 0.011*\"direct\" + 0.011*\"movi\" + 0.010*\"acrimoni\"\n", + "2019-01-31 00:52:23,658 : INFO : topic #42 (0.020): 0.047*\"german\" + 0.030*\"germani\" + 0.014*\"vol\" + 0.014*\"jewish\" + 0.014*\"berlin\" + 0.013*\"der\" + 0.013*\"israel\" + 0.010*\"european\" + 0.010*\"europ\" + 0.009*\"itali\"\n", + "2019-01-31 00:52:23,659 : INFO : topic #39 (0.020): 0.057*\"canada\" + 0.043*\"canadian\" + 0.022*\"toronto\" + 0.022*\"hoar\" + 0.019*\"ontario\" + 0.015*\"hydrogen\" + 0.014*\"new\" + 0.014*\"misericordia\" + 0.014*\"colonist\" + 0.013*\"novotná\"\n", + "2019-01-31 00:52:23,660 : INFO : topic #32 (0.020): 0.053*\"district\" + 0.044*\"popolo\" + 0.043*\"vigour\" + 0.037*\"tortur\" + 0.034*\"cotton\" + 0.026*\"area\" + 0.022*\"multitud\" + 0.021*\"regim\" + 0.020*\"cede\" + 0.020*\"citi\"\n", + "2019-01-31 00:52:23,666 : INFO : topic diff=0.006252, rho=0.030758\n", + "2019-01-31 00:52:23,820 : INFO : PROGRESS: pass 0, at document #2116000/4922894\n", + "2019-01-31 00:52:25,186 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:52:25,452 : INFO : topic #33 (0.020): 0.061*\"french\" + 0.046*\"franc\" + 0.030*\"pari\" + 0.024*\"sail\" + 0.022*\"jean\" + 0.016*\"daphn\" + 0.013*\"lazi\" + 0.012*\"loui\" + 0.011*\"piec\" + 0.010*\"wine\"\n", + "2019-01-31 00:52:25,453 : INFO : topic #39 (0.020): 0.057*\"canada\" + 0.043*\"canadian\" + 0.023*\"toronto\" + 0.022*\"hoar\" + 0.019*\"ontario\" + 0.015*\"hydrogen\" + 0.015*\"misericordia\" + 0.014*\"new\" + 0.014*\"colonist\" + 0.012*\"quebec\"\n", + "2019-01-31 00:52:25,454 : INFO : topic #16 (0.020): 0.057*\"king\" + 0.032*\"priest\" + 0.021*\"rotterdam\" + 0.020*\"duke\" + 0.019*\"grammat\" + 0.018*\"quarterli\" + 0.017*\"idiosyncrat\" + 0.014*\"count\" + 0.014*\"kingdom\" + 0.012*\"portugues\"\n", + "2019-01-31 00:52:25,455 : INFO : topic #3 (0.020): 0.033*\"present\" + 0.027*\"offic\" + 0.024*\"minist\" + 0.021*\"govern\" + 0.021*\"nation\" + 0.020*\"serv\" + 0.020*\"member\" + 0.016*\"gener\" + 0.015*\"start\" + 0.015*\"seri\"\n", + "2019-01-31 00:52:25,456 : INFO : topic #7 (0.020): 0.021*\"snatch\" + 0.020*\"di\" + 0.018*\"factor\" + 0.015*\"yawn\" + 0.015*\"margin\" + 0.014*\"bone\" + 0.013*\"faster\" + 0.013*\"life\" + 0.012*\"deal\" + 0.011*\"john\"\n", + "2019-01-31 00:52:25,462 : INFO : topic diff=0.004050, rho=0.030744\n", + "2019-01-31 00:52:25,622 : INFO : PROGRESS: pass 0, at document #2118000/4922894\n", + "2019-01-31 00:52:27,014 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:52:27,280 : INFO : topic #2 (0.020): 0.048*\"isl\" + 0.038*\"shield\" + 0.018*\"narrat\" + 0.014*\"scot\" + 0.012*\"pope\" + 0.012*\"blur\" + 0.011*\"nativist\" + 0.011*\"coalit\" + 0.009*\"class\" + 0.008*\"fleet\"\n", + "2019-01-31 00:52:27,281 : INFO : topic #15 (0.020): 0.011*\"small\" + 0.011*\"organ\" + 0.010*\"develop\" + 0.010*\"commun\" + 0.009*\"group\" + 0.009*\"word\" + 0.008*\"peopl\" + 0.007*\"woman\" + 0.007*\"human\" + 0.007*\"cultur\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 00:52:27,282 : INFO : topic #14 (0.020): 0.023*\"forc\" + 0.021*\"aggress\" + 0.021*\"armi\" + 0.021*\"walter\" + 0.018*\"com\" + 0.014*\"unionist\" + 0.013*\"oper\" + 0.013*\"militari\" + 0.011*\"refut\" + 0.011*\"airbu\"\n", + "2019-01-31 00:52:27,283 : INFO : topic #24 (0.020): 0.039*\"book\" + 0.035*\"publicis\" + 0.025*\"word\" + 0.018*\"new\" + 0.015*\"edit\" + 0.013*\"presid\" + 0.012*\"collect\" + 0.012*\"nicola\" + 0.012*\"storag\" + 0.011*\"author\"\n", + "2019-01-31 00:52:27,284 : INFO : topic #3 (0.020): 0.034*\"present\" + 0.027*\"offic\" + 0.024*\"minist\" + 0.021*\"nation\" + 0.021*\"govern\" + 0.020*\"serv\" + 0.020*\"member\" + 0.016*\"gener\" + 0.015*\"start\" + 0.015*\"seri\"\n", + "2019-01-31 00:52:27,290 : INFO : topic diff=0.005558, rho=0.030729\n", + "2019-01-31 00:52:30,023 : INFO : -11.502 per-word bound, 2900.4 perplexity estimate based on a held-out corpus of 2000 documents with 560350 words\n", + "2019-01-31 00:52:30,023 : INFO : PROGRESS: pass 0, at document #2120000/4922894\n", + "2019-01-31 00:52:31,429 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:52:31,695 : INFO : topic #34 (0.020): 0.069*\"start\" + 0.031*\"new\" + 0.030*\"american\" + 0.029*\"unionist\" + 0.026*\"cotton\" + 0.020*\"year\" + 0.015*\"california\" + 0.013*\"warrior\" + 0.012*\"terri\" + 0.012*\"north\"\n", + "2019-01-31 00:52:31,696 : INFO : topic #24 (0.020): 0.039*\"book\" + 0.035*\"publicis\" + 0.025*\"word\" + 0.018*\"new\" + 0.015*\"edit\" + 0.013*\"presid\" + 0.012*\"collect\" + 0.012*\"nicola\" + 0.012*\"storag\" + 0.011*\"author\"\n", + "2019-01-31 00:52:31,698 : INFO : topic #13 (0.020): 0.028*\"new\" + 0.027*\"australia\" + 0.026*\"sourc\" + 0.025*\"london\" + 0.023*\"england\" + 0.022*\"australian\" + 0.019*\"british\" + 0.018*\"ireland\" + 0.015*\"youth\" + 0.014*\"wale\"\n", + "2019-01-31 00:52:31,699 : INFO : topic #33 (0.020): 0.062*\"french\" + 0.047*\"franc\" + 0.031*\"pari\" + 0.024*\"sail\" + 0.022*\"jean\" + 0.016*\"daphn\" + 0.013*\"lazi\" + 0.012*\"loui\" + 0.010*\"piec\" + 0.010*\"wine\"\n", + "2019-01-31 00:52:31,700 : INFO : topic #26 (0.020): 0.028*\"workplac\" + 0.028*\"champion\" + 0.028*\"woman\" + 0.025*\"men\" + 0.025*\"olymp\" + 0.022*\"medal\" + 0.021*\"event\" + 0.019*\"atheist\" + 0.018*\"alic\" + 0.018*\"taxpay\"\n", + "2019-01-31 00:52:31,706 : INFO : topic diff=0.004722, rho=0.030715\n", + "2019-01-31 00:52:31,867 : INFO : PROGRESS: pass 0, at document #2122000/4922894\n", + "2019-01-31 00:52:33,273 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:52:33,539 : INFO : topic #12 (0.020): 0.009*\"number\" + 0.007*\"frontal\" + 0.007*\"exampl\" + 0.007*\"théori\" + 0.006*\"servitud\" + 0.006*\"southern\" + 0.006*\"gener\" + 0.006*\"poet\" + 0.006*\"measur\" + 0.006*\"utopian\"\n", + "2019-01-31 00:52:33,541 : INFO : topic #39 (0.020): 0.058*\"canada\" + 0.044*\"canadian\" + 0.023*\"toronto\" + 0.022*\"hoar\" + 0.019*\"ontario\" + 0.015*\"hydrogen\" + 0.015*\"misericordia\" + 0.015*\"new\" + 0.014*\"colonist\" + 0.012*\"quebec\"\n", + "2019-01-31 00:52:33,542 : INFO : topic #47 (0.020): 0.063*\"muscl\" + 0.032*\"perceptu\" + 0.019*\"theater\" + 0.017*\"damn\" + 0.017*\"compos\" + 0.017*\"place\" + 0.015*\"orchestr\" + 0.012*\"physician\" + 0.012*\"olympo\" + 0.011*\"word\"\n", + "2019-01-31 00:52:33,543 : INFO : topic #2 (0.020): 0.049*\"isl\" + 0.038*\"shield\" + 0.018*\"narrat\" + 0.014*\"scot\" + 0.012*\"pope\" + 0.012*\"blur\" + 0.011*\"nativist\" + 0.011*\"coalit\" + 0.009*\"class\" + 0.009*\"bahá\"\n", + "2019-01-31 00:52:33,544 : INFO : topic #22 (0.020): 0.033*\"spars\" + 0.023*\"factor\" + 0.020*\"adulthood\" + 0.015*\"feel\" + 0.013*\"male\" + 0.011*\"plaisir\" + 0.011*\"hostil\" + 0.010*\"genu\" + 0.009*\"live\" + 0.009*\"median\"\n", + "2019-01-31 00:52:33,550 : INFO : topic diff=0.006739, rho=0.030700\n", + "2019-01-31 00:52:33,711 : INFO : PROGRESS: pass 0, at document #2124000/4922894\n", + "2019-01-31 00:52:35,129 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:52:35,396 : INFO : topic #23 (0.020): 0.138*\"audit\" + 0.066*\"best\" + 0.031*\"yawn\" + 0.029*\"jacksonvil\" + 0.022*\"japanes\" + 0.021*\"noll\" + 0.019*\"festiv\" + 0.019*\"women\" + 0.016*\"intern\" + 0.014*\"misconcept\"\n", + "2019-01-31 00:52:35,397 : INFO : topic #18 (0.020): 0.011*\"théori\" + 0.007*\"later\" + 0.007*\"sack\" + 0.006*\"kill\" + 0.006*\"dai\" + 0.005*\"retrospect\" + 0.005*\"end\" + 0.005*\"like\" + 0.004*\"help\" + 0.004*\"call\"\n", + "2019-01-31 00:52:35,398 : INFO : topic #39 (0.020): 0.058*\"canada\" + 0.044*\"canadian\" + 0.023*\"toronto\" + 0.022*\"hoar\" + 0.019*\"ontario\" + 0.015*\"hydrogen\" + 0.015*\"new\" + 0.014*\"misericordia\" + 0.014*\"colonist\" + 0.013*\"quebec\"\n", + "2019-01-31 00:52:35,399 : INFO : topic #13 (0.020): 0.028*\"new\" + 0.027*\"sourc\" + 0.026*\"australia\" + 0.025*\"london\" + 0.023*\"england\" + 0.022*\"australian\" + 0.020*\"british\" + 0.018*\"ireland\" + 0.015*\"youth\" + 0.014*\"wale\"\n", + "2019-01-31 00:52:35,400 : INFO : topic #11 (0.020): 0.024*\"john\" + 0.013*\"will\" + 0.012*\"jame\" + 0.012*\"david\" + 0.010*\"rival\" + 0.009*\"georg\" + 0.009*\"mexican–american\" + 0.008*\"slur\" + 0.008*\"paul\" + 0.008*\"rhyme\"\n", + "2019-01-31 00:52:35,406 : INFO : topic diff=0.004119, rho=0.030686\n", + "2019-01-31 00:52:35,562 : INFO : PROGRESS: pass 0, at document #2126000/4922894\n", + "2019-01-31 00:52:36,940 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:52:37,206 : INFO : topic #29 (0.020): 0.027*\"companhia\" + 0.012*\"million\" + 0.011*\"busi\" + 0.010*\"produc\" + 0.010*\"market\" + 0.010*\"bank\" + 0.009*\"industri\" + 0.009*\"yawn\" + 0.008*\"manag\" + 0.007*\"function\"\n", + "2019-01-31 00:52:37,208 : INFO : topic #38 (0.020): 0.024*\"walter\" + 0.010*\"aza\" + 0.008*\"battalion\" + 0.008*\"empath\" + 0.008*\"forc\" + 0.008*\"teufel\" + 0.007*\"armi\" + 0.006*\"pour\" + 0.006*\"till\" + 0.006*\"militari\"\n", + "2019-01-31 00:52:37,209 : INFO : topic #28 (0.020): 0.032*\"build\" + 0.026*\"hous\" + 0.023*\"rivièr\" + 0.017*\"buford\" + 0.013*\"histor\" + 0.011*\"strategist\" + 0.010*\"constitut\" + 0.010*\"briarwood\" + 0.010*\"depress\" + 0.010*\"linear\"\n", + "2019-01-31 00:52:37,210 : INFO : topic #33 (0.020): 0.062*\"french\" + 0.047*\"franc\" + 0.030*\"pari\" + 0.024*\"sail\" + 0.022*\"jean\" + 0.016*\"daphn\" + 0.013*\"lazi\" + 0.012*\"loui\" + 0.010*\"piec\" + 0.010*\"wine\"\n", + "2019-01-31 00:52:37,211 : INFO : topic #6 (0.020): 0.070*\"fewer\" + 0.025*\"epiru\" + 0.024*\"septemb\" + 0.019*\"teacher\" + 0.016*\"stake\" + 0.013*\"rodríguez\" + 0.013*\"proclaim\" + 0.011*\"direct\" + 0.011*\"movi\" + 0.010*\"acrimoni\"\n", + "2019-01-31 00:52:37,217 : INFO : topic diff=0.004646, rho=0.030671\n", + "2019-01-31 00:52:37,373 : INFO : PROGRESS: pass 0, at document #2128000/4922894\n", + "2019-01-31 00:52:38,750 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:52:39,017 : INFO : topic #14 (0.020): 0.023*\"forc\" + 0.021*\"armi\" + 0.021*\"walter\" + 0.020*\"aggress\" + 0.018*\"com\" + 0.013*\"unionist\" + 0.013*\"oper\" + 0.013*\"militari\" + 0.012*\"refut\" + 0.011*\"diversifi\"\n", + "2019-01-31 00:52:39,018 : INFO : topic #43 (0.020): 0.063*\"elect\" + 0.055*\"parti\" + 0.024*\"voluntari\" + 0.023*\"democrat\" + 0.021*\"member\" + 0.017*\"polici\" + 0.016*\"republ\" + 0.014*\"liber\" + 0.013*\"seaport\" + 0.013*\"report\"\n", + "2019-01-31 00:52:39,019 : INFO : topic #12 (0.020): 0.009*\"number\" + 0.007*\"frontal\" + 0.007*\"exampl\" + 0.006*\"théori\" + 0.006*\"gener\" + 0.006*\"servitud\" + 0.006*\"southern\" + 0.006*\"poet\" + 0.006*\"measur\" + 0.006*\"utopian\"\n", + "2019-01-31 00:52:39,020 : INFO : topic #1 (0.020): 0.055*\"china\" + 0.046*\"chilton\" + 0.022*\"hong\" + 0.022*\"korea\" + 0.021*\"kong\" + 0.019*\"korean\" + 0.017*\"sourc\" + 0.016*\"leah\" + 0.015*\"shirin\" + 0.014*\"kim\"\n", + "2019-01-31 00:52:39,022 : INFO : topic #15 (0.020): 0.011*\"small\" + 0.011*\"organ\" + 0.010*\"develop\" + 0.010*\"commun\" + 0.009*\"group\" + 0.009*\"word\" + 0.008*\"peopl\" + 0.007*\"woman\" + 0.007*\"human\" + 0.007*\"cultur\"\n", + "2019-01-31 00:52:39,028 : INFO : topic diff=0.004411, rho=0.030657\n", + "2019-01-31 00:52:39,182 : INFO : PROGRESS: pass 0, at document #2130000/4922894\n", + "2019-01-31 00:52:40,560 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:52:40,827 : INFO : topic #20 (0.020): 0.148*\"scholar\" + 0.040*\"struggl\" + 0.035*\"high\" + 0.029*\"educ\" + 0.022*\"collector\" + 0.018*\"yawn\" + 0.013*\"prognosi\" + 0.009*\"task\" + 0.009*\"class\" + 0.009*\"district\"\n", + "2019-01-31 00:52:40,828 : INFO : topic #25 (0.020): 0.034*\"ring\" + 0.017*\"lagrang\" + 0.016*\"warmth\" + 0.016*\"area\" + 0.016*\"mount\" + 0.009*\"crayfish\" + 0.009*\"land\" + 0.009*\"palmer\" + 0.009*\"vacant\" + 0.008*\"north\"\n", + "2019-01-31 00:52:40,829 : INFO : topic #12 (0.020): 0.009*\"number\" + 0.007*\"frontal\" + 0.007*\"exampl\" + 0.006*\"servitud\" + 0.006*\"théori\" + 0.006*\"gener\" + 0.006*\"southern\" + 0.006*\"poet\" + 0.006*\"measur\" + 0.006*\"differ\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 00:52:40,831 : INFO : topic #22 (0.020): 0.034*\"spars\" + 0.023*\"factor\" + 0.020*\"adulthood\" + 0.015*\"feel\" + 0.013*\"male\" + 0.011*\"plaisir\" + 0.010*\"hostil\" + 0.010*\"genu\" + 0.008*\"biom\" + 0.008*\"live\"\n", + "2019-01-31 00:52:40,832 : INFO : topic #41 (0.020): 0.041*\"citi\" + 0.024*\"new\" + 0.022*\"palmer\" + 0.014*\"strategist\" + 0.012*\"center\" + 0.012*\"open\" + 0.011*\"includ\" + 0.010*\"lobe\" + 0.009*\"dai\" + 0.009*\"highli\"\n", + "2019-01-31 00:52:40,838 : INFO : topic diff=0.005138, rho=0.030643\n", + "2019-01-31 00:52:40,993 : INFO : PROGRESS: pass 0, at document #2132000/4922894\n", + "2019-01-31 00:52:42,372 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:52:42,639 : INFO : topic #26 (0.020): 0.029*\"workplac\" + 0.028*\"champion\" + 0.028*\"woman\" + 0.026*\"men\" + 0.025*\"olymp\" + 0.021*\"medal\" + 0.021*\"alic\" + 0.020*\"event\" + 0.018*\"taxpay\" + 0.018*\"atheist\"\n", + "2019-01-31 00:52:42,640 : INFO : topic #34 (0.020): 0.069*\"start\" + 0.031*\"new\" + 0.031*\"american\" + 0.029*\"unionist\" + 0.026*\"cotton\" + 0.020*\"year\" + 0.015*\"california\" + 0.013*\"warrior\" + 0.012*\"terri\" + 0.012*\"north\"\n", + "2019-01-31 00:52:42,642 : INFO : topic #38 (0.020): 0.024*\"walter\" + 0.011*\"aza\" + 0.008*\"battalion\" + 0.008*\"empath\" + 0.008*\"forc\" + 0.008*\"teufel\" + 0.007*\"armi\" + 0.007*\"till\" + 0.006*\"pour\" + 0.006*\"govern\"\n", + "2019-01-31 00:52:42,643 : INFO : topic #29 (0.020): 0.028*\"companhia\" + 0.012*\"million\" + 0.011*\"busi\" + 0.011*\"produc\" + 0.010*\"market\" + 0.010*\"bank\" + 0.009*\"industri\" + 0.009*\"yawn\" + 0.008*\"manag\" + 0.007*\"function\"\n", + "2019-01-31 00:52:42,644 : INFO : topic #19 (0.020): 0.016*\"languag\" + 0.013*\"centuri\" + 0.010*\"woodcut\" + 0.009*\"form\" + 0.009*\"origin\" + 0.009*\"mean\" + 0.008*\"trade\" + 0.008*\"english\" + 0.007*\"known\" + 0.006*\"like\"\n", + "2019-01-31 00:52:42,650 : INFO : topic diff=0.004653, rho=0.030628\n", + "2019-01-31 00:52:42,813 : INFO : PROGRESS: pass 0, at document #2134000/4922894\n", + "2019-01-31 00:52:44,245 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:52:44,511 : INFO : topic #1 (0.020): 0.056*\"china\" + 0.046*\"chilton\" + 0.023*\"hong\" + 0.022*\"korea\" + 0.022*\"kong\" + 0.019*\"korean\" + 0.017*\"leah\" + 0.016*\"sourc\" + 0.015*\"kim\" + 0.015*\"shirin\"\n", + "2019-01-31 00:52:44,513 : INFO : topic #0 (0.020): 0.067*\"statewid\" + 0.040*\"line\" + 0.034*\"arsen\" + 0.032*\"raid\" + 0.026*\"museo\" + 0.019*\"traceabl\" + 0.018*\"serv\" + 0.014*\"pain\" + 0.013*\"exhaust\" + 0.012*\"rosenwald\"\n", + "2019-01-31 00:52:44,514 : INFO : topic #28 (0.020): 0.032*\"build\" + 0.026*\"hous\" + 0.022*\"rivièr\" + 0.017*\"buford\" + 0.013*\"histor\" + 0.011*\"strategist\" + 0.011*\"constitut\" + 0.011*\"briarwood\" + 0.010*\"depress\" + 0.010*\"linear\"\n", + "2019-01-31 00:52:44,515 : INFO : topic #13 (0.020): 0.029*\"new\" + 0.027*\"sourc\" + 0.027*\"australia\" + 0.025*\"london\" + 0.023*\"england\" + 0.022*\"australian\" + 0.020*\"british\" + 0.018*\"ireland\" + 0.016*\"youth\" + 0.014*\"wale\"\n", + "2019-01-31 00:52:44,517 : INFO : topic #41 (0.020): 0.041*\"citi\" + 0.024*\"new\" + 0.022*\"palmer\" + 0.014*\"strategist\" + 0.012*\"center\" + 0.012*\"open\" + 0.011*\"includ\" + 0.010*\"lobe\" + 0.009*\"dai\" + 0.009*\"highli\"\n", + "2019-01-31 00:52:44,522 : INFO : topic diff=0.005083, rho=0.030614\n", + "2019-01-31 00:52:44,679 : INFO : PROGRESS: pass 0, at document #2136000/4922894\n", + "2019-01-31 00:52:46,063 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:52:46,330 : INFO : topic #7 (0.020): 0.021*\"snatch\" + 0.020*\"di\" + 0.018*\"factor\" + 0.015*\"margin\" + 0.015*\"yawn\" + 0.014*\"bone\" + 0.013*\"faster\" + 0.013*\"life\" + 0.012*\"deal\" + 0.011*\"john\"\n", + "2019-01-31 00:52:46,331 : INFO : topic #6 (0.020): 0.071*\"fewer\" + 0.025*\"epiru\" + 0.023*\"septemb\" + 0.019*\"teacher\" + 0.016*\"stake\" + 0.013*\"rodríguez\" + 0.012*\"proclaim\" + 0.011*\"direct\" + 0.011*\"movi\" + 0.010*\"acrimoni\"\n", + "2019-01-31 00:52:46,332 : INFO : topic #24 (0.020): 0.039*\"book\" + 0.035*\"publicis\" + 0.026*\"word\" + 0.018*\"new\" + 0.015*\"edit\" + 0.013*\"presid\" + 0.012*\"nicola\" + 0.012*\"collect\" + 0.012*\"storag\" + 0.011*\"author\"\n", + "2019-01-31 00:52:46,334 : INFO : topic #5 (0.020): 0.039*\"abroad\" + 0.029*\"son\" + 0.027*\"rel\" + 0.026*\"reconstruct\" + 0.021*\"band\" + 0.016*\"muscl\" + 0.015*\"simultan\" + 0.014*\"charcoal\" + 0.014*\"toyota\" + 0.010*\"vocabulari\"\n", + "2019-01-31 00:52:46,335 : INFO : topic #9 (0.020): 0.079*\"bone\" + 0.047*\"american\" + 0.027*\"valour\" + 0.019*\"folei\" + 0.018*\"player\" + 0.017*\"polit\" + 0.016*\"dutch\" + 0.016*\"english\" + 0.012*\"acrimoni\" + 0.011*\"surnam\"\n", + "2019-01-31 00:52:46,341 : INFO : topic diff=0.004378, rho=0.030600\n", + "2019-01-31 00:52:46,493 : INFO : PROGRESS: pass 0, at document #2138000/4922894\n", + "2019-01-31 00:52:47,872 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:52:48,139 : INFO : topic #21 (0.020): 0.034*\"samford\" + 0.021*\"spain\" + 0.019*\"del\" + 0.017*\"mexico\" + 0.013*\"soviet\" + 0.011*\"juan\" + 0.011*\"carlo\" + 0.011*\"italian\" + 0.011*\"santa\" + 0.011*\"lizard\"\n", + "2019-01-31 00:52:48,140 : INFO : topic #24 (0.020): 0.039*\"book\" + 0.035*\"publicis\" + 0.025*\"word\" + 0.018*\"new\" + 0.015*\"edit\" + 0.013*\"presid\" + 0.012*\"nicola\" + 0.012*\"collect\" + 0.012*\"storag\" + 0.011*\"author\"\n", + "2019-01-31 00:52:48,141 : INFO : topic #3 (0.020): 0.033*\"present\" + 0.027*\"offic\" + 0.024*\"minist\" + 0.022*\"serv\" + 0.021*\"nation\" + 0.021*\"govern\" + 0.020*\"member\" + 0.016*\"gener\" + 0.015*\"start\" + 0.015*\"seri\"\n", + "2019-01-31 00:52:48,142 : INFO : topic #17 (0.020): 0.076*\"church\" + 0.023*\"christian\" + 0.022*\"cathol\" + 0.021*\"bishop\" + 0.016*\"sail\" + 0.015*\"retroflex\" + 0.009*\"centuri\" + 0.009*\"relationship\" + 0.009*\"historiographi\" + 0.009*\"poll\"\n", + "2019-01-31 00:52:48,144 : INFO : topic #10 (0.020): 0.011*\"cdd\" + 0.008*\"disco\" + 0.008*\"hormon\" + 0.008*\"media\" + 0.007*\"pathwai\" + 0.007*\"caus\" + 0.006*\"proper\" + 0.006*\"have\" + 0.006*\"treat\" + 0.006*\"effect\"\n", + "2019-01-31 00:52:48,149 : INFO : topic diff=0.004352, rho=0.030585\n", + "2019-01-31 00:52:50,871 : INFO : -11.783 per-word bound, 3523.8 perplexity estimate based on a held-out corpus of 2000 documents with 552413 words\n", + "2019-01-31 00:52:50,872 : INFO : PROGRESS: pass 0, at document #2140000/4922894\n", + "2019-01-31 00:52:52,281 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:52:52,548 : INFO : topic #41 (0.020): 0.041*\"citi\" + 0.024*\"new\" + 0.022*\"palmer\" + 0.014*\"strategist\" + 0.012*\"center\" + 0.012*\"open\" + 0.011*\"includ\" + 0.010*\"lobe\" + 0.009*\"dai\" + 0.009*\"highli\"\n", + "2019-01-31 00:52:52,549 : INFO : topic #38 (0.020): 0.024*\"walter\" + 0.010*\"aza\" + 0.008*\"forc\" + 0.008*\"battalion\" + 0.008*\"teufel\" + 0.008*\"empath\" + 0.007*\"armi\" + 0.007*\"till\" + 0.006*\"pour\" + 0.006*\"militari\"\n", + "2019-01-31 00:52:52,550 : INFO : topic #1 (0.020): 0.054*\"china\" + 0.044*\"chilton\" + 0.023*\"hong\" + 0.022*\"kong\" + 0.021*\"korea\" + 0.019*\"korean\" + 0.017*\"leah\" + 0.016*\"sourc\" + 0.016*\"kim\" + 0.014*\"shirin\"\n", + "2019-01-31 00:52:52,552 : INFO : topic #7 (0.020): 0.021*\"snatch\" + 0.020*\"di\" + 0.018*\"factor\" + 0.015*\"margin\" + 0.015*\"yawn\" + 0.014*\"bone\" + 0.013*\"faster\" + 0.013*\"life\" + 0.012*\"deal\" + 0.012*\"john\"\n", + "2019-01-31 00:52:52,553 : INFO : topic #13 (0.020): 0.029*\"new\" + 0.026*\"sourc\" + 0.026*\"australia\" + 0.025*\"london\" + 0.022*\"australian\" + 0.022*\"england\" + 0.020*\"british\" + 0.018*\"ireland\" + 0.016*\"youth\" + 0.014*\"wale\"\n", + "2019-01-31 00:52:52,559 : INFO : topic diff=0.004782, rho=0.030571\n", + "2019-01-31 00:52:52,712 : INFO : PROGRESS: pass 0, at document #2142000/4922894\n", + "2019-01-31 00:52:54,076 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:52:54,343 : INFO : topic #12 (0.020): 0.009*\"number\" + 0.007*\"frontal\" + 0.007*\"exampl\" + 0.007*\"théori\" + 0.006*\"servitud\" + 0.006*\"gener\" + 0.006*\"poet\" + 0.006*\"southern\" + 0.006*\"measur\" + 0.006*\"differ\"\n", + "2019-01-31 00:52:54,344 : INFO : topic #42 (0.020): 0.046*\"german\" + 0.031*\"germani\" + 0.014*\"vol\" + 0.014*\"jewish\" + 0.014*\"israel\" + 0.014*\"berlin\" + 0.014*\"der\" + 0.010*\"european\" + 0.010*\"europ\" + 0.009*\"itali\"\n", + "2019-01-31 00:52:54,345 : INFO : topic #13 (0.020): 0.028*\"new\" + 0.026*\"sourc\" + 0.026*\"australia\" + 0.025*\"london\" + 0.023*\"australian\" + 0.022*\"england\" + 0.020*\"british\" + 0.018*\"ireland\" + 0.016*\"youth\" + 0.014*\"wale\"\n", + "2019-01-31 00:52:54,346 : INFO : topic #31 (0.020): 0.053*\"fusiform\" + 0.026*\"scientist\" + 0.025*\"taxpay\" + 0.025*\"player\" + 0.020*\"place\" + 0.013*\"clot\" + 0.013*\"leagu\" + 0.011*\"folei\" + 0.010*\"yawn\" + 0.009*\"reconstruct\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 00:52:54,348 : INFO : topic #6 (0.020): 0.071*\"fewer\" + 0.025*\"epiru\" + 0.023*\"septemb\" + 0.019*\"teacher\" + 0.016*\"stake\" + 0.013*\"rodríguez\" + 0.012*\"proclaim\" + 0.011*\"direct\" + 0.011*\"movi\" + 0.010*\"acrimoni\"\n", + "2019-01-31 00:52:54,354 : INFO : topic diff=0.005411, rho=0.030557\n", + "2019-01-31 00:52:54,574 : INFO : PROGRESS: pass 0, at document #2144000/4922894\n", + "2019-01-31 00:52:55,990 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:52:56,257 : INFO : topic #18 (0.020): 0.011*\"théori\" + 0.007*\"later\" + 0.007*\"sack\" + 0.006*\"dai\" + 0.006*\"kill\" + 0.005*\"retrospect\" + 0.005*\"like\" + 0.005*\"end\" + 0.004*\"call\" + 0.004*\"help\"\n", + "2019-01-31 00:52:56,258 : INFO : topic #40 (0.020): 0.091*\"unit\" + 0.023*\"schuster\" + 0.022*\"collector\" + 0.022*\"requir\" + 0.021*\"institut\" + 0.019*\"student\" + 0.016*\"professor\" + 0.012*\"word\" + 0.011*\"http\" + 0.011*\"governor\"\n", + "2019-01-31 00:52:56,259 : INFO : topic #45 (0.020): 0.027*\"jpg\" + 0.025*\"fifteenth\" + 0.018*\"illicit\" + 0.018*\"colder\" + 0.016*\"western\" + 0.016*\"black\" + 0.013*\"record\" + 0.011*\"blind\" + 0.009*\"depress\" + 0.007*\"pain\"\n", + "2019-01-31 00:52:56,260 : INFO : topic #34 (0.020): 0.070*\"start\" + 0.031*\"new\" + 0.030*\"american\" + 0.029*\"unionist\" + 0.026*\"cotton\" + 0.019*\"year\" + 0.015*\"california\" + 0.013*\"warrior\" + 0.013*\"terri\" + 0.011*\"north\"\n", + "2019-01-31 00:52:56,262 : INFO : topic #21 (0.020): 0.034*\"samford\" + 0.021*\"spain\" + 0.020*\"del\" + 0.017*\"mexico\" + 0.013*\"soviet\" + 0.011*\"italian\" + 0.011*\"juan\" + 0.011*\"carlo\" + 0.011*\"santa\" + 0.011*\"francisco\"\n", + "2019-01-31 00:52:56,267 : INFO : topic diff=0.004642, rho=0.030542\n", + "2019-01-31 00:52:56,423 : INFO : PROGRESS: pass 0, at document #2146000/4922894\n", + "2019-01-31 00:52:57,803 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:52:58,069 : INFO : topic #16 (0.020): 0.055*\"king\" + 0.031*\"priest\" + 0.022*\"rotterdam\" + 0.020*\"duke\" + 0.019*\"grammat\" + 0.018*\"quarterli\" + 0.017*\"idiosyncrat\" + 0.014*\"kingdom\" + 0.014*\"count\" + 0.013*\"portugues\"\n", + "2019-01-31 00:52:58,070 : INFO : topic #41 (0.020): 0.041*\"citi\" + 0.024*\"new\" + 0.022*\"palmer\" + 0.014*\"strategist\" + 0.012*\"center\" + 0.012*\"open\" + 0.011*\"includ\" + 0.010*\"lobe\" + 0.009*\"dai\" + 0.009*\"highli\"\n", + "2019-01-31 00:52:58,071 : INFO : topic #38 (0.020): 0.024*\"walter\" + 0.010*\"aza\" + 0.008*\"forc\" + 0.008*\"battalion\" + 0.008*\"teufel\" + 0.008*\"empath\" + 0.007*\"armi\" + 0.007*\"till\" + 0.006*\"pour\" + 0.006*\"militari\"\n", + "2019-01-31 00:52:58,072 : INFO : topic #46 (0.020): 0.019*\"damag\" + 0.017*\"stop\" + 0.016*\"sweden\" + 0.016*\"norwai\" + 0.015*\"swedish\" + 0.014*\"wind\" + 0.013*\"norwegian\" + 0.012*\"turkish\" + 0.011*\"treeless\" + 0.011*\"farid\"\n", + "2019-01-31 00:52:58,074 : INFO : topic #18 (0.020): 0.011*\"théori\" + 0.007*\"later\" + 0.007*\"sack\" + 0.006*\"dai\" + 0.006*\"kill\" + 0.005*\"retrospect\" + 0.005*\"like\" + 0.005*\"end\" + 0.004*\"help\" + 0.004*\"call\"\n", + "2019-01-31 00:52:58,080 : INFO : topic diff=0.004320, rho=0.030528\n", + "2019-01-31 00:52:58,235 : INFO : PROGRESS: pass 0, at document #2148000/4922894\n", + "2019-01-31 00:52:59,629 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:52:59,895 : INFO : topic #49 (0.020): 0.043*\"india\" + 0.029*\"incumb\" + 0.013*\"islam\" + 0.013*\"anglo\" + 0.012*\"televis\" + 0.012*\"pakistan\" + 0.011*\"muskoge\" + 0.010*\"affection\" + 0.009*\"alam\" + 0.009*\"start\"\n", + "2019-01-31 00:52:59,896 : INFO : topic #29 (0.020): 0.028*\"companhia\" + 0.012*\"million\" + 0.012*\"busi\" + 0.011*\"produc\" + 0.010*\"market\" + 0.010*\"bank\" + 0.009*\"industri\" + 0.009*\"yawn\" + 0.008*\"manag\" + 0.007*\"function\"\n", + "2019-01-31 00:52:59,897 : INFO : topic #17 (0.020): 0.077*\"church\" + 0.023*\"christian\" + 0.022*\"cathol\" + 0.020*\"bishop\" + 0.016*\"sail\" + 0.015*\"retroflex\" + 0.010*\"centuri\" + 0.009*\"poll\" + 0.009*\"relationship\" + 0.009*\"john\"\n", + "2019-01-31 00:52:59,899 : INFO : topic #38 (0.020): 0.024*\"walter\" + 0.011*\"aza\" + 0.008*\"forc\" + 0.008*\"battalion\" + 0.008*\"teufel\" + 0.008*\"empath\" + 0.007*\"armi\" + 0.007*\"till\" + 0.006*\"pour\" + 0.006*\"militari\"\n", + "2019-01-31 00:52:59,900 : INFO : topic #44 (0.020): 0.030*\"rooftop\" + 0.027*\"final\" + 0.024*\"wife\" + 0.021*\"tourist\" + 0.020*\"champion\" + 0.017*\"martin\" + 0.015*\"taxpay\" + 0.015*\"tiepolo\" + 0.015*\"chamber\" + 0.012*\"women\"\n", + "2019-01-31 00:52:59,906 : INFO : topic diff=0.003981, rho=0.030514\n", + "2019-01-31 00:53:00,062 : INFO : PROGRESS: pass 0, at document #2150000/4922894\n", + "2019-01-31 00:53:01,443 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:53:01,710 : INFO : topic #29 (0.020): 0.028*\"companhia\" + 0.012*\"million\" + 0.012*\"busi\" + 0.011*\"produc\" + 0.010*\"market\" + 0.010*\"bank\" + 0.009*\"industri\" + 0.009*\"yawn\" + 0.008*\"manag\" + 0.007*\"function\"\n", + "2019-01-31 00:53:01,711 : INFO : topic #44 (0.020): 0.030*\"rooftop\" + 0.027*\"final\" + 0.023*\"wife\" + 0.020*\"tourist\" + 0.020*\"champion\" + 0.017*\"chamber\" + 0.016*\"martin\" + 0.016*\"tiepolo\" + 0.015*\"taxpay\" + 0.013*\"open\"\n", + "2019-01-31 00:53:01,712 : INFO : topic #8 (0.020): 0.027*\"law\" + 0.024*\"cortic\" + 0.019*\"start\" + 0.017*\"act\" + 0.012*\"ricardo\" + 0.012*\"case\" + 0.010*\"replac\" + 0.010*\"polaris\" + 0.009*\"legal\" + 0.008*\"order\"\n", + "2019-01-31 00:53:01,713 : INFO : topic #3 (0.020): 0.033*\"present\" + 0.027*\"offic\" + 0.024*\"minist\" + 0.022*\"nation\" + 0.021*\"serv\" + 0.021*\"govern\" + 0.020*\"member\" + 0.016*\"gener\" + 0.015*\"start\" + 0.015*\"seri\"\n", + "2019-01-31 00:53:01,714 : INFO : topic #11 (0.020): 0.024*\"john\" + 0.013*\"will\" + 0.012*\"jame\" + 0.011*\"david\" + 0.010*\"rival\" + 0.009*\"mexican–american\" + 0.009*\"georg\" + 0.008*\"slur\" + 0.008*\"paul\" + 0.008*\"rhyme\"\n", + "2019-01-31 00:53:01,720 : INFO : topic diff=0.004137, rho=0.030500\n", + "2019-01-31 00:53:01,875 : INFO : PROGRESS: pass 0, at document #2152000/4922894\n", + "2019-01-31 00:53:03,256 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:53:03,522 : INFO : topic #34 (0.020): 0.070*\"start\" + 0.031*\"new\" + 0.030*\"american\" + 0.029*\"unionist\" + 0.025*\"cotton\" + 0.019*\"year\" + 0.015*\"california\" + 0.013*\"terri\" + 0.013*\"warrior\" + 0.012*\"north\"\n", + "2019-01-31 00:53:03,523 : INFO : topic #11 (0.020): 0.024*\"john\" + 0.013*\"will\" + 0.012*\"jame\" + 0.011*\"david\" + 0.010*\"rival\" + 0.009*\"mexican–american\" + 0.009*\"georg\" + 0.008*\"slur\" + 0.008*\"paul\" + 0.008*\"rhyme\"\n", + "2019-01-31 00:53:03,525 : INFO : topic #6 (0.020): 0.071*\"fewer\" + 0.025*\"epiru\" + 0.023*\"septemb\" + 0.019*\"teacher\" + 0.017*\"stake\" + 0.013*\"rodríguez\" + 0.012*\"proclaim\" + 0.011*\"direct\" + 0.011*\"movi\" + 0.010*\"acrimoni\"\n", + "2019-01-31 00:53:03,526 : INFO : topic #24 (0.020): 0.040*\"book\" + 0.035*\"publicis\" + 0.025*\"word\" + 0.017*\"new\" + 0.015*\"edit\" + 0.013*\"presid\" + 0.012*\"nicola\" + 0.012*\"collect\" + 0.012*\"storag\" + 0.011*\"author\"\n", + "2019-01-31 00:53:03,527 : INFO : topic #39 (0.020): 0.056*\"canada\" + 0.042*\"canadian\" + 0.023*\"toronto\" + 0.022*\"hoar\" + 0.019*\"ontario\" + 0.015*\"new\" + 0.015*\"misericordia\" + 0.014*\"hydrogen\" + 0.013*\"quebec\" + 0.013*\"novotná\"\n", + "2019-01-31 00:53:03,533 : INFO : topic diff=0.004978, rho=0.030486\n", + "2019-01-31 00:53:03,692 : INFO : PROGRESS: pass 0, at document #2154000/4922894\n", + "2019-01-31 00:53:05,092 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:53:05,357 : INFO : topic #39 (0.020): 0.056*\"canada\" + 0.042*\"canadian\" + 0.023*\"toronto\" + 0.021*\"hoar\" + 0.019*\"ontario\" + 0.015*\"new\" + 0.015*\"misericordia\" + 0.014*\"hydrogen\" + 0.013*\"quebec\" + 0.013*\"novotná\"\n", + "2019-01-31 00:53:05,358 : INFO : topic #24 (0.020): 0.040*\"book\" + 0.035*\"publicis\" + 0.025*\"word\" + 0.018*\"new\" + 0.014*\"edit\" + 0.013*\"presid\" + 0.012*\"nicola\" + 0.012*\"storag\" + 0.012*\"collect\" + 0.011*\"author\"\n", + "2019-01-31 00:53:05,360 : INFO : topic #11 (0.020): 0.024*\"john\" + 0.013*\"will\" + 0.012*\"jame\" + 0.011*\"david\" + 0.010*\"rival\" + 0.009*\"mexican–american\" + 0.009*\"georg\" + 0.008*\"slur\" + 0.008*\"paul\" + 0.008*\"rhyme\"\n", + "2019-01-31 00:53:05,361 : INFO : topic #23 (0.020): 0.137*\"audit\" + 0.067*\"best\" + 0.031*\"yawn\" + 0.030*\"jacksonvil\" + 0.023*\"japanes\" + 0.021*\"noll\" + 0.020*\"festiv\" + 0.019*\"women\" + 0.016*\"intern\" + 0.014*\"prison\"\n", + "2019-01-31 00:53:05,362 : INFO : topic #3 (0.020): 0.033*\"present\" + 0.027*\"offic\" + 0.023*\"minist\" + 0.021*\"serv\" + 0.021*\"nation\" + 0.021*\"govern\" + 0.020*\"member\" + 0.016*\"gener\" + 0.015*\"start\" + 0.015*\"seri\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 00:53:05,368 : INFO : topic diff=0.005291, rho=0.030471\n", + "2019-01-31 00:53:05,529 : INFO : PROGRESS: pass 0, at document #2156000/4922894\n", + "2019-01-31 00:53:06,914 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:53:07,181 : INFO : topic #23 (0.020): 0.137*\"audit\" + 0.066*\"best\" + 0.031*\"yawn\" + 0.030*\"jacksonvil\" + 0.023*\"japanes\" + 0.021*\"noll\" + 0.020*\"festiv\" + 0.019*\"women\" + 0.016*\"intern\" + 0.014*\"prison\"\n", + "2019-01-31 00:53:07,182 : INFO : topic #31 (0.020): 0.052*\"fusiform\" + 0.026*\"scientist\" + 0.025*\"taxpay\" + 0.025*\"player\" + 0.020*\"place\" + 0.014*\"clot\" + 0.013*\"leagu\" + 0.011*\"folei\" + 0.010*\"yawn\" + 0.009*\"reconstruct\"\n", + "2019-01-31 00:53:07,183 : INFO : topic #36 (0.020): 0.012*\"network\" + 0.011*\"pop\" + 0.011*\"prognosi\" + 0.008*\"develop\" + 0.008*\"diggin\" + 0.008*\"brio\" + 0.008*\"user\" + 0.008*\"softwar\" + 0.007*\"uruguayan\" + 0.007*\"cytokin\"\n", + "2019-01-31 00:53:07,184 : INFO : topic #20 (0.020): 0.146*\"scholar\" + 0.039*\"struggl\" + 0.034*\"high\" + 0.030*\"educ\" + 0.022*\"collector\" + 0.018*\"yawn\" + 0.013*\"prognosi\" + 0.010*\"gothic\" + 0.010*\"district\" + 0.009*\"class\"\n", + "2019-01-31 00:53:07,185 : INFO : topic #10 (0.020): 0.011*\"cdd\" + 0.008*\"disco\" + 0.008*\"media\" + 0.008*\"hormon\" + 0.007*\"pathwai\" + 0.007*\"have\" + 0.007*\"proper\" + 0.007*\"caus\" + 0.006*\"treat\" + 0.006*\"effect\"\n", + "2019-01-31 00:53:07,191 : INFO : topic diff=0.004198, rho=0.030457\n", + "2019-01-31 00:53:07,355 : INFO : PROGRESS: pass 0, at document #2158000/4922894\n", + "2019-01-31 00:53:08,751 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:53:09,017 : INFO : topic #21 (0.020): 0.034*\"samford\" + 0.021*\"spain\" + 0.019*\"del\" + 0.017*\"mexico\" + 0.014*\"soviet\" + 0.012*\"juan\" + 0.011*\"italian\" + 0.011*\"carlo\" + 0.011*\"santa\" + 0.011*\"lizard\"\n", + "2019-01-31 00:53:09,019 : INFO : topic #47 (0.020): 0.062*\"muscl\" + 0.032*\"perceptu\" + 0.019*\"theater\" + 0.017*\"place\" + 0.017*\"compos\" + 0.017*\"damn\" + 0.015*\"orchestr\" + 0.012*\"physician\" + 0.012*\"jack\" + 0.012*\"word\"\n", + "2019-01-31 00:53:09,020 : INFO : topic #43 (0.020): 0.063*\"elect\" + 0.054*\"parti\" + 0.024*\"voluntari\" + 0.022*\"democrat\" + 0.021*\"member\" + 0.017*\"polici\" + 0.015*\"republ\" + 0.013*\"seaport\" + 0.013*\"liber\" + 0.013*\"report\"\n", + "2019-01-31 00:53:09,021 : INFO : topic #0 (0.020): 0.066*\"statewid\" + 0.040*\"line\" + 0.034*\"arsen\" + 0.031*\"raid\" + 0.026*\"museo\" + 0.019*\"traceabl\" + 0.018*\"serv\" + 0.014*\"pain\" + 0.013*\"rosenwald\" + 0.012*\"exhaust\"\n", + "2019-01-31 00:53:09,022 : INFO : topic #48 (0.020): 0.079*\"march\" + 0.077*\"sens\" + 0.076*\"octob\" + 0.068*\"juli\" + 0.068*\"notion\" + 0.067*\"januari\" + 0.067*\"august\" + 0.066*\"judici\" + 0.065*\"april\" + 0.063*\"decatur\"\n", + "2019-01-31 00:53:09,028 : INFO : topic diff=0.003990, rho=0.030443\n", + "2019-01-31 00:53:11,702 : INFO : -11.803 per-word bound, 3573.1 perplexity estimate based on a held-out corpus of 2000 documents with 545454 words\n", + "2019-01-31 00:53:11,703 : INFO : PROGRESS: pass 0, at document #2160000/4922894\n", + "2019-01-31 00:53:13,088 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:53:13,354 : INFO : topic #33 (0.020): 0.062*\"french\" + 0.046*\"franc\" + 0.030*\"pari\" + 0.024*\"sail\" + 0.022*\"jean\" + 0.017*\"daphn\" + 0.013*\"lazi\" + 0.012*\"loui\" + 0.011*\"piec\" + 0.009*\"wine\"\n", + "2019-01-31 00:53:13,355 : INFO : topic #30 (0.020): 0.036*\"leagu\" + 0.035*\"cleveland\" + 0.029*\"place\" + 0.027*\"taxpay\" + 0.025*\"scientist\" + 0.024*\"crete\" + 0.021*\"folei\" + 0.017*\"goal\" + 0.015*\"martin\" + 0.012*\"schmitz\"\n", + "2019-01-31 00:53:13,357 : INFO : topic #27 (0.020): 0.070*\"questionnair\" + 0.019*\"candid\" + 0.018*\"taxpay\" + 0.014*\"tornado\" + 0.013*\"ret\" + 0.013*\"squatter\" + 0.013*\"fool\" + 0.012*\"driver\" + 0.012*\"find\" + 0.011*\"champion\"\n", + "2019-01-31 00:53:13,358 : INFO : topic #25 (0.020): 0.034*\"ring\" + 0.018*\"lagrang\" + 0.016*\"warmth\" + 0.016*\"area\" + 0.016*\"mount\" + 0.009*\"north\" + 0.009*\"vacant\" + 0.009*\"palmer\" + 0.008*\"crayfish\" + 0.008*\"land\"\n", + "2019-01-31 00:53:13,359 : INFO : topic #15 (0.020): 0.011*\"small\" + 0.010*\"organ\" + 0.010*\"develop\" + 0.010*\"commun\" + 0.009*\"group\" + 0.009*\"word\" + 0.008*\"peopl\" + 0.007*\"cultur\" + 0.007*\"woman\" + 0.007*\"workplac\"\n", + "2019-01-31 00:53:13,365 : INFO : topic diff=0.004862, rho=0.030429\n", + "2019-01-31 00:53:13,528 : INFO : PROGRESS: pass 0, at document #2162000/4922894\n", + "2019-01-31 00:53:14,960 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:53:15,226 : INFO : topic #25 (0.020): 0.034*\"ring\" + 0.018*\"lagrang\" + 0.016*\"warmth\" + 0.016*\"area\" + 0.016*\"mount\" + 0.009*\"north\" + 0.009*\"vacant\" + 0.009*\"palmer\" + 0.008*\"crayfish\" + 0.008*\"land\"\n", + "2019-01-31 00:53:15,227 : INFO : topic #19 (0.020): 0.017*\"languag\" + 0.014*\"centuri\" + 0.011*\"woodcut\" + 0.009*\"origin\" + 0.009*\"form\" + 0.009*\"mean\" + 0.008*\"trade\" + 0.007*\"english\" + 0.007*\"known\" + 0.006*\"ancestor\"\n", + "2019-01-31 00:53:15,229 : INFO : topic #3 (0.020): 0.033*\"present\" + 0.027*\"offic\" + 0.024*\"minist\" + 0.021*\"nation\" + 0.021*\"govern\" + 0.021*\"serv\" + 0.020*\"member\" + 0.016*\"gener\" + 0.015*\"start\" + 0.015*\"seri\"\n", + "2019-01-31 00:53:15,230 : INFO : topic #0 (0.020): 0.066*\"statewid\" + 0.040*\"line\" + 0.034*\"arsen\" + 0.031*\"raid\" + 0.026*\"museo\" + 0.019*\"traceabl\" + 0.018*\"serv\" + 0.014*\"pain\" + 0.013*\"exhaust\" + 0.013*\"rosenwald\"\n", + "2019-01-31 00:53:15,231 : INFO : topic #4 (0.020): 0.021*\"enfranchis\" + 0.015*\"depress\" + 0.015*\"pour\" + 0.009*\"mode\" + 0.008*\"elabor\" + 0.008*\"veget\" + 0.008*\"uruguayan\" + 0.007*\"encyclopedia\" + 0.006*\"produc\" + 0.006*\"develop\"\n", + "2019-01-31 00:53:15,237 : INFO : topic diff=0.004586, rho=0.030415\n", + "2019-01-31 00:53:15,392 : INFO : PROGRESS: pass 0, at document #2164000/4922894\n", + "2019-01-31 00:53:16,780 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:53:17,046 : INFO : topic #20 (0.020): 0.145*\"scholar\" + 0.039*\"struggl\" + 0.034*\"high\" + 0.030*\"educ\" + 0.023*\"collector\" + 0.018*\"yawn\" + 0.013*\"prognosi\" + 0.010*\"gothic\" + 0.009*\"district\" + 0.009*\"class\"\n", + "2019-01-31 00:53:17,047 : INFO : topic #49 (0.020): 0.043*\"india\" + 0.028*\"incumb\" + 0.013*\"islam\" + 0.013*\"anglo\" + 0.013*\"televis\" + 0.012*\"pakistan\" + 0.011*\"muskoge\" + 0.010*\"singh\" + 0.010*\"affection\" + 0.009*\"alam\"\n", + "2019-01-31 00:53:17,049 : INFO : topic #36 (0.020): 0.011*\"network\" + 0.011*\"prognosi\" + 0.011*\"pop\" + 0.008*\"develop\" + 0.008*\"softwar\" + 0.008*\"user\" + 0.008*\"diggin\" + 0.008*\"brio\" + 0.007*\"uruguayan\" + 0.007*\"includ\"\n", + "2019-01-31 00:53:17,050 : INFO : topic #0 (0.020): 0.066*\"statewid\" + 0.040*\"line\" + 0.034*\"arsen\" + 0.031*\"raid\" + 0.026*\"museo\" + 0.019*\"traceabl\" + 0.017*\"serv\" + 0.014*\"pain\" + 0.013*\"rosenwald\" + 0.013*\"exhaust\"\n", + "2019-01-31 00:53:17,051 : INFO : topic #28 (0.020): 0.032*\"build\" + 0.025*\"hous\" + 0.021*\"rivièr\" + 0.017*\"buford\" + 0.013*\"histor\" + 0.013*\"briarwood\" + 0.011*\"strategist\" + 0.011*\"constitut\" + 0.010*\"linear\" + 0.010*\"depress\"\n", + "2019-01-31 00:53:17,057 : INFO : topic diff=0.004641, rho=0.030401\n", + "2019-01-31 00:53:17,221 : INFO : PROGRESS: pass 0, at document #2166000/4922894\n", + "2019-01-31 00:53:18,637 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:53:18,903 : INFO : topic #37 (0.020): 0.010*\"charact\" + 0.010*\"man\" + 0.009*\"septemb\" + 0.008*\"comic\" + 0.007*\"love\" + 0.007*\"appear\" + 0.007*\"anim\" + 0.006*\"gestur\" + 0.005*\"workplac\" + 0.005*\"blue\"\n", + "2019-01-31 00:53:18,905 : INFO : topic #21 (0.020): 0.033*\"samford\" + 0.021*\"spain\" + 0.019*\"del\" + 0.017*\"mexico\" + 0.013*\"soviet\" + 0.012*\"juan\" + 0.012*\"carlo\" + 0.011*\"santa\" + 0.011*\"italian\" + 0.011*\"lizard\"\n", + "2019-01-31 00:53:18,906 : INFO : topic #49 (0.020): 0.043*\"india\" + 0.028*\"incumb\" + 0.013*\"islam\" + 0.013*\"anglo\" + 0.013*\"televis\" + 0.012*\"pakistan\" + 0.011*\"muskoge\" + 0.010*\"affection\" + 0.010*\"singh\" + 0.010*\"start\"\n", + "2019-01-31 00:53:18,907 : INFO : topic #25 (0.020): 0.034*\"ring\" + 0.018*\"lagrang\" + 0.016*\"warmth\" + 0.016*\"area\" + 0.016*\"mount\" + 0.009*\"north\" + 0.009*\"vacant\" + 0.008*\"palmer\" + 0.008*\"crayfish\" + 0.008*\"land\"\n", + "2019-01-31 00:53:18,908 : INFO : topic #35 (0.020): 0.056*\"russia\" + 0.036*\"sovereignti\" + 0.034*\"rural\" + 0.027*\"poison\" + 0.026*\"personifi\" + 0.023*\"reprint\" + 0.020*\"poland\" + 0.019*\"moscow\" + 0.017*\"alexand\" + 0.015*\"tyrant\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 00:53:18,914 : INFO : topic diff=0.006502, rho=0.030387\n", + "2019-01-31 00:53:19,073 : INFO : PROGRESS: pass 0, at document #2168000/4922894\n", + "2019-01-31 00:53:20,467 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:53:20,733 : INFO : topic #44 (0.020): 0.030*\"rooftop\" + 0.027*\"final\" + 0.023*\"wife\" + 0.021*\"champion\" + 0.020*\"tourist\" + 0.016*\"chamber\" + 0.016*\"martin\" + 0.016*\"tiepolo\" + 0.015*\"taxpay\" + 0.012*\"women\"\n", + "2019-01-31 00:53:20,735 : INFO : topic #45 (0.020): 0.027*\"jpg\" + 0.026*\"fifteenth\" + 0.017*\"colder\" + 0.017*\"illicit\" + 0.015*\"western\" + 0.015*\"black\" + 0.013*\"record\" + 0.011*\"blind\" + 0.009*\"depress\" + 0.008*\"arm\"\n", + "2019-01-31 00:53:20,736 : INFO : topic #48 (0.020): 0.079*\"march\" + 0.077*\"sens\" + 0.075*\"octob\" + 0.068*\"juli\" + 0.068*\"januari\" + 0.068*\"notion\" + 0.067*\"august\" + 0.066*\"judici\" + 0.066*\"april\" + 0.063*\"decatur\"\n", + "2019-01-31 00:53:20,737 : INFO : topic #11 (0.020): 0.024*\"john\" + 0.013*\"will\" + 0.012*\"jame\" + 0.012*\"david\" + 0.010*\"rival\" + 0.009*\"mexican–american\" + 0.009*\"georg\" + 0.008*\"slur\" + 0.008*\"paul\" + 0.008*\"rhyme\"\n", + "2019-01-31 00:53:20,738 : INFO : topic #25 (0.020): 0.033*\"ring\" + 0.017*\"lagrang\" + 0.016*\"area\" + 0.016*\"warmth\" + 0.016*\"mount\" + 0.009*\"north\" + 0.009*\"vacant\" + 0.008*\"palmer\" + 0.008*\"land\" + 0.008*\"crayfish\"\n", + "2019-01-31 00:53:20,744 : INFO : topic diff=0.004136, rho=0.030373\n", + "2019-01-31 00:53:20,902 : INFO : PROGRESS: pass 0, at document #2170000/4922894\n", + "2019-01-31 00:53:22,294 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:53:22,561 : INFO : topic #11 (0.020): 0.024*\"john\" + 0.013*\"will\" + 0.012*\"jame\" + 0.012*\"david\" + 0.010*\"rival\" + 0.009*\"mexican–american\" + 0.009*\"georg\" + 0.008*\"slur\" + 0.008*\"paul\" + 0.008*\"rhyme\"\n", + "2019-01-31 00:53:22,562 : INFO : topic #8 (0.020): 0.027*\"law\" + 0.024*\"cortic\" + 0.019*\"start\" + 0.017*\"act\" + 0.012*\"ricardo\" + 0.012*\"case\" + 0.010*\"replac\" + 0.010*\"polaris\" + 0.009*\"legal\" + 0.008*\"order\"\n", + "2019-01-31 00:53:22,563 : INFO : topic #48 (0.020): 0.079*\"march\" + 0.077*\"sens\" + 0.076*\"octob\" + 0.069*\"juli\" + 0.068*\"januari\" + 0.068*\"notion\" + 0.067*\"august\" + 0.066*\"judici\" + 0.066*\"april\" + 0.062*\"decatur\"\n", + "2019-01-31 00:53:22,564 : INFO : topic #16 (0.020): 0.055*\"king\" + 0.032*\"priest\" + 0.022*\"duke\" + 0.021*\"rotterdam\" + 0.019*\"grammat\" + 0.018*\"quarterli\" + 0.018*\"idiosyncrat\" + 0.015*\"kingdom\" + 0.013*\"count\" + 0.013*\"portugues\"\n", + "2019-01-31 00:53:22,565 : INFO : topic #0 (0.020): 0.067*\"statewid\" + 0.040*\"line\" + 0.034*\"arsen\" + 0.031*\"raid\" + 0.026*\"museo\" + 0.019*\"traceabl\" + 0.018*\"serv\" + 0.013*\"pain\" + 0.013*\"exhaust\" + 0.013*\"rosenwald\"\n", + "2019-01-31 00:53:22,571 : INFO : topic diff=0.004951, rho=0.030359\n", + "2019-01-31 00:53:22,728 : INFO : PROGRESS: pass 0, at document #2172000/4922894\n", + "2019-01-31 00:53:24,144 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:53:24,411 : INFO : topic #46 (0.020): 0.018*\"damag\" + 0.017*\"stop\" + 0.016*\"sweden\" + 0.016*\"swedish\" + 0.015*\"norwai\" + 0.014*\"wind\" + 0.013*\"norwegian\" + 0.012*\"turkish\" + 0.011*\"turkei\" + 0.011*\"huntsvil\"\n", + "2019-01-31 00:53:24,412 : INFO : topic #0 (0.020): 0.067*\"statewid\" + 0.040*\"line\" + 0.034*\"arsen\" + 0.032*\"raid\" + 0.026*\"museo\" + 0.019*\"traceabl\" + 0.017*\"serv\" + 0.013*\"exhaust\" + 0.013*\"pain\" + 0.013*\"rosenwald\"\n", + "2019-01-31 00:53:24,413 : INFO : topic #45 (0.020): 0.027*\"jpg\" + 0.026*\"fifteenth\" + 0.017*\"illicit\" + 0.017*\"colder\" + 0.016*\"western\" + 0.015*\"black\" + 0.013*\"record\" + 0.011*\"blind\" + 0.009*\"depress\" + 0.008*\"arm\"\n", + "2019-01-31 00:53:24,415 : INFO : topic #16 (0.020): 0.055*\"king\" + 0.032*\"priest\" + 0.022*\"duke\" + 0.021*\"rotterdam\" + 0.019*\"grammat\" + 0.018*\"quarterli\" + 0.017*\"idiosyncrat\" + 0.014*\"kingdom\" + 0.013*\"count\" + 0.013*\"portugues\"\n", + "2019-01-31 00:53:24,416 : INFO : topic #33 (0.020): 0.061*\"french\" + 0.047*\"franc\" + 0.030*\"pari\" + 0.024*\"sail\" + 0.023*\"jean\" + 0.016*\"daphn\" + 0.013*\"lazi\" + 0.012*\"loui\" + 0.011*\"piec\" + 0.009*\"wine\"\n", + "2019-01-31 00:53:24,422 : INFO : topic diff=0.004714, rho=0.030345\n", + "2019-01-31 00:53:24,634 : INFO : PROGRESS: pass 0, at document #2174000/4922894\n", + "2019-01-31 00:53:26,023 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:53:26,289 : INFO : topic #8 (0.020): 0.027*\"law\" + 0.025*\"cortic\" + 0.019*\"start\" + 0.017*\"act\" + 0.013*\"ricardo\" + 0.012*\"case\" + 0.010*\"replac\" + 0.010*\"polaris\" + 0.009*\"legal\" + 0.008*\"order\"\n", + "2019-01-31 00:53:26,290 : INFO : topic #23 (0.020): 0.135*\"audit\" + 0.065*\"best\" + 0.031*\"yawn\" + 0.031*\"jacksonvil\" + 0.024*\"japanes\" + 0.021*\"noll\" + 0.019*\"women\" + 0.019*\"festiv\" + 0.016*\"intern\" + 0.014*\"prison\"\n", + "2019-01-31 00:53:26,292 : INFO : topic #9 (0.020): 0.075*\"bone\" + 0.047*\"american\" + 0.027*\"valour\" + 0.018*\"folei\" + 0.018*\"player\" + 0.017*\"polit\" + 0.017*\"english\" + 0.016*\"dutch\" + 0.012*\"acrimoni\" + 0.011*\"surnam\"\n", + "2019-01-31 00:53:26,293 : INFO : topic #3 (0.020): 0.033*\"present\" + 0.027*\"offic\" + 0.023*\"minist\" + 0.022*\"nation\" + 0.021*\"govern\" + 0.020*\"serv\" + 0.020*\"member\" + 0.016*\"gener\" + 0.015*\"start\" + 0.015*\"seri\"\n", + "2019-01-31 00:53:26,294 : INFO : topic #41 (0.020): 0.042*\"citi\" + 0.024*\"new\" + 0.022*\"palmer\" + 0.014*\"strategist\" + 0.012*\"open\" + 0.012*\"center\" + 0.011*\"includ\" + 0.011*\"lobe\" + 0.010*\"dai\" + 0.009*\"highli\"\n", + "2019-01-31 00:53:26,300 : INFO : topic diff=0.005065, rho=0.030331\n", + "2019-01-31 00:53:26,456 : INFO : PROGRESS: pass 0, at document #2176000/4922894\n", + "2019-01-31 00:53:27,852 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:53:28,118 : INFO : topic #14 (0.020): 0.023*\"forc\" + 0.022*\"aggress\" + 0.021*\"armi\" + 0.020*\"walter\" + 0.017*\"com\" + 0.014*\"unionist\" + 0.014*\"militari\" + 0.014*\"oper\" + 0.012*\"airbu\" + 0.012*\"refut\"\n", + "2019-01-31 00:53:28,119 : INFO : topic #9 (0.020): 0.077*\"bone\" + 0.046*\"american\" + 0.027*\"valour\" + 0.018*\"folei\" + 0.018*\"player\" + 0.017*\"polit\" + 0.017*\"dutch\" + 0.016*\"english\" + 0.013*\"acrimoni\" + 0.011*\"simpler\"\n", + "2019-01-31 00:53:28,120 : INFO : topic #49 (0.020): 0.043*\"india\" + 0.028*\"incumb\" + 0.013*\"islam\" + 0.013*\"televis\" + 0.012*\"anglo\" + 0.012*\"pakistan\" + 0.011*\"muskoge\" + 0.010*\"khalsa\" + 0.010*\"affection\" + 0.009*\"singh\"\n", + "2019-01-31 00:53:28,122 : INFO : topic #8 (0.020): 0.027*\"law\" + 0.025*\"cortic\" + 0.019*\"start\" + 0.017*\"act\" + 0.013*\"ricardo\" + 0.012*\"case\" + 0.010*\"replac\" + 0.010*\"polaris\" + 0.009*\"legal\" + 0.008*\"order\"\n", + "2019-01-31 00:53:28,123 : INFO : topic #48 (0.020): 0.079*\"march\" + 0.077*\"sens\" + 0.076*\"octob\" + 0.070*\"juli\" + 0.069*\"januari\" + 0.068*\"notion\" + 0.067*\"august\" + 0.067*\"judici\" + 0.066*\"april\" + 0.063*\"decatur\"\n", + "2019-01-31 00:53:28,129 : INFO : topic diff=0.004624, rho=0.030317\n", + "2019-01-31 00:53:28,283 : INFO : PROGRESS: pass 0, at document #2178000/4922894\n", + "2019-01-31 00:53:29,652 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:53:29,919 : INFO : topic #37 (0.020): 0.010*\"charact\" + 0.010*\"man\" + 0.009*\"septemb\" + 0.007*\"comic\" + 0.007*\"love\" + 0.007*\"anim\" + 0.007*\"appear\" + 0.006*\"gestur\" + 0.005*\"workplac\" + 0.005*\"blue\"\n", + "2019-01-31 00:53:29,920 : INFO : topic #33 (0.020): 0.062*\"french\" + 0.046*\"franc\" + 0.030*\"pari\" + 0.023*\"sail\" + 0.023*\"jean\" + 0.017*\"daphn\" + 0.014*\"lazi\" + 0.012*\"loui\" + 0.011*\"piec\" + 0.009*\"wine\"\n", + "2019-01-31 00:53:29,922 : INFO : topic #3 (0.020): 0.033*\"present\" + 0.027*\"offic\" + 0.024*\"minist\" + 0.022*\"nation\" + 0.021*\"govern\" + 0.020*\"member\" + 0.020*\"serv\" + 0.016*\"gener\" + 0.015*\"start\" + 0.015*\"chickasaw\"\n", + "2019-01-31 00:53:29,923 : INFO : topic #41 (0.020): 0.041*\"citi\" + 0.024*\"new\" + 0.022*\"palmer\" + 0.014*\"strategist\" + 0.012*\"open\" + 0.012*\"center\" + 0.011*\"includ\" + 0.010*\"lobe\" + 0.010*\"dai\" + 0.009*\"highli\"\n", + "2019-01-31 00:53:29,924 : INFO : topic #21 (0.020): 0.033*\"samford\" + 0.022*\"spain\" + 0.019*\"del\" + 0.017*\"mexico\" + 0.014*\"soviet\" + 0.012*\"italian\" + 0.012*\"juan\" + 0.012*\"carlo\" + 0.011*\"santa\" + 0.011*\"lizard\"\n", + "2019-01-31 00:53:29,930 : INFO : topic diff=0.004867, rho=0.030303\n", + "2019-01-31 00:53:32,656 : INFO : -11.674 per-word bound, 3268.0 perplexity estimate based on a held-out corpus of 2000 documents with 584163 words\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 00:53:32,657 : INFO : PROGRESS: pass 0, at document #2180000/4922894\n", + "2019-01-31 00:53:34,051 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:53:34,317 : INFO : topic #46 (0.020): 0.017*\"damag\" + 0.017*\"stop\" + 0.016*\"sweden\" + 0.016*\"swedish\" + 0.016*\"norwai\" + 0.014*\"wind\" + 0.013*\"norwegian\" + 0.012*\"turkish\" + 0.011*\"turkei\" + 0.011*\"farid\"\n", + "2019-01-31 00:53:34,319 : INFO : topic #24 (0.020): 0.040*\"book\" + 0.035*\"publicis\" + 0.025*\"word\" + 0.017*\"new\" + 0.015*\"edit\" + 0.013*\"presid\" + 0.012*\"nicola\" + 0.012*\"storag\" + 0.012*\"collect\" + 0.011*\"author\"\n", + "2019-01-31 00:53:34,320 : INFO : topic #40 (0.020): 0.089*\"unit\" + 0.023*\"schuster\" + 0.022*\"collector\" + 0.021*\"institut\" + 0.021*\"requir\" + 0.019*\"student\" + 0.015*\"professor\" + 0.012*\"word\" + 0.011*\"governor\" + 0.011*\"degre\"\n", + "2019-01-31 00:53:34,321 : INFO : topic #42 (0.020): 0.045*\"german\" + 0.031*\"germani\" + 0.014*\"jewish\" + 0.014*\"vol\" + 0.014*\"berlin\" + 0.013*\"der\" + 0.013*\"israel\" + 0.011*\"european\" + 0.010*\"europ\" + 0.009*\"itali\"\n", + "2019-01-31 00:53:34,323 : INFO : topic #31 (0.020): 0.052*\"fusiform\" + 0.026*\"scientist\" + 0.025*\"taxpay\" + 0.024*\"player\" + 0.020*\"place\" + 0.013*\"clot\" + 0.013*\"leagu\" + 0.011*\"folei\" + 0.010*\"yawn\" + 0.009*\"reconstruct\"\n", + "2019-01-31 00:53:34,329 : INFO : topic diff=0.004981, rho=0.030289\n", + "2019-01-31 00:53:34,488 : INFO : PROGRESS: pass 0, at document #2182000/4922894\n", + "2019-01-31 00:53:35,888 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:53:36,155 : INFO : topic #41 (0.020): 0.041*\"citi\" + 0.024*\"new\" + 0.022*\"palmer\" + 0.014*\"strategist\" + 0.012*\"open\" + 0.012*\"center\" + 0.011*\"includ\" + 0.010*\"lobe\" + 0.010*\"dai\" + 0.009*\"highli\"\n", + "2019-01-31 00:53:36,156 : INFO : topic #27 (0.020): 0.070*\"questionnair\" + 0.019*\"candid\" + 0.018*\"taxpay\" + 0.014*\"tornado\" + 0.012*\"ret\" + 0.012*\"driver\" + 0.012*\"find\" + 0.012*\"squatter\" + 0.011*\"fool\" + 0.011*\"champion\"\n", + "2019-01-31 00:53:36,158 : INFO : topic #28 (0.020): 0.030*\"build\" + 0.026*\"hous\" + 0.021*\"rivièr\" + 0.017*\"buford\" + 0.013*\"histor\" + 0.012*\"briarwood\" + 0.011*\"strategist\" + 0.010*\"constitut\" + 0.010*\"linear\" + 0.010*\"depress\"\n", + "2019-01-31 00:53:36,159 : INFO : topic #6 (0.020): 0.071*\"fewer\" + 0.024*\"epiru\" + 0.023*\"septemb\" + 0.019*\"teacher\" + 0.016*\"stake\" + 0.013*\"proclaim\" + 0.013*\"rodríguez\" + 0.011*\"direct\" + 0.011*\"movi\" + 0.011*\"acrimoni\"\n", + "2019-01-31 00:53:36,160 : INFO : topic #4 (0.020): 0.021*\"enfranchis\" + 0.015*\"depress\" + 0.014*\"pour\" + 0.009*\"mode\" + 0.008*\"veget\" + 0.008*\"elabor\" + 0.007*\"uruguayan\" + 0.007*\"encyclopedia\" + 0.006*\"spectacl\" + 0.006*\"develop\"\n", + "2019-01-31 00:53:36,166 : INFO : topic diff=0.004280, rho=0.030275\n", + "2019-01-31 00:53:36,325 : INFO : PROGRESS: pass 0, at document #2184000/4922894\n", + "2019-01-31 00:53:37,742 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:53:38,008 : INFO : topic #30 (0.020): 0.036*\"leagu\" + 0.035*\"cleveland\" + 0.029*\"place\" + 0.027*\"taxpay\" + 0.024*\"scientist\" + 0.024*\"crete\" + 0.021*\"folei\" + 0.017*\"goal\" + 0.015*\"martin\" + 0.012*\"schmitz\"\n", + "2019-01-31 00:53:38,009 : INFO : topic #48 (0.020): 0.079*\"march\" + 0.077*\"sens\" + 0.077*\"octob\" + 0.069*\"juli\" + 0.069*\"januari\" + 0.068*\"notion\" + 0.068*\"august\" + 0.066*\"judici\" + 0.066*\"april\" + 0.064*\"decatur\"\n", + "2019-01-31 00:53:38,010 : INFO : topic #17 (0.020): 0.076*\"church\" + 0.023*\"christian\" + 0.022*\"cathol\" + 0.020*\"bishop\" + 0.016*\"sail\" + 0.016*\"retroflex\" + 0.009*\"cathedr\" + 0.009*\"centuri\" + 0.009*\"relationship\" + 0.009*\"poll\"\n", + "2019-01-31 00:53:38,011 : INFO : topic #33 (0.020): 0.063*\"french\" + 0.047*\"franc\" + 0.029*\"pari\" + 0.023*\"sail\" + 0.023*\"jean\" + 0.017*\"daphn\" + 0.013*\"lazi\" + 0.012*\"loui\" + 0.011*\"piec\" + 0.009*\"wine\"\n", + "2019-01-31 00:53:38,012 : INFO : topic #18 (0.020): 0.011*\"théori\" + 0.007*\"later\" + 0.007*\"sack\" + 0.006*\"dai\" + 0.006*\"kill\" + 0.005*\"retrospect\" + 0.005*\"end\" + 0.005*\"like\" + 0.004*\"help\" + 0.004*\"call\"\n", + "2019-01-31 00:53:38,018 : INFO : topic diff=0.004740, rho=0.030261\n", + "2019-01-31 00:53:38,179 : INFO : PROGRESS: pass 0, at document #2186000/4922894\n", + "2019-01-31 00:53:39,604 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:53:39,870 : INFO : topic #46 (0.020): 0.018*\"stop\" + 0.017*\"damag\" + 0.017*\"sweden\" + 0.016*\"norwai\" + 0.016*\"swedish\" + 0.014*\"wind\" + 0.013*\"norwegian\" + 0.012*\"turkish\" + 0.011*\"turkei\" + 0.011*\"treeless\"\n", + "2019-01-31 00:53:39,871 : INFO : topic #2 (0.020): 0.049*\"isl\" + 0.038*\"shield\" + 0.018*\"narrat\" + 0.014*\"scot\" + 0.012*\"pope\" + 0.011*\"blur\" + 0.011*\"coalit\" + 0.011*\"nativist\" + 0.009*\"class\" + 0.009*\"fleet\"\n", + "2019-01-31 00:53:39,872 : INFO : topic #13 (0.020): 0.027*\"new\" + 0.026*\"sourc\" + 0.026*\"australia\" + 0.024*\"london\" + 0.023*\"australian\" + 0.023*\"england\" + 0.020*\"ireland\" + 0.020*\"british\" + 0.015*\"wale\" + 0.015*\"youth\"\n", + "2019-01-31 00:53:39,873 : INFO : topic #3 (0.020): 0.034*\"present\" + 0.027*\"offic\" + 0.024*\"minist\" + 0.022*\"nation\" + 0.021*\"govern\" + 0.020*\"member\" + 0.019*\"serv\" + 0.016*\"gener\" + 0.016*\"start\" + 0.015*\"seri\"\n", + "2019-01-31 00:53:39,874 : INFO : topic #21 (0.020): 0.034*\"samford\" + 0.022*\"spain\" + 0.019*\"del\" + 0.018*\"mexico\" + 0.014*\"soviet\" + 0.012*\"italian\" + 0.012*\"carlo\" + 0.012*\"santa\" + 0.011*\"juan\" + 0.011*\"francisco\"\n", + "2019-01-31 00:53:39,880 : INFO : topic diff=0.004062, rho=0.030248\n", + "2019-01-31 00:53:40,036 : INFO : PROGRESS: pass 0, at document #2188000/4922894\n", + "2019-01-31 00:53:41,423 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:53:41,689 : INFO : topic #23 (0.020): 0.136*\"audit\" + 0.065*\"best\" + 0.031*\"yawn\" + 0.030*\"jacksonvil\" + 0.024*\"japanes\" + 0.022*\"noll\" + 0.020*\"festiv\" + 0.020*\"women\" + 0.016*\"intern\" + 0.014*\"prison\"\n", + "2019-01-31 00:53:41,690 : INFO : topic #42 (0.020): 0.046*\"german\" + 0.031*\"germani\" + 0.016*\"berlin\" + 0.014*\"jewish\" + 0.014*\"vol\" + 0.013*\"israel\" + 0.013*\"der\" + 0.011*\"european\" + 0.010*\"europ\" + 0.009*\"itali\"\n", + "2019-01-31 00:53:41,692 : INFO : topic #6 (0.020): 0.071*\"fewer\" + 0.024*\"epiru\" + 0.023*\"septemb\" + 0.019*\"teacher\" + 0.016*\"stake\" + 0.013*\"rodríguez\" + 0.013*\"proclaim\" + 0.011*\"direct\" + 0.011*\"movi\" + 0.011*\"acrimoni\"\n", + "2019-01-31 00:53:41,693 : INFO : topic #22 (0.020): 0.033*\"spars\" + 0.023*\"factor\" + 0.019*\"adulthood\" + 0.015*\"feel\" + 0.013*\"male\" + 0.011*\"plaisir\" + 0.010*\"hostil\" + 0.010*\"genu\" + 0.008*\"median\" + 0.008*\"western\"\n", + "2019-01-31 00:53:41,694 : INFO : topic #19 (0.020): 0.016*\"languag\" + 0.014*\"centuri\" + 0.011*\"woodcut\" + 0.009*\"form\" + 0.009*\"origin\" + 0.009*\"mean\" + 0.008*\"trade\" + 0.008*\"english\" + 0.007*\"known\" + 0.006*\"uruguayan\"\n", + "2019-01-31 00:53:41,699 : INFO : topic diff=0.004906, rho=0.030234\n", + "2019-01-31 00:53:41,859 : INFO : PROGRESS: pass 0, at document #2190000/4922894\n", + "2019-01-31 00:53:43,275 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:53:43,541 : INFO : topic #14 (0.020): 0.023*\"forc\" + 0.022*\"aggress\" + 0.021*\"armi\" + 0.020*\"walter\" + 0.018*\"com\" + 0.014*\"oper\" + 0.014*\"unionist\" + 0.014*\"militari\" + 0.012*\"airbu\" + 0.011*\"refut\"\n", + "2019-01-31 00:53:43,543 : INFO : topic #0 (0.020): 0.067*\"statewid\" + 0.041*\"line\" + 0.035*\"arsen\" + 0.031*\"raid\" + 0.027*\"museo\" + 0.019*\"traceabl\" + 0.018*\"serv\" + 0.013*\"pain\" + 0.013*\"exhaust\" + 0.013*\"rosenwald\"\n", + "2019-01-31 00:53:43,544 : INFO : topic #48 (0.020): 0.080*\"march\" + 0.077*\"sens\" + 0.077*\"octob\" + 0.070*\"juli\" + 0.070*\"judici\" + 0.069*\"januari\" + 0.068*\"notion\" + 0.068*\"august\" + 0.067*\"april\" + 0.065*\"decatur\"\n", + "2019-01-31 00:53:43,545 : INFO : topic #34 (0.020): 0.069*\"start\" + 0.031*\"new\" + 0.030*\"american\" + 0.029*\"unionist\" + 0.027*\"cotton\" + 0.020*\"year\" + 0.014*\"california\" + 0.013*\"warrior\" + 0.013*\"terri\" + 0.012*\"north\"\n", + "2019-01-31 00:53:43,546 : INFO : topic #6 (0.020): 0.071*\"fewer\" + 0.024*\"epiru\" + 0.023*\"septemb\" + 0.019*\"teacher\" + 0.016*\"stake\" + 0.013*\"rodríguez\" + 0.013*\"proclaim\" + 0.011*\"direct\" + 0.011*\"movi\" + 0.011*\"acrimoni\"\n", + "2019-01-31 00:53:43,551 : INFO : topic diff=0.004048, rho=0.030220\n", + "2019-01-31 00:53:43,707 : INFO : PROGRESS: pass 0, at document #2192000/4922894\n", + "2019-01-31 00:53:45,099 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 00:53:45,365 : INFO : topic #8 (0.020): 0.026*\"law\" + 0.025*\"cortic\" + 0.019*\"start\" + 0.017*\"act\" + 0.014*\"ricardo\" + 0.012*\"case\" + 0.010*\"replac\" + 0.010*\"order\" + 0.009*\"polaris\" + 0.009*\"legal\"\n", + "2019-01-31 00:53:45,366 : INFO : topic #43 (0.020): 0.063*\"elect\" + 0.053*\"parti\" + 0.025*\"voluntari\" + 0.022*\"democrat\" + 0.021*\"member\" + 0.017*\"polici\" + 0.015*\"seaport\" + 0.014*\"republ\" + 0.013*\"liber\" + 0.013*\"bypass\"\n", + "2019-01-31 00:53:45,367 : INFO : topic #49 (0.020): 0.043*\"india\" + 0.030*\"incumb\" + 0.013*\"islam\" + 0.012*\"televis\" + 0.012*\"pakistan\" + 0.012*\"anglo\" + 0.010*\"muskoge\" + 0.010*\"khalsa\" + 0.010*\"affection\" + 0.009*\"sri\"\n", + "2019-01-31 00:53:45,368 : INFO : topic #9 (0.020): 0.074*\"bone\" + 0.046*\"american\" + 0.026*\"valour\" + 0.018*\"folei\" + 0.018*\"player\" + 0.017*\"polit\" + 0.017*\"english\" + 0.017*\"dutch\" + 0.013*\"acrimoni\" + 0.012*\"simpler\"\n", + "2019-01-31 00:53:45,369 : INFO : topic #27 (0.020): 0.071*\"questionnair\" + 0.019*\"candid\" + 0.018*\"taxpay\" + 0.014*\"tornado\" + 0.013*\"ret\" + 0.012*\"driver\" + 0.012*\"find\" + 0.011*\"squatter\" + 0.011*\"fool\" + 0.011*\"champion\"\n", + "2019-01-31 00:53:45,375 : INFO : topic diff=0.004663, rho=0.030206\n", + "2019-01-31 00:53:45,530 : INFO : PROGRESS: pass 0, at document #2194000/4922894\n", + "2019-01-31 00:53:46,904 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:53:47,170 : INFO : topic #20 (0.020): 0.143*\"scholar\" + 0.040*\"struggl\" + 0.033*\"high\" + 0.030*\"educ\" + 0.024*\"collector\" + 0.018*\"yawn\" + 0.013*\"prognosi\" + 0.010*\"class\" + 0.010*\"gothic\" + 0.009*\"district\"\n", + "2019-01-31 00:53:47,171 : INFO : topic #3 (0.020): 0.033*\"present\" + 0.027*\"offic\" + 0.024*\"minist\" + 0.022*\"member\" + 0.022*\"nation\" + 0.021*\"govern\" + 0.019*\"serv\" + 0.016*\"gener\" + 0.016*\"start\" + 0.015*\"seri\"\n", + "2019-01-31 00:53:47,172 : INFO : topic #36 (0.020): 0.012*\"prognosi\" + 0.012*\"pop\" + 0.011*\"network\" + 0.008*\"championship\" + 0.008*\"develop\" + 0.008*\"diggin\" + 0.008*\"cytokin\" + 0.008*\"brio\" + 0.008*\"softwar\" + 0.008*\"user\"\n", + "2019-01-31 00:53:47,173 : INFO : topic #46 (0.020): 0.018*\"stop\" + 0.018*\"damag\" + 0.016*\"sweden\" + 0.016*\"swedish\" + 0.015*\"norwai\" + 0.014*\"wind\" + 0.014*\"norwegian\" + 0.012*\"treeless\" + 0.011*\"turkish\" + 0.011*\"huntsvil\"\n", + "2019-01-31 00:53:47,174 : INFO : topic #29 (0.020): 0.028*\"companhia\" + 0.012*\"busi\" + 0.012*\"million\" + 0.011*\"bank\" + 0.011*\"produc\" + 0.010*\"market\" + 0.009*\"industri\" + 0.009*\"yawn\" + 0.007*\"manag\" + 0.007*\"function\"\n", + "2019-01-31 00:53:47,180 : INFO : topic diff=0.004133, rho=0.030192\n", + "2019-01-31 00:53:47,341 : INFO : PROGRESS: pass 0, at document #2196000/4922894\n", + "2019-01-31 00:53:48,739 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:53:49,005 : INFO : topic #6 (0.020): 0.071*\"fewer\" + 0.024*\"epiru\" + 0.023*\"septemb\" + 0.019*\"teacher\" + 0.016*\"stake\" + 0.013*\"rodríguez\" + 0.013*\"proclaim\" + 0.011*\"direct\" + 0.011*\"movi\" + 0.011*\"acrimoni\"\n", + "2019-01-31 00:53:49,006 : INFO : topic #34 (0.020): 0.068*\"start\" + 0.031*\"new\" + 0.030*\"american\" + 0.029*\"unionist\" + 0.026*\"cotton\" + 0.020*\"year\" + 0.014*\"california\" + 0.013*\"warrior\" + 0.012*\"terri\" + 0.012*\"north\"\n", + "2019-01-31 00:53:49,007 : INFO : topic #11 (0.020): 0.024*\"john\" + 0.012*\"will\" + 0.012*\"jame\" + 0.012*\"david\" + 0.010*\"rival\" + 0.009*\"mexican–american\" + 0.009*\"georg\" + 0.008*\"slur\" + 0.008*\"paul\" + 0.008*\"rhyme\"\n", + "2019-01-31 00:53:49,008 : INFO : topic #15 (0.020): 0.011*\"small\" + 0.011*\"organ\" + 0.010*\"commun\" + 0.010*\"develop\" + 0.009*\"word\" + 0.009*\"group\" + 0.008*\"peopl\" + 0.007*\"woman\" + 0.007*\"cultur\" + 0.007*\"human\"\n", + "2019-01-31 00:53:49,009 : INFO : topic #30 (0.020): 0.036*\"leagu\" + 0.035*\"cleveland\" + 0.029*\"place\" + 0.027*\"taxpay\" + 0.025*\"scientist\" + 0.024*\"crete\" + 0.021*\"folei\" + 0.017*\"goal\" + 0.015*\"martin\" + 0.012*\"schmitz\"\n", + "2019-01-31 00:53:49,015 : INFO : topic diff=0.004337, rho=0.030179\n", + "2019-01-31 00:53:49,174 : INFO : PROGRESS: pass 0, at document #2198000/4922894\n", + "2019-01-31 00:53:50,699 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:53:50,965 : INFO : topic #0 (0.020): 0.066*\"statewid\" + 0.041*\"line\" + 0.035*\"arsen\" + 0.032*\"raid\" + 0.027*\"museo\" + 0.019*\"traceabl\" + 0.018*\"serv\" + 0.013*\"exhaust\" + 0.013*\"pain\" + 0.013*\"rosenwald\"\n", + "2019-01-31 00:53:50,966 : INFO : topic #22 (0.020): 0.033*\"spars\" + 0.023*\"factor\" + 0.018*\"adulthood\" + 0.015*\"feel\" + 0.013*\"male\" + 0.011*\"plaisir\" + 0.011*\"genu\" + 0.010*\"hostil\" + 0.008*\"western\" + 0.008*\"median\"\n", + "2019-01-31 00:53:50,967 : INFO : topic #48 (0.020): 0.083*\"sens\" + 0.080*\"march\" + 0.078*\"octob\" + 0.069*\"januari\" + 0.069*\"juli\" + 0.069*\"judici\" + 0.067*\"notion\" + 0.067*\"august\" + 0.066*\"april\" + 0.065*\"decatur\"\n", + "2019-01-31 00:53:50,968 : INFO : topic #16 (0.020): 0.054*\"king\" + 0.033*\"priest\" + 0.022*\"duke\" + 0.020*\"rotterdam\" + 0.019*\"grammat\" + 0.018*\"quarterli\" + 0.017*\"idiosyncrat\" + 0.015*\"kingdom\" + 0.014*\"portugues\" + 0.013*\"count\"\n", + "2019-01-31 00:53:50,970 : INFO : topic #20 (0.020): 0.143*\"scholar\" + 0.040*\"struggl\" + 0.033*\"high\" + 0.030*\"educ\" + 0.024*\"collector\" + 0.018*\"yawn\" + 0.012*\"prognosi\" + 0.010*\"class\" + 0.010*\"gothic\" + 0.009*\"task\"\n", + "2019-01-31 00:53:50,976 : INFO : topic diff=0.004598, rho=0.030165\n", + "2019-01-31 00:53:53,754 : INFO : -11.540 per-word bound, 2978.0 perplexity estimate based on a held-out corpus of 2000 documents with 588492 words\n", + "2019-01-31 00:53:53,755 : INFO : PROGRESS: pass 0, at document #2200000/4922894\n", + "2019-01-31 00:53:55,174 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:53:55,440 : INFO : topic #23 (0.020): 0.136*\"audit\" + 0.064*\"best\" + 0.031*\"yawn\" + 0.029*\"jacksonvil\" + 0.024*\"japanes\" + 0.021*\"noll\" + 0.020*\"festiv\" + 0.019*\"women\" + 0.016*\"intern\" + 0.015*\"prison\"\n", + "2019-01-31 00:53:55,441 : INFO : topic #46 (0.020): 0.018*\"stop\" + 0.017*\"damag\" + 0.016*\"sweden\" + 0.016*\"norwai\" + 0.015*\"swedish\" + 0.014*\"wind\" + 0.014*\"norwegian\" + 0.012*\"treeless\" + 0.012*\"huntsvil\" + 0.012*\"turkish\"\n", + "2019-01-31 00:53:55,442 : INFO : topic #0 (0.020): 0.065*\"statewid\" + 0.041*\"line\" + 0.034*\"arsen\" + 0.032*\"raid\" + 0.026*\"museo\" + 0.019*\"traceabl\" + 0.018*\"serv\" + 0.013*\"exhaust\" + 0.013*\"pain\" + 0.013*\"rosenwald\"\n", + "2019-01-31 00:53:55,444 : INFO : topic #31 (0.020): 0.052*\"fusiform\" + 0.026*\"scientist\" + 0.025*\"taxpay\" + 0.024*\"player\" + 0.020*\"place\" + 0.014*\"clot\" + 0.013*\"leagu\" + 0.011*\"folei\" + 0.010*\"yawn\" + 0.009*\"reconstruct\"\n", + "2019-01-31 00:53:55,445 : INFO : topic #44 (0.020): 0.030*\"rooftop\" + 0.026*\"final\" + 0.023*\"wife\" + 0.021*\"tourist\" + 0.020*\"champion\" + 0.016*\"martin\" + 0.016*\"chamber\" + 0.015*\"tiepolo\" + 0.015*\"taxpay\" + 0.013*\"women\"\n", + "2019-01-31 00:53:55,451 : INFO : topic diff=0.005532, rho=0.030151\n", + "2019-01-31 00:53:55,608 : INFO : PROGRESS: pass 0, at document #2202000/4922894\n", + "2019-01-31 00:53:56,996 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:53:57,262 : INFO : topic #4 (0.020): 0.020*\"enfranchis\" + 0.015*\"depress\" + 0.014*\"pour\" + 0.008*\"mode\" + 0.008*\"veget\" + 0.008*\"elabor\" + 0.007*\"uruguayan\" + 0.007*\"encyclopedia\" + 0.006*\"produc\" + 0.006*\"develop\"\n", + "2019-01-31 00:53:57,263 : INFO : topic #47 (0.020): 0.062*\"muscl\" + 0.032*\"perceptu\" + 0.020*\"theater\" + 0.018*\"place\" + 0.018*\"compos\" + 0.017*\"damn\" + 0.013*\"orchestr\" + 0.012*\"olympo\" + 0.012*\"physician\" + 0.012*\"jack\"\n", + "2019-01-31 00:53:57,264 : INFO : topic #16 (0.020): 0.054*\"king\" + 0.033*\"priest\" + 0.022*\"duke\" + 0.020*\"rotterdam\" + 0.020*\"grammat\" + 0.018*\"quarterli\" + 0.017*\"idiosyncrat\" + 0.015*\"kingdom\" + 0.014*\"portugues\" + 0.014*\"count\"\n", + "2019-01-31 00:53:57,265 : INFO : topic #49 (0.020): 0.045*\"india\" + 0.029*\"incumb\" + 0.013*\"islam\" + 0.013*\"televis\" + 0.013*\"pakistan\" + 0.011*\"anglo\" + 0.011*\"muskoge\" + 0.010*\"affection\" + 0.010*\"khalsa\" + 0.009*\"sri\"\n", + "2019-01-31 00:53:57,266 : INFO : topic #8 (0.020): 0.026*\"law\" + 0.025*\"cortic\" + 0.019*\"start\" + 0.016*\"act\" + 0.013*\"ricardo\" + 0.012*\"case\" + 0.010*\"replac\" + 0.010*\"order\" + 0.009*\"polaris\" + 0.009*\"legal\"\n", + "2019-01-31 00:53:57,272 : INFO : topic diff=0.003702, rho=0.030137\n", + "2019-01-31 00:53:57,429 : INFO : PROGRESS: pass 0, at document #2204000/4922894\n", + "2019-01-31 00:53:58,817 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 00:53:59,083 : INFO : topic #34 (0.020): 0.070*\"start\" + 0.032*\"new\" + 0.031*\"american\" + 0.029*\"unionist\" + 0.026*\"cotton\" + 0.021*\"year\" + 0.015*\"california\" + 0.013*\"warrior\" + 0.012*\"terri\" + 0.012*\"north\"\n", + "2019-01-31 00:53:59,084 : INFO : topic #44 (0.020): 0.030*\"rooftop\" + 0.026*\"final\" + 0.022*\"wife\" + 0.021*\"tourist\" + 0.020*\"champion\" + 0.016*\"chamber\" + 0.016*\"martin\" + 0.015*\"taxpay\" + 0.015*\"tiepolo\" + 0.013*\"women\"\n", + "2019-01-31 00:53:59,086 : INFO : topic #17 (0.020): 0.076*\"church\" + 0.023*\"christian\" + 0.022*\"cathol\" + 0.020*\"bishop\" + 0.016*\"sail\" + 0.016*\"retroflex\" + 0.010*\"relationship\" + 0.010*\"centuri\" + 0.009*\"cathedr\" + 0.009*\"historiographi\"\n", + "2019-01-31 00:53:59,087 : INFO : topic #3 (0.020): 0.033*\"present\" + 0.026*\"offic\" + 0.023*\"minist\" + 0.022*\"member\" + 0.022*\"nation\" + 0.022*\"govern\" + 0.018*\"serv\" + 0.016*\"gener\" + 0.016*\"start\" + 0.015*\"seri\"\n", + "2019-01-31 00:53:59,088 : INFO : topic #28 (0.020): 0.031*\"build\" + 0.026*\"hous\" + 0.021*\"rivièr\" + 0.017*\"buford\" + 0.014*\"briarwood\" + 0.013*\"histor\" + 0.011*\"strategist\" + 0.011*\"constitut\" + 0.010*\"linear\" + 0.010*\"depress\"\n", + "2019-01-31 00:53:59,093 : INFO : topic diff=0.005275, rho=0.030124\n", + "2019-01-31 00:53:59,306 : INFO : PROGRESS: pass 0, at document #2206000/4922894\n", + "2019-01-31 00:54:00,710 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:54:00,975 : INFO : topic #7 (0.020): 0.021*\"snatch\" + 0.020*\"di\" + 0.018*\"factor\" + 0.016*\"yawn\" + 0.015*\"margin\" + 0.014*\"bone\" + 0.013*\"life\" + 0.013*\"faster\" + 0.012*\"deal\" + 0.012*\"will\"\n", + "2019-01-31 00:54:00,976 : INFO : topic #10 (0.020): 0.012*\"cdd\" + 0.008*\"media\" + 0.008*\"disco\" + 0.007*\"hormon\" + 0.007*\"pathwai\" + 0.007*\"proper\" + 0.006*\"have\" + 0.006*\"caus\" + 0.006*\"effect\" + 0.006*\"treat\"\n", + "2019-01-31 00:54:00,977 : INFO : topic #2 (0.020): 0.048*\"isl\" + 0.038*\"shield\" + 0.018*\"narrat\" + 0.014*\"scot\" + 0.012*\"pope\" + 0.011*\"blur\" + 0.011*\"coalit\" + 0.010*\"nativist\" + 0.010*\"fleet\" + 0.009*\"class\"\n", + "2019-01-31 00:54:00,978 : INFO : topic #23 (0.020): 0.136*\"audit\" + 0.064*\"best\" + 0.032*\"yawn\" + 0.029*\"jacksonvil\" + 0.024*\"japanes\" + 0.021*\"noll\" + 0.020*\"festiv\" + 0.019*\"women\" + 0.017*\"intern\" + 0.014*\"prison\"\n", + "2019-01-31 00:54:00,980 : INFO : topic #11 (0.020): 0.024*\"john\" + 0.013*\"will\" + 0.012*\"jame\" + 0.012*\"david\" + 0.010*\"rival\" + 0.009*\"mexican–american\" + 0.009*\"georg\" + 0.008*\"slur\" + 0.008*\"paul\" + 0.008*\"rhyme\"\n", + "2019-01-31 00:54:00,985 : INFO : topic diff=0.004937, rho=0.030110\n", + "2019-01-31 00:54:01,145 : INFO : PROGRESS: pass 0, at document #2208000/4922894\n", + "2019-01-31 00:54:02,568 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:54:02,834 : INFO : topic #1 (0.020): 0.056*\"china\" + 0.045*\"chilton\" + 0.023*\"hong\" + 0.023*\"kong\" + 0.020*\"korea\" + 0.017*\"korean\" + 0.017*\"leah\" + 0.016*\"sourc\" + 0.013*\"kim\" + 0.013*\"shirin\"\n", + "2019-01-31 00:54:02,835 : INFO : topic #14 (0.020): 0.023*\"forc\" + 0.023*\"aggress\" + 0.021*\"armi\" + 0.020*\"walter\" + 0.018*\"com\" + 0.014*\"unionist\" + 0.014*\"oper\" + 0.013*\"militari\" + 0.012*\"airbu\" + 0.011*\"refut\"\n", + "2019-01-31 00:54:02,836 : INFO : topic #9 (0.020): 0.074*\"bone\" + 0.045*\"american\" + 0.026*\"valour\" + 0.019*\"folei\" + 0.018*\"player\" + 0.018*\"dutch\" + 0.017*\"polit\" + 0.017*\"english\" + 0.012*\"acrimoni\" + 0.012*\"simpler\"\n", + "2019-01-31 00:54:02,837 : INFO : topic #37 (0.020): 0.010*\"charact\" + 0.010*\"man\" + 0.009*\"septemb\" + 0.007*\"comic\" + 0.007*\"anim\" + 0.007*\"love\" + 0.007*\"appear\" + 0.006*\"gestur\" + 0.005*\"workplac\" + 0.005*\"vision\"\n", + "2019-01-31 00:54:02,838 : INFO : topic #13 (0.020): 0.027*\"new\" + 0.026*\"australia\" + 0.026*\"sourc\" + 0.025*\"london\" + 0.023*\"australian\" + 0.022*\"england\" + 0.020*\"british\" + 0.019*\"ireland\" + 0.015*\"wale\" + 0.015*\"youth\"\n", + "2019-01-31 00:54:02,844 : INFO : topic diff=0.004893, rho=0.030096\n", + "2019-01-31 00:54:02,997 : INFO : PROGRESS: pass 0, at document #2210000/4922894\n", + "2019-01-31 00:54:04,369 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:54:04,636 : INFO : topic #12 (0.020): 0.009*\"number\" + 0.008*\"frontal\" + 0.007*\"exampl\" + 0.007*\"théori\" + 0.007*\"southern\" + 0.006*\"servitud\" + 0.006*\"gener\" + 0.006*\"utopian\" + 0.006*\"poet\" + 0.006*\"measur\"\n", + "2019-01-31 00:54:04,637 : INFO : topic #22 (0.020): 0.033*\"spars\" + 0.023*\"factor\" + 0.019*\"adulthood\" + 0.015*\"feel\" + 0.013*\"male\" + 0.011*\"plaisir\" + 0.010*\"genu\" + 0.010*\"hostil\" + 0.009*\"western\" + 0.008*\"median\"\n", + "2019-01-31 00:54:04,638 : INFO : topic #32 (0.020): 0.053*\"district\" + 0.048*\"vigour\" + 0.044*\"popolo\" + 0.037*\"tortur\" + 0.033*\"cotton\" + 0.026*\"area\" + 0.022*\"multitud\" + 0.022*\"regim\" + 0.020*\"citi\" + 0.020*\"cede\"\n", + "2019-01-31 00:54:04,639 : INFO : topic #27 (0.020): 0.070*\"questionnair\" + 0.020*\"candid\" + 0.019*\"taxpay\" + 0.013*\"tornado\" + 0.012*\"driver\" + 0.012*\"ret\" + 0.012*\"find\" + 0.011*\"squatter\" + 0.011*\"fool\" + 0.011*\"champion\"\n", + "2019-01-31 00:54:04,640 : INFO : topic #2 (0.020): 0.049*\"isl\" + 0.038*\"shield\" + 0.018*\"narrat\" + 0.014*\"scot\" + 0.012*\"pope\" + 0.011*\"blur\" + 0.010*\"coalit\" + 0.010*\"nativist\" + 0.009*\"fleet\" + 0.009*\"class\"\n", + "2019-01-31 00:54:04,647 : INFO : topic diff=0.004713, rho=0.030083\n", + "2019-01-31 00:54:04,803 : INFO : PROGRESS: pass 0, at document #2212000/4922894\n", + "2019-01-31 00:54:06,190 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:54:06,459 : INFO : topic #39 (0.020): 0.055*\"canada\" + 0.042*\"canadian\" + 0.024*\"toronto\" + 0.022*\"hoar\" + 0.019*\"ontario\" + 0.015*\"quebec\" + 0.015*\"misericordia\" + 0.015*\"new\" + 0.013*\"hydrogen\" + 0.012*\"novotná\"\n", + "2019-01-31 00:54:06,460 : INFO : topic #14 (0.020): 0.023*\"forc\" + 0.022*\"aggress\" + 0.021*\"armi\" + 0.020*\"walter\" + 0.018*\"com\" + 0.014*\"unionist\" + 0.014*\"oper\" + 0.013*\"militari\" + 0.012*\"airbu\" + 0.011*\"refut\"\n", + "2019-01-31 00:54:06,461 : INFO : topic #41 (0.020): 0.041*\"citi\" + 0.024*\"new\" + 0.021*\"palmer\" + 0.014*\"strategist\" + 0.012*\"center\" + 0.012*\"open\" + 0.011*\"includ\" + 0.010*\"lobe\" + 0.010*\"dai\" + 0.009*\"highli\"\n", + "2019-01-31 00:54:06,463 : INFO : topic #40 (0.020): 0.089*\"unit\" + 0.023*\"collector\" + 0.023*\"schuster\" + 0.021*\"institut\" + 0.020*\"requir\" + 0.019*\"student\" + 0.015*\"professor\" + 0.012*\"word\" + 0.011*\"governor\" + 0.011*\"degre\"\n", + "2019-01-31 00:54:06,464 : INFO : topic #48 (0.020): 0.082*\"sens\" + 0.081*\"march\" + 0.078*\"octob\" + 0.070*\"juli\" + 0.070*\"januari\" + 0.069*\"judici\" + 0.068*\"august\" + 0.068*\"april\" + 0.068*\"notion\" + 0.065*\"decatur\"\n", + "2019-01-31 00:54:06,469 : INFO : topic diff=0.003931, rho=0.030069\n", + "2019-01-31 00:54:06,628 : INFO : PROGRESS: pass 0, at document #2214000/4922894\n", + "2019-01-31 00:54:08,018 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:54:08,285 : INFO : topic #27 (0.020): 0.068*\"questionnair\" + 0.019*\"candid\" + 0.019*\"taxpay\" + 0.015*\"ret\" + 0.013*\"tornado\" + 0.012*\"driver\" + 0.012*\"find\" + 0.011*\"squatter\" + 0.011*\"fool\" + 0.011*\"champion\"\n", + "2019-01-31 00:54:08,286 : INFO : topic #37 (0.020): 0.010*\"man\" + 0.010*\"charact\" + 0.009*\"septemb\" + 0.008*\"anim\" + 0.007*\"comic\" + 0.007*\"love\" + 0.007*\"appear\" + 0.006*\"gestur\" + 0.005*\"workplac\" + 0.005*\"blue\"\n", + "2019-01-31 00:54:08,287 : INFO : topic #23 (0.020): 0.136*\"audit\" + 0.066*\"best\" + 0.032*\"yawn\" + 0.029*\"jacksonvil\" + 0.024*\"japanes\" + 0.021*\"noll\" + 0.020*\"festiv\" + 0.019*\"women\" + 0.017*\"intern\" + 0.015*\"prison\"\n", + "2019-01-31 00:54:08,288 : INFO : topic #22 (0.020): 0.033*\"spars\" + 0.023*\"factor\" + 0.019*\"adulthood\" + 0.015*\"feel\" + 0.013*\"male\" + 0.011*\"plaisir\" + 0.011*\"genu\" + 0.010*\"hostil\" + 0.009*\"western\" + 0.008*\"median\"\n", + "2019-01-31 00:54:08,289 : INFO : topic #21 (0.020): 0.034*\"samford\" + 0.023*\"spain\" + 0.019*\"del\" + 0.017*\"mexico\" + 0.013*\"soviet\" + 0.013*\"italian\" + 0.013*\"santa\" + 0.011*\"carlo\" + 0.011*\"lizard\" + 0.011*\"juan\"\n", + "2019-01-31 00:54:08,295 : INFO : topic diff=0.004119, rho=0.030056\n", + "2019-01-31 00:54:08,449 : INFO : PROGRESS: pass 0, at document #2216000/4922894\n", + "2019-01-31 00:54:09,827 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:54:10,093 : INFO : topic #20 (0.020): 0.143*\"scholar\" + 0.041*\"struggl\" + 0.032*\"high\" + 0.031*\"educ\" + 0.025*\"collector\" + 0.019*\"yawn\" + 0.012*\"prognosi\" + 0.010*\"class\" + 0.009*\"task\" + 0.009*\"gothic\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 00:54:10,094 : INFO : topic #26 (0.020): 0.029*\"workplac\" + 0.028*\"woman\" + 0.027*\"champion\" + 0.025*\"men\" + 0.024*\"olymp\" + 0.023*\"alic\" + 0.022*\"medal\" + 0.020*\"event\" + 0.018*\"rainfal\" + 0.018*\"atheist\"\n", + "2019-01-31 00:54:10,095 : INFO : topic #36 (0.020): 0.011*\"pop\" + 0.011*\"prognosi\" + 0.011*\"network\" + 0.008*\"develop\" + 0.008*\"user\" + 0.008*\"brio\" + 0.008*\"championship\" + 0.008*\"diggin\" + 0.008*\"softwar\" + 0.008*\"cytokin\"\n", + "2019-01-31 00:54:10,096 : INFO : topic #44 (0.020): 0.030*\"rooftop\" + 0.026*\"final\" + 0.023*\"wife\" + 0.021*\"tourist\" + 0.020*\"champion\" + 0.017*\"martin\" + 0.016*\"tiepolo\" + 0.016*\"chamber\" + 0.015*\"taxpay\" + 0.013*\"women\"\n", + "2019-01-31 00:54:10,097 : INFO : topic #7 (0.020): 0.021*\"snatch\" + 0.020*\"di\" + 0.018*\"factor\" + 0.016*\"yawn\" + 0.015*\"margin\" + 0.014*\"bone\" + 0.013*\"life\" + 0.013*\"faster\" + 0.012*\"deal\" + 0.012*\"john\"\n", + "2019-01-31 00:54:10,103 : INFO : topic diff=0.004368, rho=0.030042\n", + "2019-01-31 00:54:10,256 : INFO : PROGRESS: pass 0, at document #2218000/4922894\n", + "2019-01-31 00:54:11,616 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:54:11,882 : INFO : topic #9 (0.020): 0.074*\"bone\" + 0.044*\"american\" + 0.027*\"valour\" + 0.018*\"folei\" + 0.018*\"dutch\" + 0.018*\"player\" + 0.016*\"polit\" + 0.016*\"english\" + 0.012*\"acrimoni\" + 0.012*\"simpler\"\n", + "2019-01-31 00:54:11,883 : INFO : topic #32 (0.020): 0.054*\"district\" + 0.047*\"vigour\" + 0.044*\"popolo\" + 0.037*\"tortur\" + 0.033*\"cotton\" + 0.026*\"area\" + 0.021*\"multitud\" + 0.021*\"regim\" + 0.021*\"citi\" + 0.020*\"cede\"\n", + "2019-01-31 00:54:11,885 : INFO : topic #14 (0.020): 0.023*\"forc\" + 0.022*\"aggress\" + 0.021*\"armi\" + 0.021*\"walter\" + 0.018*\"com\" + 0.014*\"unionist\" + 0.014*\"oper\" + 0.013*\"militari\" + 0.012*\"airbu\" + 0.011*\"refut\"\n", + "2019-01-31 00:54:11,886 : INFO : topic #5 (0.020): 0.039*\"abroad\" + 0.028*\"son\" + 0.026*\"rel\" + 0.026*\"reconstruct\" + 0.021*\"band\" + 0.016*\"muscl\" + 0.016*\"simultan\" + 0.014*\"charcoal\" + 0.014*\"toyota\" + 0.010*\"vocabulari\"\n", + "2019-01-31 00:54:11,887 : INFO : topic #41 (0.020): 0.042*\"citi\" + 0.024*\"new\" + 0.021*\"palmer\" + 0.014*\"strategist\" + 0.012*\"center\" + 0.012*\"open\" + 0.011*\"includ\" + 0.010*\"lobe\" + 0.010*\"dai\" + 0.009*\"highli\"\n", + "2019-01-31 00:54:11,892 : INFO : topic diff=0.004403, rho=0.030029\n", + "2019-01-31 00:54:14,610 : INFO : -11.630 per-word bound, 3169.8 perplexity estimate based on a held-out corpus of 2000 documents with 531243 words\n", + "2019-01-31 00:54:14,610 : INFO : PROGRESS: pass 0, at document #2220000/4922894\n", + "2019-01-31 00:54:16,023 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:54:16,289 : INFO : topic #5 (0.020): 0.039*\"abroad\" + 0.028*\"son\" + 0.026*\"rel\" + 0.026*\"reconstruct\" + 0.021*\"band\" + 0.016*\"muscl\" + 0.016*\"simultan\" + 0.014*\"charcoal\" + 0.014*\"toyota\" + 0.010*\"vocabulari\"\n", + "2019-01-31 00:54:16,290 : INFO : topic #39 (0.020): 0.056*\"canada\" + 0.042*\"canadian\" + 0.024*\"toronto\" + 0.023*\"hoar\" + 0.019*\"ontario\" + 0.016*\"misericordia\" + 0.015*\"quebec\" + 0.015*\"new\" + 0.014*\"hydrogen\" + 0.012*\"novotná\"\n", + "2019-01-31 00:54:16,291 : INFO : topic #4 (0.020): 0.022*\"enfranchis\" + 0.015*\"depress\" + 0.014*\"pour\" + 0.008*\"mode\" + 0.008*\"veget\" + 0.008*\"elabor\" + 0.008*\"uruguayan\" + 0.007*\"encyclopedia\" + 0.006*\"produc\" + 0.006*\"develop\"\n", + "2019-01-31 00:54:16,292 : INFO : topic #26 (0.020): 0.029*\"workplac\" + 0.028*\"champion\" + 0.028*\"woman\" + 0.025*\"men\" + 0.024*\"olymp\" + 0.022*\"medal\" + 0.022*\"alic\" + 0.020*\"event\" + 0.018*\"rainfal\" + 0.018*\"atheist\"\n", + "2019-01-31 00:54:16,293 : INFO : topic #14 (0.020): 0.023*\"forc\" + 0.022*\"aggress\" + 0.021*\"armi\" + 0.020*\"walter\" + 0.018*\"com\" + 0.014*\"unionist\" + 0.014*\"oper\" + 0.013*\"militari\" + 0.012*\"airbu\" + 0.011*\"refut\"\n", + "2019-01-31 00:54:16,299 : INFO : topic diff=0.003956, rho=0.030015\n", + "2019-01-31 00:54:16,462 : INFO : PROGRESS: pass 0, at document #2222000/4922894\n", + "2019-01-31 00:54:17,905 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:54:18,172 : INFO : topic #28 (0.020): 0.031*\"build\" + 0.026*\"hous\" + 0.020*\"rivièr\" + 0.017*\"buford\" + 0.014*\"briarwood\" + 0.013*\"histor\" + 0.011*\"strategist\" + 0.010*\"constitut\" + 0.010*\"linear\" + 0.010*\"depress\"\n", + "2019-01-31 00:54:18,173 : INFO : topic #44 (0.020): 0.030*\"rooftop\" + 0.026*\"final\" + 0.022*\"wife\" + 0.022*\"tourist\" + 0.020*\"champion\" + 0.016*\"martin\" + 0.016*\"tiepolo\" + 0.015*\"taxpay\" + 0.015*\"chamber\" + 0.013*\"women\"\n", + "2019-01-31 00:54:18,174 : INFO : topic #32 (0.020): 0.054*\"district\" + 0.046*\"vigour\" + 0.044*\"popolo\" + 0.038*\"tortur\" + 0.034*\"cotton\" + 0.026*\"area\" + 0.022*\"multitud\" + 0.021*\"regim\" + 0.021*\"citi\" + 0.020*\"cede\"\n", + "2019-01-31 00:54:18,175 : INFO : topic #38 (0.020): 0.023*\"walter\" + 0.009*\"aza\" + 0.008*\"forc\" + 0.008*\"battalion\" + 0.007*\"empath\" + 0.007*\"teufel\" + 0.007*\"armi\" + 0.007*\"pour\" + 0.006*\"govern\" + 0.006*\"militari\"\n", + "2019-01-31 00:54:18,176 : INFO : topic #23 (0.020): 0.136*\"audit\" + 0.065*\"best\" + 0.032*\"yawn\" + 0.028*\"jacksonvil\" + 0.023*\"japanes\" + 0.021*\"noll\" + 0.020*\"festiv\" + 0.020*\"women\" + 0.017*\"intern\" + 0.015*\"prison\"\n", + "2019-01-31 00:54:18,181 : INFO : topic diff=0.005332, rho=0.030002\n", + "2019-01-31 00:54:18,342 : INFO : PROGRESS: pass 0, at document #2224000/4922894\n", + "2019-01-31 00:54:19,750 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:54:20,020 : INFO : topic #31 (0.020): 0.053*\"fusiform\" + 0.026*\"scientist\" + 0.026*\"taxpay\" + 0.025*\"player\" + 0.021*\"place\" + 0.014*\"clot\" + 0.013*\"leagu\" + 0.011*\"folei\" + 0.010*\"yawn\" + 0.009*\"reconstruct\"\n", + "2019-01-31 00:54:20,021 : INFO : topic #16 (0.020): 0.054*\"king\" + 0.033*\"priest\" + 0.021*\"duke\" + 0.019*\"grammat\" + 0.019*\"rotterdam\" + 0.017*\"idiosyncrat\" + 0.017*\"quarterli\" + 0.015*\"kingdom\" + 0.014*\"portugues\" + 0.014*\"count\"\n", + "2019-01-31 00:54:20,022 : INFO : topic #18 (0.020): 0.011*\"théori\" + 0.007*\"later\" + 0.007*\"sack\" + 0.006*\"dai\" + 0.006*\"kill\" + 0.005*\"retrospect\" + 0.005*\"end\" + 0.005*\"like\" + 0.004*\"help\" + 0.004*\"call\"\n", + "2019-01-31 00:54:20,023 : INFO : topic #12 (0.020): 0.009*\"number\" + 0.008*\"frontal\" + 0.007*\"exampl\" + 0.007*\"théori\" + 0.006*\"southern\" + 0.006*\"servitud\" + 0.006*\"gener\" + 0.006*\"measur\" + 0.006*\"poet\" + 0.006*\"utopian\"\n", + "2019-01-31 00:54:20,024 : INFO : topic #17 (0.020): 0.076*\"church\" + 0.022*\"cathol\" + 0.022*\"christian\" + 0.020*\"bishop\" + 0.017*\"sail\" + 0.016*\"retroflex\" + 0.012*\"poll\" + 0.010*\"relationship\" + 0.009*\"cathedr\" + 0.009*\"centuri\"\n", + "2019-01-31 00:54:20,030 : INFO : topic diff=0.005297, rho=0.029988\n", + "2019-01-31 00:54:20,192 : INFO : PROGRESS: pass 0, at document #2226000/4922894\n", + "2019-01-31 00:54:21,597 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:54:21,863 : INFO : topic #15 (0.020): 0.011*\"small\" + 0.010*\"organ\" + 0.010*\"commun\" + 0.010*\"develop\" + 0.009*\"word\" + 0.009*\"group\" + 0.008*\"peopl\" + 0.007*\"cultur\" + 0.007*\"woman\" + 0.006*\"human\"\n", + "2019-01-31 00:54:21,864 : INFO : topic #27 (0.020): 0.069*\"questionnair\" + 0.020*\"candid\" + 0.019*\"taxpay\" + 0.016*\"ret\" + 0.013*\"tornado\" + 0.013*\"driver\" + 0.012*\"find\" + 0.012*\"squatter\" + 0.011*\"fool\" + 0.011*\"champion\"\n", + "2019-01-31 00:54:21,865 : INFO : topic #38 (0.020): 0.023*\"walter\" + 0.009*\"aza\" + 0.008*\"forc\" + 0.008*\"battalion\" + 0.007*\"empath\" + 0.007*\"armi\" + 0.007*\"teufel\" + 0.007*\"pour\" + 0.006*\"militari\" + 0.006*\"govern\"\n", + "2019-01-31 00:54:21,866 : INFO : topic #44 (0.020): 0.030*\"rooftop\" + 0.027*\"final\" + 0.022*\"wife\" + 0.022*\"tourist\" + 0.020*\"champion\" + 0.016*\"martin\" + 0.016*\"chamber\" + 0.016*\"tiepolo\" + 0.015*\"taxpay\" + 0.013*\"women\"\n", + "2019-01-31 00:54:21,867 : INFO : topic #3 (0.020): 0.033*\"present\" + 0.027*\"offic\" + 0.023*\"minist\" + 0.022*\"member\" + 0.022*\"govern\" + 0.022*\"nation\" + 0.019*\"serv\" + 0.016*\"gener\" + 0.015*\"start\" + 0.015*\"seri\"\n", + "2019-01-31 00:54:21,873 : INFO : topic diff=0.005691, rho=0.029975\n", + "2019-01-31 00:54:22,029 : INFO : PROGRESS: pass 0, at document #2228000/4922894\n", + "2019-01-31 00:54:23,417 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:54:23,683 : INFO : topic #14 (0.020): 0.023*\"forc\" + 0.022*\"aggress\" + 0.021*\"armi\" + 0.020*\"walter\" + 0.018*\"com\" + 0.014*\"oper\" + 0.014*\"unionist\" + 0.013*\"militari\" + 0.011*\"airbu\" + 0.011*\"refut\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 00:54:23,684 : INFO : topic #9 (0.020): 0.075*\"bone\" + 0.045*\"american\" + 0.026*\"valour\" + 0.019*\"folei\" + 0.018*\"player\" + 0.018*\"dutch\" + 0.017*\"polit\" + 0.016*\"english\" + 0.012*\"acrimoni\" + 0.012*\"simpler\"\n", + "2019-01-31 00:54:23,685 : INFO : topic #37 (0.020): 0.010*\"charact\" + 0.010*\"man\" + 0.009*\"septemb\" + 0.008*\"anim\" + 0.007*\"comic\" + 0.007*\"love\" + 0.007*\"appear\" + 0.006*\"gestur\" + 0.005*\"workplac\" + 0.005*\"blue\"\n", + "2019-01-31 00:54:23,686 : INFO : topic #31 (0.020): 0.054*\"fusiform\" + 0.027*\"scientist\" + 0.026*\"taxpay\" + 0.024*\"player\" + 0.020*\"place\" + 0.014*\"clot\" + 0.013*\"leagu\" + 0.011*\"folei\" + 0.010*\"yawn\" + 0.009*\"reconstruct\"\n", + "2019-01-31 00:54:23,687 : INFO : topic #47 (0.020): 0.062*\"muscl\" + 0.033*\"perceptu\" + 0.021*\"theater\" + 0.020*\"place\" + 0.017*\"compos\" + 0.016*\"damn\" + 0.013*\"orchestr\" + 0.013*\"physician\" + 0.012*\"olympo\" + 0.012*\"word\"\n", + "2019-01-31 00:54:23,693 : INFO : topic diff=0.004230, rho=0.029961\n", + "2019-01-31 00:54:23,850 : INFO : PROGRESS: pass 0, at document #2230000/4922894\n", + "2019-01-31 00:54:25,234 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:54:25,500 : INFO : topic #15 (0.020): 0.011*\"small\" + 0.010*\"organ\" + 0.010*\"commun\" + 0.010*\"develop\" + 0.009*\"word\" + 0.009*\"group\" + 0.008*\"peopl\" + 0.007*\"woman\" + 0.007*\"cultur\" + 0.006*\"human\"\n", + "2019-01-31 00:54:25,501 : INFO : topic #14 (0.020): 0.023*\"forc\" + 0.022*\"aggress\" + 0.021*\"armi\" + 0.020*\"walter\" + 0.018*\"com\" + 0.014*\"oper\" + 0.014*\"unionist\" + 0.013*\"militari\" + 0.012*\"refut\" + 0.011*\"airbu\"\n", + "2019-01-31 00:54:25,502 : INFO : topic #16 (0.020): 0.055*\"king\" + 0.034*\"priest\" + 0.023*\"duke\" + 0.019*\"rotterdam\" + 0.019*\"grammat\" + 0.017*\"quarterli\" + 0.017*\"idiosyncrat\" + 0.014*\"kingdom\" + 0.014*\"count\" + 0.014*\"portugues\"\n", + "2019-01-31 00:54:25,503 : INFO : topic #46 (0.020): 0.019*\"stop\" + 0.016*\"damag\" + 0.016*\"norwai\" + 0.015*\"sweden\" + 0.015*\"swedish\" + 0.014*\"wind\" + 0.014*\"norwegian\" + 0.013*\"treeless\" + 0.012*\"turkish\" + 0.012*\"denmark\"\n", + "2019-01-31 00:54:25,504 : INFO : topic #25 (0.020): 0.033*\"ring\" + 0.018*\"lagrang\" + 0.017*\"area\" + 0.017*\"warmth\" + 0.014*\"mount\" + 0.009*\"north\" + 0.009*\"palmer\" + 0.008*\"vacant\" + 0.008*\"lobe\" + 0.008*\"land\"\n", + "2019-01-31 00:54:25,510 : INFO : topic diff=0.004679, rho=0.029948\n", + "2019-01-31 00:54:25,669 : INFO : PROGRESS: pass 0, at document #2232000/4922894\n", + "2019-01-31 00:54:27,079 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:54:27,345 : INFO : topic #22 (0.020): 0.033*\"spars\" + 0.023*\"factor\" + 0.019*\"adulthood\" + 0.014*\"feel\" + 0.013*\"male\" + 0.011*\"plaisir\" + 0.010*\"genu\" + 0.010*\"hostil\" + 0.008*\"western\" + 0.008*\"median\"\n", + "2019-01-31 00:54:27,346 : INFO : topic #14 (0.020): 0.023*\"forc\" + 0.022*\"aggress\" + 0.021*\"armi\" + 0.020*\"walter\" + 0.018*\"com\" + 0.014*\"oper\" + 0.014*\"unionist\" + 0.013*\"militari\" + 0.012*\"refut\" + 0.011*\"airbu\"\n", + "2019-01-31 00:54:27,347 : INFO : topic #27 (0.020): 0.069*\"questionnair\" + 0.019*\"candid\" + 0.018*\"taxpay\" + 0.015*\"ret\" + 0.013*\"tornado\" + 0.012*\"driver\" + 0.012*\"find\" + 0.012*\"squatter\" + 0.011*\"fool\" + 0.011*\"champion\"\n", + "2019-01-31 00:54:27,348 : INFO : topic #11 (0.020): 0.024*\"john\" + 0.012*\"will\" + 0.012*\"jame\" + 0.012*\"david\" + 0.010*\"rival\" + 0.009*\"mexican–american\" + 0.009*\"slur\" + 0.008*\"georg\" + 0.008*\"paul\" + 0.008*\"rhyme\"\n", + "2019-01-31 00:54:27,349 : INFO : topic #3 (0.020): 0.034*\"present\" + 0.027*\"offic\" + 0.023*\"minist\" + 0.022*\"member\" + 0.022*\"nation\" + 0.022*\"govern\" + 0.019*\"serv\" + 0.016*\"gener\" + 0.015*\"start\" + 0.015*\"seri\"\n", + "2019-01-31 00:54:27,355 : INFO : topic diff=0.004707, rho=0.029934\n", + "2019-01-31 00:54:27,516 : INFO : PROGRESS: pass 0, at document #2234000/4922894\n", + "2019-01-31 00:54:28,908 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:54:29,177 : INFO : topic #21 (0.020): 0.034*\"samford\" + 0.022*\"spain\" + 0.019*\"del\" + 0.017*\"mexico\" + 0.014*\"soviet\" + 0.013*\"italian\" + 0.012*\"santa\" + 0.011*\"juan\" + 0.011*\"carlo\" + 0.010*\"lizard\"\n", + "2019-01-31 00:54:29,178 : INFO : topic #14 (0.020): 0.023*\"forc\" + 0.022*\"aggress\" + 0.021*\"armi\" + 0.020*\"walter\" + 0.018*\"com\" + 0.014*\"oper\" + 0.014*\"unionist\" + 0.013*\"militari\" + 0.012*\"refut\" + 0.011*\"airbu\"\n", + "2019-01-31 00:54:29,179 : INFO : topic #2 (0.020): 0.048*\"isl\" + 0.037*\"shield\" + 0.018*\"narrat\" + 0.015*\"scot\" + 0.013*\"pope\" + 0.011*\"blur\" + 0.011*\"coalit\" + 0.010*\"nativist\" + 0.009*\"fleet\" + 0.009*\"bahá\"\n", + "2019-01-31 00:54:29,180 : INFO : topic #42 (0.020): 0.046*\"german\" + 0.032*\"germani\" + 0.015*\"berlin\" + 0.015*\"vol\" + 0.014*\"jewish\" + 0.013*\"der\" + 0.013*\"israel\" + 0.012*\"european\" + 0.010*\"europ\" + 0.009*\"itali\"\n", + "2019-01-31 00:54:29,181 : INFO : topic #18 (0.020): 0.010*\"théori\" + 0.007*\"later\" + 0.007*\"sack\" + 0.006*\"dai\" + 0.006*\"kill\" + 0.005*\"retrospect\" + 0.005*\"end\" + 0.005*\"like\" + 0.004*\"help\" + 0.004*\"call\"\n", + "2019-01-31 00:54:29,187 : INFO : topic diff=0.005543, rho=0.029921\n", + "2019-01-31 00:54:29,345 : INFO : PROGRESS: pass 0, at document #2236000/4922894\n", + "2019-01-31 00:54:30,744 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:54:31,010 : INFO : topic #26 (0.020): 0.029*\"workplac\" + 0.028*\"woman\" + 0.028*\"champion\" + 0.025*\"men\" + 0.024*\"olymp\" + 0.022*\"medal\" + 0.021*\"alic\" + 0.020*\"event\" + 0.018*\"rainfal\" + 0.018*\"taxpay\"\n", + "2019-01-31 00:54:31,012 : INFO : topic #31 (0.020): 0.053*\"fusiform\" + 0.027*\"scientist\" + 0.025*\"taxpay\" + 0.024*\"player\" + 0.020*\"place\" + 0.014*\"clot\" + 0.013*\"leagu\" + 0.011*\"folei\" + 0.010*\"yawn\" + 0.010*\"reconstruct\"\n", + "2019-01-31 00:54:31,012 : INFO : topic #16 (0.020): 0.054*\"king\" + 0.035*\"priest\" + 0.023*\"duke\" + 0.019*\"rotterdam\" + 0.019*\"grammat\" + 0.017*\"quarterli\" + 0.017*\"idiosyncrat\" + 0.014*\"kingdom\" + 0.014*\"count\" + 0.014*\"portugues\"\n", + "2019-01-31 00:54:31,014 : INFO : topic #14 (0.020): 0.023*\"forc\" + 0.022*\"aggress\" + 0.020*\"armi\" + 0.020*\"walter\" + 0.017*\"com\" + 0.014*\"oper\" + 0.013*\"unionist\" + 0.013*\"militari\" + 0.011*\"airbu\" + 0.011*\"refut\"\n", + "2019-01-31 00:54:31,015 : INFO : topic #34 (0.020): 0.071*\"start\" + 0.032*\"new\" + 0.031*\"american\" + 0.028*\"unionist\" + 0.026*\"cotton\" + 0.020*\"year\" + 0.015*\"california\" + 0.013*\"warrior\" + 0.013*\"terri\" + 0.012*\"north\"\n", + "2019-01-31 00:54:31,020 : INFO : topic diff=0.004682, rho=0.029907\n", + "2019-01-31 00:54:31,173 : INFO : PROGRESS: pass 0, at document #2238000/4922894\n", + "2019-01-31 00:54:32,603 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:54:32,871 : INFO : topic #47 (0.020): 0.063*\"muscl\" + 0.033*\"perceptu\" + 0.021*\"theater\" + 0.020*\"place\" + 0.018*\"compos\" + 0.015*\"damn\" + 0.013*\"orchestr\" + 0.013*\"olympo\" + 0.013*\"physician\" + 0.012*\"word\"\n", + "2019-01-31 00:54:32,872 : INFO : topic #21 (0.020): 0.033*\"samford\" + 0.022*\"spain\" + 0.019*\"del\" + 0.017*\"mexico\" + 0.014*\"soviet\" + 0.013*\"italian\" + 0.012*\"santa\" + 0.011*\"juan\" + 0.011*\"carlo\" + 0.010*\"josé\"\n", + "2019-01-31 00:54:32,873 : INFO : topic #29 (0.020): 0.029*\"companhia\" + 0.012*\"million\" + 0.012*\"busi\" + 0.011*\"bank\" + 0.011*\"produc\" + 0.011*\"market\" + 0.009*\"industri\" + 0.009*\"yawn\" + 0.008*\"manag\" + 0.007*\"function\"\n", + "2019-01-31 00:54:32,874 : INFO : topic #34 (0.020): 0.070*\"start\" + 0.032*\"new\" + 0.031*\"american\" + 0.028*\"unionist\" + 0.026*\"cotton\" + 0.020*\"year\" + 0.015*\"california\" + 0.013*\"warrior\" + 0.012*\"terri\" + 0.012*\"north\"\n", + "2019-01-31 00:54:32,875 : INFO : topic #43 (0.020): 0.063*\"elect\" + 0.052*\"parti\" + 0.025*\"voluntari\" + 0.022*\"democrat\" + 0.020*\"member\" + 0.017*\"polici\" + 0.014*\"republ\" + 0.014*\"report\" + 0.014*\"seaport\" + 0.013*\"liber\"\n", + "2019-01-31 00:54:32,882 : INFO : topic diff=0.005081, rho=0.029894\n", + "2019-01-31 00:54:35,627 : INFO : -11.822 per-word bound, 3619.9 perplexity estimate based on a held-out corpus of 2000 documents with 544971 words\n", + "2019-01-31 00:54:35,628 : INFO : PROGRESS: pass 0, at document #2240000/4922894\n", + "2019-01-31 00:54:37,007 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:54:37,273 : INFO : topic #28 (0.020): 0.031*\"build\" + 0.026*\"hous\" + 0.021*\"rivièr\" + 0.017*\"buford\" + 0.013*\"briarwood\" + 0.013*\"histor\" + 0.011*\"strategist\" + 0.011*\"constitut\" + 0.010*\"depress\" + 0.010*\"linear\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 00:54:37,274 : INFO : topic #9 (0.020): 0.075*\"bone\" + 0.046*\"american\" + 0.025*\"valour\" + 0.019*\"player\" + 0.019*\"folei\" + 0.018*\"dutch\" + 0.017*\"polit\" + 0.016*\"english\" + 0.012*\"acrimoni\" + 0.012*\"simpler\"\n", + "2019-01-31 00:54:37,275 : INFO : topic #10 (0.020): 0.012*\"cdd\" + 0.008*\"disco\" + 0.008*\"media\" + 0.007*\"have\" + 0.007*\"caus\" + 0.007*\"hormon\" + 0.007*\"pathwai\" + 0.006*\"proper\" + 0.006*\"effect\" + 0.006*\"treat\"\n", + "2019-01-31 00:54:37,276 : INFO : topic #8 (0.020): 0.025*\"law\" + 0.023*\"cortic\" + 0.018*\"act\" + 0.018*\"start\" + 0.014*\"ricardo\" + 0.012*\"case\" + 0.010*\"order\" + 0.010*\"replac\" + 0.010*\"polaris\" + 0.009*\"legal\"\n", + "2019-01-31 00:54:37,277 : INFO : topic #29 (0.020): 0.029*\"companhia\" + 0.012*\"million\" + 0.012*\"busi\" + 0.011*\"bank\" + 0.011*\"produc\" + 0.011*\"market\" + 0.009*\"industri\" + 0.009*\"yawn\" + 0.008*\"manag\" + 0.007*\"function\"\n", + "2019-01-31 00:54:37,283 : INFO : topic diff=0.004726, rho=0.029881\n", + "2019-01-31 00:54:37,439 : INFO : PROGRESS: pass 0, at document #2242000/4922894\n", + "2019-01-31 00:54:38,818 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:54:39,084 : INFO : topic #6 (0.020): 0.071*\"fewer\" + 0.025*\"epiru\" + 0.023*\"septemb\" + 0.019*\"teacher\" + 0.016*\"stake\" + 0.013*\"rodríguez\" + 0.012*\"proclaim\" + 0.011*\"direct\" + 0.011*\"acrimoni\" + 0.011*\"movi\"\n", + "2019-01-31 00:54:39,085 : INFO : topic #9 (0.020): 0.075*\"bone\" + 0.047*\"american\" + 0.025*\"valour\" + 0.019*\"player\" + 0.019*\"folei\" + 0.018*\"dutch\" + 0.018*\"polit\" + 0.016*\"english\" + 0.012*\"simpler\" + 0.012*\"acrimoni\"\n", + "2019-01-31 00:54:39,087 : INFO : topic #42 (0.020): 0.046*\"german\" + 0.031*\"germani\" + 0.015*\"berlin\" + 0.015*\"vol\" + 0.014*\"jewish\" + 0.013*\"der\" + 0.013*\"israel\" + 0.011*\"european\" + 0.010*\"europ\" + 0.009*\"itali\"\n", + "2019-01-31 00:54:39,088 : INFO : topic #16 (0.020): 0.054*\"king\" + 0.035*\"priest\" + 0.022*\"duke\" + 0.019*\"rotterdam\" + 0.018*\"grammat\" + 0.017*\"idiosyncrat\" + 0.017*\"quarterli\" + 0.014*\"kingdom\" + 0.014*\"count\" + 0.013*\"portugues\"\n", + "2019-01-31 00:54:39,089 : INFO : topic #25 (0.020): 0.033*\"ring\" + 0.018*\"lagrang\" + 0.017*\"area\" + 0.016*\"warmth\" + 0.015*\"mount\" + 0.009*\"north\" + 0.009*\"palmer\" + 0.008*\"vacant\" + 0.008*\"sourc\" + 0.008*\"lobe\"\n", + "2019-01-31 00:54:39,095 : INFO : topic diff=0.004676, rho=0.029867\n", + "2019-01-31 00:54:39,249 : INFO : PROGRESS: pass 0, at document #2244000/4922894\n", + "2019-01-31 00:54:40,619 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:54:40,885 : INFO : topic #27 (0.020): 0.069*\"questionnair\" + 0.019*\"candid\" + 0.018*\"taxpay\" + 0.014*\"ret\" + 0.014*\"tornado\" + 0.012*\"driver\" + 0.012*\"squatter\" + 0.011*\"find\" + 0.011*\"fool\" + 0.010*\"théori\"\n", + "2019-01-31 00:54:40,887 : INFO : topic #16 (0.020): 0.054*\"king\" + 0.036*\"priest\" + 0.022*\"duke\" + 0.019*\"rotterdam\" + 0.018*\"grammat\" + 0.017*\"idiosyncrat\" + 0.017*\"quarterli\" + 0.014*\"kingdom\" + 0.014*\"count\" + 0.013*\"portugues\"\n", + "2019-01-31 00:54:40,888 : INFO : topic #30 (0.020): 0.035*\"leagu\" + 0.034*\"cleveland\" + 0.030*\"place\" + 0.027*\"taxpay\" + 0.025*\"scientist\" + 0.024*\"crete\" + 0.021*\"folei\" + 0.017*\"goal\" + 0.015*\"martin\" + 0.012*\"diversifi\"\n", + "2019-01-31 00:54:40,889 : INFO : topic #2 (0.020): 0.050*\"isl\" + 0.037*\"shield\" + 0.018*\"narrat\" + 0.015*\"scot\" + 0.013*\"pope\" + 0.012*\"blur\" + 0.011*\"coalit\" + 0.010*\"nativist\" + 0.009*\"fleet\" + 0.008*\"vernon\"\n", + "2019-01-31 00:54:40,890 : INFO : topic #6 (0.020): 0.071*\"fewer\" + 0.025*\"epiru\" + 0.023*\"septemb\" + 0.019*\"teacher\" + 0.016*\"stake\" + 0.013*\"rodríguez\" + 0.012*\"proclaim\" + 0.011*\"direct\" + 0.011*\"acrimoni\" + 0.011*\"movi\"\n", + "2019-01-31 00:54:40,896 : INFO : topic diff=0.004133, rho=0.029854\n", + "2019-01-31 00:54:41,051 : INFO : PROGRESS: pass 0, at document #2246000/4922894\n", + "2019-01-31 00:54:42,424 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:54:42,691 : INFO : topic #2 (0.020): 0.049*\"isl\" + 0.037*\"shield\" + 0.018*\"narrat\" + 0.015*\"scot\" + 0.013*\"pope\" + 0.012*\"blur\" + 0.010*\"coalit\" + 0.010*\"nativist\" + 0.009*\"fleet\" + 0.009*\"class\"\n", + "2019-01-31 00:54:42,692 : INFO : topic #17 (0.020): 0.077*\"church\" + 0.022*\"christian\" + 0.022*\"cathol\" + 0.020*\"bishop\" + 0.017*\"sail\" + 0.016*\"retroflex\" + 0.011*\"poll\" + 0.010*\"cathedr\" + 0.010*\"relationship\" + 0.010*\"centuri\"\n", + "2019-01-31 00:54:42,693 : INFO : topic #32 (0.020): 0.052*\"district\" + 0.046*\"vigour\" + 0.044*\"popolo\" + 0.040*\"tortur\" + 0.034*\"cotton\" + 0.026*\"area\" + 0.022*\"multitud\" + 0.021*\"citi\" + 0.021*\"regim\" + 0.020*\"cede\"\n", + "2019-01-31 00:54:42,694 : INFO : topic #28 (0.020): 0.031*\"build\" + 0.026*\"hous\" + 0.021*\"rivièr\" + 0.017*\"buford\" + 0.013*\"histor\" + 0.013*\"briarwood\" + 0.011*\"constitut\" + 0.011*\"strategist\" + 0.010*\"depress\" + 0.010*\"linear\"\n", + "2019-01-31 00:54:42,695 : INFO : topic #0 (0.020): 0.067*\"statewid\" + 0.041*\"line\" + 0.034*\"raid\" + 0.033*\"arsen\" + 0.026*\"museo\" + 0.020*\"traceabl\" + 0.019*\"serv\" + 0.013*\"rosenwald\" + 0.013*\"exhaust\" + 0.013*\"pain\"\n", + "2019-01-31 00:54:42,701 : INFO : topic diff=0.004573, rho=0.029841\n", + "2019-01-31 00:54:42,855 : INFO : PROGRESS: pass 0, at document #2248000/4922894\n", + "2019-01-31 00:54:44,222 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:54:44,488 : INFO : topic #0 (0.020): 0.067*\"statewid\" + 0.041*\"line\" + 0.034*\"arsen\" + 0.034*\"raid\" + 0.026*\"museo\" + 0.020*\"traceabl\" + 0.018*\"serv\" + 0.013*\"rosenwald\" + 0.013*\"exhaust\" + 0.013*\"pain\"\n", + "2019-01-31 00:54:44,489 : INFO : topic #5 (0.020): 0.039*\"abroad\" + 0.029*\"son\" + 0.027*\"rel\" + 0.026*\"reconstruct\" + 0.021*\"band\" + 0.016*\"muscl\" + 0.016*\"simultan\" + 0.014*\"charcoal\" + 0.013*\"toyota\" + 0.010*\"myspac\"\n", + "2019-01-31 00:54:44,490 : INFO : topic #35 (0.020): 0.059*\"russia\" + 0.037*\"sovereignti\" + 0.035*\"rural\" + 0.026*\"poison\" + 0.026*\"personifi\" + 0.024*\"reprint\" + 0.019*\"moscow\" + 0.018*\"poland\" + 0.017*\"alexand\" + 0.015*\"unfortun\"\n", + "2019-01-31 00:54:44,491 : INFO : topic #33 (0.020): 0.064*\"french\" + 0.046*\"franc\" + 0.030*\"pari\" + 0.024*\"jean\" + 0.023*\"sail\" + 0.017*\"daphn\" + 0.014*\"lazi\" + 0.012*\"loui\" + 0.011*\"piec\" + 0.008*\"wine\"\n", + "2019-01-31 00:54:44,492 : INFO : topic #43 (0.020): 0.062*\"elect\" + 0.052*\"parti\" + 0.025*\"voluntari\" + 0.022*\"democrat\" + 0.020*\"member\" + 0.016*\"polici\" + 0.014*\"conserv\" + 0.014*\"republ\" + 0.014*\"liber\" + 0.013*\"labour\"\n", + "2019-01-31 00:54:44,498 : INFO : topic diff=0.004308, rho=0.029827\n", + "2019-01-31 00:54:44,649 : INFO : PROGRESS: pass 0, at document #2250000/4922894\n", + "2019-01-31 00:54:46,002 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:54:46,268 : INFO : topic #43 (0.020): 0.062*\"elect\" + 0.052*\"parti\" + 0.025*\"voluntari\" + 0.022*\"democrat\" + 0.020*\"member\" + 0.016*\"polici\" + 0.014*\"conserv\" + 0.014*\"liber\" + 0.014*\"republ\" + 0.013*\"seaport\"\n", + "2019-01-31 00:54:46,269 : INFO : topic #40 (0.020): 0.087*\"unit\" + 0.022*\"schuster\" + 0.022*\"collector\" + 0.021*\"institut\" + 0.020*\"requir\" + 0.019*\"student\" + 0.014*\"professor\" + 0.012*\"word\" + 0.011*\"governor\" + 0.011*\"degre\"\n", + "2019-01-31 00:54:46,270 : INFO : topic #33 (0.020): 0.065*\"french\" + 0.046*\"franc\" + 0.030*\"pari\" + 0.024*\"jean\" + 0.023*\"sail\" + 0.017*\"daphn\" + 0.013*\"lazi\" + 0.012*\"loui\" + 0.011*\"piec\" + 0.008*\"wine\"\n", + "2019-01-31 00:54:46,272 : INFO : topic #5 (0.020): 0.039*\"abroad\" + 0.029*\"son\" + 0.027*\"rel\" + 0.026*\"reconstruct\" + 0.021*\"band\" + 0.016*\"muscl\" + 0.016*\"simultan\" + 0.014*\"charcoal\" + 0.013*\"toyota\" + 0.010*\"myspac\"\n", + "2019-01-31 00:54:46,273 : INFO : topic #48 (0.020): 0.083*\"sens\" + 0.080*\"march\" + 0.079*\"octob\" + 0.071*\"januari\" + 0.070*\"juli\" + 0.068*\"judici\" + 0.068*\"notion\" + 0.067*\"april\" + 0.067*\"august\" + 0.065*\"decatur\"\n", + "2019-01-31 00:54:46,279 : INFO : topic diff=0.004911, rho=0.029814\n", + "2019-01-31 00:54:46,434 : INFO : PROGRESS: pass 0, at document #2252000/4922894\n", + "2019-01-31 00:54:47,810 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:54:48,077 : INFO : topic #27 (0.020): 0.069*\"questionnair\" + 0.019*\"candid\" + 0.018*\"taxpay\" + 0.014*\"ret\" + 0.013*\"tornado\" + 0.012*\"driver\" + 0.012*\"find\" + 0.011*\"squatter\" + 0.011*\"fool\" + 0.010*\"théori\"\n", + "2019-01-31 00:54:48,078 : INFO : topic #6 (0.020): 0.071*\"fewer\" + 0.025*\"epiru\" + 0.023*\"septemb\" + 0.019*\"teacher\" + 0.016*\"stake\" + 0.013*\"rodríguez\" + 0.012*\"proclaim\" + 0.011*\"direct\" + 0.011*\"acrimoni\" + 0.011*\"movi\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 00:54:48,079 : INFO : topic #8 (0.020): 0.026*\"law\" + 0.023*\"cortic\" + 0.018*\"start\" + 0.018*\"act\" + 0.014*\"ricardo\" + 0.012*\"case\" + 0.010*\"replac\" + 0.010*\"polaris\" + 0.009*\"order\" + 0.009*\"legal\"\n", + "2019-01-31 00:54:48,080 : INFO : topic #23 (0.020): 0.137*\"audit\" + 0.065*\"best\" + 0.032*\"yawn\" + 0.029*\"jacksonvil\" + 0.023*\"japanes\" + 0.021*\"noll\" + 0.020*\"festiv\" + 0.019*\"women\" + 0.016*\"intern\" + 0.015*\"winner\"\n", + "2019-01-31 00:54:48,081 : INFO : topic #48 (0.020): 0.083*\"sens\" + 0.080*\"march\" + 0.079*\"octob\" + 0.071*\"januari\" + 0.070*\"juli\" + 0.068*\"judici\" + 0.068*\"notion\" + 0.067*\"april\" + 0.067*\"august\" + 0.066*\"decatur\"\n", + "2019-01-31 00:54:48,087 : INFO : topic diff=0.005261, rho=0.029801\n", + "2019-01-31 00:54:48,242 : INFO : PROGRESS: pass 0, at document #2254000/4922894\n", + "2019-01-31 00:54:49,607 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:54:49,873 : INFO : topic #22 (0.020): 0.033*\"spars\" + 0.022*\"factor\" + 0.018*\"adulthood\" + 0.014*\"feel\" + 0.012*\"male\" + 0.011*\"plaisir\" + 0.010*\"genu\" + 0.009*\"hostil\" + 0.008*\"western\" + 0.008*\"median\"\n", + "2019-01-31 00:54:49,874 : INFO : topic #23 (0.020): 0.137*\"audit\" + 0.066*\"best\" + 0.032*\"yawn\" + 0.029*\"jacksonvil\" + 0.023*\"japanes\" + 0.021*\"noll\" + 0.020*\"festiv\" + 0.019*\"women\" + 0.016*\"intern\" + 0.015*\"winner\"\n", + "2019-01-31 00:54:49,875 : INFO : topic #27 (0.020): 0.070*\"questionnair\" + 0.019*\"candid\" + 0.018*\"taxpay\" + 0.014*\"ret\" + 0.014*\"tornado\" + 0.012*\"driver\" + 0.012*\"find\" + 0.011*\"fool\" + 0.011*\"squatter\" + 0.010*\"théori\"\n", + "2019-01-31 00:54:49,876 : INFO : topic #1 (0.020): 0.059*\"china\" + 0.044*\"chilton\" + 0.023*\"hong\" + 0.023*\"kong\" + 0.020*\"korea\" + 0.020*\"korean\" + 0.016*\"sourc\" + 0.016*\"leah\" + 0.012*\"shirin\" + 0.012*\"ashvil\"\n", + "2019-01-31 00:54:49,877 : INFO : topic #26 (0.020): 0.029*\"woman\" + 0.028*\"workplac\" + 0.027*\"champion\" + 0.027*\"men\" + 0.025*\"olymp\" + 0.023*\"alic\" + 0.021*\"medal\" + 0.020*\"event\" + 0.019*\"rainfal\" + 0.018*\"atheist\"\n", + "2019-01-31 00:54:49,883 : INFO : topic diff=0.004541, rho=0.029788\n", + "2019-01-31 00:54:50,044 : INFO : PROGRESS: pass 0, at document #2256000/4922894\n", + "2019-01-31 00:54:51,446 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:54:51,713 : INFO : topic #12 (0.020): 0.008*\"number\" + 0.007*\"frontal\" + 0.007*\"exampl\" + 0.006*\"southern\" + 0.006*\"théori\" + 0.006*\"measur\" + 0.006*\"servitud\" + 0.006*\"utopian\" + 0.006*\"gener\" + 0.006*\"poet\"\n", + "2019-01-31 00:54:51,714 : INFO : topic #2 (0.020): 0.050*\"isl\" + 0.037*\"shield\" + 0.017*\"narrat\" + 0.015*\"scot\" + 0.013*\"pope\" + 0.011*\"blur\" + 0.010*\"coalit\" + 0.010*\"nativist\" + 0.009*\"fleet\" + 0.009*\"vernon\"\n", + "2019-01-31 00:54:51,715 : INFO : topic #16 (0.020): 0.054*\"king\" + 0.034*\"priest\" + 0.021*\"duke\" + 0.019*\"rotterdam\" + 0.019*\"grammat\" + 0.017*\"quarterli\" + 0.017*\"idiosyncrat\" + 0.014*\"kingdom\" + 0.014*\"count\" + 0.013*\"portugues\"\n", + "2019-01-31 00:54:51,716 : INFO : topic #47 (0.020): 0.064*\"muscl\" + 0.032*\"perceptu\" + 0.021*\"theater\" + 0.019*\"place\" + 0.018*\"compos\" + 0.015*\"damn\" + 0.013*\"orchestr\" + 0.013*\"olympo\" + 0.012*\"physician\" + 0.012*\"word\"\n", + "2019-01-31 00:54:51,717 : INFO : topic #29 (0.020): 0.028*\"companhia\" + 0.012*\"busi\" + 0.012*\"million\" + 0.012*\"market\" + 0.011*\"bank\" + 0.010*\"produc\" + 0.009*\"industri\" + 0.009*\"yawn\" + 0.008*\"manag\" + 0.007*\"function\"\n", + "2019-01-31 00:54:51,723 : INFO : topic diff=0.005600, rho=0.029775\n", + "2019-01-31 00:54:51,880 : INFO : PROGRESS: pass 0, at document #2258000/4922894\n", + "2019-01-31 00:54:53,252 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:54:53,519 : INFO : topic #3 (0.020): 0.033*\"present\" + 0.026*\"offic\" + 0.023*\"minist\" + 0.022*\"serv\" + 0.022*\"member\" + 0.022*\"nation\" + 0.021*\"govern\" + 0.016*\"gener\" + 0.016*\"start\" + 0.015*\"seri\"\n", + "2019-01-31 00:54:53,520 : INFO : topic #4 (0.020): 0.021*\"enfranchis\" + 0.016*\"depress\" + 0.014*\"pour\" + 0.008*\"mode\" + 0.008*\"veget\" + 0.008*\"elabor\" + 0.008*\"uruguayan\" + 0.007*\"encyclopedia\" + 0.006*\"develop\" + 0.006*\"produc\"\n", + "2019-01-31 00:54:53,521 : INFO : topic #15 (0.020): 0.011*\"small\" + 0.010*\"organ\" + 0.010*\"develop\" + 0.010*\"commun\" + 0.009*\"word\" + 0.009*\"group\" + 0.008*\"peopl\" + 0.007*\"woman\" + 0.007*\"human\" + 0.006*\"cultur\"\n", + "2019-01-31 00:54:53,522 : INFO : topic #43 (0.020): 0.062*\"elect\" + 0.052*\"parti\" + 0.025*\"voluntari\" + 0.022*\"democrat\" + 0.020*\"member\" + 0.016*\"polici\" + 0.014*\"liber\" + 0.014*\"conserv\" + 0.014*\"republ\" + 0.013*\"seaport\"\n", + "2019-01-31 00:54:53,523 : INFO : topic #28 (0.020): 0.032*\"build\" + 0.026*\"hous\" + 0.021*\"rivièr\" + 0.017*\"buford\" + 0.014*\"histor\" + 0.013*\"briarwood\" + 0.011*\"constitut\" + 0.011*\"strategist\" + 0.010*\"depress\" + 0.010*\"linear\"\n", + "2019-01-31 00:54:53,529 : INFO : topic diff=0.004321, rho=0.029761\n", + "2019-01-31 00:54:56,215 : INFO : -11.817 per-word bound, 3609.1 perplexity estimate based on a held-out corpus of 2000 documents with 550496 words\n", + "2019-01-31 00:54:56,215 : INFO : PROGRESS: pass 0, at document #2260000/4922894\n", + "2019-01-31 00:54:57,600 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:54:57,866 : INFO : topic #44 (0.020): 0.032*\"rooftop\" + 0.026*\"final\" + 0.023*\"wife\" + 0.021*\"tourist\" + 0.019*\"champion\" + 0.016*\"chamber\" + 0.015*\"taxpay\" + 0.015*\"martin\" + 0.015*\"tiepolo\" + 0.012*\"women\"\n", + "2019-01-31 00:54:57,867 : INFO : topic #11 (0.020): 0.024*\"john\" + 0.013*\"will\" + 0.012*\"jame\" + 0.011*\"david\" + 0.010*\"rival\" + 0.009*\"mexican–american\" + 0.009*\"slur\" + 0.008*\"georg\" + 0.008*\"paul\" + 0.008*\"rhyme\"\n", + "2019-01-31 00:54:57,868 : INFO : topic #25 (0.020): 0.033*\"ring\" + 0.018*\"lagrang\" + 0.017*\"warmth\" + 0.017*\"area\" + 0.015*\"mount\" + 0.009*\"north\" + 0.009*\"palmer\" + 0.008*\"lobe\" + 0.008*\"foam\" + 0.008*\"land\"\n", + "2019-01-31 00:54:57,869 : INFO : topic #18 (0.020): 0.010*\"théori\" + 0.007*\"later\" + 0.007*\"sack\" + 0.006*\"dai\" + 0.006*\"kill\" + 0.005*\"retrospect\" + 0.005*\"end\" + 0.005*\"like\" + 0.004*\"call\" + 0.004*\"help\"\n", + "2019-01-31 00:54:57,870 : INFO : topic #32 (0.020): 0.051*\"district\" + 0.046*\"vigour\" + 0.044*\"popolo\" + 0.040*\"tortur\" + 0.034*\"cotton\" + 0.026*\"area\" + 0.021*\"multitud\" + 0.021*\"citi\" + 0.021*\"regim\" + 0.019*\"cede\"\n", + "2019-01-31 00:54:57,876 : INFO : topic diff=0.004881, rho=0.029748\n", + "2019-01-31 00:54:58,032 : INFO : PROGRESS: pass 0, at document #2262000/4922894\n", + "2019-01-31 00:54:59,412 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:54:59,678 : INFO : topic #45 (0.020): 0.027*\"jpg\" + 0.027*\"fifteenth\" + 0.017*\"illicit\" + 0.017*\"colder\" + 0.015*\"black\" + 0.014*\"western\" + 0.012*\"record\" + 0.010*\"blind\" + 0.008*\"depress\" + 0.008*\"arm\"\n", + "2019-01-31 00:54:59,679 : INFO : topic #44 (0.020): 0.033*\"rooftop\" + 0.026*\"final\" + 0.023*\"wife\" + 0.021*\"tourist\" + 0.019*\"champion\" + 0.016*\"chamber\" + 0.015*\"taxpay\" + 0.015*\"martin\" + 0.015*\"tiepolo\" + 0.012*\"women\"\n", + "2019-01-31 00:54:59,680 : INFO : topic #33 (0.020): 0.064*\"french\" + 0.046*\"franc\" + 0.031*\"pari\" + 0.023*\"jean\" + 0.023*\"sail\" + 0.017*\"daphn\" + 0.013*\"lazi\" + 0.012*\"loui\" + 0.011*\"piec\" + 0.008*\"wine\"\n", + "2019-01-31 00:54:59,681 : INFO : topic #11 (0.020): 0.024*\"john\" + 0.013*\"will\" + 0.012*\"jame\" + 0.011*\"david\" + 0.010*\"rival\" + 0.009*\"mexican–american\" + 0.009*\"slur\" + 0.008*\"georg\" + 0.008*\"paul\" + 0.008*\"rhyme\"\n", + "2019-01-31 00:54:59,683 : INFO : topic #18 (0.020): 0.010*\"théori\" + 0.007*\"later\" + 0.007*\"sack\" + 0.006*\"dai\" + 0.006*\"kill\" + 0.005*\"retrospect\" + 0.005*\"end\" + 0.005*\"like\" + 0.004*\"call\" + 0.004*\"help\"\n", + "2019-01-31 00:54:59,688 : INFO : topic diff=0.004998, rho=0.029735\n", + "2019-01-31 00:54:59,843 : INFO : PROGRESS: pass 0, at document #2264000/4922894\n", + "2019-01-31 00:55:01,195 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:55:01,462 : INFO : topic #24 (0.020): 0.039*\"book\" + 0.034*\"publicis\" + 0.025*\"word\" + 0.018*\"new\" + 0.014*\"edit\" + 0.013*\"presid\" + 0.012*\"collect\" + 0.012*\"nicola\" + 0.011*\"storag\" + 0.011*\"worldwid\"\n", + "2019-01-31 00:55:01,463 : INFO : topic #36 (0.020): 0.012*\"pop\" + 0.011*\"network\" + 0.011*\"prognosi\" + 0.008*\"develop\" + 0.008*\"user\" + 0.008*\"brio\" + 0.008*\"diggin\" + 0.008*\"cytokin\" + 0.008*\"softwar\" + 0.007*\"championship\"\n", + "2019-01-31 00:55:01,464 : INFO : topic #21 (0.020): 0.035*\"samford\" + 0.023*\"spain\" + 0.019*\"del\" + 0.017*\"mexico\" + 0.013*\"soviet\" + 0.013*\"italian\" + 0.012*\"santa\" + 0.011*\"juan\" + 0.011*\"francisco\" + 0.011*\"carlo\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 00:55:01,465 : INFO : topic #44 (0.020): 0.033*\"rooftop\" + 0.026*\"final\" + 0.023*\"wife\" + 0.021*\"tourist\" + 0.019*\"champion\" + 0.016*\"chamber\" + 0.016*\"taxpay\" + 0.015*\"tiepolo\" + 0.015*\"martin\" + 0.012*\"women\"\n", + "2019-01-31 00:55:01,466 : INFO : topic #28 (0.020): 0.032*\"build\" + 0.026*\"hous\" + 0.021*\"rivièr\" + 0.017*\"buford\" + 0.014*\"histor\" + 0.012*\"briarwood\" + 0.011*\"strategist\" + 0.011*\"constitut\" + 0.010*\"depress\" + 0.010*\"linear\"\n", + "2019-01-31 00:55:01,472 : INFO : topic diff=0.004950, rho=0.029722\n", + "2019-01-31 00:55:01,627 : INFO : PROGRESS: pass 0, at document #2266000/4922894\n", + "2019-01-31 00:55:03,004 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:55:03,270 : INFO : topic #43 (0.020): 0.063*\"elect\" + 0.053*\"parti\" + 0.025*\"voluntari\" + 0.023*\"democrat\" + 0.020*\"member\" + 0.016*\"polici\" + 0.014*\"republ\" + 0.014*\"liber\" + 0.014*\"seaport\" + 0.013*\"bypass\"\n", + "2019-01-31 00:55:03,271 : INFO : topic #25 (0.020): 0.032*\"ring\" + 0.018*\"lagrang\" + 0.017*\"warmth\" + 0.017*\"area\" + 0.015*\"mount\" + 0.009*\"north\" + 0.009*\"palmer\" + 0.008*\"foam\" + 0.008*\"vacant\" + 0.008*\"lobe\"\n", + "2019-01-31 00:55:03,272 : INFO : topic #8 (0.020): 0.027*\"law\" + 0.023*\"cortic\" + 0.018*\"start\" + 0.018*\"act\" + 0.014*\"ricardo\" + 0.012*\"case\" + 0.010*\"replac\" + 0.010*\"polaris\" + 0.009*\"order\" + 0.009*\"legal\"\n", + "2019-01-31 00:55:03,273 : INFO : topic #35 (0.020): 0.058*\"russia\" + 0.037*\"sovereignti\" + 0.034*\"rural\" + 0.027*\"poison\" + 0.026*\"personifi\" + 0.024*\"reprint\" + 0.019*\"moscow\" + 0.018*\"poland\" + 0.016*\"alexand\" + 0.015*\"unfortun\"\n", + "2019-01-31 00:55:03,274 : INFO : topic #26 (0.020): 0.029*\"woman\" + 0.028*\"workplac\" + 0.026*\"champion\" + 0.026*\"men\" + 0.024*\"olymp\" + 0.022*\"alic\" + 0.021*\"event\" + 0.021*\"medal\" + 0.019*\"rainfal\" + 0.018*\"atheist\"\n", + "2019-01-31 00:55:03,280 : INFO : topic diff=0.004497, rho=0.029709\n", + "2019-01-31 00:55:03,431 : INFO : PROGRESS: pass 0, at document #2268000/4922894\n", + "2019-01-31 00:55:04,780 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:55:05,047 : INFO : topic #41 (0.020): 0.041*\"citi\" + 0.023*\"new\" + 0.023*\"palmer\" + 0.013*\"strategist\" + 0.013*\"center\" + 0.012*\"open\" + 0.011*\"includ\" + 0.010*\"lobe\" + 0.010*\"dai\" + 0.009*\"highli\"\n", + "2019-01-31 00:55:05,048 : INFO : topic #1 (0.020): 0.057*\"china\" + 0.044*\"chilton\" + 0.023*\"hong\" + 0.023*\"kong\" + 0.021*\"korea\" + 0.019*\"korean\" + 0.016*\"leah\" + 0.016*\"sourc\" + 0.013*\"kim\" + 0.012*\"shirin\"\n", + "2019-01-31 00:55:05,049 : INFO : topic #12 (0.020): 0.008*\"number\" + 0.007*\"frontal\" + 0.007*\"exampl\" + 0.006*\"théori\" + 0.006*\"southern\" + 0.006*\"utopian\" + 0.006*\"measur\" + 0.006*\"gener\" + 0.006*\"servitud\" + 0.006*\"poet\"\n", + "2019-01-31 00:55:05,050 : INFO : topic #22 (0.020): 0.034*\"spars\" + 0.022*\"factor\" + 0.018*\"adulthood\" + 0.015*\"feel\" + 0.013*\"male\" + 0.012*\"plaisir\" + 0.010*\"genu\" + 0.009*\"hostil\" + 0.008*\"live\" + 0.008*\"western\"\n", + "2019-01-31 00:55:05,051 : INFO : topic #8 (0.020): 0.026*\"law\" + 0.023*\"cortic\" + 0.018*\"start\" + 0.018*\"act\" + 0.014*\"ricardo\" + 0.012*\"case\" + 0.010*\"replac\" + 0.010*\"polaris\" + 0.009*\"legal\" + 0.009*\"order\"\n", + "2019-01-31 00:55:05,057 : INFO : topic diff=0.004598, rho=0.029696\n", + "2019-01-31 00:55:05,271 : INFO : PROGRESS: pass 0, at document #2270000/4922894\n", + "2019-01-31 00:55:06,671 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:55:06,938 : INFO : topic #37 (0.020): 0.010*\"charact\" + 0.010*\"man\" + 0.009*\"septemb\" + 0.007*\"anim\" + 0.007*\"love\" + 0.007*\"comic\" + 0.007*\"appear\" + 0.006*\"gestur\" + 0.005*\"workplac\" + 0.005*\"blue\"\n", + "2019-01-31 00:55:06,939 : INFO : topic #11 (0.020): 0.024*\"john\" + 0.013*\"will\" + 0.012*\"jame\" + 0.011*\"david\" + 0.010*\"rival\" + 0.009*\"mexican–american\" + 0.009*\"slur\" + 0.008*\"georg\" + 0.008*\"paul\" + 0.008*\"rhyme\"\n", + "2019-01-31 00:55:06,940 : INFO : topic #48 (0.020): 0.082*\"sens\" + 0.080*\"march\" + 0.080*\"octob\" + 0.072*\"januari\" + 0.069*\"notion\" + 0.069*\"juli\" + 0.067*\"april\" + 0.067*\"judici\" + 0.066*\"decatur\" + 0.066*\"august\"\n", + "2019-01-31 00:55:06,941 : INFO : topic #16 (0.020): 0.055*\"king\" + 0.034*\"priest\" + 0.021*\"duke\" + 0.019*\"rotterdam\" + 0.019*\"grammat\" + 0.018*\"idiosyncrat\" + 0.016*\"quarterli\" + 0.014*\"count\" + 0.014*\"kingdom\" + 0.013*\"maria\"\n", + "2019-01-31 00:55:06,942 : INFO : topic #27 (0.020): 0.070*\"questionnair\" + 0.019*\"taxpay\" + 0.019*\"candid\" + 0.014*\"ret\" + 0.013*\"tornado\" + 0.013*\"driver\" + 0.012*\"find\" + 0.011*\"squatter\" + 0.011*\"fool\" + 0.010*\"théori\"\n", + "2019-01-31 00:55:06,949 : INFO : topic diff=0.004482, rho=0.029683\n", + "2019-01-31 00:55:07,107 : INFO : PROGRESS: pass 0, at document #2272000/4922894\n", + "2019-01-31 00:55:08,506 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:55:08,773 : INFO : topic #31 (0.020): 0.052*\"fusiform\" + 0.027*\"scientist\" + 0.026*\"taxpay\" + 0.024*\"player\" + 0.020*\"place\" + 0.014*\"clot\" + 0.013*\"leagu\" + 0.012*\"folei\" + 0.010*\"yawn\" + 0.009*\"reconstruct\"\n", + "2019-01-31 00:55:08,774 : INFO : topic #17 (0.020): 0.077*\"church\" + 0.022*\"christian\" + 0.022*\"cathol\" + 0.020*\"bishop\" + 0.017*\"sail\" + 0.016*\"retroflex\" + 0.010*\"centuri\" + 0.010*\"relationship\" + 0.010*\"cathedr\" + 0.009*\"poll\"\n", + "2019-01-31 00:55:08,775 : INFO : topic #0 (0.020): 0.067*\"statewid\" + 0.040*\"line\" + 0.034*\"raid\" + 0.033*\"arsen\" + 0.027*\"museo\" + 0.019*\"traceabl\" + 0.019*\"serv\" + 0.013*\"rosenwald\" + 0.013*\"exhaust\" + 0.012*\"pain\"\n", + "2019-01-31 00:55:08,776 : INFO : topic #19 (0.020): 0.017*\"languag\" + 0.014*\"centuri\" + 0.010*\"woodcut\" + 0.009*\"form\" + 0.009*\"mean\" + 0.009*\"origin\" + 0.008*\"trade\" + 0.007*\"english\" + 0.007*\"known\" + 0.007*\"ancestor\"\n", + "2019-01-31 00:55:08,777 : INFO : topic #26 (0.020): 0.029*\"woman\" + 0.027*\"workplac\" + 0.026*\"champion\" + 0.026*\"men\" + 0.024*\"olymp\" + 0.022*\"alic\" + 0.021*\"medal\" + 0.021*\"event\" + 0.020*\"rainfal\" + 0.018*\"atheist\"\n", + "2019-01-31 00:55:08,783 : INFO : topic diff=0.005570, rho=0.029670\n", + "2019-01-31 00:55:08,942 : INFO : PROGRESS: pass 0, at document #2274000/4922894\n", + "2019-01-31 00:55:10,338 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:55:10,605 : INFO : topic #12 (0.020): 0.008*\"number\" + 0.008*\"frontal\" + 0.007*\"exampl\" + 0.006*\"théori\" + 0.006*\"southern\" + 0.006*\"utopian\" + 0.006*\"measur\" + 0.006*\"gener\" + 0.006*\"servitud\" + 0.006*\"poet\"\n", + "2019-01-31 00:55:10,606 : INFO : topic #3 (0.020): 0.033*\"present\" + 0.026*\"offic\" + 0.024*\"minist\" + 0.022*\"member\" + 0.022*\"nation\" + 0.021*\"govern\" + 0.021*\"serv\" + 0.016*\"gener\" + 0.015*\"start\" + 0.015*\"seri\"\n", + "2019-01-31 00:55:10,607 : INFO : topic #18 (0.020): 0.010*\"théori\" + 0.007*\"later\" + 0.007*\"sack\" + 0.006*\"dai\" + 0.006*\"kill\" + 0.005*\"retrospect\" + 0.005*\"end\" + 0.005*\"like\" + 0.004*\"call\" + 0.004*\"kenworthi\"\n", + "2019-01-31 00:55:10,608 : INFO : topic #8 (0.020): 0.027*\"law\" + 0.023*\"cortic\" + 0.018*\"start\" + 0.017*\"act\" + 0.014*\"ricardo\" + 0.012*\"case\" + 0.011*\"replac\" + 0.010*\"polaris\" + 0.009*\"legal\" + 0.009*\"order\"\n", + "2019-01-31 00:55:10,609 : INFO : topic #30 (0.020): 0.035*\"cleveland\" + 0.035*\"leagu\" + 0.029*\"place\" + 0.027*\"taxpay\" + 0.025*\"scientist\" + 0.023*\"crete\" + 0.021*\"folei\" + 0.016*\"goal\" + 0.014*\"martin\" + 0.012*\"diversifi\"\n", + "2019-01-31 00:55:10,615 : INFO : topic diff=0.004688, rho=0.029656\n", + "2019-01-31 00:55:10,773 : INFO : PROGRESS: pass 0, at document #2276000/4922894\n", + "2019-01-31 00:55:12,144 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:55:12,410 : INFO : topic #3 (0.020): 0.033*\"present\" + 0.026*\"offic\" + 0.024*\"minist\" + 0.022*\"member\" + 0.022*\"nation\" + 0.021*\"govern\" + 0.020*\"serv\" + 0.016*\"gener\" + 0.015*\"start\" + 0.015*\"seri\"\n", + "2019-01-31 00:55:12,411 : INFO : topic #17 (0.020): 0.077*\"church\" + 0.023*\"cathol\" + 0.022*\"christian\" + 0.021*\"bishop\" + 0.017*\"sail\" + 0.015*\"retroflex\" + 0.010*\"centuri\" + 0.010*\"relationship\" + 0.009*\"cathedr\" + 0.009*\"poll\"\n", + "2019-01-31 00:55:12,412 : INFO : topic #14 (0.020): 0.023*\"forc\" + 0.021*\"armi\" + 0.021*\"aggress\" + 0.020*\"walter\" + 0.017*\"com\" + 0.014*\"oper\" + 0.014*\"unionist\" + 0.013*\"militari\" + 0.012*\"airbu\" + 0.011*\"refut\"\n", + "2019-01-31 00:55:12,413 : INFO : topic #31 (0.020): 0.051*\"fusiform\" + 0.026*\"scientist\" + 0.026*\"taxpay\" + 0.024*\"player\" + 0.020*\"place\" + 0.014*\"clot\" + 0.013*\"leagu\" + 0.012*\"folei\" + 0.010*\"yawn\" + 0.009*\"reconstruct\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 00:55:12,414 : INFO : topic #5 (0.020): 0.039*\"abroad\" + 0.029*\"son\" + 0.027*\"rel\" + 0.026*\"reconstruct\" + 0.021*\"band\" + 0.017*\"muscl\" + 0.016*\"simultan\" + 0.014*\"charcoal\" + 0.014*\"toyota\" + 0.010*\"myspac\"\n", + "2019-01-31 00:55:12,420 : INFO : topic diff=0.005100, rho=0.029643\n", + "2019-01-31 00:55:12,579 : INFO : PROGRESS: pass 0, at document #2278000/4922894\n", + "2019-01-31 00:55:13,974 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:55:14,240 : INFO : topic #46 (0.020): 0.018*\"sweden\" + 0.018*\"stop\" + 0.017*\"swedish\" + 0.016*\"norwai\" + 0.015*\"damag\" + 0.015*\"wind\" + 0.015*\"norwegian\" + 0.013*\"farid\" + 0.012*\"treeless\" + 0.011*\"huntsvil\"\n", + "2019-01-31 00:55:14,241 : INFO : topic #37 (0.020): 0.010*\"charact\" + 0.010*\"man\" + 0.009*\"septemb\" + 0.007*\"love\" + 0.007*\"anim\" + 0.007*\"comic\" + 0.007*\"appear\" + 0.006*\"gestur\" + 0.005*\"workplac\" + 0.005*\"blue\"\n", + "2019-01-31 00:55:14,243 : INFO : topic #30 (0.020): 0.035*\"cleveland\" + 0.035*\"leagu\" + 0.029*\"place\" + 0.027*\"taxpay\" + 0.025*\"scientist\" + 0.023*\"crete\" + 0.021*\"folei\" + 0.016*\"goal\" + 0.014*\"martin\" + 0.012*\"diversifi\"\n", + "2019-01-31 00:55:14,244 : INFO : topic #8 (0.020): 0.027*\"law\" + 0.023*\"cortic\" + 0.018*\"start\" + 0.017*\"act\" + 0.014*\"ricardo\" + 0.012*\"case\" + 0.011*\"replac\" + 0.010*\"polaris\" + 0.009*\"legal\" + 0.008*\"order\"\n", + "2019-01-31 00:55:14,245 : INFO : topic #7 (0.020): 0.021*\"snatch\" + 0.020*\"di\" + 0.018*\"factor\" + 0.016*\"yawn\" + 0.015*\"margin\" + 0.014*\"bone\" + 0.013*\"life\" + 0.013*\"faster\" + 0.012*\"deal\" + 0.012*\"daughter\"\n", + "2019-01-31 00:55:14,251 : INFO : topic diff=0.004832, rho=0.029630\n", + "2019-01-31 00:55:16,914 : INFO : -11.637 per-word bound, 3185.9 perplexity estimate based on a held-out corpus of 2000 documents with 541085 words\n", + "2019-01-31 00:55:16,915 : INFO : PROGRESS: pass 0, at document #2280000/4922894\n", + "2019-01-31 00:55:18,287 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:55:18,553 : INFO : topic #18 (0.020): 0.010*\"théori\" + 0.007*\"later\" + 0.007*\"sack\" + 0.006*\"dai\" + 0.006*\"kill\" + 0.005*\"retrospect\" + 0.005*\"end\" + 0.005*\"like\" + 0.004*\"call\" + 0.004*\"kenworthi\"\n", + "2019-01-31 00:55:18,554 : INFO : topic #2 (0.020): 0.051*\"isl\" + 0.037*\"shield\" + 0.017*\"narrat\" + 0.015*\"scot\" + 0.013*\"pope\" + 0.011*\"blur\" + 0.010*\"coalit\" + 0.010*\"nativist\" + 0.009*\"fleet\" + 0.009*\"vernon\"\n", + "2019-01-31 00:55:18,555 : INFO : topic #42 (0.020): 0.047*\"german\" + 0.031*\"germani\" + 0.015*\"vol\" + 0.015*\"berlin\" + 0.014*\"jewish\" + 0.014*\"israel\" + 0.013*\"der\" + 0.012*\"european\" + 0.009*\"europ\" + 0.009*\"austria\"\n", + "2019-01-31 00:55:18,557 : INFO : topic #35 (0.020): 0.057*\"russia\" + 0.036*\"sovereignti\" + 0.034*\"rural\" + 0.026*\"poison\" + 0.026*\"personifi\" + 0.024*\"reprint\" + 0.019*\"moscow\" + 0.018*\"poland\" + 0.017*\"alexand\" + 0.014*\"unfortun\"\n", + "2019-01-31 00:55:18,558 : INFO : topic #36 (0.020): 0.012*\"pop\" + 0.011*\"network\" + 0.011*\"prognosi\" + 0.008*\"develop\" + 0.008*\"cytokin\" + 0.008*\"brio\" + 0.008*\"user\" + 0.008*\"diggin\" + 0.007*\"softwar\" + 0.007*\"includ\"\n", + "2019-01-31 00:55:18,564 : INFO : topic diff=0.004752, rho=0.029617\n", + "2019-01-31 00:55:18,725 : INFO : PROGRESS: pass 0, at document #2282000/4922894\n", + "2019-01-31 00:55:20,138 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:55:20,404 : INFO : topic #13 (0.020): 0.027*\"new\" + 0.026*\"sourc\" + 0.025*\"australia\" + 0.024*\"london\" + 0.022*\"england\" + 0.021*\"australian\" + 0.020*\"british\" + 0.018*\"ireland\" + 0.015*\"youth\" + 0.014*\"weekli\"\n", + "2019-01-31 00:55:20,405 : INFO : topic #40 (0.020): 0.090*\"unit\" + 0.023*\"schuster\" + 0.023*\"collector\" + 0.021*\"institut\" + 0.020*\"requir\" + 0.019*\"student\" + 0.014*\"professor\" + 0.012*\"word\" + 0.011*\"governor\" + 0.011*\"degre\"\n", + "2019-01-31 00:55:20,406 : INFO : topic #27 (0.020): 0.070*\"questionnair\" + 0.019*\"taxpay\" + 0.018*\"candid\" + 0.014*\"ret\" + 0.013*\"tornado\" + 0.012*\"driver\" + 0.012*\"find\" + 0.011*\"fool\" + 0.010*\"landslid\" + 0.010*\"squatter\"\n", + "2019-01-31 00:55:20,407 : INFO : topic #49 (0.020): 0.042*\"india\" + 0.031*\"incumb\" + 0.012*\"islam\" + 0.012*\"pakistan\" + 0.012*\"televis\" + 0.012*\"anglo\" + 0.011*\"tajikistan\" + 0.010*\"affection\" + 0.009*\"khalsa\" + 0.009*\"alam\"\n", + "2019-01-31 00:55:20,408 : INFO : topic #38 (0.020): 0.023*\"walter\" + 0.009*\"aza\" + 0.009*\"forc\" + 0.008*\"battalion\" + 0.007*\"teufel\" + 0.007*\"armi\" + 0.007*\"empath\" + 0.006*\"militari\" + 0.006*\"till\" + 0.006*\"pour\"\n", + "2019-01-31 00:55:20,414 : INFO : topic diff=0.004398, rho=0.029604\n", + "2019-01-31 00:55:20,575 : INFO : PROGRESS: pass 0, at document #2284000/4922894\n", + "2019-01-31 00:55:21,957 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:55:22,224 : INFO : topic #28 (0.020): 0.033*\"build\" + 0.026*\"hous\" + 0.021*\"rivièr\" + 0.017*\"buford\" + 0.014*\"histor\" + 0.012*\"briarwood\" + 0.011*\"strategist\" + 0.011*\"constitut\" + 0.010*\"depress\" + 0.010*\"linear\"\n", + "2019-01-31 00:55:22,225 : INFO : topic #4 (0.020): 0.021*\"enfranchis\" + 0.016*\"depress\" + 0.014*\"pour\" + 0.008*\"elabor\" + 0.008*\"mode\" + 0.008*\"veget\" + 0.008*\"uruguayan\" + 0.006*\"encyclopedia\" + 0.006*\"develop\" + 0.006*\"produc\"\n", + "2019-01-31 00:55:22,226 : INFO : topic #13 (0.020): 0.027*\"new\" + 0.026*\"sourc\" + 0.025*\"australia\" + 0.024*\"london\" + 0.022*\"england\" + 0.021*\"australian\" + 0.020*\"british\" + 0.018*\"ireland\" + 0.016*\"youth\" + 0.014*\"weekli\"\n", + "2019-01-31 00:55:22,227 : INFO : topic #49 (0.020): 0.043*\"india\" + 0.031*\"incumb\" + 0.012*\"islam\" + 0.012*\"pakistan\" + 0.012*\"televis\" + 0.011*\"anglo\" + 0.011*\"tajikistan\" + 0.010*\"affection\" + 0.009*\"sri\" + 0.009*\"khalsa\"\n", + "2019-01-31 00:55:22,228 : INFO : topic #7 (0.020): 0.021*\"snatch\" + 0.020*\"di\" + 0.018*\"factor\" + 0.016*\"yawn\" + 0.015*\"margin\" + 0.014*\"bone\" + 0.013*\"faster\" + 0.013*\"life\" + 0.012*\"deal\" + 0.012*\"daughter\"\n", + "2019-01-31 00:55:22,234 : INFO : topic diff=0.004101, rho=0.029591\n", + "2019-01-31 00:55:22,392 : INFO : PROGRESS: pass 0, at document #2286000/4922894\n", + "2019-01-31 00:55:23,792 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:55:24,059 : INFO : topic #45 (0.020): 0.027*\"jpg\" + 0.027*\"fifteenth\" + 0.017*\"illicit\" + 0.016*\"colder\" + 0.016*\"black\" + 0.014*\"western\" + 0.012*\"record\" + 0.010*\"blind\" + 0.009*\"arm\" + 0.009*\"depress\"\n", + "2019-01-31 00:55:24,060 : INFO : topic #2 (0.020): 0.051*\"isl\" + 0.037*\"shield\" + 0.017*\"narrat\" + 0.015*\"scot\" + 0.013*\"pope\" + 0.011*\"coalit\" + 0.011*\"blur\" + 0.011*\"nativist\" + 0.009*\"fleet\" + 0.009*\"vernon\"\n", + "2019-01-31 00:55:24,061 : INFO : topic #35 (0.020): 0.057*\"russia\" + 0.036*\"sovereignti\" + 0.033*\"rural\" + 0.027*\"poison\" + 0.026*\"personifi\" + 0.023*\"reprint\" + 0.019*\"moscow\" + 0.018*\"poland\" + 0.017*\"alexand\" + 0.014*\"unfortun\"\n", + "2019-01-31 00:55:24,062 : INFO : topic #20 (0.020): 0.144*\"scholar\" + 0.041*\"struggl\" + 0.034*\"high\" + 0.031*\"educ\" + 0.025*\"collector\" + 0.018*\"yawn\" + 0.013*\"prognosi\" + 0.010*\"district\" + 0.009*\"task\" + 0.009*\"class\"\n", + "2019-01-31 00:55:24,063 : INFO : topic #25 (0.020): 0.031*\"ring\" + 0.018*\"lagrang\" + 0.017*\"area\" + 0.017*\"warmth\" + 0.015*\"mount\" + 0.009*\"north\" + 0.009*\"palmer\" + 0.008*\"sourc\" + 0.008*\"lobe\" + 0.008*\"land\"\n", + "2019-01-31 00:55:24,069 : INFO : topic diff=0.004848, rho=0.029579\n", + "2019-01-31 00:55:24,224 : INFO : PROGRESS: pass 0, at document #2288000/4922894\n", + "2019-01-31 00:55:25,591 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:55:25,857 : INFO : topic #43 (0.020): 0.063*\"elect\" + 0.053*\"parti\" + 0.024*\"voluntari\" + 0.022*\"democrat\" + 0.020*\"member\" + 0.016*\"polici\" + 0.014*\"liber\" + 0.014*\"republ\" + 0.014*\"report\" + 0.013*\"bypass\"\n", + "2019-01-31 00:55:25,859 : INFO : topic #34 (0.020): 0.069*\"start\" + 0.032*\"new\" + 0.031*\"american\" + 0.029*\"unionist\" + 0.025*\"cotton\" + 0.019*\"year\" + 0.014*\"california\" + 0.013*\"warrior\" + 0.012*\"terri\" + 0.012*\"north\"\n", + "2019-01-31 00:55:25,860 : INFO : topic #5 (0.020): 0.039*\"abroad\" + 0.029*\"son\" + 0.027*\"rel\" + 0.026*\"reconstruct\" + 0.021*\"band\" + 0.016*\"muscl\" + 0.016*\"simultan\" + 0.014*\"charcoal\" + 0.014*\"toyota\" + 0.010*\"myspac\"\n", + "2019-01-31 00:55:25,861 : INFO : topic #18 (0.020): 0.010*\"théori\" + 0.007*\"later\" + 0.007*\"sack\" + 0.006*\"dai\" + 0.006*\"kill\" + 0.005*\"retrospect\" + 0.005*\"end\" + 0.005*\"like\" + 0.004*\"call\" + 0.004*\"kenworthi\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 00:55:25,862 : INFO : topic #30 (0.020): 0.035*\"leagu\" + 0.035*\"cleveland\" + 0.029*\"place\" + 0.027*\"taxpay\" + 0.025*\"scientist\" + 0.023*\"crete\" + 0.021*\"folei\" + 0.016*\"goal\" + 0.015*\"martin\" + 0.012*\"diversifi\"\n", + "2019-01-31 00:55:25,869 : INFO : topic diff=0.004312, rho=0.029566\n", + "2019-01-31 00:55:26,023 : INFO : PROGRESS: pass 0, at document #2290000/4922894\n", + "2019-01-31 00:55:27,407 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:55:27,674 : INFO : topic #28 (0.020): 0.033*\"build\" + 0.025*\"hous\" + 0.022*\"rivièr\" + 0.018*\"buford\" + 0.014*\"histor\" + 0.012*\"briarwood\" + 0.011*\"strategist\" + 0.011*\"constitut\" + 0.010*\"depress\" + 0.010*\"linear\"\n", + "2019-01-31 00:55:27,675 : INFO : topic #30 (0.020): 0.036*\"leagu\" + 0.035*\"cleveland\" + 0.029*\"place\" + 0.027*\"taxpay\" + 0.025*\"scientist\" + 0.023*\"crete\" + 0.021*\"folei\" + 0.016*\"goal\" + 0.014*\"martin\" + 0.012*\"diversifi\"\n", + "2019-01-31 00:55:27,676 : INFO : topic #11 (0.020): 0.025*\"john\" + 0.012*\"will\" + 0.012*\"jame\" + 0.011*\"david\" + 0.010*\"rival\" + 0.009*\"mexican–american\" + 0.009*\"slur\" + 0.008*\"georg\" + 0.008*\"paul\" + 0.007*\"rhyme\"\n", + "2019-01-31 00:55:27,677 : INFO : topic #33 (0.020): 0.064*\"french\" + 0.046*\"franc\" + 0.031*\"pari\" + 0.023*\"jean\" + 0.023*\"sail\" + 0.016*\"daphn\" + 0.013*\"lazi\" + 0.012*\"loui\" + 0.012*\"piec\" + 0.011*\"wreath\"\n", + "2019-01-31 00:55:27,679 : INFO : topic #18 (0.020): 0.010*\"théori\" + 0.007*\"later\" + 0.007*\"sack\" + 0.006*\"dai\" + 0.006*\"kill\" + 0.005*\"retrospect\" + 0.005*\"end\" + 0.005*\"like\" + 0.004*\"call\" + 0.004*\"kenworthi\"\n", + "2019-01-31 00:55:27,684 : INFO : topic diff=0.004632, rho=0.029553\n", + "2019-01-31 00:55:27,836 : INFO : PROGRESS: pass 0, at document #2292000/4922894\n", + "2019-01-31 00:55:29,187 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:55:29,453 : INFO : topic #47 (0.020): 0.063*\"muscl\" + 0.033*\"perceptu\" + 0.021*\"theater\" + 0.019*\"place\" + 0.017*\"compos\" + 0.014*\"damn\" + 0.014*\"orchestr\" + 0.012*\"olympo\" + 0.012*\"jack\" + 0.011*\"word\"\n", + "2019-01-31 00:55:29,454 : INFO : topic #7 (0.020): 0.021*\"snatch\" + 0.020*\"di\" + 0.018*\"factor\" + 0.016*\"yawn\" + 0.015*\"margin\" + 0.014*\"bone\" + 0.013*\"faster\" + 0.013*\"life\" + 0.012*\"deal\" + 0.012*\"daughter\"\n", + "2019-01-31 00:55:29,455 : INFO : topic #5 (0.020): 0.038*\"abroad\" + 0.029*\"son\" + 0.027*\"rel\" + 0.026*\"reconstruct\" + 0.021*\"band\" + 0.017*\"muscl\" + 0.016*\"simultan\" + 0.014*\"charcoal\" + 0.014*\"toyota\" + 0.010*\"myspac\"\n", + "2019-01-31 00:55:29,456 : INFO : topic #26 (0.020): 0.030*\"woman\" + 0.027*\"workplac\" + 0.026*\"champion\" + 0.026*\"men\" + 0.024*\"olymp\" + 0.022*\"alic\" + 0.021*\"event\" + 0.020*\"medal\" + 0.019*\"rainfal\" + 0.019*\"atheist\"\n", + "2019-01-31 00:55:29,457 : INFO : topic #17 (0.020): 0.078*\"church\" + 0.023*\"cathol\" + 0.022*\"christian\" + 0.021*\"bishop\" + 0.017*\"sail\" + 0.015*\"retroflex\" + 0.010*\"centuri\" + 0.009*\"relationship\" + 0.009*\"cathedr\" + 0.009*\"poll\"\n", + "2019-01-31 00:55:29,463 : INFO : topic diff=0.004792, rho=0.029540\n", + "2019-01-31 00:55:29,621 : INFO : PROGRESS: pass 0, at document #2294000/4922894\n", + "2019-01-31 00:55:30,982 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:55:31,252 : INFO : topic #38 (0.020): 0.023*\"walter\" + 0.009*\"aza\" + 0.009*\"battalion\" + 0.009*\"forc\" + 0.007*\"armi\" + 0.007*\"teufel\" + 0.007*\"empath\" + 0.006*\"pour\" + 0.006*\"militari\" + 0.006*\"govern\"\n", + "2019-01-31 00:55:31,253 : INFO : topic #42 (0.020): 0.046*\"german\" + 0.030*\"germani\" + 0.015*\"vol\" + 0.015*\"berlin\" + 0.014*\"israel\" + 0.014*\"jewish\" + 0.013*\"der\" + 0.011*\"european\" + 0.009*\"europ\" + 0.009*\"austria\"\n", + "2019-01-31 00:55:31,254 : INFO : topic #32 (0.020): 0.052*\"district\" + 0.044*\"vigour\" + 0.044*\"popolo\" + 0.040*\"tortur\" + 0.035*\"cotton\" + 0.025*\"area\" + 0.022*\"multitud\" + 0.020*\"citi\" + 0.020*\"regim\" + 0.019*\"cede\"\n", + "2019-01-31 00:55:31,255 : INFO : topic #45 (0.020): 0.028*\"fifteenth\" + 0.027*\"jpg\" + 0.019*\"illicit\" + 0.017*\"colder\" + 0.016*\"black\" + 0.014*\"western\" + 0.012*\"record\" + 0.010*\"blind\" + 0.009*\"arm\" + 0.009*\"depress\"\n", + "2019-01-31 00:55:31,256 : INFO : topic #0 (0.020): 0.066*\"statewid\" + 0.042*\"line\" + 0.035*\"raid\" + 0.032*\"arsen\" + 0.026*\"museo\" + 0.020*\"traceabl\" + 0.018*\"serv\" + 0.013*\"rosenwald\" + 0.013*\"exhaust\" + 0.012*\"oper\"\n", + "2019-01-31 00:55:31,262 : INFO : topic diff=0.004291, rho=0.029527\n", + "2019-01-31 00:55:31,418 : INFO : PROGRESS: pass 0, at document #2296000/4922894\n", + "2019-01-31 00:55:32,818 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:55:33,084 : INFO : topic #29 (0.020): 0.029*\"companhia\" + 0.012*\"million\" + 0.012*\"market\" + 0.012*\"busi\" + 0.011*\"produc\" + 0.011*\"bank\" + 0.009*\"industri\" + 0.009*\"yawn\" + 0.008*\"manag\" + 0.007*\"function\"\n", + "2019-01-31 00:55:33,086 : INFO : topic #45 (0.020): 0.027*\"fifteenth\" + 0.027*\"jpg\" + 0.019*\"illicit\" + 0.017*\"colder\" + 0.016*\"black\" + 0.014*\"western\" + 0.012*\"record\" + 0.010*\"blind\" + 0.009*\"depress\" + 0.008*\"arm\"\n", + "2019-01-31 00:55:33,087 : INFO : topic #39 (0.020): 0.055*\"canada\" + 0.043*\"canadian\" + 0.023*\"toronto\" + 0.023*\"hoar\" + 0.020*\"ontario\" + 0.018*\"hydrogen\" + 0.015*\"new\" + 0.015*\"misericordia\" + 0.014*\"quebec\" + 0.013*\"novotná\"\n", + "2019-01-31 00:55:33,088 : INFO : topic #41 (0.020): 0.041*\"citi\" + 0.024*\"new\" + 0.023*\"palmer\" + 0.013*\"strategist\" + 0.013*\"center\" + 0.012*\"open\" + 0.011*\"includ\" + 0.011*\"lobe\" + 0.010*\"dai\" + 0.009*\"highli\"\n", + "2019-01-31 00:55:33,089 : INFO : topic #33 (0.020): 0.064*\"french\" + 0.046*\"franc\" + 0.031*\"pari\" + 0.023*\"jean\" + 0.023*\"sail\" + 0.016*\"daphn\" + 0.013*\"lazi\" + 0.012*\"loui\" + 0.012*\"piec\" + 0.010*\"wreath\"\n", + "2019-01-31 00:55:33,095 : INFO : topic diff=0.004131, rho=0.029514\n", + "2019-01-31 00:55:33,252 : INFO : PROGRESS: pass 0, at document #2298000/4922894\n", + "2019-01-31 00:55:34,647 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:55:34,913 : INFO : topic #30 (0.020): 0.036*\"leagu\" + 0.035*\"cleveland\" + 0.029*\"place\" + 0.028*\"taxpay\" + 0.025*\"scientist\" + 0.023*\"crete\" + 0.021*\"folei\" + 0.016*\"goal\" + 0.015*\"martin\" + 0.012*\"schmitz\"\n", + "2019-01-31 00:55:34,914 : INFO : topic #42 (0.020): 0.047*\"german\" + 0.031*\"germani\" + 0.015*\"vol\" + 0.015*\"jewish\" + 0.014*\"israel\" + 0.014*\"berlin\" + 0.013*\"der\" + 0.011*\"european\" + 0.009*\"europ\" + 0.009*\"austria\"\n", + "2019-01-31 00:55:34,915 : INFO : topic #47 (0.020): 0.064*\"muscl\" + 0.033*\"perceptu\" + 0.021*\"theater\" + 0.019*\"place\" + 0.018*\"compos\" + 0.014*\"damn\" + 0.014*\"orchestr\" + 0.012*\"olympo\" + 0.012*\"jack\" + 0.011*\"word\"\n", + "2019-01-31 00:55:34,916 : INFO : topic #13 (0.020): 0.026*\"new\" + 0.025*\"australia\" + 0.025*\"sourc\" + 0.025*\"england\" + 0.024*\"london\" + 0.021*\"australian\" + 0.019*\"british\" + 0.019*\"ireland\" + 0.015*\"youth\" + 0.013*\"wale\"\n", + "2019-01-31 00:55:34,918 : INFO : topic #46 (0.020): 0.019*\"sweden\" + 0.017*\"swedish\" + 0.017*\"stop\" + 0.016*\"norwai\" + 0.016*\"damag\" + 0.015*\"farid\" + 0.015*\"norwegian\" + 0.014*\"wind\" + 0.012*\"financ\" + 0.011*\"denmark\"\n", + "2019-01-31 00:55:34,924 : INFO : topic diff=0.005038, rho=0.029501\n", + "2019-01-31 00:55:37,592 : INFO : -11.743 per-word bound, 3428.2 perplexity estimate based on a held-out corpus of 2000 documents with 530380 words\n", + "2019-01-31 00:55:37,593 : INFO : PROGRESS: pass 0, at document #2300000/4922894\n", + "2019-01-31 00:55:38,972 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:55:39,239 : INFO : topic #24 (0.020): 0.040*\"book\" + 0.035*\"publicis\" + 0.024*\"word\" + 0.018*\"new\" + 0.014*\"edit\" + 0.013*\"presid\" + 0.012*\"nicola\" + 0.011*\"storag\" + 0.011*\"collect\" + 0.011*\"worldwid\"\n", + "2019-01-31 00:55:39,239 : INFO : topic #33 (0.020): 0.063*\"french\" + 0.045*\"franc\" + 0.030*\"pari\" + 0.023*\"sail\" + 0.023*\"jean\" + 0.016*\"daphn\" + 0.014*\"lazi\" + 0.012*\"loui\" + 0.012*\"piec\" + 0.010*\"wreath\"\n", + "2019-01-31 00:55:39,241 : INFO : topic #43 (0.020): 0.063*\"elect\" + 0.054*\"parti\" + 0.024*\"voluntari\" + 0.024*\"democrat\" + 0.020*\"member\" + 0.016*\"polici\" + 0.016*\"republ\" + 0.014*\"liber\" + 0.014*\"report\" + 0.013*\"bypass\"\n", + "2019-01-31 00:55:39,241 : INFO : topic #42 (0.020): 0.046*\"german\" + 0.030*\"germani\" + 0.016*\"vol\" + 0.015*\"jewish\" + 0.015*\"israel\" + 0.014*\"berlin\" + 0.013*\"der\" + 0.011*\"european\" + 0.009*\"europ\" + 0.009*\"austria\"\n", + "2019-01-31 00:55:39,242 : INFO : topic #7 (0.020): 0.022*\"snatch\" + 0.020*\"di\" + 0.019*\"factor\" + 0.016*\"yawn\" + 0.015*\"margin\" + 0.014*\"bone\" + 0.013*\"faster\" + 0.013*\"life\" + 0.012*\"deal\" + 0.012*\"daughter\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 00:55:39,248 : INFO : topic diff=0.004683, rho=0.029488\n", + "2019-01-31 00:55:39,461 : INFO : PROGRESS: pass 0, at document #2302000/4922894\n", + "2019-01-31 00:55:40,866 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:55:41,133 : INFO : topic #14 (0.020): 0.023*\"forc\" + 0.021*\"aggress\" + 0.020*\"armi\" + 0.020*\"walter\" + 0.017*\"com\" + 0.014*\"oper\" + 0.014*\"unionist\" + 0.013*\"militari\" + 0.011*\"airbu\" + 0.010*\"refut\"\n", + "2019-01-31 00:55:41,134 : INFO : topic #27 (0.020): 0.069*\"questionnair\" + 0.019*\"taxpay\" + 0.018*\"candid\" + 0.015*\"ret\" + 0.013*\"driver\" + 0.012*\"tornado\" + 0.012*\"find\" + 0.010*\"fool\" + 0.010*\"landslid\" + 0.010*\"théori\"\n", + "2019-01-31 00:55:41,135 : INFO : topic #24 (0.020): 0.039*\"book\" + 0.035*\"publicis\" + 0.025*\"word\" + 0.018*\"new\" + 0.014*\"edit\" + 0.013*\"presid\" + 0.012*\"nicola\" + 0.011*\"storag\" + 0.011*\"collect\" + 0.011*\"worldwid\"\n", + "2019-01-31 00:55:41,136 : INFO : topic #17 (0.020): 0.077*\"church\" + 0.024*\"cathol\" + 0.022*\"christian\" + 0.021*\"bishop\" + 0.018*\"sail\" + 0.015*\"retroflex\" + 0.010*\"centuri\" + 0.010*\"poll\" + 0.009*\"relationship\" + 0.009*\"cathedr\"\n", + "2019-01-31 00:55:41,137 : INFO : topic #31 (0.020): 0.050*\"fusiform\" + 0.026*\"scientist\" + 0.026*\"taxpay\" + 0.023*\"player\" + 0.019*\"place\" + 0.014*\"clot\" + 0.013*\"leagu\" + 0.012*\"folei\" + 0.010*\"yawn\" + 0.009*\"reconstruct\"\n", + "2019-01-31 00:55:41,142 : INFO : topic diff=0.004773, rho=0.029476\n", + "2019-01-31 00:55:41,299 : INFO : PROGRESS: pass 0, at document #2304000/4922894\n", + "2019-01-31 00:55:42,695 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:55:42,961 : INFO : topic #20 (0.020): 0.142*\"scholar\" + 0.041*\"struggl\" + 0.033*\"high\" + 0.030*\"educ\" + 0.025*\"collector\" + 0.019*\"yawn\" + 0.013*\"prognosi\" + 0.009*\"district\" + 0.009*\"task\" + 0.009*\"class\"\n", + "2019-01-31 00:55:42,962 : INFO : topic #42 (0.020): 0.045*\"german\" + 0.030*\"germani\" + 0.016*\"jewish\" + 0.015*\"vol\" + 0.015*\"israel\" + 0.014*\"berlin\" + 0.013*\"der\" + 0.011*\"european\" + 0.009*\"europ\" + 0.009*\"austria\"\n", + "2019-01-31 00:55:42,963 : INFO : topic #30 (0.020): 0.036*\"leagu\" + 0.035*\"cleveland\" + 0.029*\"place\" + 0.027*\"taxpay\" + 0.025*\"scientist\" + 0.023*\"crete\" + 0.021*\"folei\" + 0.016*\"goal\" + 0.015*\"martin\" + 0.012*\"diversifi\"\n", + "2019-01-31 00:55:42,964 : INFO : topic #1 (0.020): 0.056*\"china\" + 0.043*\"chilton\" + 0.023*\"hong\" + 0.022*\"kong\" + 0.021*\"korea\" + 0.019*\"korean\" + 0.016*\"leah\" + 0.016*\"sourc\" + 0.014*\"shirin\" + 0.014*\"kim\"\n", + "2019-01-31 00:55:42,965 : INFO : topic #8 (0.020): 0.027*\"law\" + 0.023*\"cortic\" + 0.018*\"start\" + 0.018*\"act\" + 0.013*\"ricardo\" + 0.012*\"case\" + 0.010*\"replac\" + 0.010*\"polaris\" + 0.009*\"legal\" + 0.008*\"order\"\n", + "2019-01-31 00:55:42,971 : INFO : topic diff=0.005092, rho=0.029463\n", + "2019-01-31 00:55:43,131 : INFO : PROGRESS: pass 0, at document #2306000/4922894\n", + "2019-01-31 00:55:44,506 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:55:44,776 : INFO : topic #17 (0.020): 0.077*\"church\" + 0.024*\"cathol\" + 0.022*\"christian\" + 0.021*\"bishop\" + 0.018*\"sail\" + 0.015*\"retroflex\" + 0.010*\"centuri\" + 0.010*\"poll\" + 0.009*\"relationship\" + 0.009*\"cathedr\"\n", + "2019-01-31 00:55:44,777 : INFO : topic #35 (0.020): 0.055*\"russia\" + 0.035*\"sovereignti\" + 0.031*\"rural\" + 0.028*\"poison\" + 0.024*\"personifi\" + 0.022*\"reprint\" + 0.018*\"poland\" + 0.018*\"moscow\" + 0.016*\"alexand\" + 0.014*\"unfortun\"\n", + "2019-01-31 00:55:44,778 : INFO : topic #13 (0.020): 0.027*\"new\" + 0.025*\"australia\" + 0.025*\"sourc\" + 0.024*\"england\" + 0.024*\"london\" + 0.021*\"australian\" + 0.019*\"british\" + 0.019*\"ireland\" + 0.015*\"youth\" + 0.013*\"wale\"\n", + "2019-01-31 00:55:44,779 : INFO : topic #10 (0.020): 0.011*\"cdd\" + 0.009*\"media\" + 0.008*\"disco\" + 0.007*\"pathwai\" + 0.007*\"caus\" + 0.007*\"have\" + 0.007*\"hormon\" + 0.006*\"cancer\" + 0.006*\"effect\" + 0.006*\"proper\"\n", + "2019-01-31 00:55:44,780 : INFO : topic #21 (0.020): 0.033*\"samford\" + 0.023*\"spain\" + 0.018*\"del\" + 0.016*\"mexico\" + 0.013*\"soviet\" + 0.013*\"italian\" + 0.012*\"santa\" + 0.011*\"juan\" + 0.011*\"francisco\" + 0.011*\"carlo\"\n", + "2019-01-31 00:55:44,786 : INFO : topic diff=0.004721, rho=0.029450\n", + "2019-01-31 00:55:44,946 : INFO : PROGRESS: pass 0, at document #2308000/4922894\n", + "2019-01-31 00:55:46,344 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:55:46,610 : INFO : topic #18 (0.020): 0.010*\"théori\" + 0.007*\"later\" + 0.007*\"sack\" + 0.006*\"dai\" + 0.006*\"kill\" + 0.005*\"retrospect\" + 0.005*\"like\" + 0.005*\"end\" + 0.004*\"help\" + 0.004*\"call\"\n", + "2019-01-31 00:55:46,611 : INFO : topic #39 (0.020): 0.055*\"canada\" + 0.044*\"canadian\" + 0.023*\"toronto\" + 0.023*\"hoar\" + 0.020*\"ontario\" + 0.017*\"hydrogen\" + 0.015*\"new\" + 0.015*\"misericordia\" + 0.014*\"quebec\" + 0.013*\"novotná\"\n", + "2019-01-31 00:55:46,613 : INFO : topic #15 (0.020): 0.011*\"small\" + 0.010*\"organ\" + 0.010*\"develop\" + 0.009*\"commun\" + 0.009*\"word\" + 0.009*\"group\" + 0.008*\"peopl\" + 0.007*\"woman\" + 0.007*\"human\" + 0.006*\"workplac\"\n", + "2019-01-31 00:55:46,614 : INFO : topic #3 (0.020): 0.033*\"present\" + 0.026*\"offic\" + 0.023*\"nation\" + 0.023*\"minist\" + 0.022*\"member\" + 0.021*\"serv\" + 0.021*\"govern\" + 0.016*\"gener\" + 0.015*\"start\" + 0.015*\"chickasaw\"\n", + "2019-01-31 00:55:46,615 : INFO : topic #30 (0.020): 0.036*\"leagu\" + 0.035*\"cleveland\" + 0.029*\"place\" + 0.028*\"taxpay\" + 0.025*\"scientist\" + 0.023*\"crete\" + 0.022*\"folei\" + 0.016*\"goal\" + 0.015*\"martin\" + 0.012*\"diversifi\"\n", + "2019-01-31 00:55:46,620 : INFO : topic diff=0.004912, rho=0.029437\n", + "2019-01-31 00:55:46,773 : INFO : PROGRESS: pass 0, at document #2310000/4922894\n", + "2019-01-31 00:55:48,113 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:55:48,379 : INFO : topic #35 (0.020): 0.055*\"russia\" + 0.035*\"sovereignti\" + 0.031*\"rural\" + 0.028*\"poison\" + 0.024*\"personifi\" + 0.023*\"reprint\" + 0.019*\"poland\" + 0.018*\"moscow\" + 0.016*\"alexand\" + 0.014*\"czech\"\n", + "2019-01-31 00:55:48,380 : INFO : topic #31 (0.020): 0.050*\"fusiform\" + 0.026*\"scientist\" + 0.026*\"taxpay\" + 0.022*\"player\" + 0.020*\"place\" + 0.015*\"clot\" + 0.013*\"leagu\" + 0.012*\"folei\" + 0.010*\"yawn\" + 0.009*\"reconstruct\"\n", + "2019-01-31 00:55:48,381 : INFO : topic #3 (0.020): 0.033*\"present\" + 0.026*\"offic\" + 0.023*\"nation\" + 0.023*\"minist\" + 0.022*\"member\" + 0.021*\"govern\" + 0.021*\"serv\" + 0.016*\"gener\" + 0.015*\"start\" + 0.015*\"chickasaw\"\n", + "2019-01-31 00:55:48,382 : INFO : topic #29 (0.020): 0.029*\"companhia\" + 0.012*\"busi\" + 0.012*\"million\" + 0.011*\"market\" + 0.011*\"produc\" + 0.010*\"bank\" + 0.009*\"industri\" + 0.009*\"yawn\" + 0.008*\"manag\" + 0.007*\"function\"\n", + "2019-01-31 00:55:48,383 : INFO : topic #25 (0.020): 0.032*\"ring\" + 0.019*\"lagrang\" + 0.017*\"area\" + 0.016*\"warmth\" + 0.015*\"mount\" + 0.009*\"north\" + 0.009*\"foam\" + 0.009*\"palmer\" + 0.008*\"sourc\" + 0.008*\"lobe\"\n", + "2019-01-31 00:55:48,389 : INFO : topic diff=0.004327, rho=0.029424\n", + "2019-01-31 00:55:48,543 : INFO : PROGRESS: pass 0, at document #2312000/4922894\n", + "2019-01-31 00:55:49,903 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:55:50,169 : INFO : topic #28 (0.020): 0.032*\"build\" + 0.025*\"hous\" + 0.021*\"rivièr\" + 0.017*\"buford\" + 0.013*\"histor\" + 0.012*\"briarwood\" + 0.011*\"strategist\" + 0.011*\"constitut\" + 0.010*\"depress\" + 0.010*\"linear\"\n", + "2019-01-31 00:55:50,170 : INFO : topic #10 (0.020): 0.011*\"cdd\" + 0.008*\"media\" + 0.008*\"disco\" + 0.007*\"pathwai\" + 0.007*\"caus\" + 0.007*\"have\" + 0.007*\"hormon\" + 0.006*\"effect\" + 0.006*\"cancer\" + 0.006*\"proper\"\n", + "2019-01-31 00:55:50,172 : INFO : topic #24 (0.020): 0.039*\"book\" + 0.035*\"publicis\" + 0.024*\"word\" + 0.018*\"new\" + 0.014*\"edit\" + 0.013*\"presid\" + 0.012*\"nicola\" + 0.011*\"storag\" + 0.011*\"collect\" + 0.011*\"worldwid\"\n", + "2019-01-31 00:55:50,173 : INFO : topic #26 (0.020): 0.029*\"woman\" + 0.027*\"workplac\" + 0.027*\"men\" + 0.025*\"champion\" + 0.024*\"olymp\" + 0.022*\"event\" + 0.021*\"rainfal\" + 0.020*\"alic\" + 0.020*\"medal\" + 0.020*\"atheist\"\n", + "2019-01-31 00:55:50,174 : INFO : topic #3 (0.020): 0.033*\"present\" + 0.026*\"offic\" + 0.023*\"nation\" + 0.023*\"minist\" + 0.022*\"member\" + 0.021*\"govern\" + 0.021*\"serv\" + 0.016*\"gener\" + 0.016*\"start\" + 0.015*\"chickasaw\"\n", + "2019-01-31 00:55:50,179 : INFO : topic diff=0.004184, rho=0.029412\n", + "2019-01-31 00:55:50,342 : INFO : PROGRESS: pass 0, at document #2314000/4922894\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 00:55:51,753 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:55:52,019 : INFO : topic #10 (0.020): 0.011*\"cdd\" + 0.008*\"media\" + 0.008*\"disco\" + 0.007*\"pathwai\" + 0.007*\"caus\" + 0.007*\"have\" + 0.007*\"hormon\" + 0.007*\"effect\" + 0.006*\"cancer\" + 0.006*\"proper\"\n", + "2019-01-31 00:55:52,021 : INFO : topic #29 (0.020): 0.029*\"companhia\" + 0.012*\"busi\" + 0.012*\"million\" + 0.012*\"market\" + 0.011*\"produc\" + 0.010*\"bank\" + 0.009*\"industri\" + 0.009*\"yawn\" + 0.008*\"manag\" + 0.007*\"function\"\n", + "2019-01-31 00:55:52,022 : INFO : topic #33 (0.020): 0.062*\"french\" + 0.046*\"franc\" + 0.029*\"pari\" + 0.023*\"jean\" + 0.022*\"sail\" + 0.017*\"daphn\" + 0.014*\"lazi\" + 0.012*\"loui\" + 0.011*\"piec\" + 0.009*\"wreath\"\n", + "2019-01-31 00:55:52,023 : INFO : topic #25 (0.020): 0.031*\"ring\" + 0.019*\"lagrang\" + 0.017*\"area\" + 0.016*\"warmth\" + 0.015*\"mount\" + 0.009*\"north\" + 0.009*\"foam\" + 0.009*\"palmer\" + 0.008*\"sourc\" + 0.008*\"lobe\"\n", + "2019-01-31 00:55:52,024 : INFO : topic #47 (0.020): 0.066*\"muscl\" + 0.033*\"perceptu\" + 0.020*\"theater\" + 0.019*\"place\" + 0.018*\"compos\" + 0.015*\"damn\" + 0.013*\"orchestr\" + 0.012*\"olympo\" + 0.012*\"jack\" + 0.011*\"word\"\n", + "2019-01-31 00:55:52,030 : INFO : topic diff=0.004895, rho=0.029399\n", + "2019-01-31 00:55:52,184 : INFO : PROGRESS: pass 0, at document #2316000/4922894\n", + "2019-01-31 00:55:53,543 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:55:53,809 : INFO : topic #35 (0.020): 0.056*\"russia\" + 0.037*\"sovereignti\" + 0.031*\"rural\" + 0.027*\"poison\" + 0.024*\"personifi\" + 0.023*\"reprint\" + 0.019*\"moscow\" + 0.018*\"poland\" + 0.015*\"alexand\" + 0.014*\"unfortun\"\n", + "2019-01-31 00:55:53,810 : INFO : topic #48 (0.020): 0.079*\"sens\" + 0.077*\"octob\" + 0.077*\"march\" + 0.071*\"januari\" + 0.069*\"notion\" + 0.068*\"juli\" + 0.066*\"april\" + 0.065*\"decatur\" + 0.065*\"judici\" + 0.064*\"august\"\n", + "2019-01-31 00:55:53,811 : INFO : topic #17 (0.020): 0.078*\"church\" + 0.024*\"cathol\" + 0.022*\"christian\" + 0.020*\"bishop\" + 0.017*\"sail\" + 0.014*\"retroflex\" + 0.010*\"poll\" + 0.010*\"centuri\" + 0.009*\"relationship\" + 0.009*\"historiographi\"\n", + "2019-01-31 00:55:53,812 : INFO : topic #37 (0.020): 0.010*\"charact\" + 0.009*\"man\" + 0.008*\"septemb\" + 0.007*\"love\" + 0.007*\"anim\" + 0.007*\"appear\" + 0.006*\"comic\" + 0.006*\"gestur\" + 0.005*\"blue\" + 0.005*\"vision\"\n", + "2019-01-31 00:55:53,813 : INFO : topic #32 (0.020): 0.051*\"district\" + 0.044*\"popolo\" + 0.044*\"vigour\" + 0.039*\"tortur\" + 0.035*\"cotton\" + 0.025*\"area\" + 0.023*\"multitud\" + 0.021*\"citi\" + 0.020*\"regim\" + 0.019*\"cede\"\n", + "2019-01-31 00:55:53,819 : INFO : topic diff=0.004881, rho=0.029386\n", + "2019-01-31 00:55:53,978 : INFO : PROGRESS: pass 0, at document #2318000/4922894\n", + "2019-01-31 00:55:55,375 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:55:55,641 : INFO : topic #11 (0.020): 0.024*\"john\" + 0.013*\"will\" + 0.012*\"david\" + 0.011*\"jame\" + 0.010*\"rival\" + 0.009*\"slur\" + 0.009*\"mexican–american\" + 0.009*\"georg\" + 0.008*\"paul\" + 0.007*\"rhyme\"\n", + "2019-01-31 00:55:55,642 : INFO : topic #25 (0.020): 0.033*\"ring\" + 0.019*\"lagrang\" + 0.017*\"area\" + 0.016*\"warmth\" + 0.015*\"mount\" + 0.009*\"north\" + 0.009*\"foam\" + 0.009*\"palmer\" + 0.008*\"sourc\" + 0.008*\"vacant\"\n", + "2019-01-31 00:55:55,643 : INFO : topic #41 (0.020): 0.040*\"citi\" + 0.023*\"palmer\" + 0.023*\"new\" + 0.014*\"strategist\" + 0.013*\"center\" + 0.012*\"open\" + 0.011*\"includ\" + 0.011*\"lobe\" + 0.009*\"dai\" + 0.009*\"highli\"\n", + "2019-01-31 00:55:55,644 : INFO : topic #6 (0.020): 0.072*\"fewer\" + 0.025*\"epiru\" + 0.022*\"septemb\" + 0.018*\"teacher\" + 0.016*\"stake\" + 0.013*\"rodríguez\" + 0.012*\"proclaim\" + 0.011*\"direct\" + 0.011*\"movi\" + 0.011*\"acrimoni\"\n", + "2019-01-31 00:55:55,645 : INFO : topic #14 (0.020): 0.023*\"forc\" + 0.020*\"aggress\" + 0.020*\"armi\" + 0.020*\"walter\" + 0.017*\"com\" + 0.014*\"oper\" + 0.013*\"unionist\" + 0.012*\"militari\" + 0.012*\"airbu\" + 0.012*\"refut\"\n", + "2019-01-31 00:55:55,651 : INFO : topic diff=0.005084, rho=0.029374\n", + "2019-01-31 00:55:58,351 : INFO : -12.302 per-word bound, 5049.5 perplexity estimate based on a held-out corpus of 2000 documents with 552979 words\n", + "2019-01-31 00:55:58,351 : INFO : PROGRESS: pass 0, at document #2320000/4922894\n", + "2019-01-31 00:55:59,752 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:56:00,020 : INFO : topic #20 (0.020): 0.144*\"scholar\" + 0.041*\"struggl\" + 0.034*\"high\" + 0.030*\"educ\" + 0.026*\"collector\" + 0.018*\"yawn\" + 0.013*\"prognosi\" + 0.009*\"class\" + 0.009*\"district\" + 0.009*\"task\"\n", + "2019-01-31 00:56:00,022 : INFO : topic #45 (0.020): 0.026*\"jpg\" + 0.026*\"fifteenth\" + 0.018*\"illicit\" + 0.017*\"colder\" + 0.016*\"black\" + 0.015*\"western\" + 0.013*\"record\" + 0.010*\"blind\" + 0.008*\"depress\" + 0.008*\"arm\"\n", + "2019-01-31 00:56:00,023 : INFO : topic #1 (0.020): 0.053*\"china\" + 0.042*\"chilton\" + 0.022*\"hong\" + 0.021*\"kong\" + 0.020*\"korea\" + 0.018*\"korean\" + 0.016*\"leah\" + 0.015*\"sourc\" + 0.014*\"kim\" + 0.013*\"shirin\"\n", + "2019-01-31 00:56:00,024 : INFO : topic #38 (0.020): 0.022*\"walter\" + 0.009*\"battalion\" + 0.009*\"forc\" + 0.009*\"aza\" + 0.007*\"armi\" + 0.007*\"empath\" + 0.007*\"teufel\" + 0.006*\"pour\" + 0.006*\"militari\" + 0.006*\"govern\"\n", + "2019-01-31 00:56:00,025 : INFO : topic #26 (0.020): 0.030*\"woman\" + 0.028*\"workplac\" + 0.027*\"men\" + 0.025*\"champion\" + 0.023*\"olymp\" + 0.021*\"event\" + 0.021*\"rainfal\" + 0.020*\"atheist\" + 0.020*\"alic\" + 0.020*\"medal\"\n", + "2019-01-31 00:56:00,030 : INFO : topic diff=0.004282, rho=0.029361\n", + "2019-01-31 00:56:00,191 : INFO : PROGRESS: pass 0, at document #2322000/4922894\n", + "2019-01-31 00:56:01,567 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:56:01,837 : INFO : topic #41 (0.020): 0.040*\"citi\" + 0.024*\"palmer\" + 0.023*\"new\" + 0.014*\"strategist\" + 0.013*\"center\" + 0.012*\"open\" + 0.011*\"includ\" + 0.011*\"lobe\" + 0.009*\"dai\" + 0.009*\"highli\"\n", + "2019-01-31 00:56:01,838 : INFO : topic #11 (0.020): 0.024*\"john\" + 0.012*\"will\" + 0.012*\"david\" + 0.011*\"jame\" + 0.010*\"rival\" + 0.009*\"mexican–american\" + 0.009*\"slur\" + 0.009*\"georg\" + 0.008*\"paul\" + 0.008*\"rhyme\"\n", + "2019-01-31 00:56:01,839 : INFO : topic #7 (0.020): 0.021*\"snatch\" + 0.020*\"di\" + 0.018*\"factor\" + 0.016*\"yawn\" + 0.015*\"margin\" + 0.014*\"bone\" + 0.013*\"faster\" + 0.013*\"life\" + 0.012*\"deal\" + 0.012*\"daughter\"\n", + "2019-01-31 00:56:01,840 : INFO : topic #17 (0.020): 0.077*\"church\" + 0.025*\"cathol\" + 0.022*\"christian\" + 0.021*\"bishop\" + 0.017*\"sail\" + 0.015*\"retroflex\" + 0.010*\"centuri\" + 0.010*\"poll\" + 0.009*\"relationship\" + 0.009*\"historiographi\"\n", + "2019-01-31 00:56:01,841 : INFO : topic #33 (0.020): 0.062*\"french\" + 0.045*\"franc\" + 0.029*\"pari\" + 0.023*\"jean\" + 0.022*\"sail\" + 0.017*\"daphn\" + 0.015*\"lazi\" + 0.012*\"loui\" + 0.012*\"piec\" + 0.009*\"wreath\"\n", + "2019-01-31 00:56:01,846 : INFO : topic diff=0.004100, rho=0.029348\n", + "2019-01-31 00:56:02,006 : INFO : PROGRESS: pass 0, at document #2324000/4922894\n", + "2019-01-31 00:56:03,424 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:56:03,690 : INFO : topic #20 (0.020): 0.144*\"scholar\" + 0.040*\"struggl\" + 0.034*\"high\" + 0.030*\"educ\" + 0.026*\"collector\" + 0.019*\"yawn\" + 0.013*\"prognosi\" + 0.009*\"class\" + 0.009*\"district\" + 0.009*\"task\"\n", + "2019-01-31 00:56:03,691 : INFO : topic #31 (0.020): 0.051*\"fusiform\" + 0.026*\"scientist\" + 0.026*\"taxpay\" + 0.022*\"player\" + 0.020*\"place\" + 0.015*\"clot\" + 0.013*\"leagu\" + 0.011*\"folei\" + 0.010*\"yawn\" + 0.009*\"reconstruct\"\n", + "2019-01-31 00:56:03,692 : INFO : topic #16 (0.020): 0.051*\"king\" + 0.031*\"priest\" + 0.020*\"duke\" + 0.018*\"rotterdam\" + 0.018*\"grammat\" + 0.018*\"idiosyncrat\" + 0.016*\"quarterli\" + 0.014*\"kingdom\" + 0.014*\"portugues\" + 0.014*\"paisiello\"\n", + "2019-01-31 00:56:03,693 : INFO : topic #36 (0.020): 0.011*\"pop\" + 0.011*\"network\" + 0.011*\"prognosi\" + 0.008*\"develop\" + 0.008*\"cytokin\" + 0.008*\"user\" + 0.008*\"softwar\" + 0.008*\"diggin\" + 0.007*\"brio\" + 0.007*\"uruguayan\"\n", + "2019-01-31 00:56:03,694 : INFO : topic #18 (0.020): 0.010*\"théori\" + 0.007*\"later\" + 0.007*\"sack\" + 0.006*\"dai\" + 0.006*\"kill\" + 0.005*\"retrospect\" + 0.005*\"like\" + 0.005*\"end\" + 0.004*\"call\" + 0.004*\"kenworthi\"\n", + "2019-01-31 00:56:03,700 : INFO : topic diff=0.005903, rho=0.029336\n", + "2019-01-31 00:56:03,858 : INFO : PROGRESS: pass 0, at document #2326000/4922894\n", + "2019-01-31 00:56:05,249 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 00:56:05,515 : INFO : topic #46 (0.020): 0.018*\"swedish\" + 0.018*\"sweden\" + 0.017*\"wind\" + 0.016*\"stop\" + 0.016*\"norwai\" + 0.016*\"damag\" + 0.015*\"norwegian\" + 0.014*\"farid\" + 0.013*\"financ\" + 0.013*\"turkish\"\n", + "2019-01-31 00:56:05,516 : INFO : topic #4 (0.020): 0.020*\"enfranchis\" + 0.015*\"depress\" + 0.015*\"pour\" + 0.008*\"elabor\" + 0.008*\"mode\" + 0.008*\"veget\" + 0.008*\"uruguayan\" + 0.007*\"encyclopedia\" + 0.007*\"develop\" + 0.006*\"produc\"\n", + "2019-01-31 00:56:05,517 : INFO : topic #3 (0.020): 0.032*\"present\" + 0.026*\"offic\" + 0.023*\"nation\" + 0.023*\"minist\" + 0.022*\"member\" + 0.021*\"govern\" + 0.021*\"serv\" + 0.016*\"gener\" + 0.016*\"start\" + 0.015*\"chickasaw\"\n", + "2019-01-31 00:56:05,518 : INFO : topic #49 (0.020): 0.042*\"india\" + 0.031*\"incumb\" + 0.013*\"anglo\" + 0.012*\"islam\" + 0.012*\"pakistan\" + 0.010*\"televis\" + 0.010*\"khalsa\" + 0.010*\"alam\" + 0.009*\"sri\" + 0.009*\"affection\"\n", + "2019-01-31 00:56:05,519 : INFO : topic #19 (0.020): 0.017*\"languag\" + 0.014*\"centuri\" + 0.010*\"woodcut\" + 0.009*\"form\" + 0.009*\"mean\" + 0.009*\"origin\" + 0.007*\"trade\" + 0.007*\"english\" + 0.007*\"known\" + 0.006*\"uruguayan\"\n", + "2019-01-31 00:56:05,525 : INFO : topic diff=0.004088, rho=0.029323\n", + "2019-01-31 00:56:05,681 : INFO : PROGRESS: pass 0, at document #2328000/4922894\n", + "2019-01-31 00:56:07,076 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:56:07,342 : INFO : topic #16 (0.020): 0.051*\"king\" + 0.031*\"priest\" + 0.020*\"duke\" + 0.018*\"grammat\" + 0.018*\"rotterdam\" + 0.018*\"idiosyncrat\" + 0.016*\"quarterli\" + 0.014*\"kingdom\" + 0.014*\"portugues\" + 0.014*\"paisiello\"\n", + "2019-01-31 00:56:07,344 : INFO : topic #17 (0.020): 0.077*\"church\" + 0.025*\"cathol\" + 0.022*\"christian\" + 0.021*\"bishop\" + 0.017*\"sail\" + 0.015*\"retroflex\" + 0.010*\"centuri\" + 0.010*\"poll\" + 0.009*\"relationship\" + 0.009*\"cathedr\"\n", + "2019-01-31 00:56:07,345 : INFO : topic #6 (0.020): 0.072*\"fewer\" + 0.025*\"epiru\" + 0.022*\"septemb\" + 0.018*\"teacher\" + 0.016*\"stake\" + 0.013*\"rodríguez\" + 0.012*\"proclaim\" + 0.011*\"direct\" + 0.011*\"movi\" + 0.011*\"acrimoni\"\n", + "2019-01-31 00:56:07,346 : INFO : topic #35 (0.020): 0.056*\"russia\" + 0.036*\"sovereignti\" + 0.031*\"rural\" + 0.028*\"poison\" + 0.024*\"personifi\" + 0.023*\"reprint\" + 0.019*\"moscow\" + 0.018*\"poland\" + 0.015*\"unfortun\" + 0.015*\"czech\"\n", + "2019-01-31 00:56:07,347 : INFO : topic #15 (0.020): 0.012*\"small\" + 0.010*\"organ\" + 0.010*\"develop\" + 0.009*\"commun\" + 0.009*\"word\" + 0.008*\"group\" + 0.008*\"peopl\" + 0.007*\"woman\" + 0.007*\"human\" + 0.006*\"cultur\"\n", + "2019-01-31 00:56:07,353 : INFO : topic diff=0.004243, rho=0.029311\n", + "2019-01-31 00:56:07,518 : INFO : PROGRESS: pass 0, at document #2330000/4922894\n", + "2019-01-31 00:56:08,940 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:56:09,210 : INFO : topic #42 (0.020): 0.047*\"german\" + 0.031*\"germani\" + 0.015*\"vol\" + 0.015*\"jewish\" + 0.015*\"israel\" + 0.014*\"berlin\" + 0.014*\"der\" + 0.011*\"european\" + 0.009*\"itali\" + 0.009*\"europ\"\n", + "2019-01-31 00:56:09,211 : INFO : topic #18 (0.020): 0.010*\"théori\" + 0.007*\"later\" + 0.007*\"sack\" + 0.006*\"dai\" + 0.006*\"kill\" + 0.005*\"retrospect\" + 0.005*\"like\" + 0.005*\"end\" + 0.004*\"kenworthi\" + 0.004*\"call\"\n", + "2019-01-31 00:56:09,212 : INFO : topic #21 (0.020): 0.035*\"samford\" + 0.022*\"spain\" + 0.019*\"del\" + 0.016*\"mexico\" + 0.013*\"italian\" + 0.013*\"soviet\" + 0.011*\"santa\" + 0.011*\"francisco\" + 0.011*\"juan\" + 0.010*\"carlo\"\n", + "2019-01-31 00:56:09,213 : INFO : topic #7 (0.020): 0.022*\"snatch\" + 0.020*\"di\" + 0.018*\"factor\" + 0.015*\"yawn\" + 0.015*\"margin\" + 0.014*\"bone\" + 0.013*\"faster\" + 0.013*\"life\" + 0.012*\"deal\" + 0.012*\"daughter\"\n", + "2019-01-31 00:56:09,214 : INFO : topic #37 (0.020): 0.010*\"charact\" + 0.009*\"man\" + 0.009*\"septemb\" + 0.007*\"anim\" + 0.007*\"love\" + 0.007*\"comic\" + 0.007*\"appear\" + 0.006*\"gestur\" + 0.006*\"blue\" + 0.005*\"workplac\"\n", + "2019-01-31 00:56:09,220 : INFO : topic diff=0.005387, rho=0.029298\n", + "2019-01-31 00:56:09,377 : INFO : PROGRESS: pass 0, at document #2332000/4922894\n", + "2019-01-31 00:56:10,753 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:56:11,019 : INFO : topic #8 (0.020): 0.027*\"law\" + 0.022*\"cortic\" + 0.018*\"start\" + 0.017*\"act\" + 0.013*\"ricardo\" + 0.011*\"case\" + 0.010*\"replac\" + 0.010*\"order\" + 0.009*\"polaris\" + 0.009*\"legal\"\n", + "2019-01-31 00:56:11,020 : INFO : topic #46 (0.020): 0.018*\"swedish\" + 0.018*\"sweden\" + 0.017*\"stop\" + 0.016*\"wind\" + 0.016*\"norwai\" + 0.015*\"norwegian\" + 0.015*\"damag\" + 0.014*\"farid\" + 0.013*\"turkish\" + 0.012*\"financ\"\n", + "2019-01-31 00:56:11,021 : INFO : topic #47 (0.020): 0.064*\"muscl\" + 0.033*\"perceptu\" + 0.021*\"theater\" + 0.019*\"place\" + 0.017*\"compos\" + 0.014*\"damn\" + 0.013*\"orchestr\" + 0.013*\"olympo\" + 0.012*\"word\" + 0.012*\"physician\"\n", + "2019-01-31 00:56:11,022 : INFO : topic #7 (0.020): 0.021*\"snatch\" + 0.019*\"di\" + 0.018*\"factor\" + 0.015*\"yawn\" + 0.015*\"margin\" + 0.014*\"bone\" + 0.013*\"faster\" + 0.013*\"life\" + 0.012*\"deal\" + 0.012*\"daughter\"\n", + "2019-01-31 00:56:11,023 : INFO : topic #13 (0.020): 0.026*\"new\" + 0.025*\"sourc\" + 0.025*\"london\" + 0.025*\"australia\" + 0.024*\"england\" + 0.021*\"australian\" + 0.020*\"british\" + 0.018*\"ireland\" + 0.015*\"youth\" + 0.013*\"wale\"\n", + "2019-01-31 00:56:11,029 : INFO : topic diff=0.004230, rho=0.029285\n", + "2019-01-31 00:56:11,237 : INFO : PROGRESS: pass 0, at document #2334000/4922894\n", + "2019-01-31 00:56:12,618 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:56:12,884 : INFO : topic #25 (0.020): 0.032*\"ring\" + 0.018*\"lagrang\" + 0.017*\"area\" + 0.016*\"warmth\" + 0.015*\"mount\" + 0.010*\"north\" + 0.009*\"foam\" + 0.009*\"vacant\" + 0.009*\"sourc\" + 0.009*\"palmer\"\n", + "2019-01-31 00:56:12,885 : INFO : topic #48 (0.020): 0.081*\"sens\" + 0.079*\"march\" + 0.078*\"octob\" + 0.072*\"januari\" + 0.070*\"notion\" + 0.070*\"juli\" + 0.068*\"april\" + 0.067*\"judici\" + 0.067*\"august\" + 0.066*\"decatur\"\n", + "2019-01-31 00:56:12,887 : INFO : topic #5 (0.020): 0.038*\"abroad\" + 0.028*\"son\" + 0.027*\"rel\" + 0.026*\"reconstruct\" + 0.021*\"band\" + 0.017*\"muscl\" + 0.016*\"simultan\" + 0.014*\"charcoal\" + 0.014*\"toyota\" + 0.009*\"myspac\"\n", + "2019-01-31 00:56:12,888 : INFO : topic #43 (0.020): 0.062*\"elect\" + 0.054*\"parti\" + 0.024*\"voluntari\" + 0.023*\"democrat\" + 0.020*\"member\" + 0.016*\"polici\" + 0.015*\"republ\" + 0.014*\"bypass\" + 0.014*\"report\" + 0.013*\"liber\"\n", + "2019-01-31 00:56:12,889 : INFO : topic #8 (0.020): 0.027*\"law\" + 0.022*\"cortic\" + 0.018*\"start\" + 0.017*\"act\" + 0.013*\"ricardo\" + 0.011*\"case\" + 0.010*\"replac\" + 0.010*\"order\" + 0.009*\"polaris\" + 0.009*\"legal\"\n", + "2019-01-31 00:56:12,895 : INFO : topic diff=0.004540, rho=0.029273\n", + "2019-01-31 00:56:13,049 : INFO : PROGRESS: pass 0, at document #2336000/4922894\n", + "2019-01-31 00:56:14,433 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:56:14,700 : INFO : topic #20 (0.020): 0.143*\"scholar\" + 0.041*\"struggl\" + 0.035*\"high\" + 0.030*\"educ\" + 0.026*\"collector\" + 0.019*\"yawn\" + 0.013*\"prognosi\" + 0.009*\"task\" + 0.009*\"class\" + 0.008*\"district\"\n", + "2019-01-31 00:56:14,701 : INFO : topic #0 (0.020): 0.066*\"statewid\" + 0.042*\"line\" + 0.037*\"raid\" + 0.031*\"arsen\" + 0.025*\"museo\" + 0.019*\"traceabl\" + 0.019*\"serv\" + 0.013*\"rosenwald\" + 0.013*\"exhaust\" + 0.012*\"oper\"\n", + "2019-01-31 00:56:14,702 : INFO : topic #14 (0.020): 0.024*\"forc\" + 0.021*\"aggress\" + 0.020*\"armi\" + 0.019*\"walter\" + 0.017*\"com\" + 0.013*\"oper\" + 0.013*\"unionist\" + 0.012*\"militari\" + 0.012*\"airbu\" + 0.011*\"diversifi\"\n", + "2019-01-31 00:56:14,703 : INFO : topic #40 (0.020): 0.090*\"unit\" + 0.023*\"schuster\" + 0.023*\"collector\" + 0.021*\"institut\" + 0.020*\"requir\" + 0.019*\"student\" + 0.015*\"professor\" + 0.011*\"word\" + 0.011*\"degre\" + 0.011*\"http\"\n", + "2019-01-31 00:56:14,704 : INFO : topic #37 (0.020): 0.010*\"charact\" + 0.009*\"man\" + 0.009*\"septemb\" + 0.007*\"anim\" + 0.007*\"comic\" + 0.007*\"love\" + 0.007*\"appear\" + 0.007*\"gestur\" + 0.006*\"blue\" + 0.005*\"workplac\"\n", + "2019-01-31 00:56:14,710 : INFO : topic diff=0.004470, rho=0.029260\n", + "2019-01-31 00:56:14,869 : INFO : PROGRESS: pass 0, at document #2338000/4922894\n", + "2019-01-31 00:56:16,253 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:56:16,520 : INFO : topic #31 (0.020): 0.051*\"fusiform\" + 0.026*\"taxpay\" + 0.025*\"scientist\" + 0.022*\"player\" + 0.020*\"place\" + 0.015*\"clot\" + 0.013*\"leagu\" + 0.011*\"folei\" + 0.010*\"yawn\" + 0.009*\"reconstruct\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 00:56:16,521 : INFO : topic #19 (0.020): 0.017*\"languag\" + 0.014*\"centuri\" + 0.010*\"woodcut\" + 0.009*\"form\" + 0.009*\"mean\" + 0.009*\"origin\" + 0.007*\"english\" + 0.007*\"trade\" + 0.007*\"known\" + 0.006*\"uruguayan\"\n", + "2019-01-31 00:56:16,522 : INFO : topic #7 (0.020): 0.021*\"snatch\" + 0.019*\"di\" + 0.018*\"factor\" + 0.015*\"yawn\" + 0.015*\"margin\" + 0.014*\"bone\" + 0.013*\"faster\" + 0.013*\"life\" + 0.012*\"deal\" + 0.012*\"daughter\"\n", + "2019-01-31 00:56:16,523 : INFO : topic #9 (0.020): 0.075*\"bone\" + 0.044*\"american\" + 0.025*\"valour\" + 0.018*\"dutch\" + 0.018*\"folei\" + 0.017*\"player\" + 0.016*\"polit\" + 0.016*\"english\" + 0.015*\"simpler\" + 0.012*\"acrimoni\"\n", + "2019-01-31 00:56:16,525 : INFO : topic #5 (0.020): 0.038*\"abroad\" + 0.029*\"son\" + 0.027*\"rel\" + 0.026*\"reconstruct\" + 0.021*\"band\" + 0.017*\"muscl\" + 0.016*\"simultan\" + 0.014*\"charcoal\" + 0.013*\"toyota\" + 0.009*\"vocabulari\"\n", + "2019-01-31 00:56:16,530 : INFO : topic diff=0.004893, rho=0.029248\n", + "2019-01-31 00:56:19,310 : INFO : -11.571 per-word bound, 3041.6 perplexity estimate based on a held-out corpus of 2000 documents with 538395 words\n", + "2019-01-31 00:56:19,311 : INFO : PROGRESS: pass 0, at document #2340000/4922894\n", + "2019-01-31 00:56:20,683 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:56:20,949 : INFO : topic #4 (0.020): 0.020*\"enfranchis\" + 0.015*\"depress\" + 0.014*\"pour\" + 0.008*\"elabor\" + 0.008*\"mode\" + 0.008*\"veget\" + 0.008*\"uruguayan\" + 0.007*\"encyclopedia\" + 0.007*\"develop\" + 0.006*\"spectacl\"\n", + "2019-01-31 00:56:20,950 : INFO : topic #44 (0.020): 0.031*\"rooftop\" + 0.025*\"final\" + 0.022*\"wife\" + 0.021*\"tourist\" + 0.018*\"champion\" + 0.016*\"taxpay\" + 0.015*\"martin\" + 0.015*\"chamber\" + 0.015*\"tiepolo\" + 0.014*\"open\"\n", + "2019-01-31 00:56:20,951 : INFO : topic #49 (0.020): 0.043*\"india\" + 0.031*\"incumb\" + 0.012*\"anglo\" + 0.012*\"islam\" + 0.012*\"pakistan\" + 0.011*\"khalsa\" + 0.010*\"televis\" + 0.010*\"alam\" + 0.010*\"sri\" + 0.010*\"muskoge\"\n", + "2019-01-31 00:56:20,952 : INFO : topic #45 (0.020): 0.026*\"jpg\" + 0.026*\"fifteenth\" + 0.018*\"illicit\" + 0.018*\"colder\" + 0.016*\"black\" + 0.015*\"western\" + 0.012*\"record\" + 0.010*\"blind\" + 0.008*\"depress\" + 0.008*\"arm\"\n", + "2019-01-31 00:56:20,953 : INFO : topic #42 (0.020): 0.048*\"german\" + 0.031*\"germani\" + 0.015*\"vol\" + 0.015*\"jewish\" + 0.014*\"berlin\" + 0.014*\"der\" + 0.014*\"israel\" + 0.011*\"european\" + 0.009*\"europ\" + 0.009*\"itali\"\n", + "2019-01-31 00:56:20,960 : INFO : topic diff=0.003730, rho=0.029235\n", + "2019-01-31 00:56:21,119 : INFO : PROGRESS: pass 0, at document #2342000/4922894\n", + "2019-01-31 00:56:22,515 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:56:22,782 : INFO : topic #7 (0.020): 0.022*\"snatch\" + 0.019*\"di\" + 0.018*\"factor\" + 0.015*\"yawn\" + 0.015*\"margin\" + 0.014*\"bone\" + 0.013*\"faster\" + 0.013*\"life\" + 0.012*\"deal\" + 0.012*\"will\"\n", + "2019-01-31 00:56:22,783 : INFO : topic #11 (0.020): 0.025*\"john\" + 0.013*\"will\" + 0.012*\"jame\" + 0.012*\"david\" + 0.010*\"rival\" + 0.009*\"georg\" + 0.009*\"mexican–american\" + 0.008*\"slur\" + 0.008*\"paul\" + 0.008*\"rhyme\"\n", + "2019-01-31 00:56:22,784 : INFO : topic #32 (0.020): 0.051*\"district\" + 0.044*\"popolo\" + 0.042*\"vigour\" + 0.040*\"tortur\" + 0.034*\"cotton\" + 0.025*\"area\" + 0.023*\"multitud\" + 0.021*\"citi\" + 0.020*\"regim\" + 0.020*\"cede\"\n", + "2019-01-31 00:56:22,785 : INFO : topic #1 (0.020): 0.054*\"china\" + 0.045*\"chilton\" + 0.022*\"hong\" + 0.022*\"kong\" + 0.020*\"korea\" + 0.018*\"korean\" + 0.015*\"leah\" + 0.015*\"sourc\" + 0.014*\"shirin\" + 0.013*\"kim\"\n", + "2019-01-31 00:56:22,786 : INFO : topic #16 (0.020): 0.051*\"king\" + 0.031*\"priest\" + 0.019*\"duke\" + 0.018*\"rotterdam\" + 0.018*\"grammat\" + 0.017*\"idiosyncrat\" + 0.017*\"quarterli\" + 0.014*\"kingdom\" + 0.014*\"portugues\" + 0.013*\"count\"\n", + "2019-01-31 00:56:22,792 : INFO : topic diff=0.006449, rho=0.029223\n", + "2019-01-31 00:56:22,946 : INFO : PROGRESS: pass 0, at document #2344000/4922894\n", + "2019-01-31 00:56:24,301 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:56:24,568 : INFO : topic #12 (0.020): 0.008*\"number\" + 0.007*\"frontal\" + 0.007*\"théori\" + 0.007*\"exampl\" + 0.006*\"gener\" + 0.006*\"southern\" + 0.006*\"poet\" + 0.006*\"servitud\" + 0.006*\"measur\" + 0.006*\"utopian\"\n", + "2019-01-31 00:56:24,569 : INFO : topic #21 (0.020): 0.034*\"samford\" + 0.023*\"spain\" + 0.019*\"del\" + 0.017*\"mexico\" + 0.013*\"italian\" + 0.013*\"soviet\" + 0.012*\"santa\" + 0.011*\"juan\" + 0.011*\"francisco\" + 0.010*\"carlo\"\n", + "2019-01-31 00:56:24,569 : INFO : topic #23 (0.020): 0.137*\"audit\" + 0.067*\"best\" + 0.033*\"yawn\" + 0.027*\"jacksonvil\" + 0.022*\"noll\" + 0.021*\"japanes\" + 0.020*\"festiv\" + 0.019*\"women\" + 0.017*\"intern\" + 0.015*\"prison\"\n", + "2019-01-31 00:56:24,570 : INFO : topic #8 (0.020): 0.027*\"law\" + 0.022*\"cortic\" + 0.018*\"start\" + 0.017*\"act\" + 0.013*\"ricardo\" + 0.012*\"case\" + 0.010*\"replac\" + 0.009*\"order\" + 0.009*\"polaris\" + 0.009*\"legal\"\n", + "2019-01-31 00:56:24,571 : INFO : topic #46 (0.020): 0.018*\"swedish\" + 0.018*\"sweden\" + 0.016*\"norwai\" + 0.016*\"stop\" + 0.016*\"wind\" + 0.015*\"norwegian\" + 0.015*\"damag\" + 0.014*\"farid\" + 0.012*\"financ\" + 0.012*\"turkish\"\n", + "2019-01-31 00:56:24,577 : INFO : topic diff=0.004345, rho=0.029210\n", + "2019-01-31 00:56:24,732 : INFO : PROGRESS: pass 0, at document #2346000/4922894\n", + "2019-01-31 00:56:26,097 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:56:26,363 : INFO : topic #16 (0.020): 0.051*\"king\" + 0.031*\"priest\" + 0.020*\"duke\" + 0.018*\"rotterdam\" + 0.018*\"grammat\" + 0.017*\"idiosyncrat\" + 0.017*\"quarterli\" + 0.014*\"kingdom\" + 0.014*\"portugues\" + 0.014*\"brazil\"\n", + "2019-01-31 00:56:26,364 : INFO : topic #13 (0.020): 0.025*\"new\" + 0.025*\"london\" + 0.025*\"sourc\" + 0.025*\"australia\" + 0.023*\"england\" + 0.021*\"australian\" + 0.020*\"british\" + 0.018*\"ireland\" + 0.015*\"youth\" + 0.013*\"wale\"\n", + "2019-01-31 00:56:26,365 : INFO : topic #37 (0.020): 0.010*\"charact\" + 0.009*\"man\" + 0.009*\"septemb\" + 0.007*\"anim\" + 0.007*\"love\" + 0.007*\"comic\" + 0.007*\"appear\" + 0.006*\"gestur\" + 0.006*\"vision\" + 0.005*\"blue\"\n", + "2019-01-31 00:56:26,366 : INFO : topic #3 (0.020): 0.031*\"present\" + 0.026*\"offic\" + 0.023*\"nation\" + 0.023*\"minist\" + 0.021*\"member\" + 0.021*\"govern\" + 0.021*\"serv\" + 0.016*\"gener\" + 0.015*\"start\" + 0.015*\"chickasaw\"\n", + "2019-01-31 00:56:26,367 : INFO : topic #48 (0.020): 0.081*\"sens\" + 0.079*\"march\" + 0.078*\"octob\" + 0.073*\"januari\" + 0.071*\"notion\" + 0.071*\"juli\" + 0.069*\"april\" + 0.068*\"august\" + 0.068*\"judici\" + 0.067*\"decatur\"\n", + "2019-01-31 00:56:26,373 : INFO : topic diff=0.004569, rho=0.029198\n", + "2019-01-31 00:56:26,530 : INFO : PROGRESS: pass 0, at document #2348000/4922894\n", + "2019-01-31 00:56:27,915 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:56:28,181 : INFO : topic #1 (0.020): 0.054*\"china\" + 0.045*\"chilton\" + 0.022*\"hong\" + 0.021*\"kong\" + 0.020*\"korea\" + 0.018*\"korean\" + 0.015*\"sourc\" + 0.015*\"leah\" + 0.014*\"shirin\" + 0.013*\"kim\"\n", + "2019-01-31 00:56:28,182 : INFO : topic #44 (0.020): 0.031*\"rooftop\" + 0.025*\"final\" + 0.022*\"wife\" + 0.021*\"tourist\" + 0.018*\"champion\" + 0.016*\"taxpay\" + 0.015*\"chamber\" + 0.015*\"tiepolo\" + 0.015*\"martin\" + 0.014*\"open\"\n", + "2019-01-31 00:56:28,183 : INFO : topic #13 (0.020): 0.026*\"new\" + 0.025*\"sourc\" + 0.025*\"london\" + 0.025*\"australia\" + 0.023*\"england\" + 0.021*\"australian\" + 0.020*\"british\" + 0.018*\"ireland\" + 0.015*\"youth\" + 0.013*\"wale\"\n", + "2019-01-31 00:56:28,184 : INFO : topic #33 (0.020): 0.061*\"french\" + 0.045*\"franc\" + 0.029*\"pari\" + 0.021*\"jean\" + 0.021*\"sail\" + 0.017*\"daphn\" + 0.013*\"lazi\" + 0.012*\"loui\" + 0.011*\"piec\" + 0.009*\"wine\"\n", + "2019-01-31 00:56:28,185 : INFO : topic #22 (0.020): 0.033*\"spars\" + 0.023*\"factor\" + 0.017*\"adulthood\" + 0.014*\"feel\" + 0.012*\"male\" + 0.011*\"plaisir\" + 0.010*\"genu\" + 0.008*\"hostil\" + 0.008*\"biom\" + 0.008*\"western\"\n", + "2019-01-31 00:56:28,191 : INFO : topic diff=0.004108, rho=0.029185\n", + "2019-01-31 00:56:28,350 : INFO : PROGRESS: pass 0, at document #2350000/4922894\n", + "2019-01-31 00:56:29,735 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:56:30,001 : INFO : topic #37 (0.020): 0.010*\"charact\" + 0.009*\"man\" + 0.009*\"septemb\" + 0.007*\"anim\" + 0.007*\"love\" + 0.007*\"comic\" + 0.007*\"appear\" + 0.006*\"gestur\" + 0.006*\"vision\" + 0.005*\"blue\"\n", + "2019-01-31 00:56:30,002 : INFO : topic #4 (0.020): 0.020*\"enfranchis\" + 0.015*\"depress\" + 0.014*\"pour\" + 0.008*\"elabor\" + 0.008*\"veget\" + 0.008*\"mode\" + 0.007*\"uruguayan\" + 0.007*\"encyclopedia\" + 0.007*\"develop\" + 0.006*\"spectacl\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 00:56:30,004 : INFO : topic #39 (0.020): 0.056*\"canada\" + 0.044*\"canadian\" + 0.023*\"toronto\" + 0.022*\"hoar\" + 0.020*\"ontario\" + 0.017*\"hydrogen\" + 0.015*\"new\" + 0.014*\"misericordia\" + 0.013*\"novotná\" + 0.013*\"quebec\"\n", + "2019-01-31 00:56:30,005 : INFO : topic #40 (0.020): 0.090*\"unit\" + 0.023*\"collector\" + 0.023*\"schuster\" + 0.021*\"institut\" + 0.020*\"requir\" + 0.019*\"student\" + 0.014*\"professor\" + 0.012*\"word\" + 0.011*\"degre\" + 0.011*\"http\"\n", + "2019-01-31 00:56:30,005 : INFO : topic #33 (0.020): 0.061*\"french\" + 0.045*\"franc\" + 0.029*\"pari\" + 0.021*\"jean\" + 0.021*\"sail\" + 0.017*\"daphn\" + 0.013*\"lazi\" + 0.012*\"loui\" + 0.011*\"piec\" + 0.009*\"wine\"\n", + "2019-01-31 00:56:30,011 : INFO : topic diff=0.004374, rho=0.029173\n", + "2019-01-31 00:56:30,168 : INFO : PROGRESS: pass 0, at document #2352000/4922894\n", + "2019-01-31 00:56:31,556 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:56:31,824 : INFO : topic #49 (0.020): 0.043*\"india\" + 0.032*\"incumb\" + 0.013*\"islam\" + 0.012*\"anglo\" + 0.012*\"pakistan\" + 0.010*\"khalsa\" + 0.010*\"muskoge\" + 0.010*\"televis\" + 0.010*\"sri\" + 0.010*\"alam\"\n", + "2019-01-31 00:56:31,825 : INFO : topic #26 (0.020): 0.029*\"woman\" + 0.028*\"workplac\" + 0.027*\"men\" + 0.026*\"champion\" + 0.024*\"olymp\" + 0.021*\"event\" + 0.021*\"medal\" + 0.020*\"rainfal\" + 0.020*\"atheist\" + 0.018*\"taxpay\"\n", + "2019-01-31 00:56:31,827 : INFO : topic #28 (0.020): 0.030*\"build\" + 0.026*\"hous\" + 0.021*\"rivièr\" + 0.017*\"buford\" + 0.013*\"histor\" + 0.011*\"strategist\" + 0.011*\"briarwood\" + 0.010*\"constitut\" + 0.010*\"depress\" + 0.010*\"linear\"\n", + "2019-01-31 00:56:31,828 : INFO : topic #23 (0.020): 0.136*\"audit\" + 0.067*\"best\" + 0.033*\"yawn\" + 0.028*\"jacksonvil\" + 0.022*\"noll\" + 0.021*\"japanes\" + 0.020*\"festiv\" + 0.019*\"women\" + 0.016*\"intern\" + 0.015*\"prison\"\n", + "2019-01-31 00:56:31,829 : INFO : topic #30 (0.020): 0.036*\"leagu\" + 0.035*\"cleveland\" + 0.029*\"place\" + 0.027*\"taxpay\" + 0.025*\"scientist\" + 0.024*\"crete\" + 0.021*\"folei\" + 0.016*\"goal\" + 0.014*\"martin\" + 0.013*\"schmitz\"\n", + "2019-01-31 00:56:31,835 : INFO : topic diff=0.004075, rho=0.029161\n", + "2019-01-31 00:56:31,988 : INFO : PROGRESS: pass 0, at document #2354000/4922894\n", + "2019-01-31 00:56:33,340 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:56:33,607 : INFO : topic #30 (0.020): 0.035*\"leagu\" + 0.035*\"cleveland\" + 0.029*\"place\" + 0.027*\"taxpay\" + 0.025*\"scientist\" + 0.024*\"crete\" + 0.021*\"folei\" + 0.016*\"goal\" + 0.015*\"martin\" + 0.013*\"schmitz\"\n", + "2019-01-31 00:56:33,608 : INFO : topic #39 (0.020): 0.056*\"canada\" + 0.044*\"canadian\" + 0.023*\"toronto\" + 0.022*\"hoar\" + 0.020*\"ontario\" + 0.017*\"hydrogen\" + 0.015*\"new\" + 0.014*\"misericordia\" + 0.013*\"novotná\" + 0.013*\"quebec\"\n", + "2019-01-31 00:56:33,609 : INFO : topic #14 (0.020): 0.024*\"forc\" + 0.021*\"armi\" + 0.021*\"aggress\" + 0.019*\"walter\" + 0.018*\"com\" + 0.013*\"oper\" + 0.012*\"unionist\" + 0.012*\"militari\" + 0.012*\"refut\" + 0.012*\"airbu\"\n", + "2019-01-31 00:56:33,610 : INFO : topic #2 (0.020): 0.058*\"isl\" + 0.037*\"shield\" + 0.018*\"narrat\" + 0.014*\"scot\" + 0.013*\"pope\" + 0.011*\"coalit\" + 0.011*\"blur\" + 0.011*\"nativist\" + 0.009*\"fleet\" + 0.008*\"vernon\"\n", + "2019-01-31 00:56:33,611 : INFO : topic #25 (0.020): 0.032*\"ring\" + 0.018*\"lagrang\" + 0.017*\"area\" + 0.016*\"warmth\" + 0.015*\"mount\" + 0.010*\"north\" + 0.009*\"foam\" + 0.009*\"sourc\" + 0.009*\"vacant\" + 0.009*\"palmer\"\n", + "2019-01-31 00:56:33,617 : INFO : topic diff=0.005187, rho=0.029148\n", + "2019-01-31 00:56:33,771 : INFO : PROGRESS: pass 0, at document #2356000/4922894\n", + "2019-01-31 00:56:35,138 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:56:35,404 : INFO : topic #31 (0.020): 0.052*\"fusiform\" + 0.025*\"taxpay\" + 0.025*\"scientist\" + 0.022*\"player\" + 0.020*\"place\" + 0.015*\"clot\" + 0.013*\"leagu\" + 0.012*\"folei\" + 0.010*\"yawn\" + 0.009*\"reconstruct\"\n", + "2019-01-31 00:56:35,405 : INFO : topic #8 (0.020): 0.027*\"law\" + 0.022*\"cortic\" + 0.018*\"start\" + 0.017*\"act\" + 0.013*\"ricardo\" + 0.012*\"case\" + 0.010*\"replac\" + 0.009*\"polaris\" + 0.009*\"order\" + 0.009*\"legal\"\n", + "2019-01-31 00:56:35,406 : INFO : topic #41 (0.020): 0.041*\"citi\" + 0.024*\"palmer\" + 0.023*\"new\" + 0.014*\"strategist\" + 0.012*\"center\" + 0.012*\"open\" + 0.011*\"includ\" + 0.011*\"lobe\" + 0.009*\"dai\" + 0.009*\"highli\"\n", + "2019-01-31 00:56:35,407 : INFO : topic #34 (0.020): 0.067*\"start\" + 0.032*\"new\" + 0.031*\"american\" + 0.028*\"unionist\" + 0.024*\"cotton\" + 0.020*\"year\" + 0.015*\"california\" + 0.013*\"warrior\" + 0.013*\"terri\" + 0.012*\"north\"\n", + "2019-01-31 00:56:35,408 : INFO : topic #11 (0.020): 0.025*\"john\" + 0.013*\"will\" + 0.012*\"jame\" + 0.011*\"david\" + 0.010*\"rival\" + 0.009*\"georg\" + 0.009*\"mexican–american\" + 0.008*\"slur\" + 0.008*\"rhyme\" + 0.008*\"paul\"\n", + "2019-01-31 00:56:35,414 : INFO : topic diff=0.004280, rho=0.029136\n", + "2019-01-31 00:56:35,567 : INFO : PROGRESS: pass 0, at document #2358000/4922894\n", + "2019-01-31 00:56:36,945 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:56:37,212 : INFO : topic #42 (0.020): 0.048*\"german\" + 0.031*\"germani\" + 0.015*\"vol\" + 0.015*\"jewish\" + 0.014*\"israel\" + 0.014*\"der\" + 0.014*\"berlin\" + 0.011*\"european\" + 0.009*\"hungarian\" + 0.009*\"itali\"\n", + "2019-01-31 00:56:37,213 : INFO : topic #19 (0.020): 0.018*\"languag\" + 0.014*\"centuri\" + 0.010*\"woodcut\" + 0.009*\"form\" + 0.009*\"mean\" + 0.009*\"origin\" + 0.007*\"trade\" + 0.007*\"english\" + 0.007*\"known\" + 0.006*\"uruguayan\"\n", + "2019-01-31 00:56:37,214 : INFO : topic #20 (0.020): 0.143*\"scholar\" + 0.041*\"struggl\" + 0.034*\"high\" + 0.030*\"educ\" + 0.027*\"collector\" + 0.019*\"yawn\" + 0.013*\"prognosi\" + 0.009*\"class\" + 0.009*\"task\" + 0.008*\"district\"\n", + "2019-01-31 00:56:37,215 : INFO : topic #0 (0.020): 0.065*\"statewid\" + 0.043*\"line\" + 0.037*\"raid\" + 0.030*\"arsen\" + 0.024*\"museo\" + 0.019*\"traceabl\" + 0.019*\"serv\" + 0.014*\"rosenwald\" + 0.013*\"exhaust\" + 0.012*\"oper\"\n", + "2019-01-31 00:56:37,216 : INFO : topic #8 (0.020): 0.027*\"law\" + 0.022*\"cortic\" + 0.018*\"start\" + 0.017*\"act\" + 0.013*\"ricardo\" + 0.012*\"case\" + 0.010*\"replac\" + 0.009*\"polaris\" + 0.009*\"order\" + 0.009*\"legal\"\n", + "2019-01-31 00:56:37,222 : INFO : topic diff=0.004180, rho=0.029123\n", + "2019-01-31 00:56:39,918 : INFO : -11.707 per-word bound, 3342.2 perplexity estimate based on a held-out corpus of 2000 documents with 549535 words\n", + "2019-01-31 00:56:39,918 : INFO : PROGRESS: pass 0, at document #2360000/4922894\n", + "2019-01-31 00:56:41,303 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:56:41,569 : INFO : topic #26 (0.020): 0.029*\"woman\" + 0.028*\"workplac\" + 0.027*\"men\" + 0.026*\"champion\" + 0.024*\"olymp\" + 0.021*\"event\" + 0.021*\"medal\" + 0.020*\"rainfal\" + 0.019*\"atheist\" + 0.018*\"taxpay\"\n", + "2019-01-31 00:56:41,571 : INFO : topic #10 (0.020): 0.012*\"cdd\" + 0.008*\"disco\" + 0.008*\"media\" + 0.007*\"hormon\" + 0.007*\"caus\" + 0.007*\"have\" + 0.007*\"pathwai\" + 0.006*\"proper\" + 0.006*\"effect\" + 0.006*\"cancer\"\n", + "2019-01-31 00:56:41,571 : INFO : topic #32 (0.020): 0.050*\"district\" + 0.044*\"popolo\" + 0.042*\"vigour\" + 0.040*\"tortur\" + 0.034*\"cotton\" + 0.025*\"area\" + 0.023*\"multitud\" + 0.020*\"citi\" + 0.020*\"regim\" + 0.019*\"cede\"\n", + "2019-01-31 00:56:41,573 : INFO : topic #37 (0.020): 0.010*\"charact\" + 0.009*\"man\" + 0.009*\"septemb\" + 0.007*\"anim\" + 0.007*\"love\" + 0.007*\"comic\" + 0.007*\"appear\" + 0.006*\"gestur\" + 0.006*\"vision\" + 0.005*\"blue\"\n", + "2019-01-31 00:56:41,574 : INFO : topic #5 (0.020): 0.039*\"abroad\" + 0.029*\"son\" + 0.027*\"rel\" + 0.026*\"reconstruct\" + 0.020*\"band\" + 0.017*\"muscl\" + 0.016*\"simultan\" + 0.014*\"charcoal\" + 0.014*\"toyota\" + 0.010*\"vocabulari\"\n", + "2019-01-31 00:56:41,579 : INFO : topic diff=0.005537, rho=0.029111\n", + "2019-01-31 00:56:41,737 : INFO : PROGRESS: pass 0, at document #2362000/4922894\n", + "2019-01-31 00:56:43,116 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:56:43,382 : INFO : topic #15 (0.020): 0.012*\"small\" + 0.010*\"organ\" + 0.010*\"develop\" + 0.009*\"commun\" + 0.009*\"word\" + 0.008*\"group\" + 0.008*\"peopl\" + 0.007*\"woman\" + 0.007*\"human\" + 0.006*\"cultur\"\n", + "2019-01-31 00:56:43,383 : INFO : topic #2 (0.020): 0.059*\"isl\" + 0.037*\"shield\" + 0.018*\"narrat\" + 0.014*\"scot\" + 0.012*\"pope\" + 0.011*\"coalit\" + 0.011*\"nativist\" + 0.011*\"blur\" + 0.009*\"fleet\" + 0.009*\"bahá\"\n", + "2019-01-31 00:56:43,384 : INFO : topic #18 (0.020): 0.010*\"théori\" + 0.007*\"later\" + 0.007*\"sack\" + 0.006*\"dai\" + 0.005*\"kill\" + 0.005*\"retrospect\" + 0.005*\"like\" + 0.005*\"end\" + 0.004*\"kenworthi\" + 0.004*\"call\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 00:56:43,385 : INFO : topic #13 (0.020): 0.026*\"new\" + 0.025*\"sourc\" + 0.025*\"australia\" + 0.025*\"london\" + 0.023*\"england\" + 0.022*\"australian\" + 0.020*\"british\" + 0.018*\"ireland\" + 0.015*\"youth\" + 0.013*\"wale\"\n", + "2019-01-31 00:56:43,386 : INFO : topic #5 (0.020): 0.039*\"abroad\" + 0.029*\"son\" + 0.027*\"rel\" + 0.026*\"reconstruct\" + 0.020*\"band\" + 0.017*\"muscl\" + 0.016*\"simultan\" + 0.014*\"charcoal\" + 0.014*\"toyota\" + 0.010*\"myspac\"\n", + "2019-01-31 00:56:43,392 : INFO : topic diff=0.004907, rho=0.029099\n", + "2019-01-31 00:56:43,549 : INFO : PROGRESS: pass 0, at document #2364000/4922894\n", + "2019-01-31 00:56:44,961 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:56:45,228 : INFO : topic #5 (0.020): 0.039*\"abroad\" + 0.029*\"son\" + 0.027*\"rel\" + 0.026*\"reconstruct\" + 0.020*\"band\" + 0.017*\"muscl\" + 0.016*\"simultan\" + 0.014*\"charcoal\" + 0.014*\"toyota\" + 0.010*\"myspac\"\n", + "2019-01-31 00:56:45,229 : INFO : topic #16 (0.020): 0.051*\"king\" + 0.032*\"priest\" + 0.019*\"rotterdam\" + 0.019*\"grammat\" + 0.018*\"duke\" + 0.017*\"quarterli\" + 0.016*\"idiosyncrat\" + 0.014*\"kingdom\" + 0.014*\"portugues\" + 0.013*\"brazil\"\n", + "2019-01-31 00:56:45,230 : INFO : topic #30 (0.020): 0.036*\"leagu\" + 0.035*\"cleveland\" + 0.029*\"place\" + 0.027*\"taxpay\" + 0.025*\"scientist\" + 0.024*\"crete\" + 0.021*\"folei\" + 0.016*\"goal\" + 0.015*\"martin\" + 0.013*\"schmitz\"\n", + "2019-01-31 00:56:45,231 : INFO : topic #15 (0.020): 0.012*\"small\" + 0.010*\"organ\" + 0.010*\"develop\" + 0.009*\"commun\" + 0.009*\"word\" + 0.008*\"peopl\" + 0.008*\"group\" + 0.007*\"woman\" + 0.007*\"human\" + 0.006*\"cultur\"\n", + "2019-01-31 00:56:45,232 : INFO : topic #29 (0.020): 0.029*\"companhia\" + 0.012*\"busi\" + 0.012*\"million\" + 0.011*\"market\" + 0.011*\"produc\" + 0.010*\"bank\" + 0.009*\"industri\" + 0.009*\"yawn\" + 0.008*\"manag\" + 0.007*\"serv\"\n", + "2019-01-31 00:56:45,238 : INFO : topic diff=0.003853, rho=0.029086\n", + "2019-01-31 00:56:45,397 : INFO : PROGRESS: pass 0, at document #2366000/4922894\n", + "2019-01-31 00:56:46,812 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:56:47,081 : INFO : topic #24 (0.020): 0.039*\"book\" + 0.035*\"publicis\" + 0.025*\"word\" + 0.018*\"new\" + 0.014*\"edit\" + 0.013*\"presid\" + 0.012*\"nicola\" + 0.012*\"collect\" + 0.011*\"storag\" + 0.011*\"magazin\"\n", + "2019-01-31 00:56:47,082 : INFO : topic #44 (0.020): 0.031*\"rooftop\" + 0.026*\"final\" + 0.022*\"wife\" + 0.021*\"tourist\" + 0.018*\"champion\" + 0.017*\"taxpay\" + 0.015*\"martin\" + 0.015*\"tiepolo\" + 0.015*\"chamber\" + 0.014*\"open\"\n", + "2019-01-31 00:56:47,083 : INFO : topic #19 (0.020): 0.018*\"languag\" + 0.014*\"centuri\" + 0.010*\"woodcut\" + 0.009*\"form\" + 0.009*\"mean\" + 0.009*\"origin\" + 0.008*\"trade\" + 0.007*\"english\" + 0.007*\"known\" + 0.006*\"ancestor\"\n", + "2019-01-31 00:56:47,084 : INFO : topic #9 (0.020): 0.076*\"bone\" + 0.043*\"american\" + 0.025*\"valour\" + 0.019*\"dutch\" + 0.017*\"folei\" + 0.017*\"player\" + 0.016*\"polit\" + 0.016*\"english\" + 0.014*\"simpler\" + 0.012*\"acrimoni\"\n", + "2019-01-31 00:56:47,085 : INFO : topic #40 (0.020): 0.089*\"unit\" + 0.024*\"schuster\" + 0.023*\"collector\" + 0.021*\"institut\" + 0.020*\"requir\" + 0.019*\"student\" + 0.015*\"professor\" + 0.012*\"word\" + 0.012*\"degre\" + 0.011*\"http\"\n", + "2019-01-31 00:56:47,091 : INFO : topic diff=0.004191, rho=0.029074\n", + "2019-01-31 00:56:47,312 : INFO : PROGRESS: pass 0, at document #2368000/4922894\n", + "2019-01-31 00:56:48,738 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:56:49,004 : INFO : topic #36 (0.020): 0.011*\"prognosi\" + 0.011*\"pop\" + 0.010*\"network\" + 0.009*\"develop\" + 0.008*\"user\" + 0.008*\"cytokin\" + 0.008*\"diggin\" + 0.008*\"softwar\" + 0.007*\"uruguayan\" + 0.007*\"includ\"\n", + "2019-01-31 00:56:49,005 : INFO : topic #18 (0.020): 0.010*\"théori\" + 0.007*\"later\" + 0.007*\"sack\" + 0.006*\"dai\" + 0.005*\"kill\" + 0.005*\"retrospect\" + 0.005*\"like\" + 0.005*\"end\" + 0.004*\"kenworthi\" + 0.004*\"call\"\n", + "2019-01-31 00:56:49,006 : INFO : topic #10 (0.020): 0.012*\"cdd\" + 0.008*\"disco\" + 0.007*\"media\" + 0.007*\"hormon\" + 0.007*\"have\" + 0.007*\"caus\" + 0.006*\"pathwai\" + 0.006*\"proper\" + 0.006*\"effect\" + 0.006*\"cancer\"\n", + "2019-01-31 00:56:49,007 : INFO : topic #20 (0.020): 0.142*\"scholar\" + 0.041*\"struggl\" + 0.034*\"high\" + 0.030*\"educ\" + 0.026*\"collector\" + 0.019*\"yawn\" + 0.013*\"prognosi\" + 0.009*\"class\" + 0.009*\"task\" + 0.009*\"district\"\n", + "2019-01-31 00:56:49,008 : INFO : topic #11 (0.020): 0.024*\"john\" + 0.012*\"will\" + 0.012*\"jame\" + 0.012*\"david\" + 0.010*\"rival\" + 0.009*\"mexican–american\" + 0.009*\"georg\" + 0.008*\"slur\" + 0.008*\"paul\" + 0.008*\"rhyme\"\n", + "2019-01-31 00:56:49,014 : INFO : topic diff=0.004161, rho=0.029062\n", + "2019-01-31 00:56:49,171 : INFO : PROGRESS: pass 0, at document #2370000/4922894\n", + "2019-01-31 00:56:50,563 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:56:50,830 : INFO : topic #15 (0.020): 0.012*\"small\" + 0.010*\"organ\" + 0.010*\"develop\" + 0.009*\"commun\" + 0.009*\"word\" + 0.008*\"peopl\" + 0.008*\"group\" + 0.007*\"woman\" + 0.007*\"human\" + 0.007*\"cultur\"\n", + "2019-01-31 00:56:50,831 : INFO : topic #49 (0.020): 0.043*\"india\" + 0.031*\"incumb\" + 0.012*\"islam\" + 0.012*\"pakistan\" + 0.012*\"anglo\" + 0.011*\"alam\" + 0.010*\"khalsa\" + 0.010*\"televis\" + 0.010*\"muskoge\" + 0.010*\"tajikistan\"\n", + "2019-01-31 00:56:50,832 : INFO : topic #25 (0.020): 0.031*\"ring\" + 0.018*\"lagrang\" + 0.017*\"area\" + 0.016*\"warmth\" + 0.015*\"mount\" + 0.010*\"north\" + 0.009*\"foam\" + 0.009*\"sourc\" + 0.009*\"palmer\" + 0.008*\"vacant\"\n", + "2019-01-31 00:56:50,833 : INFO : topic #47 (0.020): 0.063*\"muscl\" + 0.033*\"perceptu\" + 0.021*\"theater\" + 0.019*\"place\" + 0.017*\"compos\" + 0.015*\"damn\" + 0.013*\"orchestr\" + 0.013*\"olympo\" + 0.012*\"word\" + 0.012*\"physician\"\n", + "2019-01-31 00:56:50,834 : INFO : topic #9 (0.020): 0.074*\"bone\" + 0.044*\"american\" + 0.025*\"valour\" + 0.019*\"dutch\" + 0.017*\"folei\" + 0.017*\"player\" + 0.016*\"polit\" + 0.016*\"english\" + 0.013*\"simpler\" + 0.012*\"acrimoni\"\n", + "2019-01-31 00:56:50,839 : INFO : topic diff=0.004432, rho=0.029050\n", + "2019-01-31 00:56:51,000 : INFO : PROGRESS: pass 0, at document #2372000/4922894\n", + "2019-01-31 00:56:52,416 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:56:52,683 : INFO : topic #38 (0.020): 0.022*\"walter\" + 0.009*\"aza\" + 0.009*\"forc\" + 0.008*\"battalion\" + 0.007*\"armi\" + 0.007*\"empath\" + 0.007*\"teufel\" + 0.006*\"militari\" + 0.006*\"pour\" + 0.006*\"govern\"\n", + "2019-01-31 00:56:52,684 : INFO : topic #23 (0.020): 0.135*\"audit\" + 0.065*\"best\" + 0.033*\"yawn\" + 0.028*\"jacksonvil\" + 0.022*\"noll\" + 0.021*\"japanes\" + 0.020*\"festiv\" + 0.019*\"women\" + 0.017*\"intern\" + 0.015*\"prison\"\n", + "2019-01-31 00:56:52,685 : INFO : topic #0 (0.020): 0.066*\"statewid\" + 0.044*\"line\" + 0.038*\"raid\" + 0.030*\"arsen\" + 0.024*\"museo\" + 0.019*\"traceabl\" + 0.019*\"serv\" + 0.014*\"rosenwald\" + 0.012*\"exhaust\" + 0.012*\"oper\"\n", + "2019-01-31 00:56:52,686 : INFO : topic #24 (0.020): 0.039*\"book\" + 0.035*\"publicis\" + 0.025*\"word\" + 0.018*\"new\" + 0.014*\"edit\" + 0.013*\"presid\" + 0.012*\"nicola\" + 0.012*\"storag\" + 0.012*\"collect\" + 0.011*\"worldwid\"\n", + "2019-01-31 00:56:52,687 : INFO : topic #43 (0.020): 0.064*\"elect\" + 0.054*\"parti\" + 0.024*\"voluntari\" + 0.023*\"democrat\" + 0.020*\"member\" + 0.016*\"polici\" + 0.015*\"republ\" + 0.014*\"bypass\" + 0.014*\"report\" + 0.013*\"liber\"\n", + "2019-01-31 00:56:52,693 : INFO : topic diff=0.004759, rho=0.029037\n", + "2019-01-31 00:56:52,847 : INFO : PROGRESS: pass 0, at document #2374000/4922894\n", + "2019-01-31 00:56:54,205 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:56:54,472 : INFO : topic #40 (0.020): 0.089*\"unit\" + 0.024*\"schuster\" + 0.022*\"collector\" + 0.021*\"institut\" + 0.020*\"requir\" + 0.019*\"student\" + 0.014*\"professor\" + 0.012*\"word\" + 0.011*\"degre\" + 0.011*\"http\"\n", + "2019-01-31 00:56:54,473 : INFO : topic #44 (0.020): 0.031*\"rooftop\" + 0.026*\"final\" + 0.022*\"wife\" + 0.020*\"tourist\" + 0.018*\"champion\" + 0.016*\"taxpay\" + 0.015*\"martin\" + 0.015*\"tiepolo\" + 0.014*\"chamber\" + 0.014*\"open\"\n", + "2019-01-31 00:56:54,474 : INFO : topic #46 (0.020): 0.018*\"stop\" + 0.017*\"swedish\" + 0.017*\"norwai\" + 0.016*\"sweden\" + 0.016*\"wind\" + 0.014*\"norwegian\" + 0.014*\"damag\" + 0.012*\"treeless\" + 0.012*\"huntsvil\" + 0.011*\"farid\"\n", + "2019-01-31 00:56:54,475 : INFO : topic #8 (0.020): 0.027*\"law\" + 0.022*\"cortic\" + 0.018*\"start\" + 0.017*\"act\" + 0.013*\"ricardo\" + 0.012*\"case\" + 0.010*\"replac\" + 0.010*\"polaris\" + 0.009*\"legal\" + 0.008*\"order\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 00:56:54,476 : INFO : topic #21 (0.020): 0.035*\"samford\" + 0.021*\"spain\" + 0.018*\"del\" + 0.017*\"mexico\" + 0.013*\"italian\" + 0.013*\"soviet\" + 0.012*\"santa\" + 0.011*\"juan\" + 0.011*\"francisco\" + 0.011*\"carlo\"\n", + "2019-01-31 00:56:54,482 : INFO : topic diff=0.003722, rho=0.029025\n", + "2019-01-31 00:56:54,646 : INFO : PROGRESS: pass 0, at document #2376000/4922894\n", + "2019-01-31 00:56:56,036 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:56:56,303 : INFO : topic #21 (0.020): 0.035*\"samford\" + 0.021*\"spain\" + 0.018*\"del\" + 0.017*\"mexico\" + 0.013*\"italian\" + 0.013*\"soviet\" + 0.012*\"santa\" + 0.011*\"juan\" + 0.011*\"francisco\" + 0.011*\"carlo\"\n", + "2019-01-31 00:56:56,304 : INFO : topic #18 (0.020): 0.010*\"théori\" + 0.007*\"later\" + 0.007*\"sack\" + 0.006*\"dai\" + 0.005*\"kill\" + 0.005*\"retrospect\" + 0.005*\"like\" + 0.005*\"end\" + 0.004*\"kenworthi\" + 0.004*\"call\"\n", + "2019-01-31 00:56:56,305 : INFO : topic #16 (0.020): 0.050*\"king\" + 0.032*\"priest\" + 0.020*\"rotterdam\" + 0.019*\"duke\" + 0.018*\"grammat\" + 0.017*\"quarterli\" + 0.017*\"idiosyncrat\" + 0.014*\"portugues\" + 0.014*\"count\" + 0.014*\"kingdom\"\n", + "2019-01-31 00:56:56,306 : INFO : topic #24 (0.020): 0.039*\"book\" + 0.034*\"publicis\" + 0.025*\"word\" + 0.018*\"new\" + 0.014*\"edit\" + 0.013*\"presid\" + 0.012*\"nicola\" + 0.012*\"storag\" + 0.012*\"collect\" + 0.011*\"worldwid\"\n", + "2019-01-31 00:56:56,307 : INFO : topic #15 (0.020): 0.011*\"small\" + 0.010*\"organ\" + 0.010*\"develop\" + 0.009*\"commun\" + 0.009*\"word\" + 0.008*\"peopl\" + 0.008*\"group\" + 0.007*\"woman\" + 0.007*\"cultur\" + 0.007*\"human\"\n", + "2019-01-31 00:56:56,313 : INFO : topic diff=0.004264, rho=0.029013\n", + "2019-01-31 00:56:56,473 : INFO : PROGRESS: pass 0, at document #2378000/4922894\n", + "2019-01-31 00:56:57,862 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:56:58,128 : INFO : topic #10 (0.020): 0.012*\"cdd\" + 0.008*\"disco\" + 0.008*\"media\" + 0.007*\"have\" + 0.007*\"hormon\" + 0.007*\"pathwai\" + 0.007*\"caus\" + 0.006*\"proper\" + 0.006*\"effect\" + 0.006*\"treat\"\n", + "2019-01-31 00:56:58,129 : INFO : topic #48 (0.020): 0.080*\"march\" + 0.078*\"sens\" + 0.078*\"octob\" + 0.072*\"januari\" + 0.071*\"notion\" + 0.070*\"juli\" + 0.069*\"decatur\" + 0.068*\"april\" + 0.067*\"judici\" + 0.067*\"august\"\n", + "2019-01-31 00:56:58,130 : INFO : topic #47 (0.020): 0.063*\"muscl\" + 0.034*\"perceptu\" + 0.021*\"theater\" + 0.019*\"place\" + 0.017*\"compos\" + 0.016*\"damn\" + 0.014*\"orchestr\" + 0.012*\"olympo\" + 0.012*\"physician\" + 0.012*\"word\"\n", + "2019-01-31 00:56:58,131 : INFO : topic #33 (0.020): 0.061*\"french\" + 0.047*\"franc\" + 0.029*\"pari\" + 0.021*\"jean\" + 0.020*\"sail\" + 0.017*\"daphn\" + 0.013*\"lazi\" + 0.012*\"loui\" + 0.011*\"piec\" + 0.009*\"wine\"\n", + "2019-01-31 00:56:58,132 : INFO : topic #1 (0.020): 0.055*\"china\" + 0.047*\"chilton\" + 0.022*\"kong\" + 0.022*\"hong\" + 0.021*\"korea\" + 0.018*\"korean\" + 0.016*\"sourc\" + 0.015*\"leah\" + 0.014*\"shirin\" + 0.013*\"kim\"\n", + "2019-01-31 00:56:58,138 : INFO : topic diff=0.004136, rho=0.029001\n", + "2019-01-31 00:57:00,859 : INFO : -11.557 per-word bound, 3013.3 perplexity estimate based on a held-out corpus of 2000 documents with 564334 words\n", + "2019-01-31 00:57:00,859 : INFO : PROGRESS: pass 0, at document #2380000/4922894\n", + "2019-01-31 00:57:02,257 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:57:02,523 : INFO : topic #13 (0.020): 0.026*\"new\" + 0.026*\"australia\" + 0.025*\"london\" + 0.025*\"sourc\" + 0.023*\"england\" + 0.022*\"australian\" + 0.019*\"british\" + 0.018*\"ireland\" + 0.015*\"youth\" + 0.014*\"wale\"\n", + "2019-01-31 00:57:02,524 : INFO : topic #15 (0.020): 0.011*\"small\" + 0.010*\"organ\" + 0.010*\"develop\" + 0.010*\"commun\" + 0.009*\"word\" + 0.008*\"group\" + 0.008*\"peopl\" + 0.007*\"cultur\" + 0.007*\"human\" + 0.006*\"woman\"\n", + "2019-01-31 00:57:02,525 : INFO : topic #41 (0.020): 0.042*\"citi\" + 0.024*\"palmer\" + 0.023*\"new\" + 0.014*\"strategist\" + 0.012*\"center\" + 0.011*\"open\" + 0.011*\"includ\" + 0.011*\"lobe\" + 0.009*\"dai\" + 0.009*\"highli\"\n", + "2019-01-31 00:57:02,526 : INFO : topic #10 (0.020): 0.012*\"cdd\" + 0.008*\"disco\" + 0.008*\"media\" + 0.007*\"have\" + 0.007*\"hormon\" + 0.007*\"pathwai\" + 0.007*\"caus\" + 0.006*\"proper\" + 0.006*\"effect\" + 0.006*\"treat\"\n", + "2019-01-31 00:57:02,528 : INFO : topic #29 (0.020): 0.029*\"companhia\" + 0.012*\"million\" + 0.012*\"busi\" + 0.011*\"market\" + 0.011*\"produc\" + 0.011*\"bank\" + 0.009*\"industri\" + 0.009*\"yawn\" + 0.008*\"manag\" + 0.007*\"serv\"\n", + "2019-01-31 00:57:02,533 : INFO : topic diff=0.004742, rho=0.028989\n", + "2019-01-31 00:57:02,691 : INFO : PROGRESS: pass 0, at document #2382000/4922894\n", + "2019-01-31 00:57:04,079 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:57:04,346 : INFO : topic #21 (0.020): 0.036*\"samford\" + 0.022*\"spain\" + 0.018*\"del\" + 0.016*\"mexico\" + 0.013*\"italian\" + 0.013*\"soviet\" + 0.012*\"santa\" + 0.011*\"juan\" + 0.011*\"francisco\" + 0.011*\"carlo\"\n", + "2019-01-31 00:57:04,347 : INFO : topic #49 (0.020): 0.043*\"india\" + 0.031*\"incumb\" + 0.013*\"islam\" + 0.012*\"pakistan\" + 0.012*\"anglo\" + 0.011*\"televis\" + 0.011*\"khalsa\" + 0.010*\"muskoge\" + 0.010*\"alam\" + 0.010*\"sri\"\n", + "2019-01-31 00:57:04,348 : INFO : topic #4 (0.020): 0.020*\"enfranchis\" + 0.015*\"depress\" + 0.014*\"pour\" + 0.009*\"elabor\" + 0.008*\"mode\" + 0.008*\"veget\" + 0.007*\"uruguayan\" + 0.007*\"encyclopedia\" + 0.006*\"develop\" + 0.006*\"produc\"\n", + "2019-01-31 00:57:04,349 : INFO : topic #14 (0.020): 0.024*\"forc\" + 0.021*\"armi\" + 0.021*\"aggress\" + 0.020*\"walter\" + 0.017*\"com\" + 0.013*\"oper\" + 0.013*\"unionist\" + 0.012*\"militari\" + 0.012*\"airbu\" + 0.011*\"refut\"\n", + "2019-01-31 00:57:04,350 : INFO : topic #3 (0.020): 0.033*\"present\" + 0.026*\"offic\" + 0.025*\"minist\" + 0.024*\"nation\" + 0.022*\"govern\" + 0.021*\"member\" + 0.020*\"serv\" + 0.016*\"gener\" + 0.016*\"start\" + 0.015*\"seri\"\n", + "2019-01-31 00:57:04,356 : INFO : topic diff=0.004098, rho=0.028976\n", + "2019-01-31 00:57:04,509 : INFO : PROGRESS: pass 0, at document #2384000/4922894\n", + "2019-01-31 00:57:05,871 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:57:06,137 : INFO : topic #2 (0.020): 0.055*\"isl\" + 0.037*\"shield\" + 0.018*\"narrat\" + 0.014*\"scot\" + 0.012*\"pope\" + 0.011*\"coalit\" + 0.011*\"blur\" + 0.011*\"nativist\" + 0.010*\"fleet\" + 0.008*\"sai\"\n", + "2019-01-31 00:57:06,139 : INFO : topic #8 (0.020): 0.027*\"law\" + 0.022*\"cortic\" + 0.018*\"start\" + 0.017*\"act\" + 0.012*\"ricardo\" + 0.012*\"case\" + 0.010*\"replac\" + 0.009*\"polaris\" + 0.009*\"legal\" + 0.008*\"order\"\n", + "2019-01-31 00:57:06,140 : INFO : topic #15 (0.020): 0.011*\"small\" + 0.010*\"organ\" + 0.010*\"develop\" + 0.010*\"commun\" + 0.009*\"word\" + 0.008*\"group\" + 0.008*\"peopl\" + 0.007*\"cultur\" + 0.007*\"human\" + 0.007*\"woman\"\n", + "2019-01-31 00:57:06,141 : INFO : topic #44 (0.020): 0.030*\"rooftop\" + 0.025*\"final\" + 0.022*\"wife\" + 0.021*\"tourist\" + 0.018*\"champion\" + 0.016*\"taxpay\" + 0.015*\"martin\" + 0.015*\"chamber\" + 0.014*\"tiepolo\" + 0.014*\"open\"\n", + "2019-01-31 00:57:06,142 : INFO : topic #13 (0.020): 0.026*\"new\" + 0.026*\"australia\" + 0.025*\"london\" + 0.025*\"sourc\" + 0.023*\"england\" + 0.022*\"australian\" + 0.020*\"british\" + 0.018*\"ireland\" + 0.015*\"youth\" + 0.014*\"wale\"\n", + "2019-01-31 00:57:06,147 : INFO : topic diff=0.003983, rho=0.028964\n", + "2019-01-31 00:57:06,305 : INFO : PROGRESS: pass 0, at document #2386000/4922894\n", + "2019-01-31 00:57:07,700 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:57:07,967 : INFO : topic #24 (0.020): 0.039*\"book\" + 0.034*\"publicis\" + 0.025*\"word\" + 0.018*\"new\" + 0.014*\"edit\" + 0.013*\"presid\" + 0.012*\"nicola\" + 0.012*\"storag\" + 0.012*\"collect\" + 0.011*\"worldwid\"\n", + "2019-01-31 00:57:07,968 : INFO : topic #31 (0.020): 0.052*\"fusiform\" + 0.026*\"scientist\" + 0.025*\"taxpay\" + 0.022*\"player\" + 0.020*\"place\" + 0.014*\"clot\" + 0.013*\"leagu\" + 0.011*\"folei\" + 0.011*\"yawn\" + 0.009*\"reconstruct\"\n", + "2019-01-31 00:57:07,969 : INFO : topic #21 (0.020): 0.036*\"samford\" + 0.022*\"spain\" + 0.018*\"del\" + 0.016*\"mexico\" + 0.014*\"italian\" + 0.013*\"soviet\" + 0.012*\"santa\" + 0.011*\"juan\" + 0.011*\"francisco\" + 0.011*\"josé\"\n", + "2019-01-31 00:57:07,970 : INFO : topic #3 (0.020): 0.033*\"present\" + 0.026*\"offic\" + 0.024*\"minist\" + 0.024*\"nation\" + 0.022*\"govern\" + 0.022*\"member\" + 0.020*\"serv\" + 0.016*\"gener\" + 0.016*\"start\" + 0.015*\"seri\"\n", + "2019-01-31 00:57:07,971 : INFO : topic #23 (0.020): 0.136*\"audit\" + 0.066*\"best\" + 0.033*\"yawn\" + 0.027*\"jacksonvil\" + 0.022*\"noll\" + 0.021*\"festiv\" + 0.020*\"japanes\" + 0.019*\"women\" + 0.017*\"intern\" + 0.014*\"prison\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 00:57:07,977 : INFO : topic diff=0.004362, rho=0.028952\n", + "2019-01-31 00:57:08,132 : INFO : PROGRESS: pass 0, at document #2388000/4922894\n", + "2019-01-31 00:57:09,506 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:57:09,772 : INFO : topic #42 (0.020): 0.047*\"german\" + 0.030*\"germani\" + 0.016*\"jewish\" + 0.016*\"vol\" + 0.015*\"berlin\" + 0.014*\"israel\" + 0.014*\"der\" + 0.011*\"european\" + 0.010*\"jeremiah\" + 0.009*\"europ\"\n", + "2019-01-31 00:57:09,773 : INFO : topic #9 (0.020): 0.073*\"bone\" + 0.047*\"american\" + 0.026*\"valour\" + 0.019*\"dutch\" + 0.018*\"english\" + 0.017*\"folei\" + 0.016*\"player\" + 0.016*\"polit\" + 0.012*\"simpler\" + 0.012*\"acrimoni\"\n", + "2019-01-31 00:57:09,774 : INFO : topic #34 (0.020): 0.067*\"start\" + 0.033*\"new\" + 0.032*\"american\" + 0.028*\"unionist\" + 0.025*\"cotton\" + 0.020*\"year\" + 0.015*\"california\" + 0.013*\"warrior\" + 0.012*\"terri\" + 0.012*\"north\"\n", + "2019-01-31 00:57:09,775 : INFO : topic #20 (0.020): 0.143*\"scholar\" + 0.040*\"struggl\" + 0.034*\"high\" + 0.030*\"educ\" + 0.026*\"collector\" + 0.018*\"yawn\" + 0.013*\"prognosi\" + 0.009*\"task\" + 0.009*\"class\" + 0.009*\"gothic\"\n", + "2019-01-31 00:57:09,776 : INFO : topic #29 (0.020): 0.029*\"companhia\" + 0.012*\"busi\" + 0.012*\"million\" + 0.011*\"market\" + 0.011*\"produc\" + 0.010*\"bank\" + 0.009*\"industri\" + 0.008*\"yawn\" + 0.008*\"manag\" + 0.007*\"serv\"\n", + "2019-01-31 00:57:09,782 : INFO : topic diff=0.004244, rho=0.028940\n", + "2019-01-31 00:57:09,937 : INFO : PROGRESS: pass 0, at document #2390000/4922894\n", + "2019-01-31 00:57:11,313 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:57:11,579 : INFO : topic #40 (0.020): 0.088*\"unit\" + 0.024*\"schuster\" + 0.022*\"collector\" + 0.021*\"institut\" + 0.020*\"requir\" + 0.018*\"student\" + 0.014*\"professor\" + 0.012*\"word\" + 0.011*\"degre\" + 0.011*\"http\"\n", + "2019-01-31 00:57:11,580 : INFO : topic #9 (0.020): 0.073*\"bone\" + 0.047*\"american\" + 0.026*\"valour\" + 0.020*\"dutch\" + 0.018*\"english\" + 0.017*\"folei\" + 0.016*\"player\" + 0.016*\"polit\" + 0.013*\"simpler\" + 0.012*\"acrimoni\"\n", + "2019-01-31 00:57:11,582 : INFO : topic #30 (0.020): 0.035*\"leagu\" + 0.035*\"cleveland\" + 0.029*\"place\" + 0.028*\"taxpay\" + 0.024*\"scientist\" + 0.024*\"crete\" + 0.021*\"folei\" + 0.016*\"goal\" + 0.015*\"martin\" + 0.012*\"schmitz\"\n", + "2019-01-31 00:57:11,583 : INFO : topic #5 (0.020): 0.039*\"abroad\" + 0.028*\"son\" + 0.027*\"rel\" + 0.026*\"reconstruct\" + 0.021*\"band\" + 0.017*\"muscl\" + 0.016*\"simultan\" + 0.014*\"charcoal\" + 0.014*\"toyota\" + 0.010*\"myspac\"\n", + "2019-01-31 00:57:11,584 : INFO : topic #12 (0.020): 0.009*\"number\" + 0.007*\"frontal\" + 0.007*\"exampl\" + 0.006*\"théori\" + 0.006*\"gener\" + 0.006*\"poet\" + 0.006*\"southern\" + 0.006*\"servitud\" + 0.006*\"measur\" + 0.006*\"method\"\n", + "2019-01-31 00:57:11,590 : INFO : topic diff=0.004085, rho=0.028928\n", + "2019-01-31 00:57:11,743 : INFO : PROGRESS: pass 0, at document #2392000/4922894\n", + "2019-01-31 00:57:13,117 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:57:13,383 : INFO : topic #8 (0.020): 0.027*\"law\" + 0.022*\"cortic\" + 0.018*\"start\" + 0.017*\"act\" + 0.012*\"ricardo\" + 0.012*\"case\" + 0.010*\"replac\" + 0.009*\"polaris\" + 0.009*\"legal\" + 0.008*\"order\"\n", + "2019-01-31 00:57:13,384 : INFO : topic #47 (0.020): 0.063*\"muscl\" + 0.033*\"perceptu\" + 0.021*\"theater\" + 0.019*\"place\" + 0.017*\"damn\" + 0.016*\"compos\" + 0.014*\"orchestr\" + 0.013*\"olympo\" + 0.012*\"physician\" + 0.012*\"word\"\n", + "2019-01-31 00:57:13,385 : INFO : topic #5 (0.020): 0.039*\"abroad\" + 0.028*\"son\" + 0.027*\"rel\" + 0.026*\"reconstruct\" + 0.021*\"band\" + 0.017*\"muscl\" + 0.016*\"simultan\" + 0.014*\"charcoal\" + 0.014*\"toyota\" + 0.010*\"myspac\"\n", + "2019-01-31 00:57:13,386 : INFO : topic #3 (0.020): 0.033*\"present\" + 0.026*\"offic\" + 0.024*\"minist\" + 0.024*\"nation\" + 0.022*\"govern\" + 0.021*\"member\" + 0.020*\"serv\" + 0.016*\"gener\" + 0.016*\"start\" + 0.015*\"seri\"\n", + "2019-01-31 00:57:13,387 : INFO : topic #2 (0.020): 0.055*\"isl\" + 0.037*\"shield\" + 0.018*\"narrat\" + 0.014*\"scot\" + 0.012*\"pope\" + 0.011*\"coalit\" + 0.011*\"blur\" + 0.011*\"nativist\" + 0.009*\"fleet\" + 0.009*\"sai\"\n", + "2019-01-31 00:57:13,393 : INFO : topic diff=0.004585, rho=0.028916\n", + "2019-01-31 00:57:13,549 : INFO : PROGRESS: pass 0, at document #2394000/4922894\n", + "2019-01-31 00:57:14,928 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:57:15,194 : INFO : topic #2 (0.020): 0.055*\"isl\" + 0.037*\"shield\" + 0.018*\"narrat\" + 0.014*\"scot\" + 0.012*\"pope\" + 0.011*\"coalit\" + 0.011*\"nativist\" + 0.011*\"blur\" + 0.010*\"fleet\" + 0.009*\"sai\"\n", + "2019-01-31 00:57:15,195 : INFO : topic #46 (0.020): 0.018*\"stop\" + 0.017*\"swedish\" + 0.016*\"sweden\" + 0.016*\"norwai\" + 0.016*\"wind\" + 0.014*\"damag\" + 0.014*\"norwegian\" + 0.012*\"treeless\" + 0.012*\"turkish\" + 0.011*\"farid\"\n", + "2019-01-31 00:57:15,196 : INFO : topic #40 (0.020): 0.088*\"unit\" + 0.024*\"schuster\" + 0.022*\"collector\" + 0.021*\"institut\" + 0.020*\"requir\" + 0.018*\"student\" + 0.014*\"professor\" + 0.012*\"word\" + 0.011*\"degre\" + 0.011*\"governor\"\n", + "2019-01-31 00:57:15,197 : INFO : topic #13 (0.020): 0.026*\"new\" + 0.026*\"australia\" + 0.025*\"london\" + 0.025*\"sourc\" + 0.024*\"england\" + 0.022*\"australian\" + 0.021*\"british\" + 0.018*\"ireland\" + 0.015*\"youth\" + 0.014*\"wale\"\n", + "2019-01-31 00:57:15,198 : INFO : topic #42 (0.020): 0.048*\"german\" + 0.030*\"germani\" + 0.016*\"jewish\" + 0.016*\"vol\" + 0.015*\"berlin\" + 0.014*\"israel\" + 0.014*\"der\" + 0.011*\"european\" + 0.010*\"jeremiah\" + 0.009*\"itali\"\n", + "2019-01-31 00:57:15,204 : INFO : topic diff=0.004292, rho=0.028904\n", + "2019-01-31 00:57:15,360 : INFO : PROGRESS: pass 0, at document #2396000/4922894\n", + "2019-01-31 00:57:16,745 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:57:17,011 : INFO : topic #17 (0.020): 0.079*\"church\" + 0.023*\"cathol\" + 0.021*\"christian\" + 0.021*\"bishop\" + 0.017*\"sail\" + 0.015*\"retroflex\" + 0.010*\"relationship\" + 0.009*\"centuri\" + 0.009*\"parish\" + 0.008*\"poll\"\n", + "2019-01-31 00:57:17,012 : INFO : topic #0 (0.020): 0.067*\"statewid\" + 0.043*\"line\" + 0.036*\"raid\" + 0.030*\"arsen\" + 0.025*\"museo\" + 0.020*\"traceabl\" + 0.019*\"serv\" + 0.014*\"rosenwald\" + 0.012*\"exhaust\" + 0.012*\"oper\"\n", + "2019-01-31 00:57:17,013 : INFO : topic #22 (0.020): 0.034*\"spars\" + 0.023*\"factor\" + 0.015*\"adulthood\" + 0.013*\"feel\" + 0.012*\"male\" + 0.011*\"plaisir\" + 0.010*\"genu\" + 0.009*\"western\" + 0.009*\"biom\" + 0.008*\"median\"\n", + "2019-01-31 00:57:17,014 : INFO : topic #13 (0.020): 0.026*\"new\" + 0.026*\"australia\" + 0.025*\"london\" + 0.025*\"sourc\" + 0.024*\"england\" + 0.022*\"australian\" + 0.021*\"british\" + 0.018*\"ireland\" + 0.015*\"youth\" + 0.014*\"wale\"\n", + "2019-01-31 00:57:17,015 : INFO : topic #16 (0.020): 0.051*\"king\" + 0.032*\"priest\" + 0.020*\"duke\" + 0.020*\"rotterdam\" + 0.018*\"grammat\" + 0.017*\"idiosyncrat\" + 0.016*\"quarterli\" + 0.015*\"portugues\" + 0.014*\"kingdom\" + 0.014*\"count\"\n", + "2019-01-31 00:57:17,021 : INFO : topic diff=0.004440, rho=0.028892\n", + "2019-01-31 00:57:17,234 : INFO : PROGRESS: pass 0, at document #2398000/4922894\n", + "2019-01-31 00:57:18,618 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:57:18,885 : INFO : topic #42 (0.020): 0.048*\"german\" + 0.030*\"germani\" + 0.016*\"jewish\" + 0.016*\"vol\" + 0.015*\"israel\" + 0.014*\"berlin\" + 0.013*\"der\" + 0.011*\"european\" + 0.010*\"jeremiah\" + 0.009*\"itali\"\n", + "2019-01-31 00:57:18,886 : INFO : topic #20 (0.020): 0.143*\"scholar\" + 0.040*\"struggl\" + 0.034*\"high\" + 0.030*\"educ\" + 0.026*\"collector\" + 0.018*\"yawn\" + 0.013*\"prognosi\" + 0.010*\"class\" + 0.009*\"task\" + 0.009*\"gothic\"\n", + "2019-01-31 00:57:18,887 : INFO : topic #2 (0.020): 0.055*\"isl\" + 0.037*\"shield\" + 0.018*\"narrat\" + 0.014*\"scot\" + 0.012*\"pope\" + 0.011*\"coalit\" + 0.011*\"blur\" + 0.011*\"nativist\" + 0.010*\"fleet\" + 0.009*\"sai\"\n", + "2019-01-31 00:57:18,888 : INFO : topic #47 (0.020): 0.063*\"muscl\" + 0.033*\"perceptu\" + 0.021*\"theater\" + 0.019*\"place\" + 0.016*\"compos\" + 0.016*\"damn\" + 0.014*\"orchestr\" + 0.013*\"olympo\" + 0.013*\"physician\" + 0.012*\"word\"\n", + "2019-01-31 00:57:18,889 : INFO : topic #34 (0.020): 0.067*\"start\" + 0.033*\"new\" + 0.032*\"american\" + 0.028*\"unionist\" + 0.025*\"cotton\" + 0.020*\"year\" + 0.015*\"california\" + 0.013*\"warrior\" + 0.012*\"terri\" + 0.012*\"north\"\n", + "2019-01-31 00:57:18,895 : INFO : topic diff=0.004711, rho=0.028880\n", + "2019-01-31 00:57:21,545 : INFO : -11.655 per-word bound, 3224.3 perplexity estimate based on a held-out corpus of 2000 documents with 540892 words\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 00:57:21,546 : INFO : PROGRESS: pass 0, at document #2400000/4922894\n", + "2019-01-31 00:57:22,912 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:57:23,178 : INFO : topic #41 (0.020): 0.042*\"citi\" + 0.023*\"palmer\" + 0.023*\"new\" + 0.014*\"strategist\" + 0.012*\"center\" + 0.012*\"open\" + 0.011*\"includ\" + 0.011*\"lobe\" + 0.010*\"dai\" + 0.009*\"highli\"\n", + "2019-01-31 00:57:23,179 : INFO : topic #26 (0.020): 0.029*\"woman\" + 0.028*\"workplac\" + 0.027*\"men\" + 0.026*\"champion\" + 0.025*\"olymp\" + 0.022*\"medal\" + 0.020*\"event\" + 0.020*\"alic\" + 0.019*\"rainfal\" + 0.018*\"atheist\"\n", + "2019-01-31 00:57:23,180 : INFO : topic #33 (0.020): 0.061*\"french\" + 0.047*\"franc\" + 0.029*\"pari\" + 0.021*\"jean\" + 0.020*\"sail\" + 0.017*\"daphn\" + 0.013*\"lazi\" + 0.012*\"loui\" + 0.011*\"piec\" + 0.009*\"wine\"\n", + "2019-01-31 00:57:23,181 : INFO : topic #43 (0.020): 0.067*\"elect\" + 0.054*\"parti\" + 0.024*\"voluntari\" + 0.024*\"democrat\" + 0.020*\"member\" + 0.016*\"polici\" + 0.015*\"republ\" + 0.014*\"bypass\" + 0.014*\"report\" + 0.013*\"seaport\"\n", + "2019-01-31 00:57:23,182 : INFO : topic #36 (0.020): 0.011*\"pop\" + 0.011*\"prognosi\" + 0.010*\"network\" + 0.009*\"develop\" + 0.008*\"softwar\" + 0.008*\"user\" + 0.008*\"cytokin\" + 0.007*\"diggin\" + 0.007*\"brio\" + 0.007*\"uruguayan\"\n", + "2019-01-31 00:57:23,188 : INFO : topic diff=0.003905, rho=0.028868\n", + "2019-01-31 00:57:23,350 : INFO : PROGRESS: pass 0, at document #2402000/4922894\n", + "2019-01-31 00:57:24,775 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:57:25,042 : INFO : topic #19 (0.020): 0.017*\"languag\" + 0.014*\"centuri\" + 0.010*\"woodcut\" + 0.009*\"form\" + 0.009*\"origin\" + 0.009*\"mean\" + 0.008*\"trade\" + 0.007*\"english\" + 0.007*\"known\" + 0.007*\"ancestor\"\n", + "2019-01-31 00:57:25,043 : INFO : topic #38 (0.020): 0.023*\"walter\" + 0.010*\"aza\" + 0.009*\"forc\" + 0.008*\"battalion\" + 0.007*\"teufel\" + 0.007*\"empath\" + 0.007*\"armi\" + 0.006*\"pour\" + 0.006*\"govern\" + 0.006*\"till\"\n", + "2019-01-31 00:57:25,044 : INFO : topic #46 (0.020): 0.018*\"stop\" + 0.017*\"sweden\" + 0.016*\"norwai\" + 0.016*\"swedish\" + 0.015*\"wind\" + 0.014*\"norwegian\" + 0.013*\"damag\" + 0.013*\"treeless\" + 0.012*\"turkish\" + 0.011*\"farid\"\n", + "2019-01-31 00:57:25,045 : INFO : topic #17 (0.020): 0.078*\"church\" + 0.023*\"cathol\" + 0.022*\"christian\" + 0.021*\"bishop\" + 0.017*\"sail\" + 0.016*\"retroflex\" + 0.010*\"relationship\" + 0.009*\"centuri\" + 0.009*\"parish\" + 0.009*\"poll\"\n", + "2019-01-31 00:57:25,046 : INFO : topic #28 (0.020): 0.031*\"build\" + 0.026*\"hous\" + 0.020*\"rivièr\" + 0.017*\"buford\" + 0.013*\"histor\" + 0.012*\"briarwood\" + 0.011*\"strategist\" + 0.011*\"constitut\" + 0.010*\"linear\" + 0.010*\"depress\"\n", + "2019-01-31 00:57:25,051 : INFO : topic diff=0.005205, rho=0.028855\n", + "2019-01-31 00:57:25,209 : INFO : PROGRESS: pass 0, at document #2404000/4922894\n", + "2019-01-31 00:57:26,590 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:57:26,856 : INFO : topic #45 (0.020): 0.026*\"jpg\" + 0.025*\"fifteenth\" + 0.017*\"illicit\" + 0.017*\"colder\" + 0.015*\"black\" + 0.015*\"western\" + 0.012*\"record\" + 0.010*\"blind\" + 0.009*\"depress\" + 0.008*\"arm\"\n", + "2019-01-31 00:57:26,857 : INFO : topic #28 (0.020): 0.031*\"build\" + 0.026*\"hous\" + 0.020*\"rivièr\" + 0.017*\"buford\" + 0.013*\"histor\" + 0.012*\"briarwood\" + 0.011*\"strategist\" + 0.011*\"constitut\" + 0.010*\"linear\" + 0.010*\"depress\"\n", + "2019-01-31 00:57:26,859 : INFO : topic #41 (0.020): 0.042*\"citi\" + 0.023*\"palmer\" + 0.022*\"new\" + 0.014*\"strategist\" + 0.012*\"center\" + 0.012*\"open\" + 0.011*\"includ\" + 0.011*\"lobe\" + 0.010*\"dai\" + 0.009*\"highli\"\n", + "2019-01-31 00:57:26,860 : INFO : topic #29 (0.020): 0.030*\"companhia\" + 0.012*\"busi\" + 0.012*\"million\" + 0.011*\"produc\" + 0.011*\"market\" + 0.010*\"bank\" + 0.010*\"industri\" + 0.009*\"yawn\" + 0.008*\"manag\" + 0.007*\"function\"\n", + "2019-01-31 00:57:26,861 : INFO : topic #7 (0.020): 0.022*\"snatch\" + 0.019*\"di\" + 0.018*\"factor\" + 0.015*\"margin\" + 0.015*\"yawn\" + 0.014*\"bone\" + 0.013*\"faster\" + 0.013*\"life\" + 0.012*\"will\" + 0.012*\"john\"\n", + "2019-01-31 00:57:26,866 : INFO : topic diff=0.003970, rho=0.028843\n", + "2019-01-31 00:57:27,024 : INFO : PROGRESS: pass 0, at document #2406000/4922894\n", + "2019-01-31 00:57:28,418 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:57:28,685 : INFO : topic #34 (0.020): 0.067*\"start\" + 0.034*\"new\" + 0.031*\"american\" + 0.029*\"unionist\" + 0.026*\"cotton\" + 0.020*\"year\" + 0.015*\"california\" + 0.013*\"warrior\" + 0.012*\"terri\" + 0.012*\"north\"\n", + "2019-01-31 00:57:28,686 : INFO : topic #37 (0.020): 0.010*\"charact\" + 0.009*\"man\" + 0.009*\"septemb\" + 0.008*\"anim\" + 0.008*\"comic\" + 0.007*\"love\" + 0.007*\"appear\" + 0.006*\"gestur\" + 0.006*\"vision\" + 0.005*\"blue\"\n", + "2019-01-31 00:57:28,687 : INFO : topic #45 (0.020): 0.026*\"jpg\" + 0.025*\"fifteenth\" + 0.017*\"illicit\" + 0.017*\"colder\" + 0.016*\"black\" + 0.015*\"western\" + 0.012*\"record\" + 0.010*\"blind\" + 0.009*\"depress\" + 0.008*\"light\"\n", + "2019-01-31 00:57:28,688 : INFO : topic #22 (0.020): 0.034*\"spars\" + 0.023*\"factor\" + 0.015*\"adulthood\" + 0.013*\"feel\" + 0.012*\"male\" + 0.011*\"plaisir\" + 0.010*\"genu\" + 0.009*\"biom\" + 0.008*\"western\" + 0.008*\"median\"\n", + "2019-01-31 00:57:28,689 : INFO : topic #43 (0.020): 0.067*\"elect\" + 0.054*\"parti\" + 0.024*\"voluntari\" + 0.023*\"democrat\" + 0.019*\"member\" + 0.017*\"polici\" + 0.015*\"republ\" + 0.015*\"bypass\" + 0.014*\"report\" + 0.013*\"seaport\"\n", + "2019-01-31 00:57:28,695 : INFO : topic diff=0.004941, rho=0.028831\n", + "2019-01-31 00:57:28,850 : INFO : PROGRESS: pass 0, at document #2408000/4922894\n", + "2019-01-31 00:57:30,216 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:57:30,483 : INFO : topic #12 (0.020): 0.009*\"number\" + 0.008*\"frontal\" + 0.007*\"exampl\" + 0.007*\"poet\" + 0.006*\"théori\" + 0.006*\"gener\" + 0.006*\"southern\" + 0.006*\"servitud\" + 0.006*\"measur\" + 0.006*\"method\"\n", + "2019-01-31 00:57:30,484 : INFO : topic #14 (0.020): 0.024*\"forc\" + 0.021*\"armi\" + 0.021*\"aggress\" + 0.020*\"walter\" + 0.017*\"com\" + 0.013*\"unionist\" + 0.013*\"militari\" + 0.013*\"oper\" + 0.011*\"airbu\" + 0.011*\"diversifi\"\n", + "2019-01-31 00:57:30,485 : INFO : topic #48 (0.020): 0.081*\"march\" + 0.077*\"octob\" + 0.077*\"sens\" + 0.072*\"januari\" + 0.070*\"notion\" + 0.070*\"juli\" + 0.069*\"april\" + 0.069*\"judici\" + 0.068*\"decatur\" + 0.067*\"august\"\n", + "2019-01-31 00:57:30,486 : INFO : topic #6 (0.020): 0.072*\"fewer\" + 0.023*\"epiru\" + 0.022*\"septemb\" + 0.018*\"teacher\" + 0.017*\"stake\" + 0.013*\"rodríguez\" + 0.012*\"proclaim\" + 0.012*\"direct\" + 0.010*\"acrimoni\" + 0.010*\"movi\"\n", + "2019-01-31 00:57:30,487 : INFO : topic #16 (0.020): 0.050*\"king\" + 0.031*\"priest\" + 0.020*\"rotterdam\" + 0.020*\"duke\" + 0.019*\"grammat\" + 0.018*\"idiosyncrat\" + 0.017*\"quarterli\" + 0.014*\"portugues\" + 0.014*\"kingdom\" + 0.014*\"count\"\n", + "2019-01-31 00:57:30,493 : INFO : topic diff=0.004450, rho=0.028820\n", + "2019-01-31 00:57:30,644 : INFO : PROGRESS: pass 0, at document #2410000/4922894\n", + "2019-01-31 00:57:31,969 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:57:32,235 : INFO : topic #22 (0.020): 0.034*\"spars\" + 0.023*\"factor\" + 0.015*\"adulthood\" + 0.013*\"feel\" + 0.011*\"male\" + 0.011*\"plaisir\" + 0.010*\"genu\" + 0.009*\"biom\" + 0.008*\"western\" + 0.008*\"median\"\n", + "2019-01-31 00:57:32,236 : INFO : topic #21 (0.020): 0.036*\"samford\" + 0.022*\"spain\" + 0.018*\"del\" + 0.017*\"mexico\" + 0.014*\"italian\" + 0.013*\"soviet\" + 0.012*\"santa\" + 0.012*\"juan\" + 0.011*\"lizard\" + 0.010*\"francisco\"\n", + "2019-01-31 00:57:32,237 : INFO : topic #43 (0.020): 0.066*\"elect\" + 0.054*\"parti\" + 0.024*\"voluntari\" + 0.023*\"democrat\" + 0.019*\"member\" + 0.017*\"polici\" + 0.015*\"republ\" + 0.014*\"bypass\" + 0.014*\"report\" + 0.013*\"seaport\"\n", + "2019-01-31 00:57:32,239 : INFO : topic #7 (0.020): 0.021*\"snatch\" + 0.020*\"di\" + 0.018*\"factor\" + 0.015*\"margin\" + 0.015*\"yawn\" + 0.014*\"bone\" + 0.013*\"faster\" + 0.013*\"life\" + 0.012*\"john\" + 0.012*\"will\"\n", + "2019-01-31 00:57:32,240 : INFO : topic #16 (0.020): 0.050*\"king\" + 0.031*\"priest\" + 0.020*\"rotterdam\" + 0.020*\"duke\" + 0.019*\"grammat\" + 0.018*\"idiosyncrat\" + 0.017*\"quarterli\" + 0.014*\"kingdom\" + 0.014*\"portugues\" + 0.014*\"count\"\n", + "2019-01-31 00:57:32,245 : INFO : topic diff=0.004224, rho=0.028808\n", + "2019-01-31 00:57:32,398 : INFO : PROGRESS: pass 0, at document #2412000/4922894\n", + "2019-01-31 00:57:33,754 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 00:57:34,021 : INFO : topic #0 (0.020): 0.068*\"statewid\" + 0.042*\"line\" + 0.036*\"raid\" + 0.029*\"arsen\" + 0.024*\"museo\" + 0.020*\"traceabl\" + 0.019*\"serv\" + 0.014*\"rosenwald\" + 0.012*\"oper\" + 0.012*\"exhaust\"\n", + "2019-01-31 00:57:34,022 : INFO : topic #45 (0.020): 0.028*\"jpg\" + 0.026*\"fifteenth\" + 0.018*\"illicit\" + 0.017*\"colder\" + 0.016*\"western\" + 0.016*\"black\" + 0.013*\"record\" + 0.010*\"blind\" + 0.009*\"depress\" + 0.008*\"light\"\n", + "2019-01-31 00:57:34,023 : INFO : topic #30 (0.020): 0.036*\"cleveland\" + 0.035*\"leagu\" + 0.029*\"place\" + 0.028*\"taxpay\" + 0.025*\"scientist\" + 0.023*\"crete\" + 0.022*\"folei\" + 0.016*\"goal\" + 0.015*\"martin\" + 0.012*\"schmitz\"\n", + "2019-01-31 00:57:34,024 : INFO : topic #49 (0.020): 0.043*\"india\" + 0.031*\"incumb\" + 0.012*\"islam\" + 0.012*\"pakistan\" + 0.012*\"anglo\" + 0.011*\"khalsa\" + 0.011*\"televis\" + 0.011*\"alam\" + 0.010*\"muskoge\" + 0.010*\"sri\"\n", + "2019-01-31 00:57:34,025 : INFO : topic #3 (0.020): 0.032*\"present\" + 0.026*\"offic\" + 0.024*\"nation\" + 0.024*\"minist\" + 0.022*\"govern\" + 0.021*\"member\" + 0.019*\"serv\" + 0.016*\"gener\" + 0.016*\"start\" + 0.015*\"seri\"\n", + "2019-01-31 00:57:34,031 : INFO : topic diff=0.005137, rho=0.028796\n", + "2019-01-31 00:57:34,189 : INFO : PROGRESS: pass 0, at document #2414000/4922894\n", + "2019-01-31 00:57:35,585 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:57:35,852 : INFO : topic #8 (0.020): 0.028*\"law\" + 0.022*\"cortic\" + 0.019*\"act\" + 0.018*\"start\" + 0.012*\"case\" + 0.012*\"ricardo\" + 0.010*\"polaris\" + 0.009*\"replac\" + 0.009*\"legal\" + 0.008*\"order\"\n", + "2019-01-31 00:57:35,853 : INFO : topic #18 (0.020): 0.011*\"théori\" + 0.007*\"later\" + 0.007*\"sack\" + 0.006*\"dai\" + 0.005*\"kill\" + 0.005*\"retrospect\" + 0.005*\"like\" + 0.005*\"end\" + 0.004*\"help\" + 0.004*\"call\"\n", + "2019-01-31 00:57:35,854 : INFO : topic #34 (0.020): 0.067*\"start\" + 0.034*\"new\" + 0.031*\"american\" + 0.029*\"unionist\" + 0.026*\"cotton\" + 0.021*\"year\" + 0.015*\"california\" + 0.013*\"warrior\" + 0.012*\"terri\" + 0.012*\"north\"\n", + "2019-01-31 00:57:35,855 : INFO : topic #9 (0.020): 0.074*\"bone\" + 0.047*\"american\" + 0.026*\"valour\" + 0.019*\"dutch\" + 0.017*\"english\" + 0.016*\"folei\" + 0.016*\"player\" + 0.016*\"polit\" + 0.013*\"simpler\" + 0.012*\"acrimoni\"\n", + "2019-01-31 00:57:35,856 : INFO : topic #44 (0.020): 0.032*\"rooftop\" + 0.026*\"final\" + 0.023*\"wife\" + 0.020*\"tourist\" + 0.018*\"champion\" + 0.016*\"taxpay\" + 0.015*\"martin\" + 0.015*\"chamber\" + 0.014*\"tiepolo\" + 0.014*\"open\"\n", + "2019-01-31 00:57:35,862 : INFO : topic diff=0.004604, rho=0.028784\n", + "2019-01-31 00:57:36,021 : INFO : PROGRESS: pass 0, at document #2416000/4922894\n", + "2019-01-31 00:57:37,422 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:57:37,689 : INFO : topic #39 (0.020): 0.057*\"canada\" + 0.043*\"canadian\" + 0.025*\"toronto\" + 0.021*\"hoar\" + 0.019*\"ontario\" + 0.015*\"hydrogen\" + 0.015*\"new\" + 0.014*\"novotná\" + 0.014*\"misericordia\" + 0.012*\"quebec\"\n", + "2019-01-31 00:57:37,690 : INFO : topic #28 (0.020): 0.031*\"build\" + 0.026*\"hous\" + 0.020*\"rivièr\" + 0.017*\"buford\" + 0.013*\"histor\" + 0.012*\"briarwood\" + 0.011*\"strategist\" + 0.011*\"constitut\" + 0.010*\"linear\" + 0.010*\"depress\"\n", + "2019-01-31 00:57:37,691 : INFO : topic #47 (0.020): 0.063*\"muscl\" + 0.033*\"perceptu\" + 0.021*\"theater\" + 0.019*\"place\" + 0.017*\"compos\" + 0.016*\"damn\" + 0.014*\"orchestr\" + 0.013*\"physician\" + 0.013*\"olympo\" + 0.012*\"word\"\n", + "2019-01-31 00:57:37,692 : INFO : topic #25 (0.020): 0.033*\"ring\" + 0.018*\"lagrang\" + 0.017*\"area\" + 0.016*\"mount\" + 0.016*\"warmth\" + 0.009*\"north\" + 0.009*\"foam\" + 0.009*\"sourc\" + 0.008*\"palmer\" + 0.008*\"vacant\"\n", + "2019-01-31 00:57:37,693 : INFO : topic #14 (0.020): 0.024*\"forc\" + 0.021*\"aggress\" + 0.021*\"armi\" + 0.020*\"walter\" + 0.017*\"com\" + 0.013*\"unionist\" + 0.013*\"militari\" + 0.013*\"oper\" + 0.012*\"airmen\" + 0.012*\"airbu\"\n", + "2019-01-31 00:57:37,699 : INFO : topic diff=0.004405, rho=0.028772\n", + "2019-01-31 00:57:37,858 : INFO : PROGRESS: pass 0, at document #2418000/4922894\n", + "2019-01-31 00:57:39,243 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:57:39,509 : INFO : topic #20 (0.020): 0.141*\"scholar\" + 0.040*\"struggl\" + 0.033*\"high\" + 0.030*\"educ\" + 0.026*\"collector\" + 0.018*\"yawn\" + 0.013*\"prognosi\" + 0.010*\"class\" + 0.009*\"task\" + 0.009*\"gothic\"\n", + "2019-01-31 00:57:39,510 : INFO : topic #13 (0.020): 0.026*\"london\" + 0.025*\"australia\" + 0.025*\"sourc\" + 0.025*\"new\" + 0.023*\"england\" + 0.022*\"australian\" + 0.020*\"british\" + 0.017*\"ireland\" + 0.015*\"youth\" + 0.014*\"wale\"\n", + "2019-01-31 00:57:39,510 : INFO : topic #43 (0.020): 0.066*\"elect\" + 0.054*\"parti\" + 0.024*\"voluntari\" + 0.023*\"democrat\" + 0.019*\"member\" + 0.017*\"polici\" + 0.015*\"republ\" + 0.015*\"bypass\" + 0.014*\"report\" + 0.013*\"seaport\"\n", + "2019-01-31 00:57:39,511 : INFO : topic #3 (0.020): 0.032*\"present\" + 0.025*\"offic\" + 0.024*\"minist\" + 0.024*\"nation\" + 0.022*\"govern\" + 0.022*\"member\" + 0.019*\"serv\" + 0.016*\"start\" + 0.016*\"gener\" + 0.015*\"seri\"\n", + "2019-01-31 00:57:39,513 : INFO : topic #47 (0.020): 0.063*\"muscl\" + 0.033*\"perceptu\" + 0.021*\"theater\" + 0.019*\"place\" + 0.017*\"compos\" + 0.016*\"damn\" + 0.014*\"orchestr\" + 0.014*\"physician\" + 0.013*\"olympo\" + 0.012*\"word\"\n", + "2019-01-31 00:57:39,518 : INFO : topic diff=0.004684, rho=0.028760\n", + "2019-01-31 00:57:42,229 : INFO : -11.658 per-word bound, 3232.6 perplexity estimate based on a held-out corpus of 2000 documents with 561226 words\n", + "2019-01-31 00:57:42,229 : INFO : PROGRESS: pass 0, at document #2420000/4922894\n", + "2019-01-31 00:57:43,624 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:57:43,890 : INFO : topic #34 (0.020): 0.068*\"start\" + 0.034*\"new\" + 0.031*\"american\" + 0.029*\"unionist\" + 0.025*\"cotton\" + 0.021*\"year\" + 0.015*\"california\" + 0.014*\"warrior\" + 0.012*\"north\" + 0.012*\"terri\"\n", + "2019-01-31 00:57:43,892 : INFO : topic #7 (0.020): 0.021*\"snatch\" + 0.020*\"di\" + 0.018*\"factor\" + 0.015*\"margin\" + 0.015*\"yawn\" + 0.014*\"bone\" + 0.013*\"faster\" + 0.013*\"life\" + 0.012*\"john\" + 0.012*\"will\"\n", + "2019-01-31 00:57:43,892 : INFO : topic #14 (0.020): 0.024*\"forc\" + 0.021*\"aggress\" + 0.021*\"armi\" + 0.021*\"walter\" + 0.017*\"com\" + 0.013*\"unionist\" + 0.013*\"militari\" + 0.013*\"oper\" + 0.012*\"airmen\" + 0.012*\"airbu\"\n", + "2019-01-31 00:57:43,894 : INFO : topic #27 (0.020): 0.066*\"questionnair\" + 0.021*\"candid\" + 0.020*\"ret\" + 0.018*\"taxpay\" + 0.013*\"driver\" + 0.012*\"tornado\" + 0.012*\"fool\" + 0.011*\"find\" + 0.011*\"champion\" + 0.011*\"squatter\"\n", + "2019-01-31 00:57:43,894 : INFO : topic #35 (0.020): 0.060*\"russia\" + 0.038*\"sovereignti\" + 0.033*\"rural\" + 0.030*\"poison\" + 0.025*\"personifi\" + 0.023*\"reprint\" + 0.020*\"poland\" + 0.020*\"moscow\" + 0.015*\"unfortun\" + 0.014*\"czech\"\n", + "2019-01-31 00:57:43,900 : INFO : topic diff=0.004827, rho=0.028748\n", + "2019-01-31 00:57:44,061 : INFO : PROGRESS: pass 0, at document #2422000/4922894\n", + "2019-01-31 00:57:45,477 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:57:45,744 : INFO : topic #5 (0.020): 0.039*\"abroad\" + 0.028*\"son\" + 0.027*\"rel\" + 0.026*\"reconstruct\" + 0.020*\"band\" + 0.017*\"muscl\" + 0.016*\"simultan\" + 0.014*\"charcoal\" + 0.014*\"toyota\" + 0.010*\"myspac\"\n", + "2019-01-31 00:57:45,745 : INFO : topic #30 (0.020): 0.036*\"cleveland\" + 0.035*\"leagu\" + 0.029*\"place\" + 0.028*\"taxpay\" + 0.024*\"scientist\" + 0.023*\"crete\" + 0.022*\"folei\" + 0.017*\"goal\" + 0.015*\"martin\" + 0.013*\"schmitz\"\n", + "2019-01-31 00:57:45,746 : INFO : topic #6 (0.020): 0.073*\"fewer\" + 0.023*\"epiru\" + 0.022*\"septemb\" + 0.019*\"teacher\" + 0.017*\"stake\" + 0.013*\"rodríguez\" + 0.012*\"proclaim\" + 0.012*\"direct\" + 0.010*\"acrimoni\" + 0.010*\"movi\"\n", + "2019-01-31 00:57:45,747 : INFO : topic #29 (0.020): 0.029*\"companhia\" + 0.012*\"busi\" + 0.012*\"million\" + 0.011*\"produc\" + 0.011*\"market\" + 0.010*\"bank\" + 0.009*\"industri\" + 0.009*\"yawn\" + 0.008*\"manag\" + 0.007*\"oper\"\n", + "2019-01-31 00:57:45,748 : INFO : topic #37 (0.020): 0.010*\"charact\" + 0.009*\"man\" + 0.009*\"septemb\" + 0.008*\"anim\" + 0.008*\"comic\" + 0.007*\"love\" + 0.007*\"appear\" + 0.006*\"gestur\" + 0.005*\"blue\" + 0.005*\"workplac\"\n", + "2019-01-31 00:57:45,754 : INFO : topic diff=0.005325, rho=0.028736\n", + "2019-01-31 00:57:45,911 : INFO : PROGRESS: pass 0, at document #2424000/4922894\n", + "2019-01-31 00:57:47,289 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 00:57:47,555 : INFO : topic #24 (0.020): 0.038*\"book\" + 0.035*\"publicis\" + 0.026*\"word\" + 0.018*\"new\" + 0.015*\"edit\" + 0.013*\"presid\" + 0.012*\"nicola\" + 0.012*\"collect\" + 0.011*\"storag\" + 0.011*\"magazin\"\n", + "2019-01-31 00:57:47,556 : INFO : topic #25 (0.020): 0.033*\"ring\" + 0.018*\"lagrang\" + 0.017*\"area\" + 0.016*\"warmth\" + 0.016*\"mount\" + 0.009*\"north\" + 0.009*\"sourc\" + 0.009*\"foam\" + 0.008*\"palmer\" + 0.008*\"vacant\"\n", + "2019-01-31 00:57:47,557 : INFO : topic #44 (0.020): 0.032*\"rooftop\" + 0.026*\"final\" + 0.023*\"wife\" + 0.020*\"tourist\" + 0.018*\"champion\" + 0.016*\"taxpay\" + 0.015*\"open\" + 0.015*\"martin\" + 0.014*\"chamber\" + 0.014*\"tiepolo\"\n", + "2019-01-31 00:57:47,558 : INFO : topic #29 (0.020): 0.029*\"companhia\" + 0.012*\"busi\" + 0.012*\"million\" + 0.011*\"produc\" + 0.011*\"market\" + 0.010*\"bank\" + 0.009*\"industri\" + 0.009*\"yawn\" + 0.008*\"manag\" + 0.007*\"oper\"\n", + "2019-01-31 00:57:47,559 : INFO : topic #32 (0.020): 0.052*\"district\" + 0.044*\"popolo\" + 0.042*\"vigour\" + 0.039*\"tortur\" + 0.034*\"cotton\" + 0.025*\"area\" + 0.022*\"multitud\" + 0.022*\"citi\" + 0.020*\"regim\" + 0.019*\"cede\"\n", + "2019-01-31 00:57:47,565 : INFO : topic diff=0.004299, rho=0.028724\n", + "2019-01-31 00:57:47,720 : INFO : PROGRESS: pass 0, at document #2426000/4922894\n", + "2019-01-31 00:57:49,067 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:57:49,334 : INFO : topic #48 (0.020): 0.082*\"march\" + 0.078*\"octob\" + 0.077*\"sens\" + 0.073*\"januari\" + 0.072*\"juli\" + 0.072*\"notion\" + 0.071*\"april\" + 0.070*\"judici\" + 0.069*\"august\" + 0.069*\"decatur\"\n", + "2019-01-31 00:57:49,335 : INFO : topic #11 (0.020): 0.024*\"john\" + 0.012*\"will\" + 0.012*\"jame\" + 0.012*\"david\" + 0.010*\"rival\" + 0.009*\"mexican–american\" + 0.008*\"georg\" + 0.008*\"slur\" + 0.008*\"paul\" + 0.008*\"rhyme\"\n", + "2019-01-31 00:57:49,336 : INFO : topic #9 (0.020): 0.074*\"bone\" + 0.047*\"american\" + 0.025*\"valour\" + 0.018*\"dutch\" + 0.018*\"english\" + 0.017*\"folei\" + 0.016*\"player\" + 0.016*\"polit\" + 0.013*\"simpler\" + 0.011*\"acrimoni\"\n", + "2019-01-31 00:57:49,337 : INFO : topic #37 (0.020): 0.011*\"charact\" + 0.009*\"man\" + 0.009*\"septemb\" + 0.008*\"anim\" + 0.008*\"comic\" + 0.007*\"love\" + 0.007*\"appear\" + 0.006*\"gestur\" + 0.006*\"vision\" + 0.005*\"blue\"\n", + "2019-01-31 00:57:49,338 : INFO : topic #44 (0.020): 0.032*\"rooftop\" + 0.026*\"final\" + 0.023*\"wife\" + 0.020*\"tourist\" + 0.018*\"champion\" + 0.016*\"taxpay\" + 0.015*\"open\" + 0.015*\"martin\" + 0.014*\"chamber\" + 0.014*\"tiepolo\"\n", + "2019-01-31 00:57:49,344 : INFO : topic diff=0.004469, rho=0.028712\n", + "2019-01-31 00:57:49,500 : INFO : PROGRESS: pass 0, at document #2428000/4922894\n", + "2019-01-31 00:57:50,898 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:57:51,164 : INFO : topic #36 (0.020): 0.011*\"prognosi\" + 0.011*\"pop\" + 0.011*\"network\" + 0.008*\"develop\" + 0.008*\"user\" + 0.008*\"cytokin\" + 0.008*\"softwar\" + 0.007*\"brio\" + 0.007*\"diggin\" + 0.007*\"uruguayan\"\n", + "2019-01-31 00:57:51,166 : INFO : topic #8 (0.020): 0.027*\"law\" + 0.024*\"act\" + 0.022*\"cortic\" + 0.018*\"start\" + 0.012*\"ricardo\" + 0.012*\"case\" + 0.010*\"polaris\" + 0.009*\"replac\" + 0.009*\"legal\" + 0.007*\"order\"\n", + "2019-01-31 00:57:51,166 : INFO : topic #43 (0.020): 0.067*\"elect\" + 0.055*\"parti\" + 0.024*\"voluntari\" + 0.023*\"democrat\" + 0.019*\"member\" + 0.017*\"polici\" + 0.015*\"republ\" + 0.015*\"bypass\" + 0.014*\"report\" + 0.013*\"seaport\"\n", + "2019-01-31 00:57:51,168 : INFO : topic #10 (0.020): 0.012*\"cdd\" + 0.008*\"disco\" + 0.007*\"media\" + 0.007*\"pathwai\" + 0.007*\"caus\" + 0.007*\"hormon\" + 0.007*\"have\" + 0.007*\"proper\" + 0.006*\"treat\" + 0.006*\"effect\"\n", + "2019-01-31 00:57:51,169 : INFO : topic #20 (0.020): 0.141*\"scholar\" + 0.039*\"struggl\" + 0.033*\"high\" + 0.030*\"educ\" + 0.026*\"collector\" + 0.018*\"yawn\" + 0.013*\"prognosi\" + 0.010*\"class\" + 0.009*\"gothic\" + 0.009*\"task\"\n", + "2019-01-31 00:57:51,175 : INFO : topic diff=0.004472, rho=0.028701\n", + "2019-01-31 00:57:51,337 : INFO : PROGRESS: pass 0, at document #2430000/4922894\n", + "2019-01-31 00:57:52,754 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:57:53,021 : INFO : topic #20 (0.020): 0.141*\"scholar\" + 0.039*\"struggl\" + 0.033*\"high\" + 0.030*\"educ\" + 0.026*\"collector\" + 0.018*\"yawn\" + 0.013*\"prognosi\" + 0.010*\"class\" + 0.009*\"gothic\" + 0.009*\"task\"\n", + "2019-01-31 00:57:53,022 : INFO : topic #4 (0.020): 0.020*\"enfranchis\" + 0.015*\"depress\" + 0.014*\"pour\" + 0.009*\"elabor\" + 0.009*\"mode\" + 0.008*\"veget\" + 0.007*\"uruguayan\" + 0.007*\"encyclopedia\" + 0.007*\"develop\" + 0.006*\"produc\"\n", + "2019-01-31 00:57:53,023 : INFO : topic #40 (0.020): 0.086*\"unit\" + 0.024*\"schuster\" + 0.022*\"institut\" + 0.021*\"collector\" + 0.021*\"requir\" + 0.018*\"student\" + 0.015*\"professor\" + 0.012*\"word\" + 0.011*\"degre\" + 0.011*\"governor\"\n", + "2019-01-31 00:57:53,024 : INFO : topic #19 (0.020): 0.017*\"languag\" + 0.014*\"centuri\" + 0.010*\"woodcut\" + 0.009*\"form\" + 0.009*\"mean\" + 0.009*\"origin\" + 0.008*\"trade\" + 0.008*\"english\" + 0.007*\"known\" + 0.006*\"ancestor\"\n", + "2019-01-31 00:57:53,025 : INFO : topic #46 (0.020): 0.018*\"stop\" + 0.017*\"swedish\" + 0.017*\"sweden\" + 0.016*\"norwai\" + 0.015*\"wind\" + 0.014*\"damag\" + 0.014*\"norwegian\" + 0.012*\"turkish\" + 0.012*\"denmark\" + 0.012*\"farid\"\n", + "2019-01-31 00:57:53,031 : INFO : topic diff=0.004694, rho=0.028689\n", + "2019-01-31 00:57:53,241 : INFO : PROGRESS: pass 0, at document #2432000/4922894\n", + "2019-01-31 00:57:54,603 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:57:54,870 : INFO : topic #17 (0.020): 0.079*\"church\" + 0.024*\"cathol\" + 0.023*\"christian\" + 0.021*\"bishop\" + 0.017*\"sail\" + 0.015*\"retroflex\" + 0.010*\"relationship\" + 0.009*\"centuri\" + 0.009*\"parish\" + 0.009*\"historiographi\"\n", + "2019-01-31 00:57:54,871 : INFO : topic #9 (0.020): 0.074*\"bone\" + 0.047*\"american\" + 0.025*\"valour\" + 0.018*\"dutch\" + 0.018*\"english\" + 0.017*\"folei\" + 0.016*\"player\" + 0.016*\"polit\" + 0.012*\"simpler\" + 0.011*\"acrimoni\"\n", + "2019-01-31 00:57:54,872 : INFO : topic #49 (0.020): 0.043*\"india\" + 0.031*\"incumb\" + 0.012*\"islam\" + 0.012*\"pakistan\" + 0.012*\"anglo\" + 0.011*\"khalsa\" + 0.011*\"alam\" + 0.011*\"muskoge\" + 0.010*\"televis\" + 0.010*\"affection\"\n", + "2019-01-31 00:57:54,874 : INFO : topic #37 (0.020): 0.011*\"charact\" + 0.009*\"man\" + 0.009*\"septemb\" + 0.008*\"comic\" + 0.008*\"anim\" + 0.007*\"love\" + 0.007*\"appear\" + 0.006*\"gestur\" + 0.005*\"vision\" + 0.005*\"blue\"\n", + "2019-01-31 00:57:54,875 : INFO : topic #40 (0.020): 0.086*\"unit\" + 0.023*\"schuster\" + 0.022*\"institut\" + 0.021*\"collector\" + 0.021*\"requir\" + 0.018*\"student\" + 0.015*\"professor\" + 0.012*\"word\" + 0.011*\"degre\" + 0.011*\"governor\"\n", + "2019-01-31 00:57:54,881 : INFO : topic diff=0.004256, rho=0.028677\n", + "2019-01-31 00:57:55,034 : INFO : PROGRESS: pass 0, at document #2434000/4922894\n", + "2019-01-31 00:57:56,509 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:57:56,777 : INFO : topic #36 (0.020): 0.011*\"pop\" + 0.011*\"prognosi\" + 0.011*\"network\" + 0.008*\"develop\" + 0.008*\"user\" + 0.008*\"cytokin\" + 0.008*\"softwar\" + 0.007*\"brio\" + 0.007*\"diggin\" + 0.007*\"uruguayan\"\n", + "2019-01-31 00:57:56,778 : INFO : topic #26 (0.020): 0.028*\"woman\" + 0.028*\"workplac\" + 0.027*\"champion\" + 0.026*\"men\" + 0.025*\"olymp\" + 0.022*\"medal\" + 0.020*\"event\" + 0.020*\"alic\" + 0.019*\"rainfal\" + 0.018*\"atheist\"\n", + "2019-01-31 00:57:56,779 : INFO : topic #17 (0.020): 0.079*\"church\" + 0.024*\"cathol\" + 0.023*\"christian\" + 0.021*\"bishop\" + 0.017*\"sail\" + 0.015*\"retroflex\" + 0.010*\"relationship\" + 0.009*\"centuri\" + 0.009*\"parish\" + 0.009*\"historiographi\"\n", + "2019-01-31 00:57:56,781 : INFO : topic #5 (0.020): 0.039*\"abroad\" + 0.028*\"son\" + 0.027*\"rel\" + 0.026*\"reconstruct\" + 0.021*\"band\" + 0.017*\"muscl\" + 0.016*\"simultan\" + 0.014*\"charcoal\" + 0.014*\"toyota\" + 0.010*\"myspac\"\n", + "2019-01-31 00:57:56,782 : INFO : topic #46 (0.020): 0.017*\"stop\" + 0.017*\"swedish\" + 0.017*\"sweden\" + 0.017*\"norwai\" + 0.015*\"wind\" + 0.015*\"norwegian\" + 0.014*\"damag\" + 0.012*\"turkish\" + 0.012*\"farid\" + 0.011*\"turkei\"\n", + "2019-01-31 00:57:56,788 : INFO : topic diff=0.004577, rho=0.028665\n", + "2019-01-31 00:57:56,943 : INFO : PROGRESS: pass 0, at document #2436000/4922894\n", + "2019-01-31 00:57:58,331 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:57:58,597 : INFO : topic #28 (0.020): 0.031*\"build\" + 0.027*\"hous\" + 0.020*\"rivièr\" + 0.017*\"buford\" + 0.013*\"histor\" + 0.011*\"briarwood\" + 0.011*\"strategist\" + 0.010*\"constitut\" + 0.010*\"linear\" + 0.010*\"depress\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 00:57:58,598 : INFO : topic #19 (0.020): 0.017*\"languag\" + 0.014*\"centuri\" + 0.011*\"woodcut\" + 0.009*\"form\" + 0.009*\"mean\" + 0.009*\"origin\" + 0.008*\"trade\" + 0.008*\"english\" + 0.007*\"known\" + 0.006*\"uruguayan\"\n", + "2019-01-31 00:57:58,599 : INFO : topic #48 (0.020): 0.081*\"march\" + 0.079*\"octob\" + 0.078*\"sens\" + 0.074*\"juli\" + 0.073*\"januari\" + 0.072*\"notion\" + 0.071*\"april\" + 0.071*\"judici\" + 0.070*\"august\" + 0.069*\"decatur\"\n", + "2019-01-31 00:57:58,601 : INFO : topic #40 (0.020): 0.086*\"unit\" + 0.023*\"schuster\" + 0.022*\"institut\" + 0.021*\"collector\" + 0.021*\"requir\" + 0.018*\"student\" + 0.014*\"professor\" + 0.012*\"word\" + 0.011*\"degre\" + 0.011*\"governor\"\n", + "2019-01-31 00:57:58,602 : INFO : topic #45 (0.020): 0.027*\"jpg\" + 0.025*\"fifteenth\" + 0.019*\"illicit\" + 0.016*\"western\" + 0.016*\"black\" + 0.016*\"colder\" + 0.013*\"record\" + 0.010*\"blind\" + 0.009*\"depress\" + 0.008*\"pain\"\n", + "2019-01-31 00:57:58,607 : INFO : topic diff=0.003927, rho=0.028653\n", + "2019-01-31 00:57:58,768 : INFO : PROGRESS: pass 0, at document #2438000/4922894\n", + "2019-01-31 00:58:00,177 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:58:00,443 : INFO : topic #1 (0.020): 0.056*\"china\" + 0.047*\"chilton\" + 0.023*\"hong\" + 0.023*\"kong\" + 0.021*\"korea\" + 0.017*\"korean\" + 0.016*\"leah\" + 0.015*\"sourc\" + 0.014*\"shirin\" + 0.012*\"kim\"\n", + "2019-01-31 00:58:00,444 : INFO : topic #25 (0.020): 0.033*\"ring\" + 0.018*\"area\" + 0.017*\"lagrang\" + 0.016*\"warmth\" + 0.015*\"mount\" + 0.009*\"north\" + 0.009*\"sourc\" + 0.008*\"foam\" + 0.008*\"palmer\" + 0.008*\"vacant\"\n", + "2019-01-31 00:58:00,445 : INFO : topic #19 (0.020): 0.017*\"languag\" + 0.014*\"centuri\" + 0.011*\"woodcut\" + 0.009*\"form\" + 0.009*\"origin\" + 0.009*\"mean\" + 0.008*\"trade\" + 0.008*\"english\" + 0.007*\"known\" + 0.006*\"uruguayan\"\n", + "2019-01-31 00:58:00,446 : INFO : topic #42 (0.020): 0.047*\"german\" + 0.030*\"germani\" + 0.016*\"jewish\" + 0.016*\"vol\" + 0.015*\"israel\" + 0.014*\"berlin\" + 0.013*\"der\" + 0.011*\"european\" + 0.010*\"jeremiah\" + 0.009*\"europ\"\n", + "2019-01-31 00:58:00,447 : INFO : topic #15 (0.020): 0.011*\"small\" + 0.010*\"organ\" + 0.010*\"develop\" + 0.010*\"commun\" + 0.009*\"word\" + 0.008*\"peopl\" + 0.008*\"group\" + 0.007*\"human\" + 0.007*\"woman\" + 0.006*\"workplac\"\n", + "2019-01-31 00:58:00,453 : INFO : topic diff=0.004900, rho=0.028642\n", + "2019-01-31 00:58:03,129 : INFO : -11.515 per-word bound, 2927.3 perplexity estimate based on a held-out corpus of 2000 documents with 547284 words\n", + "2019-01-31 00:58:03,130 : INFO : PROGRESS: pass 0, at document #2440000/4922894\n", + "2019-01-31 00:58:04,509 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:58:04,776 : INFO : topic #45 (0.020): 0.027*\"jpg\" + 0.025*\"fifteenth\" + 0.019*\"illicit\" + 0.016*\"western\" + 0.016*\"black\" + 0.016*\"colder\" + 0.013*\"record\" + 0.010*\"blind\" + 0.009*\"depress\" + 0.008*\"pain\"\n", + "2019-01-31 00:58:04,777 : INFO : topic #7 (0.020): 0.021*\"snatch\" + 0.019*\"di\" + 0.018*\"factor\" + 0.015*\"margin\" + 0.015*\"yawn\" + 0.014*\"bone\" + 0.013*\"faster\" + 0.012*\"life\" + 0.012*\"will\" + 0.012*\"deal\"\n", + "2019-01-31 00:58:04,778 : INFO : topic #47 (0.020): 0.062*\"muscl\" + 0.033*\"perceptu\" + 0.020*\"theater\" + 0.019*\"place\" + 0.017*\"compos\" + 0.015*\"damn\" + 0.015*\"physician\" + 0.015*\"orchestr\" + 0.012*\"olympo\" + 0.012*\"word\"\n", + "2019-01-31 00:58:04,779 : INFO : topic #44 (0.020): 0.032*\"rooftop\" + 0.026*\"final\" + 0.023*\"wife\" + 0.020*\"tourist\" + 0.017*\"champion\" + 0.015*\"open\" + 0.015*\"taxpay\" + 0.014*\"martin\" + 0.014*\"chamber\" + 0.014*\"tiepolo\"\n", + "2019-01-31 00:58:04,780 : INFO : topic #24 (0.020): 0.038*\"book\" + 0.034*\"publicis\" + 0.025*\"word\" + 0.018*\"new\" + 0.015*\"edit\" + 0.013*\"presid\" + 0.011*\"collect\" + 0.011*\"nicola\" + 0.011*\"storag\" + 0.011*\"magazin\"\n", + "2019-01-31 00:58:04,786 : INFO : topic diff=0.004212, rho=0.028630\n", + "2019-01-31 00:58:04,944 : INFO : PROGRESS: pass 0, at document #2442000/4922894\n", + "2019-01-31 00:58:06,326 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:58:06,592 : INFO : topic #41 (0.020): 0.043*\"citi\" + 0.024*\"palmer\" + 0.023*\"new\" + 0.014*\"strategist\" + 0.013*\"center\" + 0.012*\"open\" + 0.011*\"includ\" + 0.011*\"lobe\" + 0.010*\"dai\" + 0.009*\"highli\"\n", + "2019-01-31 00:58:06,593 : INFO : topic #18 (0.020): 0.011*\"théori\" + 0.007*\"later\" + 0.007*\"sack\" + 0.006*\"dai\" + 0.006*\"kill\" + 0.005*\"retrospect\" + 0.005*\"like\" + 0.005*\"end\" + 0.004*\"help\" + 0.004*\"kenworthi\"\n", + "2019-01-31 00:58:06,594 : INFO : topic #34 (0.020): 0.067*\"start\" + 0.034*\"new\" + 0.031*\"american\" + 0.029*\"unionist\" + 0.025*\"cotton\" + 0.021*\"year\" + 0.015*\"california\" + 0.013*\"warrior\" + 0.012*\"terri\" + 0.012*\"north\"\n", + "2019-01-31 00:58:06,595 : INFO : topic #35 (0.020): 0.061*\"russia\" + 0.037*\"sovereignti\" + 0.035*\"rural\" + 0.029*\"poison\" + 0.027*\"personifi\" + 0.024*\"reprint\" + 0.020*\"moscow\" + 0.020*\"poland\" + 0.015*\"unfortun\" + 0.014*\"czech\"\n", + "2019-01-31 00:58:06,597 : INFO : topic #14 (0.020): 0.024*\"forc\" + 0.021*\"aggress\" + 0.021*\"armi\" + 0.020*\"walter\" + 0.018*\"com\" + 0.013*\"unionist\" + 0.013*\"oper\" + 0.013*\"militari\" + 0.012*\"airbu\" + 0.011*\"airmen\"\n", + "2019-01-31 00:58:06,602 : INFO : topic diff=0.004376, rho=0.028618\n", + "2019-01-31 00:58:06,760 : INFO : PROGRESS: pass 0, at document #2444000/4922894\n", + "2019-01-31 00:58:08,102 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:58:08,371 : INFO : topic #48 (0.020): 0.081*\"march\" + 0.077*\"octob\" + 0.077*\"sens\" + 0.073*\"juli\" + 0.072*\"januari\" + 0.071*\"april\" + 0.071*\"notion\" + 0.070*\"august\" + 0.069*\"judici\" + 0.068*\"decatur\"\n", + "2019-01-31 00:58:08,372 : INFO : topic #16 (0.020): 0.051*\"king\" + 0.031*\"priest\" + 0.021*\"rotterdam\" + 0.019*\"duke\" + 0.018*\"grammat\" + 0.018*\"quarterli\" + 0.017*\"idiosyncrat\" + 0.015*\"kingdom\" + 0.014*\"portugues\" + 0.013*\"count\"\n", + "2019-01-31 00:58:08,373 : INFO : topic #5 (0.020): 0.038*\"abroad\" + 0.028*\"son\" + 0.027*\"rel\" + 0.026*\"reconstruct\" + 0.021*\"band\" + 0.017*\"muscl\" + 0.016*\"simultan\" + 0.014*\"charcoal\" + 0.014*\"toyota\" + 0.010*\"myspac\"\n", + "2019-01-31 00:58:08,374 : INFO : topic #6 (0.020): 0.073*\"fewer\" + 0.023*\"epiru\" + 0.022*\"septemb\" + 0.019*\"teacher\" + 0.017*\"stake\" + 0.013*\"rodríguez\" + 0.012*\"proclaim\" + 0.011*\"direct\" + 0.011*\"acrimoni\" + 0.010*\"movi\"\n", + "2019-01-31 00:58:08,375 : INFO : topic #9 (0.020): 0.074*\"bone\" + 0.047*\"american\" + 0.026*\"valour\" + 0.018*\"dutch\" + 0.018*\"english\" + 0.017*\"folei\" + 0.017*\"player\" + 0.016*\"polit\" + 0.013*\"simpler\" + 0.011*\"acrimoni\"\n", + "2019-01-31 00:58:08,381 : INFO : topic diff=0.004427, rho=0.028606\n", + "2019-01-31 00:58:08,539 : INFO : PROGRESS: pass 0, at document #2446000/4922894\n", + "2019-01-31 00:58:09,932 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:58:10,199 : INFO : topic #29 (0.020): 0.029*\"companhia\" + 0.012*\"busi\" + 0.012*\"million\" + 0.011*\"market\" + 0.011*\"produc\" + 0.010*\"bank\" + 0.009*\"industri\" + 0.009*\"yawn\" + 0.008*\"manag\" + 0.007*\"oper\"\n", + "2019-01-31 00:58:10,200 : INFO : topic #35 (0.020): 0.060*\"russia\" + 0.038*\"sovereignti\" + 0.036*\"rural\" + 0.028*\"poison\" + 0.026*\"personifi\" + 0.024*\"reprint\" + 0.020*\"moscow\" + 0.020*\"poland\" + 0.015*\"unfortun\" + 0.014*\"czech\"\n", + "2019-01-31 00:58:10,201 : INFO : topic #32 (0.020): 0.052*\"district\" + 0.044*\"popolo\" + 0.041*\"vigour\" + 0.039*\"tortur\" + 0.033*\"cotton\" + 0.025*\"area\" + 0.022*\"multitud\" + 0.021*\"citi\" + 0.020*\"regim\" + 0.019*\"cede\"\n", + "2019-01-31 00:58:10,202 : INFO : topic #46 (0.020): 0.018*\"sweden\" + 0.017*\"norwai\" + 0.017*\"swedish\" + 0.017*\"stop\" + 0.015*\"norwegian\" + 0.015*\"wind\" + 0.014*\"damag\" + 0.012*\"farid\" + 0.012*\"denmark\" + 0.012*\"turkish\"\n", + "2019-01-31 00:58:10,203 : INFO : topic #31 (0.020): 0.052*\"fusiform\" + 0.027*\"scientist\" + 0.025*\"taxpay\" + 0.023*\"player\" + 0.020*\"place\" + 0.015*\"clot\" + 0.013*\"leagu\" + 0.011*\"folei\" + 0.011*\"yawn\" + 0.009*\"reconstruct\"\n", + "2019-01-31 00:58:10,209 : INFO : topic diff=0.004222, rho=0.028595\n", + "2019-01-31 00:58:10,368 : INFO : PROGRESS: pass 0, at document #2448000/4922894\n", + "2019-01-31 00:58:11,774 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:58:12,040 : INFO : topic #32 (0.020): 0.052*\"district\" + 0.044*\"popolo\" + 0.041*\"vigour\" + 0.039*\"tortur\" + 0.033*\"cotton\" + 0.025*\"area\" + 0.022*\"multitud\" + 0.021*\"citi\" + 0.020*\"regim\" + 0.019*\"cede\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 00:58:12,041 : INFO : topic #35 (0.020): 0.061*\"russia\" + 0.038*\"sovereignti\" + 0.036*\"rural\" + 0.028*\"poison\" + 0.026*\"personifi\" + 0.023*\"reprint\" + 0.020*\"moscow\" + 0.019*\"poland\" + 0.015*\"unfortun\" + 0.014*\"czech\"\n", + "2019-01-31 00:58:12,042 : INFO : topic #22 (0.020): 0.033*\"spars\" + 0.023*\"factor\" + 0.015*\"adulthood\" + 0.013*\"feel\" + 0.011*\"plaisir\" + 0.011*\"male\" + 0.011*\"genu\" + 0.009*\"western\" + 0.008*\"biom\" + 0.008*\"median\"\n", + "2019-01-31 00:58:12,043 : INFO : topic #7 (0.020): 0.021*\"snatch\" + 0.020*\"di\" + 0.018*\"factor\" + 0.015*\"margin\" + 0.015*\"yawn\" + 0.014*\"bone\" + 0.013*\"faster\" + 0.012*\"life\" + 0.012*\"will\" + 0.012*\"deal\"\n", + "2019-01-31 00:58:12,044 : INFO : topic #36 (0.020): 0.011*\"prognosi\" + 0.011*\"network\" + 0.011*\"pop\" + 0.008*\"develop\" + 0.008*\"user\" + 0.008*\"softwar\" + 0.008*\"cytokin\" + 0.007*\"brio\" + 0.007*\"diggin\" + 0.007*\"uruguayan\"\n", + "2019-01-31 00:58:12,050 : INFO : topic diff=0.003707, rho=0.028583\n", + "2019-01-31 00:58:12,207 : INFO : PROGRESS: pass 0, at document #2450000/4922894\n", + "2019-01-31 00:58:13,590 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:58:13,856 : INFO : topic #18 (0.020): 0.011*\"théori\" + 0.007*\"later\" + 0.007*\"sack\" + 0.006*\"dai\" + 0.005*\"kill\" + 0.005*\"retrospect\" + 0.005*\"like\" + 0.005*\"end\" + 0.004*\"help\" + 0.004*\"kenworthi\"\n", + "2019-01-31 00:58:13,857 : INFO : topic #17 (0.020): 0.078*\"church\" + 0.023*\"cathol\" + 0.023*\"christian\" + 0.021*\"bishop\" + 0.017*\"sail\" + 0.016*\"retroflex\" + 0.010*\"relationship\" + 0.009*\"poll\" + 0.009*\"centuri\" + 0.009*\"parish\"\n", + "2019-01-31 00:58:13,858 : INFO : topic #13 (0.020): 0.026*\"london\" + 0.025*\"australia\" + 0.025*\"sourc\" + 0.025*\"new\" + 0.024*\"england\" + 0.021*\"australian\" + 0.020*\"british\" + 0.017*\"ireland\" + 0.015*\"youth\" + 0.014*\"wale\"\n", + "2019-01-31 00:58:13,859 : INFO : topic #32 (0.020): 0.052*\"district\" + 0.044*\"popolo\" + 0.042*\"vigour\" + 0.039*\"tortur\" + 0.034*\"cotton\" + 0.025*\"area\" + 0.022*\"multitud\" + 0.021*\"citi\" + 0.019*\"regim\" + 0.019*\"cede\"\n", + "2019-01-31 00:58:13,860 : INFO : topic #42 (0.020): 0.047*\"german\" + 0.030*\"germani\" + 0.016*\"jewish\" + 0.015*\"vol\" + 0.015*\"israel\" + 0.014*\"berlin\" + 0.013*\"der\" + 0.010*\"european\" + 0.010*\"jeremiah\" + 0.010*\"europ\"\n", + "2019-01-31 00:58:13,866 : INFO : topic diff=0.004929, rho=0.028571\n", + "2019-01-31 00:58:14,022 : INFO : PROGRESS: pass 0, at document #2452000/4922894\n", + "2019-01-31 00:58:15,406 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:58:15,672 : INFO : topic #13 (0.020): 0.026*\"london\" + 0.026*\"sourc\" + 0.025*\"australia\" + 0.024*\"new\" + 0.024*\"england\" + 0.021*\"australian\" + 0.020*\"british\" + 0.017*\"ireland\" + 0.015*\"youth\" + 0.014*\"wale\"\n", + "2019-01-31 00:58:15,673 : INFO : topic #14 (0.020): 0.024*\"forc\" + 0.021*\"aggress\" + 0.021*\"armi\" + 0.020*\"walter\" + 0.018*\"com\" + 0.013*\"oper\" + 0.013*\"unionist\" + 0.013*\"militari\" + 0.011*\"airbu\" + 0.011*\"airmen\"\n", + "2019-01-31 00:58:15,674 : INFO : topic #33 (0.020): 0.062*\"french\" + 0.047*\"franc\" + 0.029*\"pari\" + 0.021*\"jean\" + 0.020*\"sail\" + 0.016*\"daphn\" + 0.014*\"lazi\" + 0.012*\"loui\" + 0.011*\"piec\" + 0.010*\"wine\"\n", + "2019-01-31 00:58:15,675 : INFO : topic #16 (0.020): 0.052*\"king\" + 0.032*\"priest\" + 0.021*\"rotterdam\" + 0.019*\"duke\" + 0.018*\"quarterli\" + 0.018*\"grammat\" + 0.018*\"idiosyncrat\" + 0.014*\"kingdom\" + 0.014*\"portugues\" + 0.013*\"count\"\n", + "2019-01-31 00:58:15,677 : INFO : topic #6 (0.020): 0.072*\"fewer\" + 0.023*\"epiru\" + 0.022*\"septemb\" + 0.019*\"teacher\" + 0.017*\"stake\" + 0.013*\"proclaim\" + 0.013*\"rodríguez\" + 0.011*\"direct\" + 0.011*\"movi\" + 0.010*\"acrimoni\"\n", + "2019-01-31 00:58:15,682 : INFO : topic diff=0.004492, rho=0.028560\n", + "2019-01-31 00:58:15,843 : INFO : PROGRESS: pass 0, at document #2454000/4922894\n", + "2019-01-31 00:58:17,210 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:58:17,479 : INFO : topic #26 (0.020): 0.028*\"woman\" + 0.027*\"workplac\" + 0.027*\"champion\" + 0.026*\"men\" + 0.025*\"olymp\" + 0.022*\"medal\" + 0.020*\"rainfal\" + 0.020*\"event\" + 0.018*\"alic\" + 0.018*\"atheist\"\n", + "2019-01-31 00:58:17,480 : INFO : topic #10 (0.020): 0.011*\"cdd\" + 0.008*\"disco\" + 0.008*\"media\" + 0.008*\"pathwai\" + 0.007*\"hormon\" + 0.007*\"caus\" + 0.007*\"have\" + 0.006*\"effect\" + 0.006*\"proper\" + 0.006*\"treat\"\n", + "2019-01-31 00:58:17,481 : INFO : topic #7 (0.020): 0.021*\"snatch\" + 0.020*\"di\" + 0.018*\"factor\" + 0.016*\"margin\" + 0.015*\"yawn\" + 0.014*\"bone\" + 0.013*\"faster\" + 0.013*\"life\" + 0.012*\"deal\" + 0.012*\"will\"\n", + "2019-01-31 00:58:17,482 : INFO : topic #46 (0.020): 0.018*\"norwai\" + 0.018*\"sweden\" + 0.017*\"swedish\" + 0.016*\"stop\" + 0.016*\"wind\" + 0.015*\"norwegian\" + 0.014*\"damag\" + 0.012*\"denmark\" + 0.012*\"farid\" + 0.011*\"turkish\"\n", + "2019-01-31 00:58:17,483 : INFO : topic #35 (0.020): 0.060*\"russia\" + 0.038*\"sovereignti\" + 0.035*\"rural\" + 0.029*\"poison\" + 0.027*\"personifi\" + 0.023*\"reprint\" + 0.020*\"moscow\" + 0.020*\"poland\" + 0.015*\"unfortun\" + 0.013*\"czech\"\n", + "2019-01-31 00:58:17,489 : INFO : topic diff=0.004143, rho=0.028548\n", + "2019-01-31 00:58:17,644 : INFO : PROGRESS: pass 0, at document #2456000/4922894\n", + "2019-01-31 00:58:19,016 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:58:19,282 : INFO : topic #21 (0.020): 0.035*\"samford\" + 0.023*\"spain\" + 0.018*\"del\" + 0.016*\"mexico\" + 0.016*\"italian\" + 0.014*\"soviet\" + 0.011*\"juan\" + 0.011*\"santa\" + 0.011*\"lizard\" + 0.010*\"carlo\"\n", + "2019-01-31 00:58:19,283 : INFO : topic #1 (0.020): 0.056*\"china\" + 0.046*\"chilton\" + 0.024*\"hong\" + 0.023*\"kong\" + 0.021*\"korea\" + 0.018*\"korean\" + 0.016*\"sourc\" + 0.015*\"leah\" + 0.013*\"shirin\" + 0.012*\"kim\"\n", + "2019-01-31 00:58:19,284 : INFO : topic #41 (0.020): 0.043*\"citi\" + 0.024*\"palmer\" + 0.023*\"new\" + 0.014*\"strategist\" + 0.013*\"center\" + 0.012*\"open\" + 0.011*\"includ\" + 0.011*\"lobe\" + 0.009*\"dai\" + 0.009*\"highli\"\n", + "2019-01-31 00:58:19,285 : INFO : topic #6 (0.020): 0.072*\"fewer\" + 0.023*\"epiru\" + 0.022*\"septemb\" + 0.019*\"teacher\" + 0.017*\"stake\" + 0.013*\"proclaim\" + 0.013*\"rodríguez\" + 0.011*\"direct\" + 0.011*\"movi\" + 0.010*\"acrimoni\"\n", + "2019-01-31 00:58:19,287 : INFO : topic #19 (0.020): 0.017*\"languag\" + 0.014*\"centuri\" + 0.010*\"woodcut\" + 0.009*\"form\" + 0.009*\"origin\" + 0.009*\"mean\" + 0.008*\"trade\" + 0.007*\"english\" + 0.007*\"known\" + 0.006*\"uruguayan\"\n", + "2019-01-31 00:58:19,292 : INFO : topic diff=0.004388, rho=0.028537\n", + "2019-01-31 00:58:19,449 : INFO : PROGRESS: pass 0, at document #2458000/4922894\n", + "2019-01-31 00:58:20,842 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:58:21,108 : INFO : topic #26 (0.020): 0.028*\"woman\" + 0.027*\"workplac\" + 0.027*\"champion\" + 0.026*\"men\" + 0.025*\"olymp\" + 0.022*\"medal\" + 0.020*\"event\" + 0.020*\"rainfal\" + 0.019*\"alic\" + 0.018*\"atheist\"\n", + "2019-01-31 00:58:21,109 : INFO : topic #24 (0.020): 0.038*\"book\" + 0.034*\"publicis\" + 0.026*\"word\" + 0.018*\"new\" + 0.015*\"edit\" + 0.013*\"presid\" + 0.012*\"nicola\" + 0.011*\"collect\" + 0.011*\"storag\" + 0.011*\"magazin\"\n", + "2019-01-31 00:58:21,111 : INFO : topic #46 (0.020): 0.018*\"norwai\" + 0.018*\"sweden\" + 0.017*\"swedish\" + 0.017*\"stop\" + 0.016*\"wind\" + 0.015*\"norwegian\" + 0.015*\"damag\" + 0.012*\"denmark\" + 0.012*\"farid\" + 0.011*\"turkish\"\n", + "2019-01-31 00:58:21,112 : INFO : topic #21 (0.020): 0.036*\"samford\" + 0.023*\"spain\" + 0.018*\"del\" + 0.016*\"mexico\" + 0.016*\"italian\" + 0.014*\"soviet\" + 0.011*\"juan\" + 0.011*\"santa\" + 0.011*\"francisco\" + 0.011*\"lizard\"\n", + "2019-01-31 00:58:21,113 : INFO : topic #28 (0.020): 0.031*\"build\" + 0.026*\"hous\" + 0.020*\"rivièr\" + 0.017*\"buford\" + 0.013*\"histor\" + 0.012*\"briarwood\" + 0.011*\"strategist\" + 0.011*\"constitut\" + 0.010*\"depress\" + 0.010*\"linear\"\n", + "2019-01-31 00:58:21,119 : INFO : topic diff=0.004239, rho=0.028525\n", + "2019-01-31 00:58:23,789 : INFO : -11.431 per-word bound, 2760.2 perplexity estimate based on a held-out corpus of 2000 documents with 559575 words\n", + "2019-01-31 00:58:23,790 : INFO : PROGRESS: pass 0, at document #2460000/4922894\n", + "2019-01-31 00:58:25,160 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:58:25,426 : INFO : topic #46 (0.020): 0.018*\"norwai\" + 0.018*\"sweden\" + 0.017*\"swedish\" + 0.017*\"stop\" + 0.016*\"wind\" + 0.016*\"norwegian\" + 0.015*\"damag\" + 0.012*\"denmark\" + 0.012*\"farid\" + 0.011*\"huntsvil\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 00:58:25,427 : INFO : topic #3 (0.020): 0.033*\"present\" + 0.026*\"offic\" + 0.024*\"minist\" + 0.024*\"nation\" + 0.021*\"member\" + 0.021*\"govern\" + 0.020*\"serv\" + 0.016*\"start\" + 0.016*\"gener\" + 0.015*\"seri\"\n", + "2019-01-31 00:58:25,428 : INFO : topic #32 (0.020): 0.051*\"district\" + 0.044*\"popolo\" + 0.041*\"vigour\" + 0.039*\"tortur\" + 0.033*\"cotton\" + 0.025*\"area\" + 0.023*\"multitud\" + 0.021*\"citi\" + 0.019*\"regim\" + 0.019*\"cede\"\n", + "2019-01-31 00:58:25,429 : INFO : topic #20 (0.020): 0.141*\"scholar\" + 0.040*\"struggl\" + 0.033*\"high\" + 0.030*\"educ\" + 0.026*\"collector\" + 0.018*\"yawn\" + 0.013*\"prognosi\" + 0.010*\"class\" + 0.009*\"task\" + 0.009*\"gothic\"\n", + "2019-01-31 00:58:25,430 : INFO : topic #29 (0.020): 0.029*\"companhia\" + 0.012*\"busi\" + 0.012*\"million\" + 0.011*\"market\" + 0.011*\"produc\" + 0.011*\"bank\" + 0.009*\"industri\" + 0.008*\"yawn\" + 0.008*\"manag\" + 0.007*\"oper\"\n", + "2019-01-31 00:58:25,436 : INFO : topic diff=0.004059, rho=0.028513\n", + "2019-01-31 00:58:25,654 : INFO : PROGRESS: pass 0, at document #2462000/4922894\n", + "2019-01-31 00:58:27,060 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:58:27,326 : INFO : topic #25 (0.020): 0.033*\"ring\" + 0.018*\"lagrang\" + 0.018*\"area\" + 0.016*\"warmth\" + 0.015*\"mount\" + 0.009*\"north\" + 0.009*\"palmer\" + 0.009*\"foam\" + 0.009*\"sourc\" + 0.008*\"lobe\"\n", + "2019-01-31 00:58:27,327 : INFO : topic #12 (0.020): 0.009*\"number\" + 0.007*\"frontal\" + 0.007*\"exampl\" + 0.007*\"poet\" + 0.007*\"gener\" + 0.006*\"théori\" + 0.006*\"southern\" + 0.006*\"servitud\" + 0.006*\"measur\" + 0.006*\"differ\"\n", + "2019-01-31 00:58:27,329 : INFO : topic #7 (0.020): 0.021*\"snatch\" + 0.020*\"di\" + 0.018*\"factor\" + 0.016*\"margin\" + 0.015*\"yawn\" + 0.014*\"bone\" + 0.013*\"faster\" + 0.013*\"life\" + 0.012*\"will\" + 0.012*\"daughter\"\n", + "2019-01-31 00:58:27,330 : INFO : topic #41 (0.020): 0.042*\"citi\" + 0.023*\"palmer\" + 0.023*\"new\" + 0.014*\"strategist\" + 0.012*\"center\" + 0.012*\"open\" + 0.011*\"includ\" + 0.011*\"lobe\" + 0.010*\"dai\" + 0.009*\"highli\"\n", + "2019-01-31 00:58:27,330 : INFO : topic #9 (0.020): 0.075*\"bone\" + 0.044*\"american\" + 0.027*\"valour\" + 0.018*\"dutch\" + 0.018*\"folei\" + 0.018*\"english\" + 0.017*\"player\" + 0.016*\"polit\" + 0.012*\"simpler\" + 0.011*\"acrimoni\"\n", + "2019-01-31 00:58:27,336 : INFO : topic diff=0.003703, rho=0.028502\n", + "2019-01-31 00:58:27,491 : INFO : PROGRESS: pass 0, at document #2464000/4922894\n", + "2019-01-31 00:58:28,860 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:58:29,126 : INFO : topic #30 (0.020): 0.036*\"cleveland\" + 0.035*\"leagu\" + 0.029*\"place\" + 0.028*\"taxpay\" + 0.024*\"scientist\" + 0.023*\"crete\" + 0.022*\"folei\" + 0.016*\"goal\" + 0.015*\"martin\" + 0.013*\"schmitz\"\n", + "2019-01-31 00:58:29,127 : INFO : topic #32 (0.020): 0.051*\"district\" + 0.044*\"popolo\" + 0.041*\"vigour\" + 0.039*\"tortur\" + 0.033*\"cotton\" + 0.025*\"area\" + 0.023*\"multitud\" + 0.021*\"citi\" + 0.020*\"regim\" + 0.019*\"cede\"\n", + "2019-01-31 00:58:29,129 : INFO : topic #46 (0.020): 0.018*\"sweden\" + 0.018*\"norwai\" + 0.017*\"swedish\" + 0.017*\"stop\" + 0.015*\"wind\" + 0.015*\"norwegian\" + 0.014*\"damag\" + 0.012*\"denmark\" + 0.012*\"farid\" + 0.011*\"huntsvil\"\n", + "2019-01-31 00:58:29,130 : INFO : topic #24 (0.020): 0.038*\"book\" + 0.034*\"publicis\" + 0.026*\"word\" + 0.018*\"new\" + 0.014*\"edit\" + 0.013*\"presid\" + 0.012*\"nicola\" + 0.011*\"collect\" + 0.011*\"storag\" + 0.011*\"magazin\"\n", + "2019-01-31 00:58:29,131 : INFO : topic #12 (0.020): 0.009*\"number\" + 0.008*\"frontal\" + 0.007*\"exampl\" + 0.007*\"gener\" + 0.007*\"poet\" + 0.006*\"southern\" + 0.006*\"théori\" + 0.006*\"servitud\" + 0.006*\"measur\" + 0.006*\"differ\"\n", + "2019-01-31 00:58:29,136 : INFO : topic diff=0.004334, rho=0.028490\n", + "2019-01-31 00:58:29,293 : INFO : PROGRESS: pass 0, at document #2466000/4922894\n", + "2019-01-31 00:58:30,668 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:58:30,938 : INFO : topic #8 (0.020): 0.027*\"law\" + 0.022*\"cortic\" + 0.022*\"act\" + 0.018*\"start\" + 0.012*\"case\" + 0.012*\"ricardo\" + 0.010*\"polaris\" + 0.009*\"replac\" + 0.009*\"legal\" + 0.008*\"order\"\n", + "2019-01-31 00:58:30,939 : INFO : topic #23 (0.020): 0.134*\"audit\" + 0.065*\"best\" + 0.033*\"yawn\" + 0.029*\"jacksonvil\" + 0.023*\"japanes\" + 0.021*\"noll\" + 0.019*\"festiv\" + 0.019*\"women\" + 0.017*\"intern\" + 0.017*\"prison\"\n", + "2019-01-31 00:58:30,940 : INFO : topic #34 (0.020): 0.067*\"start\" + 0.034*\"new\" + 0.031*\"american\" + 0.029*\"unionist\" + 0.024*\"cotton\" + 0.022*\"year\" + 0.016*\"california\" + 0.013*\"warrior\" + 0.012*\"terri\" + 0.012*\"north\"\n", + "2019-01-31 00:58:30,941 : INFO : topic #15 (0.020): 0.011*\"small\" + 0.010*\"develop\" + 0.010*\"organ\" + 0.009*\"commun\" + 0.009*\"word\" + 0.008*\"peopl\" + 0.008*\"group\" + 0.007*\"woman\" + 0.007*\"human\" + 0.006*\"workplac\"\n", + "2019-01-31 00:58:30,942 : INFO : topic #31 (0.020): 0.052*\"fusiform\" + 0.027*\"scientist\" + 0.025*\"taxpay\" + 0.023*\"player\" + 0.020*\"place\" + 0.015*\"clot\" + 0.013*\"leagu\" + 0.011*\"folei\" + 0.011*\"yawn\" + 0.009*\"reconstruct\"\n", + "2019-01-31 00:58:30,948 : INFO : topic diff=0.004527, rho=0.028479\n", + "2019-01-31 00:58:31,100 : INFO : PROGRESS: pass 0, at document #2468000/4922894\n", + "2019-01-31 00:58:32,443 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:58:32,710 : INFO : topic #30 (0.020): 0.036*\"cleveland\" + 0.035*\"leagu\" + 0.029*\"place\" + 0.028*\"taxpay\" + 0.024*\"scientist\" + 0.023*\"crete\" + 0.021*\"folei\" + 0.016*\"goal\" + 0.015*\"martin\" + 0.013*\"schmitz\"\n", + "2019-01-31 00:58:32,711 : INFO : topic #33 (0.020): 0.063*\"french\" + 0.047*\"franc\" + 0.030*\"pari\" + 0.021*\"jean\" + 0.021*\"sail\" + 0.017*\"daphn\" + 0.014*\"lazi\" + 0.012*\"loui\" + 0.011*\"piec\" + 0.009*\"wine\"\n", + "2019-01-31 00:58:32,712 : INFO : topic #7 (0.020): 0.021*\"snatch\" + 0.020*\"di\" + 0.018*\"factor\" + 0.016*\"margin\" + 0.015*\"yawn\" + 0.014*\"bone\" + 0.013*\"faster\" + 0.013*\"life\" + 0.012*\"daughter\" + 0.012*\"will\"\n", + "2019-01-31 00:58:32,713 : INFO : topic #38 (0.020): 0.023*\"walter\" + 0.009*\"aza\" + 0.009*\"forc\" + 0.008*\"battalion\" + 0.007*\"empath\" + 0.007*\"armi\" + 0.007*\"teufel\" + 0.006*\"govern\" + 0.006*\"pour\" + 0.006*\"militari\"\n", + "2019-01-31 00:58:32,714 : INFO : topic #47 (0.020): 0.064*\"muscl\" + 0.033*\"perceptu\" + 0.020*\"theater\" + 0.019*\"place\" + 0.017*\"compos\" + 0.015*\"damn\" + 0.014*\"orchestr\" + 0.014*\"physician\" + 0.012*\"olympo\" + 0.012*\"word\"\n", + "2019-01-31 00:58:32,720 : INFO : topic diff=0.004536, rho=0.028467\n", + "2019-01-31 00:58:32,876 : INFO : PROGRESS: pass 0, at document #2470000/4922894\n", + "2019-01-31 00:58:34,256 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:58:34,522 : INFO : topic #14 (0.020): 0.025*\"forc\" + 0.022*\"aggress\" + 0.021*\"armi\" + 0.020*\"walter\" + 0.018*\"com\" + 0.013*\"oper\" + 0.013*\"unionist\" + 0.013*\"militari\" + 0.012*\"airbu\" + 0.010*\"diversifi\"\n", + "2019-01-31 00:58:34,523 : INFO : topic #40 (0.020): 0.089*\"unit\" + 0.022*\"schuster\" + 0.021*\"institut\" + 0.021*\"collector\" + 0.020*\"requir\" + 0.018*\"student\" + 0.015*\"professor\" + 0.012*\"word\" + 0.011*\"http\" + 0.011*\"degre\"\n", + "2019-01-31 00:58:34,524 : INFO : topic #43 (0.020): 0.065*\"elect\" + 0.055*\"parti\" + 0.024*\"voluntari\" + 0.022*\"democrat\" + 0.021*\"member\" + 0.017*\"polici\" + 0.014*\"republ\" + 0.014*\"bypass\" + 0.013*\"report\" + 0.013*\"seaport\"\n", + "2019-01-31 00:58:34,525 : INFO : topic #48 (0.020): 0.081*\"march\" + 0.077*\"sens\" + 0.076*\"octob\" + 0.072*\"juli\" + 0.071*\"januari\" + 0.071*\"august\" + 0.070*\"notion\" + 0.070*\"april\" + 0.068*\"judici\" + 0.066*\"decatur\"\n", + "2019-01-31 00:58:34,526 : INFO : topic #2 (0.020): 0.053*\"isl\" + 0.037*\"shield\" + 0.018*\"narrat\" + 0.014*\"scot\" + 0.011*\"pope\" + 0.011*\"blur\" + 0.011*\"coalit\" + 0.011*\"nativist\" + 0.010*\"fleet\" + 0.009*\"bahá\"\n", + "2019-01-31 00:58:34,532 : INFO : topic diff=0.004253, rho=0.028456\n", + "2019-01-31 00:58:34,689 : INFO : PROGRESS: pass 0, at document #2472000/4922894\n", + "2019-01-31 00:58:36,079 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:58:36,345 : INFO : topic #32 (0.020): 0.051*\"district\" + 0.044*\"popolo\" + 0.041*\"vigour\" + 0.039*\"tortur\" + 0.032*\"cotton\" + 0.025*\"area\" + 0.023*\"multitud\" + 0.021*\"citi\" + 0.020*\"regim\" + 0.019*\"cede\"\n", + "2019-01-31 00:58:36,346 : INFO : topic #46 (0.020): 0.018*\"sweden\" + 0.018*\"norwai\" + 0.017*\"swedish\" + 0.017*\"stop\" + 0.015*\"norwegian\" + 0.015*\"wind\" + 0.015*\"damag\" + 0.012*\"farid\" + 0.012*\"denmark\" + 0.011*\"turkish\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 00:58:36,347 : INFO : topic #49 (0.020): 0.044*\"india\" + 0.032*\"incumb\" + 0.013*\"islam\" + 0.012*\"pakistan\" + 0.012*\"muskoge\" + 0.011*\"anglo\" + 0.011*\"khalsa\" + 0.011*\"alam\" + 0.010*\"televis\" + 0.009*\"affection\"\n", + "2019-01-31 00:58:36,348 : INFO : topic #38 (0.020): 0.023*\"walter\" + 0.009*\"aza\" + 0.009*\"forc\" + 0.008*\"battalion\" + 0.007*\"empath\" + 0.007*\"armi\" + 0.007*\"teufel\" + 0.006*\"govern\" + 0.006*\"militari\" + 0.006*\"pour\"\n", + "2019-01-31 00:58:36,350 : INFO : topic #6 (0.020): 0.072*\"fewer\" + 0.024*\"epiru\" + 0.022*\"septemb\" + 0.019*\"teacher\" + 0.017*\"stake\" + 0.013*\"rodríguez\" + 0.013*\"proclaim\" + 0.011*\"movi\" + 0.011*\"direct\" + 0.010*\"acrimoni\"\n", + "2019-01-31 00:58:36,355 : INFO : topic diff=0.003954, rho=0.028444\n", + "2019-01-31 00:58:36,513 : INFO : PROGRESS: pass 0, at document #2474000/4922894\n", + "2019-01-31 00:58:37,910 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:58:38,176 : INFO : topic #16 (0.020): 0.052*\"king\" + 0.031*\"priest\" + 0.020*\"rotterdam\" + 0.018*\"duke\" + 0.018*\"idiosyncrat\" + 0.017*\"grammat\" + 0.017*\"quarterli\" + 0.015*\"portugues\" + 0.014*\"kingdom\" + 0.013*\"count\"\n", + "2019-01-31 00:58:38,177 : INFO : topic #32 (0.020): 0.051*\"district\" + 0.044*\"popolo\" + 0.041*\"vigour\" + 0.038*\"tortur\" + 0.032*\"cotton\" + 0.025*\"area\" + 0.023*\"multitud\" + 0.021*\"citi\" + 0.020*\"regim\" + 0.019*\"cede\"\n", + "2019-01-31 00:58:38,179 : INFO : topic #17 (0.020): 0.078*\"church\" + 0.023*\"christian\" + 0.022*\"cathol\" + 0.020*\"bishop\" + 0.016*\"sail\" + 0.016*\"retroflex\" + 0.009*\"relationship\" + 0.009*\"parish\" + 0.009*\"poll\" + 0.009*\"historiographi\"\n", + "2019-01-31 00:58:38,180 : INFO : topic #42 (0.020): 0.047*\"german\" + 0.031*\"germani\" + 0.016*\"vol\" + 0.016*\"jewish\" + 0.014*\"israel\" + 0.014*\"berlin\" + 0.013*\"der\" + 0.011*\"jeremiah\" + 0.010*\"european\" + 0.010*\"europ\"\n", + "2019-01-31 00:58:38,181 : INFO : topic #24 (0.020): 0.039*\"book\" + 0.034*\"publicis\" + 0.026*\"word\" + 0.018*\"new\" + 0.014*\"edit\" + 0.013*\"presid\" + 0.012*\"nicola\" + 0.011*\"collect\" + 0.011*\"storag\" + 0.011*\"magazin\"\n", + "2019-01-31 00:58:38,186 : INFO : topic diff=0.003548, rho=0.028433\n", + "2019-01-31 00:58:38,346 : INFO : PROGRESS: pass 0, at document #2476000/4922894\n", + "2019-01-31 00:58:39,749 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:58:40,019 : INFO : topic #18 (0.020): 0.011*\"théori\" + 0.007*\"later\" + 0.007*\"sack\" + 0.006*\"dai\" + 0.006*\"kill\" + 0.005*\"retrospect\" + 0.005*\"like\" + 0.005*\"end\" + 0.004*\"call\" + 0.004*\"help\"\n", + "2019-01-31 00:58:40,020 : INFO : topic #5 (0.020): 0.039*\"abroad\" + 0.027*\"son\" + 0.027*\"rel\" + 0.025*\"reconstruct\" + 0.021*\"band\" + 0.017*\"muscl\" + 0.016*\"simultan\" + 0.014*\"charcoal\" + 0.014*\"toyota\" + 0.010*\"myspac\"\n", + "2019-01-31 00:58:40,021 : INFO : topic #4 (0.020): 0.019*\"enfranchis\" + 0.015*\"depress\" + 0.014*\"pour\" + 0.009*\"mode\" + 0.009*\"elabor\" + 0.008*\"veget\" + 0.008*\"uruguayan\" + 0.006*\"encyclopedia\" + 0.006*\"develop\" + 0.006*\"produc\"\n", + "2019-01-31 00:58:40,023 : INFO : topic #24 (0.020): 0.039*\"book\" + 0.034*\"publicis\" + 0.026*\"word\" + 0.018*\"new\" + 0.014*\"edit\" + 0.013*\"presid\" + 0.012*\"nicola\" + 0.011*\"collect\" + 0.011*\"storag\" + 0.011*\"magazin\"\n", + "2019-01-31 00:58:40,024 : INFO : topic #28 (0.020): 0.032*\"build\" + 0.026*\"hous\" + 0.020*\"rivièr\" + 0.017*\"buford\" + 0.013*\"histor\" + 0.012*\"briarwood\" + 0.011*\"strategist\" + 0.011*\"constitut\" + 0.010*\"depress\" + 0.010*\"linear\"\n", + "2019-01-31 00:58:40,029 : INFO : topic diff=0.004280, rho=0.028421\n", + "2019-01-31 00:58:40,190 : INFO : PROGRESS: pass 0, at document #2478000/4922894\n", + "2019-01-31 00:58:41,585 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:58:41,852 : INFO : topic #18 (0.020): 0.011*\"théori\" + 0.007*\"later\" + 0.007*\"sack\" + 0.006*\"dai\" + 0.006*\"kill\" + 0.005*\"retrospect\" + 0.005*\"like\" + 0.005*\"end\" + 0.004*\"call\" + 0.004*\"help\"\n", + "2019-01-31 00:58:41,853 : INFO : topic #14 (0.020): 0.024*\"forc\" + 0.022*\"aggress\" + 0.022*\"armi\" + 0.020*\"walter\" + 0.018*\"com\" + 0.014*\"oper\" + 0.013*\"unionist\" + 0.013*\"militari\" + 0.012*\"airbu\" + 0.010*\"diversifi\"\n", + "2019-01-31 00:58:41,854 : INFO : topic #20 (0.020): 0.142*\"scholar\" + 0.039*\"struggl\" + 0.033*\"high\" + 0.030*\"educ\" + 0.026*\"collector\" + 0.018*\"yawn\" + 0.014*\"prognosi\" + 0.010*\"class\" + 0.009*\"task\" + 0.009*\"gothic\"\n", + "2019-01-31 00:58:41,855 : INFO : topic #9 (0.020): 0.078*\"bone\" + 0.043*\"american\" + 0.027*\"valour\" + 0.018*\"dutch\" + 0.018*\"folei\" + 0.017*\"english\" + 0.017*\"player\" + 0.016*\"polit\" + 0.012*\"acrimoni\" + 0.012*\"simpler\"\n", + "2019-01-31 00:58:41,856 : INFO : topic #1 (0.020): 0.055*\"china\" + 0.046*\"chilton\" + 0.025*\"hong\" + 0.024*\"kong\" + 0.021*\"korea\" + 0.017*\"korean\" + 0.015*\"leah\" + 0.015*\"sourc\" + 0.015*\"shirin\" + 0.012*\"kim\"\n", + "2019-01-31 00:58:41,862 : INFO : topic diff=0.004982, rho=0.028410\n", + "2019-01-31 00:58:44,536 : INFO : -11.660 per-word bound, 3236.0 perplexity estimate based on a held-out corpus of 2000 documents with 538649 words\n", + "2019-01-31 00:58:44,536 : INFO : PROGRESS: pass 0, at document #2480000/4922894\n", + "2019-01-31 00:58:45,896 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:58:46,165 : INFO : topic #45 (0.020): 0.028*\"jpg\" + 0.025*\"fifteenth\" + 0.018*\"illicit\" + 0.016*\"black\" + 0.016*\"western\" + 0.016*\"colder\" + 0.012*\"record\" + 0.011*\"blind\" + 0.009*\"depress\" + 0.008*\"pain\"\n", + "2019-01-31 00:58:46,166 : INFO : topic #38 (0.020): 0.023*\"walter\" + 0.010*\"aza\" + 0.009*\"forc\" + 0.008*\"battalion\" + 0.007*\"teufel\" + 0.007*\"empath\" + 0.007*\"armi\" + 0.006*\"govern\" + 0.006*\"militari\" + 0.006*\"pour\"\n", + "2019-01-31 00:58:46,167 : INFO : topic #42 (0.020): 0.047*\"german\" + 0.030*\"germani\" + 0.016*\"vol\" + 0.016*\"jewish\" + 0.015*\"israel\" + 0.013*\"berlin\" + 0.013*\"der\" + 0.010*\"jeremiah\" + 0.010*\"european\" + 0.009*\"europ\"\n", + "2019-01-31 00:58:46,169 : INFO : topic #41 (0.020): 0.043*\"citi\" + 0.023*\"new\" + 0.023*\"palmer\" + 0.014*\"strategist\" + 0.012*\"center\" + 0.012*\"includ\" + 0.012*\"open\" + 0.011*\"lobe\" + 0.010*\"dai\" + 0.009*\"highli\"\n", + "2019-01-31 00:58:46,170 : INFO : topic #23 (0.020): 0.133*\"audit\" + 0.065*\"best\" + 0.033*\"yawn\" + 0.030*\"jacksonvil\" + 0.023*\"japanes\" + 0.021*\"noll\" + 0.020*\"festiv\" + 0.019*\"women\" + 0.017*\"intern\" + 0.016*\"prison\"\n", + "2019-01-31 00:58:46,175 : INFO : topic diff=0.003905, rho=0.028398\n", + "2019-01-31 00:58:46,330 : INFO : PROGRESS: pass 0, at document #2482000/4922894\n", + "2019-01-31 00:58:47,690 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:58:47,957 : INFO : topic #26 (0.020): 0.028*\"workplac\" + 0.028*\"champion\" + 0.027*\"men\" + 0.027*\"woman\" + 0.025*\"olymp\" + 0.022*\"medal\" + 0.020*\"alic\" + 0.020*\"event\" + 0.019*\"rainfal\" + 0.018*\"taxpay\"\n", + "2019-01-31 00:58:47,958 : INFO : topic #35 (0.020): 0.062*\"russia\" + 0.038*\"sovereignti\" + 0.034*\"rural\" + 0.028*\"poison\" + 0.024*\"personifi\" + 0.022*\"reprint\" + 0.020*\"moscow\" + 0.019*\"poland\" + 0.015*\"turin\" + 0.015*\"unfortun\"\n", + "2019-01-31 00:58:47,959 : INFO : topic #24 (0.020): 0.039*\"book\" + 0.034*\"publicis\" + 0.026*\"word\" + 0.018*\"new\" + 0.014*\"edit\" + 0.013*\"presid\" + 0.012*\"nicola\" + 0.011*\"collect\" + 0.011*\"storag\" + 0.011*\"magazin\"\n", + "2019-01-31 00:58:47,960 : INFO : topic #29 (0.020): 0.029*\"companhia\" + 0.012*\"busi\" + 0.012*\"market\" + 0.012*\"million\" + 0.011*\"bank\" + 0.011*\"produc\" + 0.009*\"industri\" + 0.008*\"yawn\" + 0.008*\"manag\" + 0.007*\"oper\"\n", + "2019-01-31 00:58:47,961 : INFO : topic #10 (0.020): 0.011*\"cdd\" + 0.008*\"disco\" + 0.008*\"pathwai\" + 0.008*\"media\" + 0.007*\"have\" + 0.007*\"effect\" + 0.007*\"caus\" + 0.007*\"hormon\" + 0.006*\"treat\" + 0.006*\"proper\"\n", + "2019-01-31 00:58:47,967 : INFO : topic diff=0.004212, rho=0.028387\n", + "2019-01-31 00:58:48,123 : INFO : PROGRESS: pass 0, at document #2484000/4922894\n", + "2019-01-31 00:58:49,495 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:58:49,762 : INFO : topic #2 (0.020): 0.051*\"isl\" + 0.037*\"shield\" + 0.018*\"narrat\" + 0.014*\"scot\" + 0.011*\"blur\" + 0.011*\"pope\" + 0.011*\"coalit\" + 0.010*\"nativist\" + 0.010*\"fleet\" + 0.009*\"bahá\"\n", + "2019-01-31 00:58:49,763 : INFO : topic #12 (0.020): 0.009*\"number\" + 0.008*\"frontal\" + 0.007*\"poet\" + 0.007*\"gener\" + 0.006*\"exampl\" + 0.006*\"southern\" + 0.006*\"théori\" + 0.006*\"servitud\" + 0.006*\"measur\" + 0.006*\"differ\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 00:58:49,764 : INFO : topic #42 (0.020): 0.046*\"german\" + 0.030*\"germani\" + 0.016*\"jewish\" + 0.016*\"vol\" + 0.014*\"israel\" + 0.014*\"berlin\" + 0.013*\"der\" + 0.011*\"jeremiah\" + 0.010*\"european\" + 0.009*\"europ\"\n", + "2019-01-31 00:58:49,765 : INFO : topic #28 (0.020): 0.031*\"build\" + 0.026*\"hous\" + 0.020*\"rivièr\" + 0.017*\"buford\" + 0.013*\"histor\" + 0.012*\"briarwood\" + 0.011*\"strategist\" + 0.011*\"constitut\" + 0.010*\"depress\" + 0.010*\"linear\"\n", + "2019-01-31 00:58:49,767 : INFO : topic #10 (0.020): 0.011*\"cdd\" + 0.008*\"disco\" + 0.008*\"media\" + 0.008*\"pathwai\" + 0.007*\"caus\" + 0.007*\"effect\" + 0.007*\"have\" + 0.006*\"hormon\" + 0.006*\"treat\" + 0.006*\"proper\"\n", + "2019-01-31 00:58:49,772 : INFO : topic diff=0.004235, rho=0.028375\n", + "2019-01-31 00:58:49,927 : INFO : PROGRESS: pass 0, at document #2486000/4922894\n", + "2019-01-31 00:58:51,286 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:58:51,553 : INFO : topic #40 (0.020): 0.087*\"unit\" + 0.022*\"schuster\" + 0.021*\"institut\" + 0.020*\"collector\" + 0.020*\"requir\" + 0.018*\"student\" + 0.014*\"professor\" + 0.013*\"http\" + 0.012*\"word\" + 0.011*\"degre\"\n", + "2019-01-31 00:58:51,554 : INFO : topic #20 (0.020): 0.142*\"scholar\" + 0.039*\"struggl\" + 0.033*\"high\" + 0.029*\"educ\" + 0.025*\"collector\" + 0.018*\"yawn\" + 0.013*\"prognosi\" + 0.010*\"class\" + 0.009*\"task\" + 0.009*\"gothic\"\n", + "2019-01-31 00:58:51,555 : INFO : topic #46 (0.020): 0.018*\"sweden\" + 0.017*\"stop\" + 0.017*\"norwai\" + 0.017*\"swedish\" + 0.015*\"norwegian\" + 0.014*\"wind\" + 0.014*\"damag\" + 0.012*\"turkish\" + 0.012*\"huntsvil\" + 0.012*\"farid\"\n", + "2019-01-31 00:58:51,556 : INFO : topic #5 (0.020): 0.039*\"abroad\" + 0.028*\"son\" + 0.027*\"rel\" + 0.025*\"reconstruct\" + 0.021*\"band\" + 0.017*\"muscl\" + 0.016*\"simultan\" + 0.014*\"charcoal\" + 0.014*\"toyota\" + 0.010*\"myspac\"\n", + "2019-01-31 00:58:51,557 : INFO : topic #22 (0.020): 0.033*\"spars\" + 0.022*\"factor\" + 0.014*\"adulthood\" + 0.013*\"feel\" + 0.012*\"plaisir\" + 0.011*\"male\" + 0.011*\"genu\" + 0.009*\"biom\" + 0.008*\"western\" + 0.008*\"median\"\n", + "2019-01-31 00:58:51,563 : INFO : topic diff=0.003709, rho=0.028364\n", + "2019-01-31 00:58:51,719 : INFO : PROGRESS: pass 0, at document #2488000/4922894\n", + "2019-01-31 00:58:53,091 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:58:53,357 : INFO : topic #2 (0.020): 0.051*\"isl\" + 0.038*\"shield\" + 0.018*\"narrat\" + 0.014*\"scot\" + 0.011*\"blur\" + 0.011*\"pope\" + 0.011*\"coalit\" + 0.010*\"nativist\" + 0.009*\"fleet\" + 0.009*\"bahá\"\n", + "2019-01-31 00:58:53,358 : INFO : topic #9 (0.020): 0.075*\"bone\" + 0.043*\"american\" + 0.027*\"valour\" + 0.018*\"dutch\" + 0.018*\"folei\" + 0.018*\"player\" + 0.017*\"english\" + 0.017*\"polit\" + 0.012*\"acrimoni\" + 0.012*\"simpler\"\n", + "2019-01-31 00:58:53,359 : INFO : topic #16 (0.020): 0.052*\"king\" + 0.032*\"priest\" + 0.021*\"rotterdam\" + 0.019*\"grammat\" + 0.019*\"duke\" + 0.018*\"idiosyncrat\" + 0.017*\"quarterli\" + 0.014*\"portugues\" + 0.013*\"kingdom\" + 0.013*\"count\"\n", + "2019-01-31 00:58:53,360 : INFO : topic #47 (0.020): 0.063*\"muscl\" + 0.033*\"perceptu\" + 0.020*\"theater\" + 0.019*\"place\" + 0.017*\"compos\" + 0.015*\"damn\" + 0.014*\"physician\" + 0.014*\"orchestr\" + 0.013*\"olympo\" + 0.012*\"word\"\n", + "2019-01-31 00:58:53,361 : INFO : topic #22 (0.020): 0.033*\"spars\" + 0.023*\"factor\" + 0.014*\"adulthood\" + 0.013*\"feel\" + 0.012*\"plaisir\" + 0.011*\"male\" + 0.011*\"genu\" + 0.009*\"biom\" + 0.008*\"western\" + 0.008*\"median\"\n", + "2019-01-31 00:58:53,367 : INFO : topic diff=0.004803, rho=0.028352\n", + "2019-01-31 00:58:53,521 : INFO : PROGRESS: pass 0, at document #2490000/4922894\n", + "2019-01-31 00:58:54,895 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:58:55,165 : INFO : topic #24 (0.020): 0.039*\"book\" + 0.034*\"publicis\" + 0.026*\"word\" + 0.018*\"new\" + 0.014*\"edit\" + 0.013*\"presid\" + 0.012*\"nicola\" + 0.011*\"collect\" + 0.011*\"storag\" + 0.011*\"worldwid\"\n", + "2019-01-31 00:58:55,166 : INFO : topic #9 (0.020): 0.075*\"bone\" + 0.043*\"american\" + 0.027*\"valour\" + 0.018*\"dutch\" + 0.018*\"folei\" + 0.017*\"player\" + 0.017*\"english\" + 0.017*\"polit\" + 0.012*\"acrimoni\" + 0.012*\"simpler\"\n", + "2019-01-31 00:58:55,167 : INFO : topic #17 (0.020): 0.079*\"church\" + 0.024*\"christian\" + 0.022*\"cathol\" + 0.020*\"bishop\" + 0.016*\"sail\" + 0.015*\"retroflex\" + 0.010*\"relationship\" + 0.009*\"parish\" + 0.009*\"historiographi\" + 0.009*\"centuri\"\n", + "2019-01-31 00:58:55,168 : INFO : topic #37 (0.020): 0.011*\"charact\" + 0.010*\"man\" + 0.009*\"septemb\" + 0.008*\"comic\" + 0.008*\"anim\" + 0.007*\"love\" + 0.007*\"appear\" + 0.006*\"gestur\" + 0.006*\"workplac\" + 0.005*\"blue\"\n", + "2019-01-31 00:58:55,169 : INFO : topic #10 (0.020): 0.011*\"cdd\" + 0.008*\"disco\" + 0.008*\"media\" + 0.008*\"hormon\" + 0.008*\"pathwai\" + 0.007*\"caus\" + 0.007*\"have\" + 0.007*\"effect\" + 0.006*\"proper\" + 0.006*\"treat\"\n", + "2019-01-31 00:58:55,175 : INFO : topic diff=0.003928, rho=0.028341\n", + "2019-01-31 00:58:55,331 : INFO : PROGRESS: pass 0, at document #2492000/4922894\n", + "2019-01-31 00:58:56,716 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:58:56,982 : INFO : topic #1 (0.020): 0.055*\"china\" + 0.046*\"chilton\" + 0.023*\"hong\" + 0.023*\"kong\" + 0.021*\"korea\" + 0.017*\"korean\" + 0.015*\"leah\" + 0.015*\"sourc\" + 0.014*\"shirin\" + 0.012*\"thailand\"\n", + "2019-01-31 00:58:56,983 : INFO : topic #10 (0.020): 0.011*\"cdd\" + 0.008*\"disco\" + 0.008*\"hormon\" + 0.008*\"media\" + 0.008*\"pathwai\" + 0.007*\"caus\" + 0.007*\"have\" + 0.007*\"effect\" + 0.006*\"proper\" + 0.006*\"treat\"\n", + "2019-01-31 00:58:56,984 : INFO : topic #16 (0.020): 0.051*\"king\" + 0.032*\"priest\" + 0.021*\"rotterdam\" + 0.020*\"grammat\" + 0.018*\"duke\" + 0.018*\"idiosyncrat\" + 0.017*\"quarterli\" + 0.014*\"order\" + 0.014*\"portugues\" + 0.013*\"kingdom\"\n", + "2019-01-31 00:58:56,985 : INFO : topic #17 (0.020): 0.079*\"church\" + 0.024*\"christian\" + 0.023*\"cathol\" + 0.020*\"bishop\" + 0.016*\"sail\" + 0.015*\"retroflex\" + 0.010*\"relationship\" + 0.009*\"parish\" + 0.009*\"historiographi\" + 0.009*\"centuri\"\n", + "2019-01-31 00:58:56,986 : INFO : topic #19 (0.020): 0.018*\"languag\" + 0.014*\"centuri\" + 0.011*\"woodcut\" + 0.010*\"form\" + 0.009*\"origin\" + 0.009*\"mean\" + 0.008*\"trade\" + 0.007*\"english\" + 0.007*\"known\" + 0.006*\"uruguayan\"\n", + "2019-01-31 00:58:56,992 : INFO : topic diff=0.003798, rho=0.028330\n", + "2019-01-31 00:58:57,203 : INFO : PROGRESS: pass 0, at document #2494000/4922894\n", + "2019-01-31 00:58:58,579 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:58:58,845 : INFO : topic #36 (0.020): 0.011*\"prognosi\" + 0.011*\"network\" + 0.010*\"pop\" + 0.008*\"develop\" + 0.008*\"cytokin\" + 0.008*\"softwar\" + 0.008*\"diggin\" + 0.008*\"user\" + 0.007*\"championship\" + 0.007*\"uruguayan\"\n", + "2019-01-31 00:58:58,846 : INFO : topic #39 (0.020): 0.057*\"canada\" + 0.046*\"canadian\" + 0.023*\"toronto\" + 0.022*\"hoar\" + 0.020*\"ontario\" + 0.016*\"hydrogen\" + 0.015*\"misericordia\" + 0.015*\"new\" + 0.013*\"novotná\" + 0.012*\"quebec\"\n", + "2019-01-31 00:58:58,847 : INFO : topic #20 (0.020): 0.142*\"scholar\" + 0.040*\"struggl\" + 0.034*\"high\" + 0.029*\"educ\" + 0.025*\"collector\" + 0.018*\"yawn\" + 0.013*\"prognosi\" + 0.010*\"class\" + 0.009*\"task\" + 0.009*\"gothic\"\n", + "2019-01-31 00:58:58,849 : INFO : topic #41 (0.020): 0.042*\"citi\" + 0.023*\"palmer\" + 0.023*\"new\" + 0.014*\"strategist\" + 0.012*\"center\" + 0.012*\"includ\" + 0.012*\"open\" + 0.011*\"lobe\" + 0.010*\"dai\" + 0.009*\"highli\"\n", + "2019-01-31 00:58:58,850 : INFO : topic #10 (0.020): 0.011*\"cdd\" + 0.008*\"disco\" + 0.008*\"hormon\" + 0.008*\"media\" + 0.007*\"pathwai\" + 0.007*\"have\" + 0.007*\"caus\" + 0.006*\"effect\" + 0.006*\"proper\" + 0.006*\"treat\"\n", + "2019-01-31 00:58:58,856 : INFO : topic diff=0.003770, rho=0.028318\n", + "2019-01-31 00:58:59,013 : INFO : PROGRESS: pass 0, at document #2496000/4922894\n", + "2019-01-31 00:59:00,396 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:59:00,663 : INFO : topic #0 (0.020): 0.066*\"statewid\" + 0.043*\"line\" + 0.036*\"raid\" + 0.028*\"arsen\" + 0.024*\"museo\" + 0.019*\"traceabl\" + 0.019*\"serv\" + 0.016*\"rosenwald\" + 0.012*\"oper\" + 0.012*\"exhaust\"\n", + "2019-01-31 00:59:00,664 : INFO : topic #35 (0.020): 0.062*\"russia\" + 0.037*\"sovereignti\" + 0.034*\"rural\" + 0.028*\"poison\" + 0.024*\"personifi\" + 0.022*\"moscow\" + 0.021*\"reprint\" + 0.019*\"poland\" + 0.016*\"turin\" + 0.014*\"unfortun\"\n", + "2019-01-31 00:59:00,665 : INFO : topic #3 (0.020): 0.034*\"present\" + 0.026*\"offic\" + 0.024*\"minist\" + 0.023*\"nation\" + 0.022*\"govern\" + 0.021*\"member\" + 0.018*\"serv\" + 0.016*\"start\" + 0.016*\"gener\" + 0.014*\"chickasaw\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 00:59:00,666 : INFO : topic #13 (0.020): 0.027*\"london\" + 0.026*\"sourc\" + 0.026*\"new\" + 0.025*\"australia\" + 0.024*\"england\" + 0.021*\"australian\" + 0.019*\"british\" + 0.018*\"ireland\" + 0.016*\"youth\" + 0.014*\"wale\"\n", + "2019-01-31 00:59:00,667 : INFO : topic #42 (0.020): 0.047*\"german\" + 0.031*\"germani\" + 0.015*\"vol\" + 0.015*\"jewish\" + 0.014*\"israel\" + 0.013*\"berlin\" + 0.013*\"der\" + 0.010*\"european\" + 0.010*\"jeremiah\" + 0.009*\"europ\"\n", + "2019-01-31 00:59:00,672 : INFO : topic diff=0.003982, rho=0.028307\n", + "2019-01-31 00:59:00,826 : INFO : PROGRESS: pass 0, at document #2498000/4922894\n", + "2019-01-31 00:59:02,182 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:59:02,449 : INFO : topic #5 (0.020): 0.039*\"abroad\" + 0.028*\"son\" + 0.027*\"rel\" + 0.025*\"reconstruct\" + 0.021*\"band\" + 0.017*\"muscl\" + 0.016*\"simultan\" + 0.014*\"charcoal\" + 0.014*\"toyota\" + 0.010*\"myspac\"\n", + "2019-01-31 00:59:02,450 : INFO : topic #17 (0.020): 0.079*\"church\" + 0.024*\"christian\" + 0.022*\"cathol\" + 0.020*\"bishop\" + 0.016*\"sail\" + 0.015*\"retroflex\" + 0.010*\"relationship\" + 0.009*\"historiographi\" + 0.009*\"centuri\" + 0.009*\"parish\"\n", + "2019-01-31 00:59:02,451 : INFO : topic #31 (0.020): 0.052*\"fusiform\" + 0.026*\"scientist\" + 0.025*\"taxpay\" + 0.022*\"player\" + 0.019*\"place\" + 0.014*\"clot\" + 0.013*\"leagu\" + 0.011*\"folei\" + 0.010*\"yawn\" + 0.009*\"ruler\"\n", + "2019-01-31 00:59:02,452 : INFO : topic #22 (0.020): 0.033*\"spars\" + 0.023*\"factor\" + 0.014*\"adulthood\" + 0.013*\"feel\" + 0.011*\"plaisir\" + 0.011*\"male\" + 0.010*\"genu\" + 0.008*\"biom\" + 0.008*\"western\" + 0.008*\"median\"\n", + "2019-01-31 00:59:02,453 : INFO : topic #47 (0.020): 0.063*\"muscl\" + 0.033*\"perceptu\" + 0.020*\"theater\" + 0.018*\"place\" + 0.017*\"compos\" + 0.016*\"damn\" + 0.014*\"physician\" + 0.013*\"orchestr\" + 0.012*\"olympo\" + 0.012*\"word\"\n", + "2019-01-31 00:59:02,459 : INFO : topic diff=0.004895, rho=0.028296\n", + "2019-01-31 00:59:05,118 : INFO : -11.711 per-word bound, 3351.7 perplexity estimate based on a held-out corpus of 2000 documents with 559807 words\n", + "2019-01-31 00:59:05,118 : INFO : PROGRESS: pass 0, at document #2500000/4922894\n", + "2019-01-31 00:59:06,482 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:59:06,749 : INFO : topic #41 (0.020): 0.042*\"citi\" + 0.025*\"palmer\" + 0.023*\"new\" + 0.013*\"strategist\" + 0.012*\"center\" + 0.012*\"open\" + 0.012*\"includ\" + 0.011*\"lobe\" + 0.010*\"dai\" + 0.009*\"highli\"\n", + "2019-01-31 00:59:06,750 : INFO : topic #21 (0.020): 0.036*\"samford\" + 0.023*\"spain\" + 0.019*\"del\" + 0.016*\"mexico\" + 0.016*\"italian\" + 0.014*\"soviet\" + 0.012*\"santa\" + 0.011*\"juan\" + 0.011*\"francisco\" + 0.010*\"carlo\"\n", + "2019-01-31 00:59:06,751 : INFO : topic #31 (0.020): 0.052*\"fusiform\" + 0.026*\"scientist\" + 0.025*\"taxpay\" + 0.022*\"player\" + 0.019*\"place\" + 0.014*\"clot\" + 0.013*\"leagu\" + 0.011*\"folei\" + 0.010*\"yawn\" + 0.009*\"ruler\"\n", + "2019-01-31 00:59:06,752 : INFO : topic #30 (0.020): 0.035*\"cleveland\" + 0.034*\"leagu\" + 0.029*\"place\" + 0.027*\"taxpay\" + 0.024*\"scientist\" + 0.023*\"crete\" + 0.021*\"folei\" + 0.016*\"goal\" + 0.016*\"martin\" + 0.013*\"schmitz\"\n", + "2019-01-31 00:59:06,753 : INFO : topic #15 (0.020): 0.011*\"small\" + 0.010*\"develop\" + 0.010*\"organ\" + 0.009*\"commun\" + 0.009*\"word\" + 0.008*\"group\" + 0.008*\"peopl\" + 0.007*\"human\" + 0.007*\"woman\" + 0.006*\"workplac\"\n", + "2019-01-31 00:59:06,759 : INFO : topic diff=0.004423, rho=0.028284\n", + "2019-01-31 00:59:06,917 : INFO : PROGRESS: pass 0, at document #2502000/4922894\n", + "2019-01-31 00:59:08,300 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:59:08,566 : INFO : topic #46 (0.020): 0.018*\"sweden\" + 0.017*\"norwai\" + 0.017*\"stop\" + 0.016*\"swedish\" + 0.014*\"norwegian\" + 0.014*\"wind\" + 0.014*\"damag\" + 0.012*\"farid\" + 0.011*\"turkish\" + 0.011*\"denmark\"\n", + "2019-01-31 00:59:08,567 : INFO : topic #3 (0.020): 0.034*\"present\" + 0.026*\"offic\" + 0.024*\"minist\" + 0.023*\"nation\" + 0.021*\"govern\" + 0.021*\"member\" + 0.018*\"serv\" + 0.016*\"start\" + 0.016*\"gener\" + 0.014*\"seri\"\n", + "2019-01-31 00:59:08,568 : INFO : topic #23 (0.020): 0.134*\"audit\" + 0.066*\"best\" + 0.033*\"yawn\" + 0.029*\"jacksonvil\" + 0.023*\"japanes\" + 0.021*\"noll\" + 0.020*\"festiv\" + 0.019*\"women\" + 0.017*\"intern\" + 0.016*\"prison\"\n", + "2019-01-31 00:59:08,569 : INFO : topic #5 (0.020): 0.039*\"abroad\" + 0.028*\"son\" + 0.027*\"rel\" + 0.025*\"reconstruct\" + 0.021*\"band\" + 0.017*\"muscl\" + 0.016*\"simultan\" + 0.014*\"charcoal\" + 0.014*\"toyota\" + 0.010*\"myspac\"\n", + "2019-01-31 00:59:08,570 : INFO : topic #30 (0.020): 0.035*\"cleveland\" + 0.034*\"leagu\" + 0.029*\"place\" + 0.028*\"taxpay\" + 0.024*\"scientist\" + 0.023*\"crete\" + 0.021*\"folei\" + 0.016*\"martin\" + 0.016*\"goal\" + 0.013*\"schmitz\"\n", + "2019-01-31 00:59:08,576 : INFO : topic diff=0.003549, rho=0.028273\n", + "2019-01-31 00:59:08,739 : INFO : PROGRESS: pass 0, at document #2504000/4922894\n", + "2019-01-31 00:59:10,107 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:59:10,377 : INFO : topic #44 (0.020): 0.031*\"rooftop\" + 0.026*\"final\" + 0.021*\"wife\" + 0.019*\"tourist\" + 0.017*\"champion\" + 0.015*\"martin\" + 0.014*\"open\" + 0.014*\"taxpay\" + 0.014*\"chamber\" + 0.013*\"tiepolo\"\n", + "2019-01-31 00:59:10,378 : INFO : topic #12 (0.020): 0.009*\"number\" + 0.008*\"frontal\" + 0.007*\"southern\" + 0.007*\"exampl\" + 0.007*\"gener\" + 0.006*\"poet\" + 0.006*\"servitud\" + 0.006*\"théori\" + 0.006*\"measur\" + 0.006*\"differ\"\n", + "2019-01-31 00:59:10,379 : INFO : topic #25 (0.020): 0.031*\"ring\" + 0.018*\"lagrang\" + 0.017*\"area\" + 0.017*\"warmth\" + 0.015*\"mount\" + 0.009*\"north\" + 0.009*\"palmer\" + 0.009*\"sourc\" + 0.008*\"foam\" + 0.008*\"vacant\"\n", + "2019-01-31 00:59:10,380 : INFO : topic #24 (0.020): 0.039*\"book\" + 0.034*\"publicis\" + 0.026*\"word\" + 0.018*\"new\" + 0.014*\"edit\" + 0.013*\"presid\" + 0.012*\"nicola\" + 0.011*\"collect\" + 0.011*\"storag\" + 0.011*\"worldwid\"\n", + "2019-01-31 00:59:10,381 : INFO : topic #28 (0.020): 0.032*\"build\" + 0.026*\"hous\" + 0.020*\"rivièr\" + 0.017*\"buford\" + 0.013*\"histor\" + 0.012*\"briarwood\" + 0.011*\"constitut\" + 0.011*\"strategist\" + 0.010*\"depress\" + 0.010*\"linear\"\n", + "2019-01-31 00:59:10,387 : INFO : topic diff=0.004378, rho=0.028262\n", + "2019-01-31 00:59:10,543 : INFO : PROGRESS: pass 0, at document #2506000/4922894\n", + "2019-01-31 00:59:11,913 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:59:12,180 : INFO : topic #33 (0.020): 0.061*\"french\" + 0.047*\"franc\" + 0.030*\"pari\" + 0.022*\"jean\" + 0.020*\"sail\" + 0.017*\"daphn\" + 0.014*\"lazi\" + 0.012*\"loui\" + 0.011*\"piec\" + 0.009*\"wine\"\n", + "2019-01-31 00:59:12,181 : INFO : topic #26 (0.020): 0.028*\"workplac\" + 0.027*\"champion\" + 0.027*\"woman\" + 0.026*\"men\" + 0.025*\"olymp\" + 0.023*\"alic\" + 0.021*\"medal\" + 0.020*\"event\" + 0.019*\"rainfal\" + 0.018*\"taxpay\"\n", + "2019-01-31 00:59:12,182 : INFO : topic #15 (0.020): 0.011*\"small\" + 0.010*\"organ\" + 0.010*\"develop\" + 0.009*\"commun\" + 0.009*\"word\" + 0.008*\"group\" + 0.008*\"peopl\" + 0.007*\"human\" + 0.007*\"woman\" + 0.006*\"cultur\"\n", + "2019-01-31 00:59:12,183 : INFO : topic #41 (0.020): 0.041*\"citi\" + 0.024*\"palmer\" + 0.023*\"new\" + 0.014*\"strategist\" + 0.012*\"center\" + 0.012*\"open\" + 0.012*\"includ\" + 0.011*\"lobe\" + 0.010*\"dai\" + 0.009*\"hot\"\n", + "2019-01-31 00:59:12,184 : INFO : topic #30 (0.020): 0.035*\"cleveland\" + 0.035*\"leagu\" + 0.029*\"place\" + 0.028*\"taxpay\" + 0.024*\"scientist\" + 0.023*\"crete\" + 0.021*\"folei\" + 0.016*\"goal\" + 0.016*\"martin\" + 0.013*\"schmitz\"\n", + "2019-01-31 00:59:12,190 : INFO : topic diff=0.004373, rho=0.028250\n", + "2019-01-31 00:59:12,344 : INFO : PROGRESS: pass 0, at document #2508000/4922894\n", + "2019-01-31 00:59:13,718 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:59:13,984 : INFO : topic #45 (0.020): 0.029*\"jpg\" + 0.027*\"fifteenth\" + 0.018*\"illicit\" + 0.016*\"colder\" + 0.016*\"black\" + 0.016*\"western\" + 0.012*\"record\" + 0.011*\"blind\" + 0.009*\"depress\" + 0.008*\"pain\"\n", + "2019-01-31 00:59:13,985 : INFO : topic #39 (0.020): 0.057*\"canada\" + 0.044*\"canadian\" + 0.022*\"toronto\" + 0.021*\"hoar\" + 0.019*\"ontario\" + 0.016*\"hydrogen\" + 0.015*\"new\" + 0.014*\"misericordia\" + 0.013*\"novotná\" + 0.011*\"quebec\"\n", + "2019-01-31 00:59:13,986 : INFO : topic #32 (0.020): 0.050*\"district\" + 0.044*\"popolo\" + 0.042*\"vigour\" + 0.038*\"tortur\" + 0.033*\"cotton\" + 0.025*\"area\" + 0.023*\"multitud\" + 0.021*\"citi\" + 0.020*\"regim\" + 0.019*\"cede\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 00:59:13,987 : INFO : topic #27 (0.020): 0.069*\"questionnair\" + 0.022*\"candid\" + 0.019*\"taxpay\" + 0.015*\"ret\" + 0.012*\"driver\" + 0.012*\"find\" + 0.012*\"tornado\" + 0.012*\"squatter\" + 0.011*\"fool\" + 0.010*\"théori\"\n", + "2019-01-31 00:59:13,988 : INFO : topic #14 (0.020): 0.024*\"forc\" + 0.021*\"aggress\" + 0.020*\"walter\" + 0.020*\"armi\" + 0.018*\"com\" + 0.014*\"oper\" + 0.013*\"unionist\" + 0.012*\"militari\" + 0.012*\"airbu\" + 0.011*\"diversifi\"\n", + "2019-01-31 00:59:13,994 : INFO : topic diff=0.004081, rho=0.028239\n", + "2019-01-31 00:59:14,146 : INFO : PROGRESS: pass 0, at document #2510000/4922894\n", + "2019-01-31 00:59:15,500 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:59:15,766 : INFO : topic #2 (0.020): 0.050*\"isl\" + 0.037*\"shield\" + 0.017*\"narrat\" + 0.014*\"scot\" + 0.012*\"pope\" + 0.011*\"blur\" + 0.011*\"coalit\" + 0.010*\"nativist\" + 0.009*\"fleet\" + 0.009*\"bahá\"\n", + "2019-01-31 00:59:15,768 : INFO : topic #7 (0.020): 0.021*\"snatch\" + 0.020*\"di\" + 0.018*\"factor\" + 0.016*\"margin\" + 0.015*\"yawn\" + 0.014*\"bone\" + 0.013*\"life\" + 0.012*\"faster\" + 0.012*\"daughter\" + 0.012*\"deal\"\n", + "2019-01-31 00:59:15,769 : INFO : topic #35 (0.020): 0.060*\"russia\" + 0.037*\"sovereignti\" + 0.033*\"rural\" + 0.027*\"poison\" + 0.024*\"personifi\" + 0.022*\"moscow\" + 0.021*\"reprint\" + 0.019*\"poland\" + 0.016*\"turin\" + 0.014*\"unfortun\"\n", + "2019-01-31 00:59:15,770 : INFO : topic #33 (0.020): 0.061*\"french\" + 0.047*\"franc\" + 0.030*\"pari\" + 0.021*\"jean\" + 0.020*\"sail\" + 0.017*\"daphn\" + 0.015*\"lazi\" + 0.012*\"loui\" + 0.011*\"piec\" + 0.009*\"wine\"\n", + "2019-01-31 00:59:15,771 : INFO : topic #38 (0.020): 0.023*\"walter\" + 0.010*\"aza\" + 0.009*\"forc\" + 0.007*\"battalion\" + 0.007*\"empath\" + 0.007*\"teufel\" + 0.007*\"armi\" + 0.006*\"govern\" + 0.006*\"militari\" + 0.006*\"pour\"\n", + "2019-01-31 00:59:15,777 : INFO : topic diff=0.003900, rho=0.028228\n", + "2019-01-31 00:59:15,935 : INFO : PROGRESS: pass 0, at document #2512000/4922894\n", + "2019-01-31 00:59:17,334 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:59:17,601 : INFO : topic #48 (0.020): 0.081*\"march\" + 0.078*\"sens\" + 0.077*\"octob\" + 0.073*\"juli\" + 0.072*\"januari\" + 0.071*\"august\" + 0.071*\"notion\" + 0.070*\"april\" + 0.070*\"judici\" + 0.066*\"decatur\"\n", + "2019-01-31 00:59:17,602 : INFO : topic #18 (0.020): 0.011*\"théori\" + 0.007*\"later\" + 0.007*\"sack\" + 0.006*\"dai\" + 0.005*\"kill\" + 0.005*\"retrospect\" + 0.005*\"like\" + 0.005*\"end\" + 0.004*\"call\" + 0.004*\"help\"\n", + "2019-01-31 00:59:17,603 : INFO : topic #23 (0.020): 0.134*\"audit\" + 0.066*\"best\" + 0.033*\"yawn\" + 0.029*\"jacksonvil\" + 0.023*\"japanes\" + 0.021*\"noll\" + 0.020*\"festiv\" + 0.020*\"women\" + 0.017*\"intern\" + 0.016*\"prison\"\n", + "2019-01-31 00:59:17,604 : INFO : topic #38 (0.020): 0.023*\"walter\" + 0.010*\"aza\" + 0.009*\"forc\" + 0.008*\"battalion\" + 0.007*\"empath\" + 0.007*\"teufel\" + 0.007*\"armi\" + 0.006*\"govern\" + 0.006*\"militari\" + 0.006*\"till\"\n", + "2019-01-31 00:59:17,605 : INFO : topic #6 (0.020): 0.072*\"fewer\" + 0.023*\"epiru\" + 0.021*\"septemb\" + 0.019*\"teacher\" + 0.017*\"stake\" + 0.013*\"rodríguez\" + 0.012*\"proclaim\" + 0.011*\"movi\" + 0.011*\"direct\" + 0.010*\"acrimoni\"\n", + "2019-01-31 00:59:17,611 : INFO : topic diff=0.004112, rho=0.028217\n", + "2019-01-31 00:59:17,770 : INFO : PROGRESS: pass 0, at document #2514000/4922894\n", + "2019-01-31 00:59:19,135 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:59:19,405 : INFO : topic #38 (0.020): 0.023*\"walter\" + 0.010*\"aza\" + 0.009*\"forc\" + 0.007*\"battalion\" + 0.007*\"empath\" + 0.007*\"teufel\" + 0.007*\"armi\" + 0.006*\"govern\" + 0.006*\"militari\" + 0.006*\"pour\"\n", + "2019-01-31 00:59:19,406 : INFO : topic #30 (0.020): 0.035*\"cleveland\" + 0.035*\"leagu\" + 0.029*\"place\" + 0.027*\"taxpay\" + 0.024*\"scientist\" + 0.022*\"crete\" + 0.021*\"folei\" + 0.016*\"goal\" + 0.016*\"martin\" + 0.012*\"schmitz\"\n", + "2019-01-31 00:59:19,407 : INFO : topic #44 (0.020): 0.032*\"rooftop\" + 0.026*\"final\" + 0.021*\"wife\" + 0.019*\"tourist\" + 0.018*\"champion\" + 0.015*\"martin\" + 0.014*\"taxpay\" + 0.014*\"open\" + 0.014*\"chamber\" + 0.014*\"tiepolo\"\n", + "2019-01-31 00:59:19,408 : INFO : topic #18 (0.020): 0.011*\"théori\" + 0.007*\"later\" + 0.007*\"sack\" + 0.006*\"dai\" + 0.006*\"kill\" + 0.005*\"retrospect\" + 0.005*\"like\" + 0.005*\"end\" + 0.004*\"call\" + 0.004*\"help\"\n", + "2019-01-31 00:59:19,409 : INFO : topic #9 (0.020): 0.075*\"bone\" + 0.044*\"american\" + 0.027*\"valour\" + 0.018*\"folei\" + 0.018*\"dutch\" + 0.018*\"player\" + 0.017*\"polit\" + 0.017*\"english\" + 0.013*\"acrimoni\" + 0.012*\"simpler\"\n", + "2019-01-31 00:59:19,415 : INFO : topic diff=0.003551, rho=0.028205\n", + "2019-01-31 00:59:19,575 : INFO : PROGRESS: pass 0, at document #2516000/4922894\n", + "2019-01-31 00:59:21,435 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:59:21,702 : INFO : topic #47 (0.020): 0.064*\"muscl\" + 0.033*\"perceptu\" + 0.021*\"theater\" + 0.018*\"place\" + 0.017*\"compos\" + 0.016*\"damn\" + 0.014*\"physician\" + 0.013*\"orchestr\" + 0.012*\"olympo\" + 0.012*\"word\"\n", + "2019-01-31 00:59:21,703 : INFO : topic #23 (0.020): 0.134*\"audit\" + 0.065*\"best\" + 0.033*\"yawn\" + 0.029*\"jacksonvil\" + 0.023*\"japanes\" + 0.021*\"noll\" + 0.020*\"festiv\" + 0.020*\"women\" + 0.017*\"intern\" + 0.016*\"prison\"\n", + "2019-01-31 00:59:21,704 : INFO : topic #46 (0.020): 0.018*\"stop\" + 0.017*\"sweden\" + 0.016*\"norwai\" + 0.016*\"swedish\" + 0.014*\"wind\" + 0.014*\"norwegian\" + 0.013*\"damag\" + 0.012*\"turkei\" + 0.012*\"treeless\" + 0.012*\"turkish\"\n", + "2019-01-31 00:59:21,705 : INFO : topic #15 (0.020): 0.011*\"small\" + 0.010*\"organ\" + 0.010*\"develop\" + 0.010*\"commun\" + 0.009*\"word\" + 0.008*\"group\" + 0.008*\"peopl\" + 0.007*\"woman\" + 0.007*\"human\" + 0.007*\"cultur\"\n", + "2019-01-31 00:59:21,706 : INFO : topic #33 (0.020): 0.061*\"french\" + 0.047*\"franc\" + 0.030*\"pari\" + 0.021*\"jean\" + 0.021*\"sail\" + 0.017*\"daphn\" + 0.015*\"lazi\" + 0.012*\"loui\" + 0.011*\"piec\" + 0.009*\"wine\"\n", + "2019-01-31 00:59:21,712 : INFO : topic diff=0.004172, rho=0.028194\n", + "2019-01-31 00:59:21,870 : INFO : PROGRESS: pass 0, at document #2518000/4922894\n", + "2019-01-31 00:59:23,286 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:59:23,552 : INFO : topic #11 (0.020): 0.024*\"john\" + 0.012*\"will\" + 0.012*\"jame\" + 0.011*\"david\" + 0.010*\"rival\" + 0.009*\"mexican–american\" + 0.008*\"georg\" + 0.008*\"slur\" + 0.008*\"paul\" + 0.007*\"rhyme\"\n", + "2019-01-31 00:59:23,554 : INFO : topic #9 (0.020): 0.075*\"bone\" + 0.045*\"american\" + 0.027*\"valour\" + 0.019*\"dutch\" + 0.018*\"folei\" + 0.018*\"player\" + 0.017*\"english\" + 0.017*\"polit\" + 0.013*\"acrimoni\" + 0.012*\"simpler\"\n", + "2019-01-31 00:59:23,555 : INFO : topic #20 (0.020): 0.143*\"scholar\" + 0.039*\"struggl\" + 0.033*\"high\" + 0.029*\"educ\" + 0.025*\"collector\" + 0.018*\"yawn\" + 0.013*\"prognosi\" + 0.010*\"pseudo\" + 0.009*\"class\" + 0.009*\"task\"\n", + "2019-01-31 00:59:23,556 : INFO : topic #35 (0.020): 0.060*\"russia\" + 0.041*\"sovereignti\" + 0.033*\"rural\" + 0.027*\"poison\" + 0.024*\"personifi\" + 0.021*\"moscow\" + 0.021*\"reprint\" + 0.018*\"poland\" + 0.016*\"unfortun\" + 0.015*\"turin\"\n", + "2019-01-31 00:59:23,557 : INFO : topic #27 (0.020): 0.069*\"questionnair\" + 0.021*\"candid\" + 0.020*\"taxpay\" + 0.014*\"ret\" + 0.012*\"find\" + 0.012*\"driver\" + 0.012*\"fool\" + 0.012*\"squatter\" + 0.012*\"tornado\" + 0.010*\"théori\"\n", + "2019-01-31 00:59:23,563 : INFO : topic diff=0.003930, rho=0.028183\n", + "2019-01-31 00:59:26,153 : INFO : -11.477 per-word bound, 2850.2 perplexity estimate based on a held-out corpus of 2000 documents with 521447 words\n", + "2019-01-31 00:59:26,153 : INFO : PROGRESS: pass 0, at document #2520000/4922894\n", + "2019-01-31 00:59:27,488 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:59:27,754 : INFO : topic #32 (0.020): 0.050*\"district\" + 0.044*\"popolo\" + 0.042*\"vigour\" + 0.037*\"tortur\" + 0.032*\"cotton\" + 0.025*\"area\" + 0.023*\"multitud\" + 0.021*\"citi\" + 0.020*\"regim\" + 0.019*\"cede\"\n", + "2019-01-31 00:59:27,755 : INFO : topic #35 (0.020): 0.059*\"russia\" + 0.041*\"sovereignti\" + 0.033*\"rural\" + 0.027*\"poison\" + 0.024*\"personifi\" + 0.021*\"moscow\" + 0.021*\"reprint\" + 0.018*\"poland\" + 0.016*\"unfortun\" + 0.016*\"turin\"\n", + "2019-01-31 00:59:27,756 : INFO : topic #44 (0.020): 0.031*\"rooftop\" + 0.026*\"final\" + 0.021*\"wife\" + 0.019*\"tourist\" + 0.018*\"champion\" + 0.014*\"martin\" + 0.014*\"taxpay\" + 0.014*\"chamber\" + 0.014*\"open\" + 0.014*\"tiepolo\"\n", + "2019-01-31 00:59:27,757 : INFO : topic #13 (0.020): 0.026*\"london\" + 0.025*\"new\" + 0.025*\"australia\" + 0.025*\"sourc\" + 0.023*\"england\" + 0.021*\"australian\" + 0.019*\"british\" + 0.018*\"ireland\" + 0.016*\"youth\" + 0.014*\"wale\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 00:59:27,758 : INFO : topic #33 (0.020): 0.061*\"french\" + 0.047*\"franc\" + 0.030*\"pari\" + 0.021*\"jean\" + 0.021*\"sail\" + 0.017*\"daphn\" + 0.015*\"lazi\" + 0.012*\"loui\" + 0.011*\"piec\" + 0.009*\"wine\"\n", + "2019-01-31 00:59:27,764 : INFO : topic diff=0.005164, rho=0.028172\n", + "2019-01-31 00:59:27,926 : INFO : PROGRESS: pass 0, at document #2522000/4922894\n", + "2019-01-31 00:59:29,345 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:59:29,611 : INFO : topic #14 (0.020): 0.024*\"forc\" + 0.022*\"aggress\" + 0.020*\"walter\" + 0.020*\"armi\" + 0.017*\"com\" + 0.014*\"oper\" + 0.014*\"unionist\" + 0.012*\"airbu\" + 0.012*\"militari\" + 0.010*\"diversifi\"\n", + "2019-01-31 00:59:29,613 : INFO : topic #9 (0.020): 0.075*\"bone\" + 0.044*\"american\" + 0.026*\"valour\" + 0.018*\"dutch\" + 0.018*\"folei\" + 0.018*\"player\" + 0.017*\"polit\" + 0.017*\"english\" + 0.013*\"acrimoni\" + 0.013*\"simpler\"\n", + "2019-01-31 00:59:29,614 : INFO : topic #44 (0.020): 0.031*\"rooftop\" + 0.026*\"final\" + 0.021*\"wife\" + 0.019*\"tourist\" + 0.018*\"champion\" + 0.015*\"taxpay\" + 0.014*\"martin\" + 0.014*\"chamber\" + 0.014*\"tiepolo\" + 0.013*\"open\"\n", + "2019-01-31 00:59:29,615 : INFO : topic #4 (0.020): 0.019*\"enfranchis\" + 0.015*\"depress\" + 0.014*\"pour\" + 0.009*\"elabor\" + 0.008*\"mode\" + 0.008*\"veget\" + 0.007*\"uruguayan\" + 0.007*\"encyclopedia\" + 0.006*\"develop\" + 0.006*\"produc\"\n", + "2019-01-31 00:59:29,616 : INFO : topic #18 (0.020): 0.011*\"théori\" + 0.007*\"later\" + 0.007*\"sack\" + 0.006*\"dai\" + 0.006*\"kill\" + 0.005*\"retrospect\" + 0.005*\"like\" + 0.005*\"end\" + 0.004*\"call\" + 0.004*\"help\"\n", + "2019-01-31 00:59:29,622 : INFO : topic diff=0.005141, rho=0.028161\n", + "2019-01-31 00:59:29,780 : INFO : PROGRESS: pass 0, at document #2524000/4922894\n", + "2019-01-31 00:59:31,183 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:59:31,449 : INFO : topic #20 (0.020): 0.142*\"scholar\" + 0.039*\"struggl\" + 0.033*\"high\" + 0.029*\"educ\" + 0.025*\"collector\" + 0.018*\"yawn\" + 0.013*\"prognosi\" + 0.010*\"pseudo\" + 0.010*\"class\" + 0.009*\"task\"\n", + "2019-01-31 00:59:31,450 : INFO : topic #17 (0.020): 0.079*\"church\" + 0.023*\"christian\" + 0.022*\"cathol\" + 0.019*\"bishop\" + 0.017*\"sail\" + 0.015*\"retroflex\" + 0.009*\"relationship\" + 0.009*\"historiographi\" + 0.009*\"poll\" + 0.009*\"parish\"\n", + "2019-01-31 00:59:31,451 : INFO : topic #35 (0.020): 0.059*\"russia\" + 0.040*\"sovereignti\" + 0.033*\"rural\" + 0.026*\"poison\" + 0.025*\"personifi\" + 0.021*\"moscow\" + 0.021*\"reprint\" + 0.018*\"poland\" + 0.016*\"unfortun\" + 0.015*\"turin\"\n", + "2019-01-31 00:59:31,452 : INFO : topic #16 (0.020): 0.052*\"king\" + 0.030*\"priest\" + 0.020*\"grammat\" + 0.019*\"rotterdam\" + 0.018*\"duke\" + 0.018*\"quarterli\" + 0.017*\"idiosyncrat\" + 0.015*\"portugues\" + 0.014*\"order\" + 0.013*\"count\"\n", + "2019-01-31 00:59:31,453 : INFO : topic #24 (0.020): 0.039*\"book\" + 0.034*\"publicis\" + 0.026*\"word\" + 0.018*\"new\" + 0.014*\"edit\" + 0.013*\"presid\" + 0.012*\"collect\" + 0.012*\"nicola\" + 0.011*\"storag\" + 0.011*\"worldwid\"\n", + "2019-01-31 00:59:31,459 : INFO : topic diff=0.004120, rho=0.028149\n", + "2019-01-31 00:59:31,612 : INFO : PROGRESS: pass 0, at document #2526000/4922894\n", + "2019-01-31 00:59:32,962 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:59:33,229 : INFO : topic #15 (0.020): 0.011*\"small\" + 0.010*\"organ\" + 0.010*\"develop\" + 0.010*\"commun\" + 0.009*\"word\" + 0.008*\"group\" + 0.008*\"peopl\" + 0.007*\"woman\" + 0.007*\"human\" + 0.007*\"cultur\"\n", + "2019-01-31 00:59:33,230 : INFO : topic #4 (0.020): 0.019*\"enfranchis\" + 0.014*\"depress\" + 0.014*\"pour\" + 0.008*\"elabor\" + 0.008*\"mode\" + 0.008*\"veget\" + 0.007*\"uruguayan\" + 0.007*\"encyclopedia\" + 0.006*\"develop\" + 0.006*\"teratogen\"\n", + "2019-01-31 00:59:33,231 : INFO : topic #47 (0.020): 0.064*\"muscl\" + 0.033*\"perceptu\" + 0.021*\"theater\" + 0.018*\"place\" + 0.017*\"compos\" + 0.016*\"damn\" + 0.014*\"physician\" + 0.013*\"orchestr\" + 0.012*\"olympo\" + 0.012*\"word\"\n", + "2019-01-31 00:59:33,233 : INFO : topic #37 (0.020): 0.011*\"charact\" + 0.010*\"septemb\" + 0.010*\"man\" + 0.008*\"comic\" + 0.008*\"anim\" + 0.007*\"love\" + 0.007*\"appear\" + 0.006*\"gestur\" + 0.006*\"workplac\" + 0.005*\"vision\"\n", + "2019-01-31 00:59:33,234 : INFO : topic #3 (0.020): 0.035*\"present\" + 0.025*\"offic\" + 0.023*\"minist\" + 0.023*\"nation\" + 0.022*\"govern\" + 0.021*\"member\" + 0.018*\"serv\" + 0.017*\"start\" + 0.016*\"gener\" + 0.015*\"seri\"\n", + "2019-01-31 00:59:33,240 : INFO : topic diff=0.004776, rho=0.028138\n", + "2019-01-31 00:59:33,460 : INFO : PROGRESS: pass 0, at document #2528000/4922894\n", + "2019-01-31 00:59:34,877 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:59:35,144 : INFO : topic #0 (0.020): 0.066*\"statewid\" + 0.043*\"line\" + 0.036*\"raid\" + 0.027*\"arsen\" + 0.023*\"museo\" + 0.020*\"traceabl\" + 0.019*\"serv\" + 0.017*\"rosenwald\" + 0.013*\"oper\" + 0.012*\"exhaust\"\n", + "2019-01-31 00:59:35,145 : INFO : topic #24 (0.020): 0.039*\"book\" + 0.034*\"publicis\" + 0.026*\"word\" + 0.018*\"new\" + 0.014*\"edit\" + 0.013*\"presid\" + 0.012*\"nicola\" + 0.012*\"collect\" + 0.011*\"storag\" + 0.011*\"author\"\n", + "2019-01-31 00:59:35,146 : INFO : topic #46 (0.020): 0.018*\"sweden\" + 0.018*\"norwai\" + 0.017*\"stop\" + 0.017*\"swedish\" + 0.015*\"norwegian\" + 0.014*\"wind\" + 0.013*\"turkish\" + 0.013*\"damag\" + 0.012*\"denmark\" + 0.012*\"turkei\"\n", + "2019-01-31 00:59:35,147 : INFO : topic #29 (0.020): 0.030*\"companhia\" + 0.012*\"busi\" + 0.012*\"million\" + 0.011*\"bank\" + 0.011*\"produc\" + 0.011*\"market\" + 0.010*\"industri\" + 0.008*\"yawn\" + 0.008*\"manag\" + 0.007*\"function\"\n", + "2019-01-31 00:59:35,148 : INFO : topic #17 (0.020): 0.078*\"church\" + 0.023*\"christian\" + 0.022*\"cathol\" + 0.020*\"bishop\" + 0.017*\"sail\" + 0.014*\"retroflex\" + 0.010*\"relationship\" + 0.009*\"poll\" + 0.009*\"historiographi\" + 0.009*\"parish\"\n", + "2019-01-31 00:59:35,154 : INFO : topic diff=0.004358, rho=0.028127\n", + "2019-01-31 00:59:35,316 : INFO : PROGRESS: pass 0, at document #2530000/4922894\n", + "2019-01-31 00:59:36,739 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:59:37,005 : INFO : topic #16 (0.020): 0.052*\"king\" + 0.030*\"priest\" + 0.020*\"rotterdam\" + 0.019*\"grammat\" + 0.019*\"duke\" + 0.018*\"quarterli\" + 0.017*\"idiosyncrat\" + 0.015*\"order\" + 0.015*\"portugues\" + 0.013*\"kingdom\"\n", + "2019-01-31 00:59:37,006 : INFO : topic #49 (0.020): 0.045*\"india\" + 0.031*\"incumb\" + 0.014*\"islam\" + 0.012*\"anglo\" + 0.012*\"pakistan\" + 0.011*\"muskoge\" + 0.011*\"televis\" + 0.010*\"sri\" + 0.010*\"alam\" + 0.009*\"affection\"\n", + "2019-01-31 00:59:37,008 : INFO : topic #10 (0.020): 0.011*\"cdd\" + 0.008*\"hormon\" + 0.008*\"media\" + 0.008*\"disco\" + 0.007*\"pathwai\" + 0.007*\"caus\" + 0.006*\"have\" + 0.006*\"effect\" + 0.006*\"proper\" + 0.006*\"treat\"\n", + "2019-01-31 00:59:37,009 : INFO : topic #42 (0.020): 0.046*\"german\" + 0.031*\"germani\" + 0.015*\"vol\" + 0.015*\"jewish\" + 0.014*\"israel\" + 0.013*\"der\" + 0.013*\"berlin\" + 0.011*\"european\" + 0.009*\"europ\" + 0.009*\"jeremiah\"\n", + "2019-01-31 00:59:37,010 : INFO : topic #35 (0.020): 0.060*\"russia\" + 0.040*\"sovereignti\" + 0.032*\"rural\" + 0.026*\"poison\" + 0.025*\"personifi\" + 0.021*\"moscow\" + 0.021*\"reprint\" + 0.018*\"poland\" + 0.016*\"unfortun\" + 0.015*\"turin\"\n", + "2019-01-31 00:59:37,016 : INFO : topic diff=0.004921, rho=0.028116\n", + "2019-01-31 00:59:37,167 : INFO : PROGRESS: pass 0, at document #2532000/4922894\n", + "2019-01-31 00:59:38,534 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:59:38,801 : INFO : topic #20 (0.020): 0.142*\"scholar\" + 0.039*\"struggl\" + 0.032*\"high\" + 0.029*\"educ\" + 0.025*\"collector\" + 0.018*\"yawn\" + 0.013*\"prognosi\" + 0.010*\"class\" + 0.010*\"pseudo\" + 0.009*\"task\"\n", + "2019-01-31 00:59:38,802 : INFO : topic #11 (0.020): 0.024*\"john\" + 0.012*\"will\" + 0.012*\"jame\" + 0.011*\"david\" + 0.010*\"rival\" + 0.009*\"mexican–american\" + 0.008*\"georg\" + 0.008*\"slur\" + 0.008*\"paul\" + 0.007*\"rhyme\"\n", + "2019-01-31 00:59:38,803 : INFO : topic #47 (0.020): 0.063*\"muscl\" + 0.033*\"perceptu\" + 0.023*\"theater\" + 0.018*\"place\" + 0.017*\"compos\" + 0.015*\"damn\" + 0.014*\"orchestr\" + 0.013*\"physician\" + 0.012*\"olympo\" + 0.012*\"word\"\n", + "2019-01-31 00:59:38,804 : INFO : topic #30 (0.020): 0.035*\"cleveland\" + 0.035*\"leagu\" + 0.029*\"place\" + 0.027*\"taxpay\" + 0.024*\"scientist\" + 0.022*\"crete\" + 0.021*\"folei\" + 0.016*\"goal\" + 0.016*\"martin\" + 0.012*\"schmitz\"\n", + "2019-01-31 00:59:38,805 : INFO : topic #25 (0.020): 0.031*\"ring\" + 0.017*\"area\" + 0.017*\"lagrang\" + 0.017*\"warmth\" + 0.015*\"mount\" + 0.009*\"north\" + 0.009*\"palmer\" + 0.008*\"sourc\" + 0.008*\"land\" + 0.008*\"foam\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 00:59:38,811 : INFO : topic diff=0.004290, rho=0.028105\n", + "2019-01-31 00:59:38,976 : INFO : PROGRESS: pass 0, at document #2534000/4922894\n", + "2019-01-31 00:59:40,411 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:59:40,679 : INFO : topic #40 (0.020): 0.087*\"unit\" + 0.023*\"schuster\" + 0.021*\"institut\" + 0.020*\"requir\" + 0.019*\"collector\" + 0.018*\"student\" + 0.015*\"professor\" + 0.012*\"http\" + 0.012*\"word\" + 0.011*\"governor\"\n", + "2019-01-31 00:59:40,680 : INFO : topic #5 (0.020): 0.039*\"abroad\" + 0.028*\"son\" + 0.027*\"rel\" + 0.025*\"reconstruct\" + 0.021*\"band\" + 0.017*\"muscl\" + 0.016*\"simultan\" + 0.014*\"charcoal\" + 0.014*\"toyota\" + 0.010*\"myspac\"\n", + "2019-01-31 00:59:40,682 : INFO : topic #7 (0.020): 0.021*\"snatch\" + 0.020*\"di\" + 0.018*\"factor\" + 0.016*\"margin\" + 0.015*\"yawn\" + 0.014*\"bone\" + 0.013*\"life\" + 0.012*\"faster\" + 0.012*\"deal\" + 0.012*\"daughter\"\n", + "2019-01-31 00:59:40,683 : INFO : topic #25 (0.020): 0.031*\"ring\" + 0.017*\"lagrang\" + 0.017*\"area\" + 0.017*\"warmth\" + 0.015*\"mount\" + 0.009*\"north\" + 0.009*\"palmer\" + 0.008*\"sourc\" + 0.008*\"land\" + 0.008*\"foam\"\n", + "2019-01-31 00:59:40,684 : INFO : topic #9 (0.020): 0.075*\"bone\" + 0.045*\"american\" + 0.027*\"valour\" + 0.019*\"dutch\" + 0.018*\"folei\" + 0.018*\"player\" + 0.017*\"english\" + 0.017*\"polit\" + 0.013*\"simpler\" + 0.013*\"acrimoni\"\n", + "2019-01-31 00:59:40,689 : INFO : topic diff=0.005142, rho=0.028094\n", + "2019-01-31 00:59:40,846 : INFO : PROGRESS: pass 0, at document #2536000/4922894\n", + "2019-01-31 00:59:42,234 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:59:42,500 : INFO : topic #45 (0.020): 0.029*\"jpg\" + 0.027*\"fifteenth\" + 0.018*\"illicit\" + 0.017*\"colder\" + 0.016*\"black\" + 0.016*\"western\" + 0.013*\"record\" + 0.010*\"blind\" + 0.009*\"depress\" + 0.009*\"pain\"\n", + "2019-01-31 00:59:42,501 : INFO : topic #38 (0.020): 0.023*\"walter\" + 0.010*\"aza\" + 0.009*\"forc\" + 0.007*\"battalion\" + 0.007*\"teufel\" + 0.007*\"empath\" + 0.007*\"armi\" + 0.007*\"till\" + 0.006*\"pour\" + 0.006*\"govern\"\n", + "2019-01-31 00:59:42,502 : INFO : topic #19 (0.020): 0.018*\"languag\" + 0.014*\"centuri\" + 0.011*\"woodcut\" + 0.010*\"form\" + 0.009*\"origin\" + 0.009*\"mean\" + 0.008*\"trade\" + 0.008*\"english\" + 0.006*\"known\" + 0.006*\"uruguayan\"\n", + "2019-01-31 00:59:42,503 : INFO : topic #21 (0.020): 0.036*\"samford\" + 0.023*\"spain\" + 0.019*\"del\" + 0.016*\"mexico\" + 0.015*\"italian\" + 0.013*\"soviet\" + 0.012*\"santa\" + 0.011*\"carlo\" + 0.011*\"juan\" + 0.011*\"francisco\"\n", + "2019-01-31 00:59:42,505 : INFO : topic #14 (0.020): 0.023*\"forc\" + 0.023*\"aggress\" + 0.021*\"walter\" + 0.020*\"armi\" + 0.017*\"com\" + 0.014*\"unionist\" + 0.014*\"oper\" + 0.012*\"airbu\" + 0.012*\"militari\" + 0.011*\"refut\"\n", + "2019-01-31 00:59:42,510 : INFO : topic diff=0.004544, rho=0.028083\n", + "2019-01-31 00:59:42,669 : INFO : PROGRESS: pass 0, at document #2538000/4922894\n", + "2019-01-31 00:59:44,064 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:59:44,330 : INFO : topic #21 (0.020): 0.036*\"samford\" + 0.023*\"spain\" + 0.019*\"del\" + 0.016*\"mexico\" + 0.015*\"italian\" + 0.013*\"soviet\" + 0.012*\"santa\" + 0.011*\"juan\" + 0.011*\"carlo\" + 0.011*\"francisco\"\n", + "2019-01-31 00:59:44,331 : INFO : topic #8 (0.020): 0.027*\"law\" + 0.023*\"cortic\" + 0.019*\"act\" + 0.018*\"start\" + 0.013*\"ricardo\" + 0.012*\"case\" + 0.010*\"replac\" + 0.010*\"polaris\" + 0.009*\"legal\" + 0.007*\"order\"\n", + "2019-01-31 00:59:44,333 : INFO : topic #17 (0.020): 0.078*\"church\" + 0.023*\"cathol\" + 0.022*\"christian\" + 0.019*\"bishop\" + 0.016*\"sail\" + 0.015*\"retroflex\" + 0.010*\"relationship\" + 0.009*\"poll\" + 0.009*\"historiographi\" + 0.009*\"centuri\"\n", + "2019-01-31 00:59:44,334 : INFO : topic #6 (0.020): 0.071*\"fewer\" + 0.023*\"epiru\" + 0.021*\"septemb\" + 0.018*\"teacher\" + 0.017*\"stake\" + 0.013*\"rodríguez\" + 0.012*\"proclaim\" + 0.011*\"movi\" + 0.011*\"acrimoni\" + 0.011*\"direct\"\n", + "2019-01-31 00:59:44,335 : INFO : topic #35 (0.020): 0.059*\"russia\" + 0.041*\"sovereignti\" + 0.032*\"rural\" + 0.026*\"poison\" + 0.025*\"personifi\" + 0.021*\"reprint\" + 0.021*\"moscow\" + 0.018*\"poland\" + 0.016*\"unfortun\" + 0.015*\"turin\"\n", + "2019-01-31 00:59:44,341 : INFO : topic diff=0.004077, rho=0.028072\n", + "2019-01-31 00:59:47,076 : INFO : -12.120 per-word bound, 4451.5 perplexity estimate based on a held-out corpus of 2000 documents with 566639 words\n", + "2019-01-31 00:59:47,077 : INFO : PROGRESS: pass 0, at document #2540000/4922894\n", + "2019-01-31 00:59:48,467 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:59:48,732 : INFO : topic #5 (0.020): 0.038*\"abroad\" + 0.028*\"son\" + 0.027*\"rel\" + 0.025*\"reconstruct\" + 0.021*\"band\" + 0.017*\"muscl\" + 0.016*\"simultan\" + 0.014*\"charcoal\" + 0.014*\"toyota\" + 0.010*\"myspac\"\n", + "2019-01-31 00:59:48,733 : INFO : topic #16 (0.020): 0.052*\"king\" + 0.031*\"priest\" + 0.019*\"duke\" + 0.019*\"grammat\" + 0.019*\"rotterdam\" + 0.018*\"quarterli\" + 0.017*\"idiosyncrat\" + 0.015*\"order\" + 0.014*\"portugues\" + 0.013*\"kingdom\"\n", + "2019-01-31 00:59:48,735 : INFO : topic #42 (0.020): 0.047*\"german\" + 0.031*\"germani\" + 0.015*\"jewish\" + 0.014*\"vol\" + 0.014*\"israel\" + 0.013*\"der\" + 0.013*\"berlin\" + 0.011*\"european\" + 0.009*\"europ\" + 0.009*\"austria\"\n", + "2019-01-31 00:59:48,736 : INFO : topic #14 (0.020): 0.023*\"forc\" + 0.022*\"aggress\" + 0.020*\"walter\" + 0.019*\"armi\" + 0.017*\"com\" + 0.014*\"oper\" + 0.014*\"unionist\" + 0.012*\"airbu\" + 0.012*\"militari\" + 0.011*\"refut\"\n", + "2019-01-31 00:59:48,737 : INFO : topic #47 (0.020): 0.063*\"muscl\" + 0.033*\"perceptu\" + 0.023*\"theater\" + 0.018*\"place\" + 0.017*\"compos\" + 0.016*\"damn\" + 0.014*\"orchestr\" + 0.013*\"physician\" + 0.012*\"olympo\" + 0.012*\"word\"\n", + "2019-01-31 00:59:48,743 : INFO : topic diff=0.004293, rho=0.028061\n", + "2019-01-31 00:59:48,900 : INFO : PROGRESS: pass 0, at document #2542000/4922894\n", + "2019-01-31 00:59:50,265 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:59:50,531 : INFO : topic #13 (0.020): 0.026*\"london\" + 0.025*\"australia\" + 0.025*\"new\" + 0.025*\"sourc\" + 0.023*\"england\" + 0.021*\"australian\" + 0.019*\"british\" + 0.018*\"ireland\" + 0.015*\"youth\" + 0.014*\"wale\"\n", + "2019-01-31 00:59:50,532 : INFO : topic #33 (0.020): 0.062*\"french\" + 0.046*\"franc\" + 0.029*\"pari\" + 0.022*\"jean\" + 0.022*\"sail\" + 0.017*\"daphn\" + 0.014*\"lazi\" + 0.012*\"loui\" + 0.012*\"piec\" + 0.009*\"wine\"\n", + "2019-01-31 00:59:50,534 : INFO : topic #14 (0.020): 0.023*\"forc\" + 0.022*\"aggress\" + 0.020*\"walter\" + 0.019*\"armi\" + 0.017*\"com\" + 0.014*\"oper\" + 0.014*\"unionist\" + 0.012*\"airbu\" + 0.012*\"militari\" + 0.011*\"refut\"\n", + "2019-01-31 00:59:50,535 : INFO : topic #24 (0.020): 0.039*\"book\" + 0.034*\"publicis\" + 0.026*\"word\" + 0.018*\"new\" + 0.014*\"edit\" + 0.013*\"presid\" + 0.012*\"collect\" + 0.011*\"storag\" + 0.011*\"nicola\" + 0.011*\"worldwid\"\n", + "2019-01-31 00:59:50,536 : INFO : topic #23 (0.020): 0.136*\"audit\" + 0.066*\"best\" + 0.032*\"yawn\" + 0.028*\"jacksonvil\" + 0.022*\"japanes\" + 0.021*\"noll\" + 0.020*\"festiv\" + 0.019*\"women\" + 0.018*\"intern\" + 0.016*\"prison\"\n", + "2019-01-31 00:59:50,541 : INFO : topic diff=0.003814, rho=0.028050\n", + "2019-01-31 00:59:50,701 : INFO : PROGRESS: pass 0, at document #2544000/4922894\n", + "2019-01-31 00:59:52,110 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:59:52,376 : INFO : topic #18 (0.020): 0.011*\"théori\" + 0.007*\"later\" + 0.007*\"sack\" + 0.006*\"dai\" + 0.006*\"kill\" + 0.005*\"retrospect\" + 0.005*\"like\" + 0.005*\"end\" + 0.004*\"call\" + 0.004*\"help\"\n", + "2019-01-31 00:59:52,377 : INFO : topic #7 (0.020): 0.021*\"snatch\" + 0.020*\"di\" + 0.018*\"factor\" + 0.015*\"margin\" + 0.015*\"yawn\" + 0.014*\"bone\" + 0.013*\"life\" + 0.012*\"faster\" + 0.012*\"daughter\" + 0.012*\"john\"\n", + "2019-01-31 00:59:52,378 : INFO : topic #29 (0.020): 0.030*\"companhia\" + 0.012*\"busi\" + 0.012*\"million\" + 0.011*\"produc\" + 0.011*\"bank\" + 0.011*\"market\" + 0.010*\"industri\" + 0.008*\"yawn\" + 0.008*\"manag\" + 0.007*\"oper\"\n", + "2019-01-31 00:59:52,379 : INFO : topic #15 (0.020): 0.011*\"small\" + 0.010*\"organ\" + 0.010*\"develop\" + 0.010*\"commun\" + 0.009*\"word\" + 0.008*\"group\" + 0.008*\"peopl\" + 0.007*\"human\" + 0.007*\"woman\" + 0.007*\"cultur\"\n", + "2019-01-31 00:59:52,380 : INFO : topic #21 (0.020): 0.036*\"samford\" + 0.022*\"spain\" + 0.019*\"del\" + 0.017*\"mexico\" + 0.015*\"italian\" + 0.013*\"soviet\" + 0.012*\"santa\" + 0.011*\"carlo\" + 0.011*\"francisco\" + 0.011*\"juan\"\n", + "2019-01-31 00:59:52,386 : INFO : topic diff=0.003761, rho=0.028039\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 00:59:52,540 : INFO : PROGRESS: pass 0, at document #2546000/4922894\n", + "2019-01-31 00:59:53,887 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:59:54,154 : INFO : topic #7 (0.020): 0.021*\"snatch\" + 0.020*\"di\" + 0.018*\"factor\" + 0.015*\"margin\" + 0.015*\"yawn\" + 0.014*\"bone\" + 0.013*\"life\" + 0.012*\"faster\" + 0.012*\"daughter\" + 0.012*\"john\"\n", + "2019-01-31 00:59:54,155 : INFO : topic #25 (0.020): 0.030*\"ring\" + 0.017*\"area\" + 0.017*\"lagrang\" + 0.017*\"warmth\" + 0.015*\"mount\" + 0.009*\"north\" + 0.009*\"palmer\" + 0.009*\"sourc\" + 0.008*\"vacant\" + 0.008*\"lobe\"\n", + "2019-01-31 00:59:54,156 : INFO : topic #33 (0.020): 0.063*\"french\" + 0.046*\"franc\" + 0.029*\"pari\" + 0.022*\"jean\" + 0.021*\"sail\" + 0.017*\"daphn\" + 0.014*\"lazi\" + 0.011*\"piec\" + 0.011*\"loui\" + 0.009*\"wine\"\n", + "2019-01-31 00:59:54,157 : INFO : topic #38 (0.020): 0.023*\"walter\" + 0.010*\"aza\" + 0.009*\"forc\" + 0.008*\"battalion\" + 0.007*\"teufel\" + 0.007*\"empath\" + 0.007*\"armi\" + 0.007*\"till\" + 0.006*\"pour\" + 0.006*\"govern\"\n", + "2019-01-31 00:59:54,158 : INFO : topic #28 (0.020): 0.032*\"build\" + 0.026*\"hous\" + 0.020*\"rivièr\" + 0.017*\"buford\" + 0.013*\"histor\" + 0.011*\"briarwood\" + 0.011*\"constitut\" + 0.011*\"depress\" + 0.011*\"strategist\" + 0.010*\"linear\"\n", + "2019-01-31 00:59:54,164 : INFO : topic diff=0.004435, rho=0.028028\n", + "2019-01-31 00:59:54,318 : INFO : PROGRESS: pass 0, at document #2548000/4922894\n", + "2019-01-31 00:59:55,692 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:59:55,961 : INFO : topic #23 (0.020): 0.136*\"audit\" + 0.066*\"best\" + 0.032*\"yawn\" + 0.028*\"jacksonvil\" + 0.022*\"japanes\" + 0.021*\"noll\" + 0.020*\"festiv\" + 0.019*\"women\" + 0.018*\"intern\" + 0.016*\"prison\"\n", + "2019-01-31 00:59:55,962 : INFO : topic #32 (0.020): 0.051*\"district\" + 0.044*\"popolo\" + 0.043*\"vigour\" + 0.037*\"tortur\" + 0.031*\"cotton\" + 0.025*\"area\" + 0.022*\"multitud\" + 0.021*\"citi\" + 0.020*\"cede\" + 0.019*\"regim\"\n", + "2019-01-31 00:59:55,963 : INFO : topic #31 (0.020): 0.051*\"fusiform\" + 0.027*\"scientist\" + 0.025*\"taxpay\" + 0.022*\"player\" + 0.019*\"place\" + 0.014*\"clot\" + 0.013*\"leagu\" + 0.010*\"folei\" + 0.010*\"yawn\" + 0.009*\"reconstruct\"\n", + "2019-01-31 00:59:55,964 : INFO : topic #27 (0.020): 0.069*\"questionnair\" + 0.021*\"candid\" + 0.019*\"taxpay\" + 0.013*\"tornado\" + 0.012*\"find\" + 0.012*\"driver\" + 0.012*\"squatter\" + 0.012*\"ret\" + 0.011*\"fool\" + 0.010*\"théori\"\n", + "2019-01-31 00:59:55,965 : INFO : topic #14 (0.020): 0.024*\"forc\" + 0.023*\"aggress\" + 0.020*\"walter\" + 0.019*\"armi\" + 0.017*\"com\" + 0.014*\"oper\" + 0.014*\"unionist\" + 0.012*\"airbu\" + 0.012*\"militari\" + 0.011*\"refut\"\n", + "2019-01-31 00:59:55,971 : INFO : topic diff=0.004404, rho=0.028017\n", + "2019-01-31 00:59:56,124 : INFO : PROGRESS: pass 0, at document #2550000/4922894\n", + "2019-01-31 00:59:57,478 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:59:57,745 : INFO : topic #26 (0.020): 0.028*\"champion\" + 0.028*\"workplac\" + 0.028*\"woman\" + 0.026*\"men\" + 0.025*\"olymp\" + 0.021*\"medal\" + 0.020*\"alic\" + 0.020*\"event\" + 0.018*\"rainfal\" + 0.018*\"taxpay\"\n", + "2019-01-31 00:59:57,746 : INFO : topic #12 (0.020): 0.009*\"number\" + 0.007*\"frontal\" + 0.007*\"gener\" + 0.007*\"poet\" + 0.006*\"exampl\" + 0.006*\"théori\" + 0.006*\"southern\" + 0.006*\"servitud\" + 0.006*\"measur\" + 0.006*\"differ\"\n", + "2019-01-31 00:59:57,747 : INFO : topic #8 (0.020): 0.028*\"law\" + 0.023*\"cortic\" + 0.019*\"act\" + 0.019*\"start\" + 0.013*\"ricardo\" + 0.012*\"case\" + 0.010*\"replac\" + 0.010*\"polaris\" + 0.009*\"legal\" + 0.007*\"order\"\n", + "2019-01-31 00:59:57,748 : INFO : topic #37 (0.020): 0.011*\"charact\" + 0.009*\"septemb\" + 0.009*\"man\" + 0.009*\"comic\" + 0.008*\"anim\" + 0.007*\"love\" + 0.007*\"appear\" + 0.006*\"gestur\" + 0.006*\"workplac\" + 0.005*\"storag\"\n", + "2019-01-31 00:59:57,749 : INFO : topic #30 (0.020): 0.036*\"leagu\" + 0.036*\"cleveland\" + 0.029*\"place\" + 0.028*\"taxpay\" + 0.024*\"scientist\" + 0.023*\"crete\" + 0.021*\"folei\" + 0.016*\"goal\" + 0.015*\"martin\" + 0.012*\"schmitz\"\n", + "2019-01-31 00:59:57,755 : INFO : topic diff=0.004308, rho=0.028006\n", + "2019-01-31 00:59:57,907 : INFO : PROGRESS: pass 0, at document #2552000/4922894\n", + "2019-01-31 00:59:59,262 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 00:59:59,528 : INFO : topic #43 (0.020): 0.064*\"elect\" + 0.055*\"parti\" + 0.024*\"voluntari\" + 0.022*\"democrat\" + 0.022*\"member\" + 0.016*\"polici\" + 0.014*\"republ\" + 0.013*\"report\" + 0.013*\"bypass\" + 0.013*\"seaport\"\n", + "2019-01-31 00:59:59,530 : INFO : topic #19 (0.020): 0.017*\"languag\" + 0.014*\"centuri\" + 0.010*\"woodcut\" + 0.010*\"form\" + 0.009*\"origin\" + 0.009*\"mean\" + 0.008*\"trade\" + 0.008*\"english\" + 0.007*\"known\" + 0.006*\"uruguayan\"\n", + "2019-01-31 00:59:59,531 : INFO : topic #47 (0.020): 0.063*\"muscl\" + 0.033*\"perceptu\" + 0.023*\"theater\" + 0.018*\"place\" + 0.017*\"compos\" + 0.017*\"damn\" + 0.014*\"orchestr\" + 0.013*\"physician\" + 0.012*\"word\" + 0.012*\"olympo\"\n", + "2019-01-31 00:59:59,532 : INFO : topic #32 (0.020): 0.051*\"district\" + 0.044*\"popolo\" + 0.043*\"vigour\" + 0.037*\"tortur\" + 0.031*\"cotton\" + 0.025*\"area\" + 0.022*\"multitud\" + 0.021*\"citi\" + 0.020*\"cede\" + 0.019*\"regim\"\n", + "2019-01-31 00:59:59,533 : INFO : topic #14 (0.020): 0.023*\"forc\" + 0.022*\"aggress\" + 0.020*\"walter\" + 0.019*\"armi\" + 0.017*\"com\" + 0.014*\"oper\" + 0.014*\"unionist\" + 0.012*\"airbu\" + 0.012*\"militari\" + 0.011*\"refut\"\n", + "2019-01-31 00:59:59,538 : INFO : topic diff=0.004098, rho=0.027995\n", + "2019-01-31 00:59:59,691 : INFO : PROGRESS: pass 0, at document #2554000/4922894\n", + "2019-01-31 01:00:01,049 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:00:01,315 : INFO : topic #26 (0.020): 0.028*\"champion\" + 0.028*\"workplac\" + 0.028*\"woman\" + 0.026*\"men\" + 0.025*\"olymp\" + 0.021*\"medal\" + 0.020*\"event\" + 0.020*\"alic\" + 0.018*\"taxpay\" + 0.017*\"rainfal\"\n", + "2019-01-31 01:00:01,316 : INFO : topic #23 (0.020): 0.135*\"audit\" + 0.066*\"best\" + 0.032*\"yawn\" + 0.028*\"jacksonvil\" + 0.022*\"japanes\" + 0.022*\"noll\" + 0.020*\"festiv\" + 0.019*\"women\" + 0.018*\"intern\" + 0.016*\"prison\"\n", + "2019-01-31 01:00:01,317 : INFO : topic #41 (0.020): 0.041*\"citi\" + 0.025*\"palmer\" + 0.023*\"new\" + 0.014*\"strategist\" + 0.012*\"center\" + 0.012*\"open\" + 0.012*\"includ\" + 0.011*\"lobe\" + 0.009*\"dai\" + 0.009*\"highli\"\n", + "2019-01-31 01:00:01,318 : INFO : topic #47 (0.020): 0.063*\"muscl\" + 0.033*\"perceptu\" + 0.022*\"theater\" + 0.018*\"place\" + 0.017*\"compos\" + 0.017*\"damn\" + 0.014*\"orchestr\" + 0.013*\"physician\" + 0.012*\"word\" + 0.012*\"olympo\"\n", + "2019-01-31 01:00:01,319 : INFO : topic #34 (0.020): 0.069*\"start\" + 0.034*\"new\" + 0.031*\"american\" + 0.030*\"unionist\" + 0.024*\"cotton\" + 0.022*\"year\" + 0.015*\"california\" + 0.013*\"warrior\" + 0.012*\"terri\" + 0.011*\"north\"\n", + "2019-01-31 01:00:01,325 : INFO : topic diff=0.004400, rho=0.027984\n", + "2019-01-31 01:00:01,476 : INFO : PROGRESS: pass 0, at document #2556000/4922894\n", + "2019-01-31 01:00:02,821 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:00:03,087 : INFO : topic #4 (0.020): 0.020*\"enfranchis\" + 0.015*\"depress\" + 0.014*\"pour\" + 0.008*\"elabor\" + 0.008*\"mode\" + 0.008*\"veget\" + 0.007*\"uruguayan\" + 0.007*\"encyclopedia\" + 0.006*\"develop\" + 0.006*\"produc\"\n", + "2019-01-31 01:00:03,088 : INFO : topic #6 (0.020): 0.072*\"fewer\" + 0.023*\"epiru\" + 0.022*\"septemb\" + 0.018*\"teacher\" + 0.016*\"stake\" + 0.013*\"rodríguez\" + 0.012*\"proclaim\" + 0.011*\"movi\" + 0.011*\"direct\" + 0.011*\"acrimoni\"\n", + "2019-01-31 01:00:03,090 : INFO : topic #30 (0.020): 0.035*\"leagu\" + 0.035*\"cleveland\" + 0.029*\"place\" + 0.027*\"taxpay\" + 0.024*\"scientist\" + 0.023*\"crete\" + 0.021*\"folei\" + 0.016*\"goal\" + 0.015*\"martin\" + 0.012*\"schmitz\"\n", + "2019-01-31 01:00:03,091 : INFO : topic #36 (0.020): 0.011*\"network\" + 0.011*\"prognosi\" + 0.010*\"pop\" + 0.009*\"cytokin\" + 0.008*\"develop\" + 0.008*\"diggin\" + 0.008*\"softwar\" + 0.008*\"user\" + 0.007*\"uruguayan\" + 0.007*\"includ\"\n", + "2019-01-31 01:00:03,092 : INFO : topic #9 (0.020): 0.072*\"bone\" + 0.045*\"american\" + 0.026*\"valour\" + 0.018*\"folei\" + 0.018*\"dutch\" + 0.018*\"player\" + 0.017*\"english\" + 0.017*\"polit\" + 0.013*\"acrimoni\" + 0.013*\"simpler\"\n", + "2019-01-31 01:00:03,098 : INFO : topic diff=0.004520, rho=0.027973\n", + "2019-01-31 01:00:03,312 : INFO : PROGRESS: pass 0, at document #2558000/4922894\n", + "2019-01-31 01:00:04,701 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 01:00:04,968 : INFO : topic #19 (0.020): 0.017*\"languag\" + 0.015*\"centuri\" + 0.010*\"woodcut\" + 0.010*\"form\" + 0.009*\"origin\" + 0.009*\"mean\" + 0.008*\"trade\" + 0.008*\"english\" + 0.007*\"known\" + 0.006*\"uruguayan\"\n", + "2019-01-31 01:00:04,970 : INFO : topic #30 (0.020): 0.035*\"leagu\" + 0.035*\"cleveland\" + 0.029*\"place\" + 0.027*\"taxpay\" + 0.024*\"scientist\" + 0.023*\"crete\" + 0.021*\"folei\" + 0.017*\"goal\" + 0.015*\"martin\" + 0.012*\"schmitz\"\n", + "2019-01-31 01:00:04,971 : INFO : topic #11 (0.020): 0.023*\"john\" + 0.012*\"will\" + 0.012*\"jame\" + 0.011*\"david\" + 0.010*\"rival\" + 0.009*\"mexican–american\" + 0.008*\"slur\" + 0.008*\"georg\" + 0.008*\"paul\" + 0.007*\"rhyme\"\n", + "2019-01-31 01:00:04,972 : INFO : topic #21 (0.020): 0.036*\"samford\" + 0.022*\"spain\" + 0.019*\"del\" + 0.017*\"mexico\" + 0.015*\"italian\" + 0.013*\"soviet\" + 0.012*\"santa\" + 0.012*\"juan\" + 0.011*\"carlo\" + 0.011*\"francisco\"\n", + "2019-01-31 01:00:04,973 : INFO : topic #40 (0.020): 0.086*\"unit\" + 0.023*\"schuster\" + 0.021*\"requir\" + 0.021*\"institut\" + 0.019*\"collector\" + 0.018*\"student\" + 0.017*\"professor\" + 0.012*\"word\" + 0.012*\"http\" + 0.011*\"governor\"\n", + "2019-01-31 01:00:04,978 : INFO : topic diff=0.004024, rho=0.027962\n", + "2019-01-31 01:00:07,724 : INFO : -11.708 per-word bound, 3345.2 perplexity estimate based on a held-out corpus of 2000 documents with 594692 words\n", + "2019-01-31 01:00:07,724 : INFO : PROGRESS: pass 0, at document #2560000/4922894\n", + "2019-01-31 01:00:09,122 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:00:09,389 : INFO : topic #19 (0.020): 0.017*\"languag\" + 0.015*\"centuri\" + 0.010*\"woodcut\" + 0.010*\"form\" + 0.009*\"origin\" + 0.009*\"mean\" + 0.008*\"trade\" + 0.008*\"english\" + 0.007*\"known\" + 0.006*\"ancestor\"\n", + "2019-01-31 01:00:09,390 : INFO : topic #8 (0.020): 0.028*\"law\" + 0.023*\"cortic\" + 0.019*\"act\" + 0.018*\"start\" + 0.013*\"ricardo\" + 0.012*\"case\" + 0.010*\"replac\" + 0.010*\"polaris\" + 0.009*\"legal\" + 0.007*\"order\"\n", + "2019-01-31 01:00:09,391 : INFO : topic #5 (0.020): 0.038*\"abroad\" + 0.028*\"son\" + 0.027*\"rel\" + 0.025*\"reconstruct\" + 0.021*\"band\" + 0.016*\"muscl\" + 0.016*\"simultan\" + 0.014*\"charcoal\" + 0.014*\"toyota\" + 0.010*\"myspac\"\n", + "2019-01-31 01:00:09,392 : INFO : topic #43 (0.020): 0.064*\"elect\" + 0.054*\"parti\" + 0.025*\"democrat\" + 0.024*\"voluntari\" + 0.022*\"member\" + 0.017*\"republ\" + 0.016*\"polici\" + 0.014*\"report\" + 0.013*\"bypass\" + 0.013*\"seaport\"\n", + "2019-01-31 01:00:09,393 : INFO : topic #0 (0.020): 0.071*\"statewid\" + 0.043*\"line\" + 0.036*\"raid\" + 0.027*\"arsen\" + 0.023*\"museo\" + 0.019*\"traceabl\" + 0.019*\"serv\" + 0.017*\"rosenwald\" + 0.012*\"oper\" + 0.012*\"exhaust\"\n", + "2019-01-31 01:00:09,399 : INFO : topic diff=0.005837, rho=0.027951\n", + "2019-01-31 01:00:09,553 : INFO : PROGRESS: pass 0, at document #2562000/4922894\n", + "2019-01-31 01:00:10,916 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:00:11,183 : INFO : topic #6 (0.020): 0.072*\"fewer\" + 0.024*\"epiru\" + 0.022*\"septemb\" + 0.018*\"teacher\" + 0.016*\"stake\" + 0.013*\"rodríguez\" + 0.012*\"proclaim\" + 0.011*\"movi\" + 0.011*\"direct\" + 0.010*\"acrimoni\"\n", + "2019-01-31 01:00:11,184 : INFO : topic #25 (0.020): 0.030*\"ring\" + 0.017*\"area\" + 0.017*\"lagrang\" + 0.017*\"warmth\" + 0.015*\"mount\" + 0.009*\"north\" + 0.009*\"sourc\" + 0.009*\"palmer\" + 0.008*\"vacant\" + 0.008*\"foam\"\n", + "2019-01-31 01:00:11,185 : INFO : topic #26 (0.020): 0.029*\"workplac\" + 0.029*\"woman\" + 0.028*\"champion\" + 0.027*\"men\" + 0.024*\"olymp\" + 0.020*\"medal\" + 0.020*\"event\" + 0.019*\"alic\" + 0.017*\"taxpay\" + 0.017*\"rainfal\"\n", + "2019-01-31 01:00:11,186 : INFO : topic #16 (0.020): 0.050*\"king\" + 0.029*\"priest\" + 0.021*\"grammat\" + 0.019*\"rotterdam\" + 0.018*\"duke\" + 0.018*\"quarterli\" + 0.016*\"idiosyncrat\" + 0.016*\"order\" + 0.014*\"portugues\" + 0.013*\"brazil\"\n", + "2019-01-31 01:00:11,186 : INFO : topic #21 (0.020): 0.036*\"samford\" + 0.022*\"spain\" + 0.020*\"del\" + 0.017*\"mexico\" + 0.015*\"italian\" + 0.013*\"soviet\" + 0.012*\"santa\" + 0.012*\"juan\" + 0.011*\"carlo\" + 0.011*\"francisco\"\n", + "2019-01-31 01:00:11,192 : INFO : topic diff=0.004153, rho=0.027940\n", + "2019-01-31 01:00:11,347 : INFO : PROGRESS: pass 0, at document #2564000/4922894\n", + "2019-01-31 01:00:12,724 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:00:12,991 : INFO : topic #28 (0.020): 0.032*\"build\" + 0.027*\"hous\" + 0.019*\"rivièr\" + 0.017*\"buford\" + 0.014*\"histor\" + 0.011*\"briarwood\" + 0.011*\"constitut\" + 0.011*\"depress\" + 0.010*\"strategist\" + 0.010*\"linear\"\n", + "2019-01-31 01:00:12,992 : INFO : topic #48 (0.020): 0.081*\"march\" + 0.076*\"sens\" + 0.074*\"octob\" + 0.073*\"januari\" + 0.070*\"juli\" + 0.069*\"notion\" + 0.068*\"august\" + 0.068*\"judici\" + 0.067*\"april\" + 0.066*\"decatur\"\n", + "2019-01-31 01:00:12,993 : INFO : topic #19 (0.020): 0.017*\"languag\" + 0.015*\"centuri\" + 0.010*\"woodcut\" + 0.009*\"form\" + 0.009*\"origin\" + 0.009*\"mean\" + 0.008*\"trade\" + 0.007*\"english\" + 0.007*\"known\" + 0.006*\"ancestor\"\n", + "2019-01-31 01:00:12,994 : INFO : topic #13 (0.020): 0.026*\"london\" + 0.026*\"australia\" + 0.025*\"new\" + 0.025*\"sourc\" + 0.024*\"england\" + 0.022*\"australian\" + 0.019*\"british\" + 0.018*\"ireland\" + 0.016*\"youth\" + 0.014*\"wale\"\n", + "2019-01-31 01:00:12,995 : INFO : topic #6 (0.020): 0.072*\"fewer\" + 0.023*\"epiru\" + 0.022*\"septemb\" + 0.018*\"teacher\" + 0.016*\"stake\" + 0.013*\"rodríguez\" + 0.012*\"proclaim\" + 0.011*\"movi\" + 0.011*\"direct\" + 0.010*\"acrimoni\"\n", + "2019-01-31 01:00:13,001 : INFO : topic diff=0.003664, rho=0.027929\n", + "2019-01-31 01:00:13,154 : INFO : PROGRESS: pass 0, at document #2566000/4922894\n", + "2019-01-31 01:00:14,500 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:00:14,767 : INFO : topic #15 (0.020): 0.011*\"small\" + 0.010*\"organ\" + 0.010*\"develop\" + 0.010*\"commun\" + 0.009*\"word\" + 0.009*\"group\" + 0.008*\"peopl\" + 0.007*\"woman\" + 0.007*\"human\" + 0.007*\"cultur\"\n", + "2019-01-31 01:00:14,768 : INFO : topic #45 (0.020): 0.028*\"jpg\" + 0.026*\"fifteenth\" + 0.018*\"illicit\" + 0.017*\"colder\" + 0.016*\"black\" + 0.016*\"western\" + 0.012*\"record\" + 0.010*\"blind\" + 0.009*\"pain\" + 0.009*\"depress\"\n", + "2019-01-31 01:00:14,769 : INFO : topic #20 (0.020): 0.140*\"scholar\" + 0.040*\"struggl\" + 0.032*\"high\" + 0.029*\"educ\" + 0.025*\"collector\" + 0.018*\"yawn\" + 0.013*\"prognosi\" + 0.009*\"class\" + 0.009*\"pseudo\" + 0.009*\"task\"\n", + "2019-01-31 01:00:14,770 : INFO : topic #9 (0.020): 0.073*\"bone\" + 0.045*\"american\" + 0.027*\"valour\" + 0.019*\"dutch\" + 0.018*\"folei\" + 0.018*\"player\" + 0.017*\"polit\" + 0.017*\"english\" + 0.012*\"acrimoni\" + 0.012*\"simpler\"\n", + "2019-01-31 01:00:14,771 : INFO : topic #34 (0.020): 0.069*\"start\" + 0.034*\"new\" + 0.031*\"american\" + 0.030*\"unionist\" + 0.024*\"cotton\" + 0.022*\"year\" + 0.015*\"california\" + 0.013*\"warrior\" + 0.012*\"terri\" + 0.011*\"north\"\n", + "2019-01-31 01:00:14,776 : INFO : topic diff=0.004213, rho=0.027918\n", + "2019-01-31 01:00:14,937 : INFO : PROGRESS: pass 0, at document #2568000/4922894\n", + "2019-01-31 01:00:16,300 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:00:16,566 : INFO : topic #13 (0.020): 0.026*\"london\" + 0.026*\"australia\" + 0.025*\"new\" + 0.025*\"sourc\" + 0.025*\"england\" + 0.022*\"australian\" + 0.020*\"british\" + 0.018*\"ireland\" + 0.016*\"youth\" + 0.014*\"wale\"\n", + "2019-01-31 01:00:16,567 : INFO : topic #48 (0.020): 0.081*\"march\" + 0.076*\"sens\" + 0.075*\"octob\" + 0.073*\"januari\" + 0.070*\"juli\" + 0.069*\"august\" + 0.069*\"notion\" + 0.068*\"judici\" + 0.067*\"april\" + 0.066*\"decatur\"\n", + "2019-01-31 01:00:16,568 : INFO : topic #31 (0.020): 0.051*\"fusiform\" + 0.027*\"scientist\" + 0.025*\"taxpay\" + 0.022*\"player\" + 0.019*\"place\" + 0.014*\"clot\" + 0.013*\"leagu\" + 0.010*\"yawn\" + 0.010*\"folei\" + 0.010*\"reconstruct\"\n", + "2019-01-31 01:00:16,569 : INFO : topic #18 (0.020): 0.011*\"théori\" + 0.007*\"later\" + 0.007*\"sack\" + 0.006*\"dai\" + 0.006*\"kill\" + 0.005*\"retrospect\" + 0.005*\"like\" + 0.005*\"end\" + 0.004*\"call\" + 0.004*\"help\"\n", + "2019-01-31 01:00:16,570 : INFO : topic #32 (0.020): 0.051*\"district\" + 0.044*\"popolo\" + 0.043*\"vigour\" + 0.037*\"tortur\" + 0.031*\"cotton\" + 0.025*\"area\" + 0.022*\"multitud\" + 0.021*\"citi\" + 0.019*\"cede\" + 0.019*\"regim\"\n", + "2019-01-31 01:00:16,576 : INFO : topic diff=0.004524, rho=0.027907\n", + "2019-01-31 01:00:16,733 : INFO : PROGRESS: pass 0, at document #2570000/4922894\n", + "2019-01-31 01:00:18,121 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 01:00:18,387 : INFO : topic #27 (0.020): 0.071*\"questionnair\" + 0.021*\"candid\" + 0.019*\"taxpay\" + 0.012*\"driver\" + 0.012*\"find\" + 0.011*\"tornado\" + 0.011*\"fool\" + 0.011*\"ret\" + 0.010*\"landslid\" + 0.010*\"squatter\"\n", + "2019-01-31 01:00:18,388 : INFO : topic #18 (0.020): 0.011*\"théori\" + 0.007*\"later\" + 0.007*\"sack\" + 0.006*\"dai\" + 0.006*\"kill\" + 0.005*\"retrospect\" + 0.005*\"like\" + 0.005*\"end\" + 0.004*\"call\" + 0.004*\"help\"\n", + "2019-01-31 01:00:18,389 : INFO : topic #22 (0.020): 0.034*\"spars\" + 0.022*\"factor\" + 0.013*\"feel\" + 0.012*\"adulthood\" + 0.011*\"male\" + 0.011*\"plaisir\" + 0.010*\"genu\" + 0.008*\"western\" + 0.008*\"biom\" + 0.008*\"median\"\n", + "2019-01-31 01:00:18,390 : INFO : topic #25 (0.020): 0.030*\"ring\" + 0.018*\"lagrang\" + 0.017*\"area\" + 0.017*\"warmth\" + 0.015*\"mount\" + 0.009*\"north\" + 0.009*\"palmer\" + 0.009*\"sourc\" + 0.008*\"vacant\" + 0.008*\"lobe\"\n", + "2019-01-31 01:00:18,391 : INFO : topic #24 (0.020): 0.039*\"book\" + 0.035*\"publicis\" + 0.027*\"word\" + 0.018*\"new\" + 0.014*\"edit\" + 0.013*\"presid\" + 0.012*\"collect\" + 0.011*\"storag\" + 0.011*\"nicola\" + 0.011*\"worldwid\"\n", + "2019-01-31 01:00:18,397 : INFO : topic diff=0.003682, rho=0.027896\n", + "2019-01-31 01:00:18,552 : INFO : PROGRESS: pass 0, at document #2572000/4922894\n", + "2019-01-31 01:00:19,940 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:00:20,206 : INFO : topic #32 (0.020): 0.051*\"district\" + 0.044*\"popolo\" + 0.043*\"vigour\" + 0.037*\"tortur\" + 0.031*\"cotton\" + 0.025*\"area\" + 0.022*\"multitud\" + 0.021*\"citi\" + 0.020*\"regim\" + 0.019*\"cede\"\n", + "2019-01-31 01:00:20,207 : INFO : topic #12 (0.020): 0.009*\"number\" + 0.008*\"frontal\" + 0.007*\"gener\" + 0.007*\"théori\" + 0.007*\"poet\" + 0.006*\"exampl\" + 0.006*\"southern\" + 0.006*\"measur\" + 0.006*\"servitud\" + 0.006*\"differ\"\n", + "2019-01-31 01:00:20,208 : INFO : topic #38 (0.020): 0.023*\"walter\" + 0.011*\"aza\" + 0.009*\"forc\" + 0.008*\"battalion\" + 0.008*\"teufel\" + 0.007*\"armi\" + 0.007*\"empath\" + 0.007*\"till\" + 0.006*\"militari\" + 0.006*\"govern\"\n", + "2019-01-31 01:00:20,209 : INFO : topic #45 (0.020): 0.028*\"jpg\" + 0.026*\"fifteenth\" + 0.018*\"illicit\" + 0.016*\"colder\" + 0.016*\"black\" + 0.015*\"western\" + 0.012*\"record\" + 0.011*\"blind\" + 0.010*\"pain\" + 0.009*\"depress\"\n", + "2019-01-31 01:00:20,210 : INFO : topic #0 (0.020): 0.070*\"statewid\" + 0.043*\"line\" + 0.035*\"raid\" + 0.028*\"arsen\" + 0.023*\"museo\" + 0.019*\"traceabl\" + 0.018*\"serv\" + 0.016*\"rosenwald\" + 0.013*\"oper\" + 0.012*\"exhaust\"\n", + "2019-01-31 01:00:20,216 : INFO : topic diff=0.004262, rho=0.027886\n", + "2019-01-31 01:00:20,372 : INFO : PROGRESS: pass 0, at document #2574000/4922894\n", + "2019-01-31 01:00:21,742 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:00:22,008 : INFO : topic #6 (0.020): 0.073*\"fewer\" + 0.023*\"epiru\" + 0.022*\"septemb\" + 0.018*\"teacher\" + 0.016*\"stake\" + 0.013*\"rodríguez\" + 0.012*\"proclaim\" + 0.011*\"movi\" + 0.011*\"direct\" + 0.010*\"acrimoni\"\n", + "2019-01-31 01:00:22,009 : INFO : topic #2 (0.020): 0.051*\"isl\" + 0.038*\"shield\" + 0.017*\"narrat\" + 0.014*\"scot\" + 0.012*\"pope\" + 0.011*\"blur\" + 0.011*\"coalit\" + 0.011*\"nativist\" + 0.010*\"fleet\" + 0.010*\"bahá\"\n", + "2019-01-31 01:00:22,010 : INFO : topic #41 (0.020): 0.042*\"citi\" + 0.025*\"palmer\" + 0.022*\"new\" + 0.014*\"strategist\" + 0.012*\"center\" + 0.012*\"open\" + 0.012*\"includ\" + 0.011*\"lobe\" + 0.009*\"dai\" + 0.009*\"highli\"\n", + "2019-01-31 01:00:22,011 : INFO : topic #12 (0.020): 0.010*\"number\" + 0.008*\"frontal\" + 0.007*\"gener\" + 0.007*\"poet\" + 0.006*\"théori\" + 0.006*\"exampl\" + 0.006*\"servitud\" + 0.006*\"southern\" + 0.006*\"measur\" + 0.006*\"differ\"\n", + "2019-01-31 01:00:22,012 : INFO : topic #49 (0.020): 0.043*\"india\" + 0.031*\"incumb\" + 0.013*\"islam\" + 0.012*\"pakistan\" + 0.012*\"anglo\" + 0.011*\"televis\" + 0.010*\"muskoge\" + 0.010*\"sri\" + 0.010*\"khalsa\" + 0.009*\"affection\"\n", + "2019-01-31 01:00:22,018 : INFO : topic diff=0.003424, rho=0.027875\n", + "2019-01-31 01:00:22,175 : INFO : PROGRESS: pass 0, at document #2576000/4922894\n", + "2019-01-31 01:00:23,573 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:00:23,839 : INFO : topic #19 (0.020): 0.017*\"languag\" + 0.014*\"centuri\" + 0.010*\"woodcut\" + 0.009*\"form\" + 0.009*\"origin\" + 0.008*\"mean\" + 0.008*\"trade\" + 0.008*\"english\" + 0.007*\"known\" + 0.006*\"ancestor\"\n", + "2019-01-31 01:00:23,840 : INFO : topic #47 (0.020): 0.064*\"muscl\" + 0.033*\"perceptu\" + 0.022*\"theater\" + 0.018*\"place\" + 0.017*\"compos\" + 0.016*\"damn\" + 0.014*\"orchestr\" + 0.013*\"physician\" + 0.012*\"olympo\" + 0.011*\"word\"\n", + "2019-01-31 01:00:23,842 : INFO : topic #31 (0.020): 0.051*\"fusiform\" + 0.027*\"scientist\" + 0.025*\"taxpay\" + 0.022*\"player\" + 0.019*\"place\" + 0.014*\"clot\" + 0.013*\"leagu\" + 0.010*\"yawn\" + 0.010*\"folei\" + 0.010*\"reconstruct\"\n", + "2019-01-31 01:00:23,842 : INFO : topic #1 (0.020): 0.054*\"china\" + 0.044*\"chilton\" + 0.025*\"hong\" + 0.024*\"kong\" + 0.023*\"korea\" + 0.018*\"korean\" + 0.017*\"leah\" + 0.014*\"sourc\" + 0.014*\"shirin\" + 0.013*\"kim\"\n", + "2019-01-31 01:00:23,844 : INFO : topic #6 (0.020): 0.073*\"fewer\" + 0.023*\"epiru\" + 0.021*\"septemb\" + 0.019*\"teacher\" + 0.016*\"stake\" + 0.013*\"rodríguez\" + 0.012*\"proclaim\" + 0.011*\"movi\" + 0.011*\"direct\" + 0.010*\"acrimoni\"\n", + "2019-01-31 01:00:23,849 : INFO : topic diff=0.004258, rho=0.027864\n", + "2019-01-31 01:00:24,006 : INFO : PROGRESS: pass 0, at document #2578000/4922894\n", + "2019-01-31 01:00:25,369 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:00:25,635 : INFO : topic #15 (0.020): 0.011*\"small\" + 0.010*\"organ\" + 0.010*\"develop\" + 0.010*\"commun\" + 0.009*\"word\" + 0.009*\"group\" + 0.008*\"peopl\" + 0.007*\"woman\" + 0.007*\"human\" + 0.007*\"cultur\"\n", + "2019-01-31 01:00:25,636 : INFO : topic #9 (0.020): 0.072*\"bone\" + 0.043*\"american\" + 0.027*\"valour\" + 0.019*\"dutch\" + 0.018*\"folei\" + 0.018*\"english\" + 0.018*\"player\" + 0.017*\"polit\" + 0.013*\"acrimoni\" + 0.012*\"simpler\"\n", + "2019-01-31 01:00:25,637 : INFO : topic #24 (0.020): 0.039*\"book\" + 0.035*\"publicis\" + 0.027*\"word\" + 0.018*\"new\" + 0.014*\"edit\" + 0.013*\"presid\" + 0.012*\"collect\" + 0.011*\"storag\" + 0.011*\"nicola\" + 0.011*\"worldwid\"\n", + "2019-01-31 01:00:25,638 : INFO : topic #36 (0.020): 0.011*\"network\" + 0.010*\"prognosi\" + 0.009*\"pop\" + 0.008*\"cytokin\" + 0.008*\"develop\" + 0.008*\"diggin\" + 0.008*\"softwar\" + 0.008*\"user\" + 0.007*\"uruguayan\" + 0.007*\"includ\"\n", + "2019-01-31 01:00:25,639 : INFO : topic #11 (0.020): 0.024*\"john\" + 0.012*\"will\" + 0.012*\"jame\" + 0.011*\"david\" + 0.010*\"rival\" + 0.009*\"mexican–american\" + 0.008*\"slur\" + 0.008*\"paul\" + 0.008*\"georg\" + 0.008*\"rhyme\"\n", + "2019-01-31 01:00:25,645 : INFO : topic diff=0.003997, rho=0.027853\n", + "2019-01-31 01:00:28,287 : INFO : -11.600 per-word bound, 3104.7 perplexity estimate based on a held-out corpus of 2000 documents with 542959 words\n", + "2019-01-31 01:00:28,287 : INFO : PROGRESS: pass 0, at document #2580000/4922894\n", + "2019-01-31 01:00:29,646 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:00:29,912 : INFO : topic #23 (0.020): 0.136*\"audit\" + 0.066*\"best\" + 0.033*\"yawn\" + 0.030*\"jacksonvil\" + 0.022*\"japanes\" + 0.022*\"noll\" + 0.020*\"festiv\" + 0.019*\"women\" + 0.019*\"intern\" + 0.015*\"prison\"\n", + "2019-01-31 01:00:29,913 : INFO : topic #41 (0.020): 0.042*\"citi\" + 0.025*\"palmer\" + 0.022*\"new\" + 0.015*\"strategist\" + 0.012*\"open\" + 0.012*\"center\" + 0.012*\"includ\" + 0.011*\"lobe\" + 0.009*\"dai\" + 0.009*\"highli\"\n", + "2019-01-31 01:00:29,914 : INFO : topic #2 (0.020): 0.052*\"isl\" + 0.037*\"shield\" + 0.017*\"narrat\" + 0.015*\"scot\" + 0.012*\"pope\" + 0.012*\"blur\" + 0.011*\"coalit\" + 0.011*\"nativist\" + 0.010*\"fleet\" + 0.010*\"bahá\"\n", + "2019-01-31 01:00:29,915 : INFO : topic #26 (0.020): 0.029*\"workplac\" + 0.029*\"champion\" + 0.028*\"woman\" + 0.027*\"men\" + 0.024*\"olymp\" + 0.021*\"medal\" + 0.020*\"event\" + 0.019*\"alic\" + 0.018*\"taxpay\" + 0.017*\"rainfal\"\n", + "2019-01-31 01:00:29,916 : INFO : topic #22 (0.020): 0.034*\"spars\" + 0.022*\"factor\" + 0.012*\"feel\" + 0.012*\"adulthood\" + 0.011*\"plaisir\" + 0.011*\"male\" + 0.010*\"genu\" + 0.008*\"western\" + 0.008*\"biom\" + 0.008*\"median\"\n", + "2019-01-31 01:00:29,922 : INFO : topic diff=0.004202, rho=0.027842\n", + "2019-01-31 01:00:30,077 : INFO : PROGRESS: pass 0, at document #2582000/4922894\n", + "2019-01-31 01:00:31,454 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:00:31,721 : INFO : topic #25 (0.020): 0.033*\"ring\" + 0.018*\"lagrang\" + 0.017*\"warmth\" + 0.017*\"area\" + 0.015*\"mount\" + 0.009*\"north\" + 0.009*\"sourc\" + 0.009*\"palmer\" + 0.008*\"lobe\" + 0.008*\"vacant\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 01:00:31,722 : INFO : topic #22 (0.020): 0.034*\"spars\" + 0.022*\"factor\" + 0.012*\"feel\" + 0.012*\"adulthood\" + 0.011*\"plaisir\" + 0.011*\"male\" + 0.010*\"genu\" + 0.008*\"biom\" + 0.008*\"western\" + 0.008*\"median\"\n", + "2019-01-31 01:00:31,723 : INFO : topic #19 (0.020): 0.017*\"languag\" + 0.014*\"centuri\" + 0.010*\"woodcut\" + 0.009*\"form\" + 0.009*\"origin\" + 0.008*\"mean\" + 0.008*\"trade\" + 0.007*\"english\" + 0.007*\"known\" + 0.006*\"ancestor\"\n", + "2019-01-31 01:00:31,724 : INFO : topic #26 (0.020): 0.029*\"workplac\" + 0.029*\"champion\" + 0.028*\"woman\" + 0.027*\"men\" + 0.024*\"olymp\" + 0.021*\"medal\" + 0.020*\"event\" + 0.019*\"alic\" + 0.018*\"rainfal\" + 0.017*\"taxpay\"\n", + "2019-01-31 01:00:31,724 : INFO : topic #13 (0.020): 0.026*\"london\" + 0.026*\"australia\" + 0.025*\"sourc\" + 0.025*\"new\" + 0.024*\"england\" + 0.022*\"australian\" + 0.020*\"british\" + 0.018*\"ireland\" + 0.016*\"youth\" + 0.014*\"wale\"\n", + "2019-01-31 01:00:31,730 : INFO : topic diff=0.003672, rho=0.027832\n", + "2019-01-31 01:00:31,887 : INFO : PROGRESS: pass 0, at document #2584000/4922894\n", + "2019-01-31 01:00:33,264 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:00:33,530 : INFO : topic #23 (0.020): 0.135*\"audit\" + 0.066*\"best\" + 0.033*\"yawn\" + 0.030*\"jacksonvil\" + 0.023*\"japanes\" + 0.022*\"noll\" + 0.020*\"festiv\" + 0.019*\"women\" + 0.019*\"intern\" + 0.015*\"prison\"\n", + "2019-01-31 01:00:33,531 : INFO : topic #26 (0.020): 0.029*\"workplac\" + 0.029*\"champion\" + 0.028*\"woman\" + 0.027*\"men\" + 0.024*\"olymp\" + 0.021*\"medal\" + 0.020*\"event\" + 0.019*\"alic\" + 0.018*\"rainfal\" + 0.017*\"taxpay\"\n", + "2019-01-31 01:00:33,532 : INFO : topic #25 (0.020): 0.033*\"ring\" + 0.018*\"lagrang\" + 0.017*\"area\" + 0.017*\"warmth\" + 0.015*\"mount\" + 0.009*\"north\" + 0.009*\"sourc\" + 0.009*\"palmer\" + 0.008*\"lobe\" + 0.008*\"foam\"\n", + "2019-01-31 01:00:33,533 : INFO : topic #35 (0.020): 0.059*\"russia\" + 0.041*\"sovereignti\" + 0.032*\"rural\" + 0.025*\"poison\" + 0.024*\"personifi\" + 0.023*\"reprint\" + 0.020*\"moscow\" + 0.018*\"poland\" + 0.017*\"unfortun\" + 0.014*\"turin\"\n", + "2019-01-31 01:00:33,534 : INFO : topic #48 (0.020): 0.081*\"march\" + 0.077*\"sens\" + 0.077*\"octob\" + 0.074*\"januari\" + 0.071*\"juli\" + 0.070*\"august\" + 0.070*\"notion\" + 0.069*\"judici\" + 0.068*\"april\" + 0.067*\"decatur\"\n", + "2019-01-31 01:00:33,540 : INFO : topic diff=0.003920, rho=0.027821\n", + "2019-01-31 01:00:33,690 : INFO : PROGRESS: pass 0, at document #2586000/4922894\n", + "2019-01-31 01:00:35,038 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:00:35,305 : INFO : topic #37 (0.020): 0.011*\"charact\" + 0.009*\"septemb\" + 0.009*\"man\" + 0.009*\"comic\" + 0.008*\"anim\" + 0.007*\"love\" + 0.007*\"appear\" + 0.006*\"gestur\" + 0.006*\"workplac\" + 0.005*\"storag\"\n", + "2019-01-31 01:00:35,306 : INFO : topic #29 (0.020): 0.030*\"companhia\" + 0.013*\"busi\" + 0.012*\"million\" + 0.011*\"market\" + 0.011*\"bank\" + 0.011*\"produc\" + 0.009*\"industri\" + 0.008*\"yawn\" + 0.008*\"manag\" + 0.007*\"function\"\n", + "2019-01-31 01:00:35,307 : INFO : topic #46 (0.020): 0.017*\"sweden\" + 0.016*\"swedish\" + 0.016*\"norwai\" + 0.016*\"stop\" + 0.015*\"damag\" + 0.014*\"wind\" + 0.014*\"norwegian\" + 0.012*\"denmark\" + 0.012*\"turkish\" + 0.011*\"danish\"\n", + "2019-01-31 01:00:35,308 : INFO : topic #2 (0.020): 0.051*\"isl\" + 0.038*\"shield\" + 0.017*\"narrat\" + 0.014*\"scot\" + 0.012*\"pope\" + 0.012*\"blur\" + 0.011*\"coalit\" + 0.011*\"nativist\" + 0.010*\"fleet\" + 0.010*\"bahá\"\n", + "2019-01-31 01:00:35,310 : INFO : topic #7 (0.020): 0.021*\"snatch\" + 0.020*\"di\" + 0.019*\"factor\" + 0.016*\"yawn\" + 0.015*\"margin\" + 0.014*\"bone\" + 0.013*\"life\" + 0.012*\"faster\" + 0.012*\"deal\" + 0.012*\"john\"\n", + "2019-01-31 01:00:35,315 : INFO : topic diff=0.004344, rho=0.027810\n", + "2019-01-31 01:00:35,475 : INFO : PROGRESS: pass 0, at document #2588000/4922894\n", + "2019-01-31 01:00:36,869 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:00:37,136 : INFO : topic #34 (0.020): 0.069*\"start\" + 0.035*\"new\" + 0.031*\"american\" + 0.030*\"unionist\" + 0.024*\"cotton\" + 0.022*\"year\" + 0.015*\"california\" + 0.013*\"terri\" + 0.013*\"warrior\" + 0.011*\"north\"\n", + "2019-01-31 01:00:37,137 : INFO : topic #30 (0.020): 0.036*\"leagu\" + 0.035*\"cleveland\" + 0.029*\"place\" + 0.027*\"taxpay\" + 0.025*\"scientist\" + 0.023*\"crete\" + 0.021*\"folei\" + 0.017*\"goal\" + 0.015*\"martin\" + 0.012*\"schmitz\"\n", + "2019-01-31 01:00:37,138 : INFO : topic #7 (0.020): 0.021*\"snatch\" + 0.020*\"di\" + 0.019*\"factor\" + 0.015*\"yawn\" + 0.015*\"margin\" + 0.014*\"bone\" + 0.013*\"life\" + 0.012*\"faster\" + 0.012*\"john\" + 0.012*\"daughter\"\n", + "2019-01-31 01:00:37,139 : INFO : topic #21 (0.020): 0.037*\"samford\" + 0.022*\"spain\" + 0.020*\"del\" + 0.017*\"mexico\" + 0.015*\"italian\" + 0.014*\"soviet\" + 0.012*\"juan\" + 0.012*\"santa\" + 0.011*\"francisco\" + 0.011*\"carlo\"\n", + "2019-01-31 01:00:37,140 : INFO : topic #24 (0.020): 0.038*\"book\" + 0.034*\"publicis\" + 0.027*\"word\" + 0.018*\"new\" + 0.014*\"edit\" + 0.013*\"presid\" + 0.012*\"collect\" + 0.011*\"storag\" + 0.011*\"nicola\" + 0.011*\"worldwid\"\n", + "2019-01-31 01:00:37,146 : INFO : topic diff=0.004034, rho=0.027799\n", + "2019-01-31 01:00:37,362 : INFO : PROGRESS: pass 0, at document #2590000/4922894\n", + "2019-01-31 01:00:38,758 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:00:39,024 : INFO : topic #7 (0.020): 0.021*\"snatch\" + 0.020*\"di\" + 0.019*\"factor\" + 0.015*\"yawn\" + 0.015*\"margin\" + 0.014*\"bone\" + 0.013*\"life\" + 0.012*\"faster\" + 0.012*\"daughter\" + 0.012*\"john\"\n", + "2019-01-31 01:00:39,025 : INFO : topic #6 (0.020): 0.073*\"fewer\" + 0.023*\"epiru\" + 0.021*\"septemb\" + 0.018*\"teacher\" + 0.016*\"stake\" + 0.013*\"rodríguez\" + 0.012*\"proclaim\" + 0.011*\"direct\" + 0.011*\"movi\" + 0.010*\"acrimoni\"\n", + "2019-01-31 01:00:39,026 : INFO : topic #39 (0.020): 0.058*\"canada\" + 0.043*\"canadian\" + 0.024*\"toronto\" + 0.022*\"hoar\" + 0.020*\"ontario\" + 0.015*\"misericordia\" + 0.015*\"new\" + 0.015*\"hydrogen\" + 0.014*\"novotná\" + 0.013*\"quebec\"\n", + "2019-01-31 01:00:39,027 : INFO : topic #4 (0.020): 0.021*\"enfranchis\" + 0.016*\"depress\" + 0.015*\"pour\" + 0.009*\"elabor\" + 0.009*\"mode\" + 0.008*\"veget\" + 0.007*\"uruguayan\" + 0.006*\"encyclopedia\" + 0.006*\"produc\" + 0.006*\"develop\"\n", + "2019-01-31 01:00:39,028 : INFO : topic #34 (0.020): 0.069*\"start\" + 0.035*\"new\" + 0.031*\"american\" + 0.030*\"unionist\" + 0.024*\"cotton\" + 0.022*\"year\" + 0.015*\"california\" + 0.013*\"warrior\" + 0.013*\"terri\" + 0.011*\"north\"\n", + "2019-01-31 01:00:39,034 : INFO : topic diff=0.005270, rho=0.027789\n", + "2019-01-31 01:00:39,185 : INFO : PROGRESS: pass 0, at document #2592000/4922894\n", + "2019-01-31 01:00:40,544 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:00:40,810 : INFO : topic #39 (0.020): 0.058*\"canada\" + 0.043*\"canadian\" + 0.024*\"toronto\" + 0.022*\"hoar\" + 0.020*\"ontario\" + 0.015*\"misericordia\" + 0.015*\"new\" + 0.015*\"hydrogen\" + 0.014*\"novotná\" + 0.013*\"quebec\"\n", + "2019-01-31 01:00:40,812 : INFO : topic #25 (0.020): 0.032*\"ring\" + 0.018*\"warmth\" + 0.017*\"lagrang\" + 0.017*\"area\" + 0.015*\"mount\" + 0.009*\"palmer\" + 0.009*\"north\" + 0.009*\"sourc\" + 0.008*\"foam\" + 0.008*\"lobe\"\n", + "2019-01-31 01:00:40,813 : INFO : topic #20 (0.020): 0.139*\"scholar\" + 0.039*\"struggl\" + 0.031*\"high\" + 0.031*\"educ\" + 0.025*\"collector\" + 0.017*\"yawn\" + 0.013*\"prognosi\" + 0.009*\"district\" + 0.009*\"gothic\" + 0.009*\"class\"\n", + "2019-01-31 01:00:40,814 : INFO : topic #42 (0.020): 0.047*\"german\" + 0.031*\"germani\" + 0.015*\"vol\" + 0.014*\"jewish\" + 0.014*\"berlin\" + 0.013*\"der\" + 0.013*\"israel\" + 0.011*\"european\" + 0.010*\"europ\" + 0.009*\"austria\"\n", + "2019-01-31 01:00:40,815 : INFO : topic #21 (0.020): 0.037*\"samford\" + 0.022*\"spain\" + 0.020*\"del\" + 0.017*\"mexico\" + 0.015*\"italian\" + 0.014*\"soviet\" + 0.012*\"juan\" + 0.011*\"santa\" + 0.011*\"carlo\" + 0.011*\"francisco\"\n", + "2019-01-31 01:00:40,821 : INFO : topic diff=0.004560, rho=0.027778\n", + "2019-01-31 01:00:40,973 : INFO : PROGRESS: pass 0, at document #2594000/4922894\n", + "2019-01-31 01:00:42,324 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:00:42,591 : INFO : topic #7 (0.020): 0.021*\"snatch\" + 0.020*\"di\" + 0.019*\"factor\" + 0.015*\"yawn\" + 0.015*\"margin\" + 0.014*\"bone\" + 0.013*\"life\" + 0.012*\"faster\" + 0.012*\"daughter\" + 0.012*\"john\"\n", + "2019-01-31 01:00:42,592 : INFO : topic #21 (0.020): 0.037*\"samford\" + 0.022*\"spain\" + 0.020*\"del\" + 0.017*\"mexico\" + 0.015*\"italian\" + 0.014*\"soviet\" + 0.011*\"juan\" + 0.011*\"santa\" + 0.011*\"carlo\" + 0.011*\"francisco\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 01:00:42,593 : INFO : topic #23 (0.020): 0.135*\"audit\" + 0.066*\"best\" + 0.033*\"yawn\" + 0.031*\"jacksonvil\" + 0.023*\"japanes\" + 0.022*\"noll\" + 0.020*\"festiv\" + 0.019*\"women\" + 0.019*\"intern\" + 0.015*\"prison\"\n", + "2019-01-31 01:00:42,594 : INFO : topic #25 (0.020): 0.032*\"ring\" + 0.017*\"area\" + 0.017*\"warmth\" + 0.017*\"lagrang\" + 0.015*\"mount\" + 0.009*\"palmer\" + 0.009*\"north\" + 0.009*\"sourc\" + 0.008*\"foam\" + 0.008*\"lobe\"\n", + "2019-01-31 01:00:42,595 : INFO : topic #39 (0.020): 0.057*\"canada\" + 0.043*\"canadian\" + 0.024*\"toronto\" + 0.022*\"hoar\" + 0.019*\"ontario\" + 0.015*\"new\" + 0.015*\"misericordia\" + 0.015*\"hydrogen\" + 0.015*\"novotná\" + 0.013*\"quebec\"\n", + "2019-01-31 01:00:42,601 : INFO : topic diff=0.004290, rho=0.027767\n", + "2019-01-31 01:00:42,756 : INFO : PROGRESS: pass 0, at document #2596000/4922894\n", + "2019-01-31 01:00:44,124 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:00:44,391 : INFO : topic #15 (0.020): 0.011*\"small\" + 0.010*\"organ\" + 0.010*\"develop\" + 0.009*\"commun\" + 0.009*\"group\" + 0.009*\"word\" + 0.008*\"peopl\" + 0.007*\"woman\" + 0.007*\"human\" + 0.006*\"cultur\"\n", + "2019-01-31 01:00:44,392 : INFO : topic #9 (0.020): 0.070*\"bone\" + 0.045*\"american\" + 0.027*\"valour\" + 0.019*\"dutch\" + 0.018*\"folei\" + 0.018*\"player\" + 0.018*\"english\" + 0.017*\"polit\" + 0.013*\"acrimoni\" + 0.012*\"simpler\"\n", + "2019-01-31 01:00:44,393 : INFO : topic #28 (0.020): 0.033*\"build\" + 0.026*\"hous\" + 0.019*\"rivièr\" + 0.018*\"buford\" + 0.014*\"histor\" + 0.011*\"constitut\" + 0.011*\"strategist\" + 0.011*\"briarwood\" + 0.010*\"depress\" + 0.010*\"linear\"\n", + "2019-01-31 01:00:44,394 : INFO : topic #49 (0.020): 0.044*\"india\" + 0.032*\"incumb\" + 0.014*\"islam\" + 0.012*\"pakistan\" + 0.011*\"televis\" + 0.011*\"anglo\" + 0.011*\"muskoge\" + 0.010*\"sri\" + 0.009*\"khalsa\" + 0.009*\"affection\"\n", + "2019-01-31 01:00:44,395 : INFO : topic #41 (0.020): 0.041*\"citi\" + 0.025*\"palmer\" + 0.022*\"new\" + 0.015*\"strategist\" + 0.012*\"open\" + 0.012*\"center\" + 0.011*\"includ\" + 0.011*\"lobe\" + 0.009*\"dai\" + 0.009*\"highli\"\n", + "2019-01-31 01:00:44,401 : INFO : topic diff=0.003818, rho=0.027756\n", + "2019-01-31 01:00:44,561 : INFO : PROGRESS: pass 0, at document #2598000/4922894\n", + "2019-01-31 01:00:45,976 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:00:46,243 : INFO : topic #6 (0.020): 0.073*\"fewer\" + 0.024*\"epiru\" + 0.022*\"septemb\" + 0.018*\"teacher\" + 0.016*\"stake\" + 0.013*\"rodríguez\" + 0.012*\"proclaim\" + 0.011*\"movi\" + 0.011*\"direct\" + 0.010*\"acrimoni\"\n", + "2019-01-31 01:00:46,244 : INFO : topic #31 (0.020): 0.052*\"fusiform\" + 0.027*\"scientist\" + 0.025*\"taxpay\" + 0.022*\"player\" + 0.019*\"place\" + 0.014*\"clot\" + 0.013*\"leagu\" + 0.010*\"yawn\" + 0.010*\"folei\" + 0.009*\"reconstruct\"\n", + "2019-01-31 01:00:46,245 : INFO : topic #9 (0.020): 0.069*\"bone\" + 0.045*\"american\" + 0.027*\"valour\" + 0.019*\"dutch\" + 0.018*\"folei\" + 0.018*\"player\" + 0.018*\"english\" + 0.017*\"polit\" + 0.013*\"acrimoni\" + 0.012*\"simpler\"\n", + "2019-01-31 01:00:46,246 : INFO : topic #34 (0.020): 0.069*\"start\" + 0.034*\"new\" + 0.031*\"american\" + 0.030*\"unionist\" + 0.024*\"cotton\" + 0.022*\"year\" + 0.015*\"california\" + 0.013*\"warrior\" + 0.013*\"terri\" + 0.011*\"violent\"\n", + "2019-01-31 01:00:46,247 : INFO : topic #13 (0.020): 0.026*\"london\" + 0.026*\"australia\" + 0.025*\"new\" + 0.025*\"sourc\" + 0.024*\"england\" + 0.022*\"australian\" + 0.019*\"british\" + 0.018*\"ireland\" + 0.016*\"youth\" + 0.014*\"wale\"\n", + "2019-01-31 01:00:46,253 : INFO : topic diff=0.004088, rho=0.027746\n", + "2019-01-31 01:00:48,972 : INFO : -11.393 per-word bound, 2688.5 perplexity estimate based on a held-out corpus of 2000 documents with 584820 words\n", + "2019-01-31 01:00:48,972 : INFO : PROGRESS: pass 0, at document #2600000/4922894\n", + "2019-01-31 01:00:50,359 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:00:50,626 : INFO : topic #40 (0.020): 0.085*\"unit\" + 0.024*\"schuster\" + 0.022*\"requir\" + 0.021*\"institut\" + 0.019*\"collector\" + 0.018*\"student\" + 0.016*\"professor\" + 0.013*\"http\" + 0.012*\"word\" + 0.011*\"degre\"\n", + "2019-01-31 01:00:50,627 : INFO : topic #21 (0.020): 0.037*\"samford\" + 0.022*\"spain\" + 0.020*\"del\" + 0.017*\"mexico\" + 0.014*\"italian\" + 0.013*\"soviet\" + 0.012*\"juan\" + 0.011*\"santa\" + 0.011*\"carlo\" + 0.011*\"francisco\"\n", + "2019-01-31 01:00:50,628 : INFO : topic #49 (0.020): 0.044*\"india\" + 0.033*\"incumb\" + 0.014*\"islam\" + 0.012*\"pakistan\" + 0.012*\"televis\" + 0.011*\"anglo\" + 0.010*\"muskoge\" + 0.010*\"sri\" + 0.009*\"khalsa\" + 0.009*\"affection\"\n", + "2019-01-31 01:00:50,629 : INFO : topic #6 (0.020): 0.073*\"fewer\" + 0.024*\"epiru\" + 0.022*\"septemb\" + 0.018*\"teacher\" + 0.016*\"stake\" + 0.013*\"rodríguez\" + 0.012*\"proclaim\" + 0.011*\"direct\" + 0.011*\"movi\" + 0.010*\"acrimoni\"\n", + "2019-01-31 01:00:50,630 : INFO : topic #35 (0.020): 0.058*\"russia\" + 0.039*\"sovereignti\" + 0.033*\"rural\" + 0.026*\"poison\" + 0.024*\"personifi\" + 0.023*\"reprint\" + 0.020*\"moscow\" + 0.017*\"poland\" + 0.016*\"unfortun\" + 0.014*\"czech\"\n", + "2019-01-31 01:00:50,637 : INFO : topic diff=0.004798, rho=0.027735\n", + "2019-01-31 01:00:50,797 : INFO : PROGRESS: pass 0, at document #2602000/4922894\n", + "2019-01-31 01:00:52,196 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:00:52,463 : INFO : topic #0 (0.020): 0.068*\"statewid\" + 0.042*\"line\" + 0.034*\"raid\" + 0.026*\"arsen\" + 0.023*\"museo\" + 0.020*\"traceabl\" + 0.018*\"serv\" + 0.016*\"rosenwald\" + 0.012*\"oper\" + 0.012*\"exhaust\"\n", + "2019-01-31 01:00:52,464 : INFO : topic #10 (0.020): 0.010*\"cdd\" + 0.008*\"media\" + 0.008*\"disco\" + 0.008*\"hormon\" + 0.007*\"pathwai\" + 0.007*\"caus\" + 0.006*\"effect\" + 0.006*\"have\" + 0.006*\"treat\" + 0.006*\"proper\"\n", + "2019-01-31 01:00:52,465 : INFO : topic #43 (0.020): 0.064*\"elect\" + 0.053*\"parti\" + 0.024*\"democrat\" + 0.023*\"voluntari\" + 0.021*\"member\" + 0.016*\"polici\" + 0.015*\"republ\" + 0.014*\"report\" + 0.014*\"bypass\" + 0.013*\"liber\"\n", + "2019-01-31 01:00:52,466 : INFO : topic #23 (0.020): 0.135*\"audit\" + 0.069*\"best\" + 0.033*\"yawn\" + 0.030*\"jacksonvil\" + 0.022*\"japanes\" + 0.022*\"noll\" + 0.020*\"festiv\" + 0.019*\"women\" + 0.018*\"intern\" + 0.015*\"prison\"\n", + "2019-01-31 01:00:52,467 : INFO : topic #22 (0.020): 0.034*\"spars\" + 0.024*\"factor\" + 0.012*\"feel\" + 0.011*\"plaisir\" + 0.011*\"adulthood\" + 0.011*\"male\" + 0.010*\"genu\" + 0.008*\"biom\" + 0.008*\"western\" + 0.008*\"median\"\n", + "2019-01-31 01:00:52,473 : INFO : topic diff=0.003857, rho=0.027724\n", + "2019-01-31 01:00:52,626 : INFO : PROGRESS: pass 0, at document #2604000/4922894\n", + "2019-01-31 01:00:53,968 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:00:54,234 : INFO : topic #23 (0.020): 0.135*\"audit\" + 0.069*\"best\" + 0.033*\"yawn\" + 0.030*\"jacksonvil\" + 0.022*\"japanes\" + 0.022*\"noll\" + 0.019*\"festiv\" + 0.019*\"women\" + 0.018*\"intern\" + 0.015*\"prison\"\n", + "2019-01-31 01:00:54,235 : INFO : topic #32 (0.020): 0.051*\"district\" + 0.044*\"popolo\" + 0.042*\"vigour\" + 0.037*\"tortur\" + 0.031*\"cotton\" + 0.025*\"area\" + 0.022*\"multitud\" + 0.021*\"citi\" + 0.019*\"regim\" + 0.019*\"cede\"\n", + "2019-01-31 01:00:54,236 : INFO : topic #5 (0.020): 0.039*\"abroad\" + 0.029*\"son\" + 0.027*\"rel\" + 0.025*\"reconstruct\" + 0.020*\"band\" + 0.017*\"muscl\" + 0.016*\"simultan\" + 0.014*\"charcoal\" + 0.014*\"toyota\" + 0.010*\"myspac\"\n", + "2019-01-31 01:00:54,237 : INFO : topic #39 (0.020): 0.059*\"canada\" + 0.044*\"canadian\" + 0.024*\"toronto\" + 0.022*\"hoar\" + 0.019*\"ontario\" + 0.015*\"misericordia\" + 0.015*\"new\" + 0.015*\"hydrogen\" + 0.015*\"novotná\" + 0.013*\"quebec\"\n", + "2019-01-31 01:00:54,238 : INFO : topic #30 (0.020): 0.036*\"leagu\" + 0.035*\"cleveland\" + 0.029*\"place\" + 0.027*\"taxpay\" + 0.024*\"scientist\" + 0.023*\"crete\" + 0.021*\"folei\" + 0.017*\"goal\" + 0.015*\"martin\" + 0.012*\"schmitz\"\n", + "2019-01-31 01:00:54,244 : INFO : topic diff=0.003731, rho=0.027714\n", + "2019-01-31 01:00:54,400 : INFO : PROGRESS: pass 0, at document #2606000/4922894\n", + "2019-01-31 01:00:55,767 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:00:56,033 : INFO : topic #10 (0.020): 0.010*\"cdd\" + 0.008*\"media\" + 0.008*\"disco\" + 0.007*\"hormon\" + 0.007*\"pathwai\" + 0.007*\"caus\" + 0.006*\"effect\" + 0.006*\"have\" + 0.006*\"proper\" + 0.006*\"treat\"\n", + "2019-01-31 01:00:56,035 : INFO : topic #6 (0.020): 0.073*\"fewer\" + 0.024*\"epiru\" + 0.021*\"septemb\" + 0.018*\"teacher\" + 0.016*\"stake\" + 0.013*\"rodríguez\" + 0.012*\"proclaim\" + 0.011*\"acrimoni\" + 0.011*\"direct\" + 0.011*\"movi\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 01:00:56,036 : INFO : topic #26 (0.020): 0.028*\"woman\" + 0.028*\"workplac\" + 0.028*\"champion\" + 0.027*\"men\" + 0.024*\"olymp\" + 0.021*\"medal\" + 0.020*\"event\" + 0.019*\"alic\" + 0.018*\"rainfal\" + 0.017*\"atheist\"\n", + "2019-01-31 01:00:56,036 : INFO : topic #23 (0.020): 0.135*\"audit\" + 0.069*\"best\" + 0.033*\"yawn\" + 0.030*\"jacksonvil\" + 0.022*\"japanes\" + 0.022*\"noll\" + 0.020*\"festiv\" + 0.019*\"women\" + 0.018*\"intern\" + 0.015*\"prison\"\n", + "2019-01-31 01:00:56,037 : INFO : topic #32 (0.020): 0.051*\"district\" + 0.043*\"popolo\" + 0.042*\"vigour\" + 0.037*\"tortur\" + 0.031*\"cotton\" + 0.025*\"area\" + 0.022*\"multitud\" + 0.021*\"citi\" + 0.019*\"regim\" + 0.019*\"cede\"\n", + "2019-01-31 01:00:56,043 : INFO : topic diff=0.003342, rho=0.027703\n", + "2019-01-31 01:00:56,196 : INFO : PROGRESS: pass 0, at document #2608000/4922894\n", + "2019-01-31 01:00:57,545 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:00:57,811 : INFO : topic #46 (0.020): 0.017*\"sweden\" + 0.017*\"norwai\" + 0.016*\"swedish\" + 0.016*\"stop\" + 0.014*\"damag\" + 0.014*\"wind\" + 0.013*\"norwegian\" + 0.012*\"denmark\" + 0.011*\"danish\" + 0.011*\"turkish\"\n", + "2019-01-31 01:00:57,812 : INFO : topic #7 (0.020): 0.021*\"snatch\" + 0.020*\"di\" + 0.019*\"factor\" + 0.016*\"margin\" + 0.015*\"yawn\" + 0.014*\"bone\" + 0.012*\"life\" + 0.012*\"faster\" + 0.012*\"john\" + 0.012*\"daughter\"\n", + "2019-01-31 01:00:57,813 : INFO : topic #20 (0.020): 0.139*\"scholar\" + 0.040*\"struggl\" + 0.031*\"high\" + 0.031*\"educ\" + 0.024*\"collector\" + 0.017*\"yawn\" + 0.013*\"prognosi\" + 0.010*\"gothic\" + 0.010*\"district\" + 0.009*\"class\"\n", + "2019-01-31 01:00:57,814 : INFO : topic #32 (0.020): 0.051*\"district\" + 0.043*\"popolo\" + 0.042*\"vigour\" + 0.037*\"tortur\" + 0.031*\"cotton\" + 0.025*\"area\" + 0.022*\"multitud\" + 0.021*\"citi\" + 0.020*\"regim\" + 0.019*\"cede\"\n", + "2019-01-31 01:00:57,815 : INFO : topic #6 (0.020): 0.073*\"fewer\" + 0.024*\"epiru\" + 0.021*\"septemb\" + 0.018*\"teacher\" + 0.015*\"stake\" + 0.013*\"rodríguez\" + 0.012*\"proclaim\" + 0.011*\"acrimoni\" + 0.011*\"direct\" + 0.011*\"movi\"\n", + "2019-01-31 01:00:57,821 : INFO : topic diff=0.004042, rho=0.027692\n", + "2019-01-31 01:00:57,978 : INFO : PROGRESS: pass 0, at document #2610000/4922894\n", + "2019-01-31 01:00:59,353 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:00:59,619 : INFO : topic #35 (0.020): 0.057*\"russia\" + 0.040*\"sovereignti\" + 0.033*\"rural\" + 0.025*\"poison\" + 0.023*\"personifi\" + 0.023*\"reprint\" + 0.020*\"moscow\" + 0.018*\"poland\" + 0.017*\"unfortun\" + 0.014*\"czech\"\n", + "2019-01-31 01:00:59,620 : INFO : topic #48 (0.020): 0.085*\"march\" + 0.079*\"sens\" + 0.078*\"octob\" + 0.075*\"januari\" + 0.073*\"juli\" + 0.072*\"august\" + 0.071*\"notion\" + 0.071*\"judici\" + 0.070*\"april\" + 0.069*\"decatur\"\n", + "2019-01-31 01:00:59,621 : INFO : topic #10 (0.020): 0.011*\"cdd\" + 0.008*\"disco\" + 0.008*\"media\" + 0.007*\"hormon\" + 0.007*\"pathwai\" + 0.007*\"caus\" + 0.006*\"effect\" + 0.006*\"proper\" + 0.006*\"have\" + 0.006*\"treat\"\n", + "2019-01-31 01:00:59,622 : INFO : topic #22 (0.020): 0.034*\"spars\" + 0.023*\"factor\" + 0.011*\"feel\" + 0.011*\"plaisir\" + 0.011*\"adulthood\" + 0.011*\"genu\" + 0.010*\"male\" + 0.008*\"biom\" + 0.008*\"western\" + 0.008*\"median\"\n", + "2019-01-31 01:00:59,623 : INFO : topic #13 (0.020): 0.026*\"australia\" + 0.026*\"london\" + 0.025*\"sourc\" + 0.025*\"new\" + 0.024*\"england\" + 0.022*\"australian\" + 0.019*\"british\" + 0.019*\"ireland\" + 0.016*\"youth\" + 0.014*\"wale\"\n", + "2019-01-31 01:00:59,630 : INFO : topic diff=0.003716, rho=0.027682\n", + "2019-01-31 01:00:59,783 : INFO : PROGRESS: pass 0, at document #2612000/4922894\n", + "2019-01-31 01:01:01,149 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:01:01,415 : INFO : topic #6 (0.020): 0.072*\"fewer\" + 0.023*\"epiru\" + 0.021*\"septemb\" + 0.018*\"teacher\" + 0.016*\"stake\" + 0.013*\"rodríguez\" + 0.012*\"proclaim\" + 0.011*\"acrimoni\" + 0.011*\"movi\" + 0.010*\"direct\"\n", + "2019-01-31 01:01:01,416 : INFO : topic #27 (0.020): 0.071*\"questionnair\" + 0.021*\"taxpay\" + 0.021*\"candid\" + 0.013*\"ret\" + 0.012*\"driver\" + 0.012*\"find\" + 0.011*\"tornado\" + 0.011*\"fool\" + 0.010*\"champion\" + 0.010*\"squatter\"\n", + "2019-01-31 01:01:01,418 : INFO : topic #31 (0.020): 0.052*\"fusiform\" + 0.027*\"scientist\" + 0.026*\"taxpay\" + 0.023*\"player\" + 0.019*\"place\" + 0.014*\"clot\" + 0.013*\"leagu\" + 0.010*\"folei\" + 0.010*\"yawn\" + 0.009*\"reconstruct\"\n", + "2019-01-31 01:01:01,419 : INFO : topic #26 (0.020): 0.028*\"workplac\" + 0.028*\"champion\" + 0.028*\"woman\" + 0.026*\"men\" + 0.024*\"olymp\" + 0.021*\"medal\" + 0.020*\"event\" + 0.019*\"alic\" + 0.018*\"rainfal\" + 0.017*\"taxpay\"\n", + "2019-01-31 01:01:01,419 : INFO : topic #48 (0.020): 0.085*\"march\" + 0.079*\"sens\" + 0.078*\"octob\" + 0.075*\"januari\" + 0.073*\"juli\" + 0.072*\"august\" + 0.071*\"notion\" + 0.071*\"judici\" + 0.070*\"april\" + 0.069*\"decatur\"\n", + "2019-01-31 01:01:01,425 : INFO : topic diff=0.004119, rho=0.027671\n", + "2019-01-31 01:01:01,577 : INFO : PROGRESS: pass 0, at document #2614000/4922894\n", + "2019-01-31 01:01:02,926 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:01:03,192 : INFO : topic #27 (0.020): 0.071*\"questionnair\" + 0.021*\"taxpay\" + 0.021*\"candid\" + 0.013*\"ret\" + 0.012*\"driver\" + 0.012*\"find\" + 0.012*\"tornado\" + 0.011*\"fool\" + 0.010*\"squatter\" + 0.010*\"champion\"\n", + "2019-01-31 01:01:03,193 : INFO : topic #14 (0.020): 0.024*\"forc\" + 0.023*\"aggress\" + 0.020*\"armi\" + 0.019*\"walter\" + 0.018*\"com\" + 0.014*\"oper\" + 0.014*\"unionist\" + 0.012*\"militari\" + 0.012*\"airbu\" + 0.011*\"refut\"\n", + "2019-01-31 01:01:03,194 : INFO : topic #10 (0.020): 0.011*\"cdd\" + 0.008*\"media\" + 0.008*\"disco\" + 0.007*\"hormon\" + 0.007*\"pathwai\" + 0.007*\"caus\" + 0.006*\"effect\" + 0.006*\"proper\" + 0.006*\"treat\" + 0.006*\"have\"\n", + "2019-01-31 01:01:03,195 : INFO : topic #39 (0.020): 0.058*\"canada\" + 0.045*\"canadian\" + 0.023*\"toronto\" + 0.022*\"hoar\" + 0.019*\"ontario\" + 0.015*\"new\" + 0.015*\"novotná\" + 0.015*\"misericordia\" + 0.015*\"hydrogen\" + 0.014*\"quebec\"\n", + "2019-01-31 01:01:03,197 : INFO : topic #38 (0.020): 0.023*\"walter\" + 0.011*\"aza\" + 0.009*\"forc\" + 0.008*\"battalion\" + 0.008*\"teufel\" + 0.007*\"empath\" + 0.007*\"armi\" + 0.007*\"till\" + 0.006*\"militari\" + 0.006*\"govern\"\n", + "2019-01-31 01:01:03,203 : INFO : topic diff=0.004697, rho=0.027661\n", + "2019-01-31 01:01:03,363 : INFO : PROGRESS: pass 0, at document #2616000/4922894\n", + "2019-01-31 01:01:04,777 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:01:05,043 : INFO : topic #4 (0.020): 0.021*\"enfranchis\" + 0.015*\"depress\" + 0.015*\"pour\" + 0.009*\"mode\" + 0.009*\"elabor\" + 0.008*\"veget\" + 0.007*\"uruguayan\" + 0.006*\"produc\" + 0.006*\"encyclopedia\" + 0.006*\"develop\"\n", + "2019-01-31 01:01:05,045 : INFO : topic #8 (0.020): 0.027*\"law\" + 0.022*\"cortic\" + 0.021*\"act\" + 0.018*\"start\" + 0.013*\"ricardo\" + 0.012*\"case\" + 0.010*\"polaris\" + 0.010*\"replac\" + 0.009*\"legal\" + 0.007*\"justic\"\n", + "2019-01-31 01:01:05,046 : INFO : topic #49 (0.020): 0.044*\"india\" + 0.032*\"incumb\" + 0.014*\"islam\" + 0.012*\"pakistan\" + 0.012*\"anglo\" + 0.011*\"televis\" + 0.011*\"sri\" + 0.011*\"muskoge\" + 0.010*\"tajikistan\" + 0.009*\"affection\"\n", + "2019-01-31 01:01:05,047 : INFO : topic #26 (0.020): 0.029*\"workplac\" + 0.028*\"champion\" + 0.028*\"woman\" + 0.026*\"men\" + 0.024*\"olymp\" + 0.021*\"medal\" + 0.020*\"alic\" + 0.020*\"event\" + 0.018*\"rainfal\" + 0.017*\"taxpay\"\n", + "2019-01-31 01:01:05,048 : INFO : topic #7 (0.020): 0.021*\"snatch\" + 0.020*\"di\" + 0.019*\"factor\" + 0.016*\"margin\" + 0.016*\"yawn\" + 0.014*\"bone\" + 0.013*\"faster\" + 0.013*\"life\" + 0.012*\"daughter\" + 0.012*\"john\"\n", + "2019-01-31 01:01:05,054 : INFO : topic diff=0.004615, rho=0.027650\n", + "2019-01-31 01:01:05,207 : INFO : PROGRESS: pass 0, at document #2618000/4922894\n", + "2019-01-31 01:01:06,567 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:01:06,834 : INFO : topic #32 (0.020): 0.050*\"district\" + 0.043*\"popolo\" + 0.041*\"vigour\" + 0.037*\"tortur\" + 0.032*\"cotton\" + 0.024*\"area\" + 0.022*\"multitud\" + 0.021*\"citi\" + 0.020*\"regim\" + 0.019*\"cede\"\n", + "2019-01-31 01:01:06,835 : INFO : topic #23 (0.020): 0.134*\"audit\" + 0.068*\"best\" + 0.033*\"yawn\" + 0.030*\"jacksonvil\" + 0.022*\"japanes\" + 0.022*\"noll\" + 0.019*\"festiv\" + 0.019*\"women\" + 0.018*\"intern\" + 0.015*\"prison\"\n", + "2019-01-31 01:01:06,836 : INFO : topic #45 (0.020): 0.028*\"jpg\" + 0.026*\"fifteenth\" + 0.018*\"illicit\" + 0.018*\"colder\" + 0.015*\"black\" + 0.014*\"western\" + 0.012*\"record\" + 0.011*\"blind\" + 0.010*\"pain\" + 0.009*\"depress\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 01:01:06,837 : INFO : topic #20 (0.020): 0.140*\"scholar\" + 0.039*\"struggl\" + 0.032*\"high\" + 0.030*\"educ\" + 0.025*\"collector\" + 0.018*\"yawn\" + 0.013*\"prognosi\" + 0.010*\"district\" + 0.009*\"gothic\" + 0.009*\"task\"\n", + "2019-01-31 01:01:06,838 : INFO : topic #7 (0.020): 0.021*\"snatch\" + 0.020*\"di\" + 0.019*\"factor\" + 0.016*\"margin\" + 0.016*\"yawn\" + 0.014*\"bone\" + 0.013*\"faster\" + 0.013*\"life\" + 0.012*\"daughter\" + 0.012*\"john\"\n", + "2019-01-31 01:01:06,844 : INFO : topic diff=0.003545, rho=0.027639\n", + "2019-01-31 01:01:09,520 : INFO : -11.563 per-word bound, 3025.0 perplexity estimate based on a held-out corpus of 2000 documents with 519730 words\n", + "2019-01-31 01:01:09,520 : INFO : PROGRESS: pass 0, at document #2620000/4922894\n", + "2019-01-31 01:01:10,899 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:01:11,166 : INFO : topic #0 (0.020): 0.068*\"statewid\" + 0.042*\"line\" + 0.035*\"raid\" + 0.027*\"arsen\" + 0.023*\"museo\" + 0.020*\"traceabl\" + 0.018*\"serv\" + 0.016*\"rosenwald\" + 0.013*\"oper\" + 0.012*\"exhaust\"\n", + "2019-01-31 01:01:11,167 : INFO : topic #1 (0.020): 0.056*\"china\" + 0.045*\"chilton\" + 0.024*\"hong\" + 0.024*\"kong\" + 0.022*\"korea\" + 0.018*\"korean\" + 0.015*\"leah\" + 0.015*\"taiwan\" + 0.014*\"sourc\" + 0.014*\"kim\"\n", + "2019-01-31 01:01:11,168 : INFO : topic #17 (0.020): 0.078*\"church\" + 0.021*\"cathol\" + 0.021*\"christian\" + 0.020*\"bishop\" + 0.015*\"sail\" + 0.015*\"retroflex\" + 0.012*\"centuri\" + 0.009*\"historiographi\" + 0.009*\"relationship\" + 0.009*\"poll\"\n", + "2019-01-31 01:01:11,169 : INFO : topic #24 (0.020): 0.039*\"book\" + 0.034*\"publicis\" + 0.027*\"word\" + 0.018*\"new\" + 0.014*\"edit\" + 0.013*\"presid\" + 0.012*\"collect\" + 0.011*\"storag\" + 0.011*\"nicola\" + 0.011*\"author\"\n", + "2019-01-31 01:01:11,170 : INFO : topic #29 (0.020): 0.030*\"companhia\" + 0.013*\"busi\" + 0.012*\"million\" + 0.011*\"market\" + 0.011*\"produc\" + 0.011*\"bank\" + 0.010*\"industri\" + 0.008*\"yawn\" + 0.008*\"manag\" + 0.007*\"oper\"\n", + "2019-01-31 01:01:11,176 : INFO : topic diff=0.003525, rho=0.027629\n", + "2019-01-31 01:01:11,337 : INFO : PROGRESS: pass 0, at document #2622000/4922894\n", + "2019-01-31 01:01:13,198 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:01:13,464 : INFO : topic #39 (0.020): 0.059*\"canada\" + 0.045*\"canadian\" + 0.024*\"toronto\" + 0.022*\"hoar\" + 0.019*\"ontario\" + 0.015*\"hydrogen\" + 0.015*\"misericordia\" + 0.015*\"new\" + 0.014*\"novotná\" + 0.014*\"quebec\"\n", + "2019-01-31 01:01:13,465 : INFO : topic #13 (0.020): 0.026*\"australia\" + 0.026*\"london\" + 0.025*\"sourc\" + 0.025*\"new\" + 0.024*\"england\" + 0.021*\"australian\" + 0.019*\"british\" + 0.018*\"ireland\" + 0.016*\"youth\" + 0.014*\"wale\"\n", + "2019-01-31 01:01:13,466 : INFO : topic #16 (0.020): 0.049*\"king\" + 0.029*\"priest\" + 0.019*\"duke\" + 0.019*\"grammat\" + 0.018*\"rotterdam\" + 0.018*\"idiosyncrat\" + 0.016*\"quarterli\" + 0.014*\"portugues\" + 0.014*\"order\" + 0.014*\"brazil\"\n", + "2019-01-31 01:01:13,467 : INFO : topic #31 (0.020): 0.052*\"fusiform\" + 0.027*\"scientist\" + 0.026*\"taxpay\" + 0.023*\"player\" + 0.019*\"place\" + 0.014*\"clot\" + 0.013*\"leagu\" + 0.011*\"folei\" + 0.011*\"yawn\" + 0.009*\"reconstruct\"\n", + "2019-01-31 01:01:13,468 : INFO : topic #11 (0.020): 0.024*\"john\" + 0.012*\"will\" + 0.012*\"jame\" + 0.011*\"david\" + 0.010*\"rival\" + 0.009*\"mexican–american\" + 0.008*\"slur\" + 0.008*\"georg\" + 0.008*\"paul\" + 0.008*\"rhyme\"\n", + "2019-01-31 01:01:13,474 : INFO : topic diff=0.004504, rho=0.027618\n", + "2019-01-31 01:01:13,692 : INFO : PROGRESS: pass 0, at document #2624000/4922894\n", + "2019-01-31 01:01:15,087 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:01:15,352 : INFO : topic #34 (0.020): 0.068*\"start\" + 0.035*\"new\" + 0.031*\"american\" + 0.030*\"unionist\" + 0.024*\"cotton\" + 0.022*\"year\" + 0.015*\"california\" + 0.013*\"warrior\" + 0.013*\"terri\" + 0.011*\"north\"\n", + "2019-01-31 01:01:15,353 : INFO : topic #40 (0.020): 0.085*\"unit\" + 0.023*\"schuster\" + 0.022*\"requir\" + 0.021*\"institut\" + 0.019*\"collector\" + 0.019*\"student\" + 0.015*\"professor\" + 0.013*\"http\" + 0.012*\"word\" + 0.012*\"degre\"\n", + "2019-01-31 01:01:15,354 : INFO : topic #3 (0.020): 0.033*\"present\" + 0.026*\"offic\" + 0.023*\"nation\" + 0.023*\"minist\" + 0.022*\"govern\" + 0.022*\"member\" + 0.017*\"start\" + 0.016*\"serv\" + 0.016*\"gener\" + 0.014*\"seri\"\n", + "2019-01-31 01:01:15,355 : INFO : topic #22 (0.020): 0.034*\"spars\" + 0.024*\"factor\" + 0.012*\"plaisir\" + 0.011*\"feel\" + 0.011*\"genu\" + 0.010*\"adulthood\" + 0.010*\"male\" + 0.008*\"western\" + 0.008*\"median\" + 0.008*\"biom\"\n", + "2019-01-31 01:01:15,357 : INFO : topic #18 (0.020): 0.011*\"théori\" + 0.007*\"later\" + 0.007*\"sack\" + 0.006*\"dai\" + 0.006*\"kill\" + 0.005*\"retrospect\" + 0.005*\"like\" + 0.005*\"end\" + 0.004*\"help\" + 0.004*\"call\"\n", + "2019-01-31 01:01:15,362 : INFO : topic diff=0.004411, rho=0.027608\n", + "2019-01-31 01:01:15,521 : INFO : PROGRESS: pass 0, at document #2626000/4922894\n", + "2019-01-31 01:01:16,904 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:01:17,171 : INFO : topic #35 (0.020): 0.058*\"russia\" + 0.039*\"sovereignti\" + 0.033*\"rural\" + 0.025*\"poison\" + 0.024*\"personifi\" + 0.024*\"reprint\" + 0.020*\"moscow\" + 0.018*\"poland\" + 0.016*\"unfortun\" + 0.014*\"czech\"\n", + "2019-01-31 01:01:17,172 : INFO : topic #30 (0.020): 0.035*\"leagu\" + 0.035*\"cleveland\" + 0.029*\"place\" + 0.027*\"taxpay\" + 0.024*\"scientist\" + 0.023*\"crete\" + 0.021*\"folei\" + 0.017*\"goal\" + 0.016*\"martin\" + 0.012*\"schmitz\"\n", + "2019-01-31 01:01:17,173 : INFO : topic #20 (0.020): 0.138*\"scholar\" + 0.039*\"struggl\" + 0.031*\"high\" + 0.030*\"educ\" + 0.024*\"collector\" + 0.018*\"yawn\" + 0.013*\"prognosi\" + 0.011*\"district\" + 0.010*\"gothic\" + 0.009*\"start\"\n", + "2019-01-31 01:01:17,174 : INFO : topic #24 (0.020): 0.039*\"book\" + 0.034*\"publicis\" + 0.026*\"word\" + 0.018*\"new\" + 0.014*\"edit\" + 0.013*\"presid\" + 0.012*\"collect\" + 0.011*\"storag\" + 0.011*\"nicola\" + 0.011*\"author\"\n", + "2019-01-31 01:01:17,175 : INFO : topic #45 (0.020): 0.028*\"jpg\" + 0.026*\"fifteenth\" + 0.018*\"illicit\" + 0.018*\"colder\" + 0.015*\"black\" + 0.014*\"western\" + 0.012*\"record\" + 0.010*\"blind\" + 0.010*\"pain\" + 0.009*\"depress\"\n", + "2019-01-31 01:01:17,181 : INFO : topic diff=0.004979, rho=0.027597\n", + "2019-01-31 01:01:17,341 : INFO : PROGRESS: pass 0, at document #2628000/4922894\n", + "2019-01-31 01:01:18,752 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:01:19,018 : INFO : topic #18 (0.020): 0.011*\"théori\" + 0.007*\"later\" + 0.007*\"sack\" + 0.006*\"dai\" + 0.006*\"kill\" + 0.005*\"retrospect\" + 0.005*\"like\" + 0.005*\"end\" + 0.004*\"help\" + 0.004*\"call\"\n", + "2019-01-31 01:01:19,019 : INFO : topic #1 (0.020): 0.056*\"china\" + 0.045*\"chilton\" + 0.024*\"hong\" + 0.023*\"kong\" + 0.022*\"korea\" + 0.019*\"korean\" + 0.016*\"leah\" + 0.014*\"taiwan\" + 0.014*\"sourc\" + 0.014*\"shirin\"\n", + "2019-01-31 01:01:19,020 : INFO : topic #32 (0.020): 0.051*\"district\" + 0.043*\"popolo\" + 0.042*\"vigour\" + 0.037*\"tortur\" + 0.031*\"cotton\" + 0.024*\"area\" + 0.022*\"multitud\" + 0.021*\"citi\" + 0.020*\"regim\" + 0.019*\"cede\"\n", + "2019-01-31 01:01:19,021 : INFO : topic #2 (0.020): 0.052*\"isl\" + 0.038*\"shield\" + 0.018*\"narrat\" + 0.015*\"scot\" + 0.012*\"pope\" + 0.011*\"blur\" + 0.011*\"nativist\" + 0.011*\"coalit\" + 0.010*\"bahá\" + 0.009*\"fleet\"\n", + "2019-01-31 01:01:19,022 : INFO : topic #42 (0.020): 0.046*\"german\" + 0.032*\"germani\" + 0.015*\"vol\" + 0.014*\"berlin\" + 0.014*\"jewish\" + 0.014*\"israel\" + 0.013*\"der\" + 0.010*\"europ\" + 0.010*\"european\" + 0.009*\"austria\"\n", + "2019-01-31 01:01:19,028 : INFO : topic diff=0.004392, rho=0.027587\n", + "2019-01-31 01:01:19,197 : INFO : PROGRESS: pass 0, at document #2630000/4922894\n", + "2019-01-31 01:01:20,624 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:01:20,890 : INFO : topic #45 (0.020): 0.028*\"jpg\" + 0.026*\"fifteenth\" + 0.018*\"illicit\" + 0.018*\"colder\" + 0.015*\"black\" + 0.014*\"western\" + 0.012*\"record\" + 0.010*\"blind\" + 0.010*\"pain\" + 0.009*\"depress\"\n", + "2019-01-31 01:01:20,892 : INFO : topic #14 (0.020): 0.024*\"forc\" + 0.024*\"aggress\" + 0.020*\"walter\" + 0.020*\"armi\" + 0.017*\"com\" + 0.014*\"oper\" + 0.014*\"unionist\" + 0.013*\"militari\" + 0.012*\"airbu\" + 0.011*\"refut\"\n", + "2019-01-31 01:01:20,893 : INFO : topic #22 (0.020): 0.034*\"spars\" + 0.023*\"factor\" + 0.012*\"plaisir\" + 0.011*\"feel\" + 0.011*\"genu\" + 0.010*\"adulthood\" + 0.010*\"male\" + 0.008*\"biom\" + 0.008*\"median\" + 0.008*\"western\"\n", + "2019-01-31 01:01:20,894 : INFO : topic #16 (0.020): 0.049*\"king\" + 0.029*\"priest\" + 0.020*\"duke\" + 0.019*\"rotterdam\" + 0.019*\"grammat\" + 0.017*\"idiosyncrat\" + 0.016*\"quarterli\" + 0.014*\"order\" + 0.014*\"brazil\" + 0.013*\"portugues\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 01:01:20,895 : INFO : topic #1 (0.020): 0.055*\"china\" + 0.045*\"chilton\" + 0.023*\"hong\" + 0.023*\"kong\" + 0.022*\"korea\" + 0.019*\"korean\" + 0.015*\"leah\" + 0.015*\"taiwan\" + 0.014*\"sourc\" + 0.014*\"shirin\"\n", + "2019-01-31 01:01:20,901 : INFO : topic diff=0.004655, rho=0.027576\n", + "2019-01-31 01:01:21,063 : INFO : PROGRESS: pass 0, at document #2632000/4922894\n", + "2019-01-31 01:01:22,484 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:01:22,750 : INFO : topic #27 (0.020): 0.072*\"questionnair\" + 0.021*\"taxpay\" + 0.020*\"candid\" + 0.014*\"ret\" + 0.012*\"driver\" + 0.012*\"find\" + 0.012*\"tornado\" + 0.011*\"fool\" + 0.011*\"landslid\" + 0.010*\"squatter\"\n", + "2019-01-31 01:01:22,751 : INFO : topic #10 (0.020): 0.011*\"cdd\" + 0.008*\"media\" + 0.008*\"disco\" + 0.007*\"hormon\" + 0.007*\"pathwai\" + 0.007*\"caus\" + 0.006*\"proper\" + 0.006*\"effect\" + 0.006*\"have\" + 0.006*\"treat\"\n", + "2019-01-31 01:01:22,752 : INFO : topic #47 (0.020): 0.063*\"muscl\" + 0.034*\"perceptu\" + 0.022*\"theater\" + 0.018*\"damn\" + 0.018*\"place\" + 0.017*\"compos\" + 0.013*\"orchestr\" + 0.013*\"olympo\" + 0.012*\"physician\" + 0.011*\"word\"\n", + "2019-01-31 01:01:22,753 : INFO : topic #8 (0.020): 0.027*\"law\" + 0.022*\"cortic\" + 0.020*\"act\" + 0.018*\"start\" + 0.012*\"ricardo\" + 0.012*\"case\" + 0.010*\"polaris\" + 0.010*\"replac\" + 0.009*\"legal\" + 0.007*\"justic\"\n", + "2019-01-31 01:01:22,755 : INFO : topic #17 (0.020): 0.078*\"church\" + 0.022*\"cathol\" + 0.021*\"christian\" + 0.020*\"bishop\" + 0.015*\"sail\" + 0.015*\"retroflex\" + 0.012*\"centuri\" + 0.009*\"relationship\" + 0.009*\"historiographi\" + 0.009*\"poll\"\n", + "2019-01-31 01:01:22,760 : INFO : topic diff=0.004501, rho=0.027566\n", + "2019-01-31 01:01:22,923 : INFO : PROGRESS: pass 0, at document #2634000/4922894\n", + "2019-01-31 01:01:24,352 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:01:24,618 : INFO : topic #25 (0.020): 0.033*\"ring\" + 0.018*\"lagrang\" + 0.018*\"area\" + 0.017*\"warmth\" + 0.016*\"mount\" + 0.009*\"north\" + 0.009*\"palmer\" + 0.009*\"sourc\" + 0.009*\"vacant\" + 0.009*\"foam\"\n", + "2019-01-31 01:01:24,619 : INFO : topic #2 (0.020): 0.053*\"isl\" + 0.038*\"shield\" + 0.018*\"narrat\" + 0.015*\"scot\" + 0.012*\"pope\" + 0.012*\"blur\" + 0.011*\"coalit\" + 0.010*\"nativist\" + 0.010*\"bahá\" + 0.009*\"fleet\"\n", + "2019-01-31 01:01:24,620 : INFO : topic #16 (0.020): 0.049*\"king\" + 0.030*\"priest\" + 0.020*\"duke\" + 0.019*\"rotterdam\" + 0.019*\"grammat\" + 0.017*\"idiosyncrat\" + 0.016*\"quarterli\" + 0.014*\"order\" + 0.013*\"portugues\" + 0.013*\"kingdom\"\n", + "2019-01-31 01:01:24,622 : INFO : topic #15 (0.020): 0.011*\"small\" + 0.010*\"organ\" + 0.010*\"develop\" + 0.010*\"commun\" + 0.009*\"group\" + 0.009*\"word\" + 0.008*\"peopl\" + 0.007*\"human\" + 0.007*\"woman\" + 0.006*\"summerhil\"\n", + "2019-01-31 01:01:24,623 : INFO : topic #39 (0.020): 0.058*\"canada\" + 0.046*\"canadian\" + 0.024*\"toronto\" + 0.022*\"hoar\" + 0.020*\"ontario\" + 0.016*\"hydrogen\" + 0.015*\"new\" + 0.014*\"misericordia\" + 0.014*\"novotná\" + 0.014*\"quebec\"\n", + "2019-01-31 01:01:24,628 : INFO : topic diff=0.004843, rho=0.027555\n", + "2019-01-31 01:01:24,790 : INFO : PROGRESS: pass 0, at document #2636000/4922894\n", + "2019-01-31 01:01:26,209 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:01:26,476 : INFO : topic #37 (0.020): 0.011*\"charact\" + 0.010*\"man\" + 0.009*\"septemb\" + 0.008*\"anim\" + 0.008*\"comic\" + 0.007*\"love\" + 0.007*\"appear\" + 0.006*\"gestur\" + 0.006*\"workplac\" + 0.005*\"storag\"\n", + "2019-01-31 01:01:26,477 : INFO : topic #27 (0.020): 0.072*\"questionnair\" + 0.021*\"candid\" + 0.021*\"taxpay\" + 0.014*\"driver\" + 0.013*\"ret\" + 0.012*\"find\" + 0.012*\"tornado\" + 0.011*\"fool\" + 0.011*\"landslid\" + 0.010*\"squatter\"\n", + "2019-01-31 01:01:26,478 : INFO : topic #21 (0.020): 0.035*\"samford\" + 0.022*\"spain\" + 0.019*\"del\" + 0.018*\"mexico\" + 0.014*\"italian\" + 0.014*\"soviet\" + 0.012*\"santa\" + 0.012*\"juan\" + 0.011*\"lizard\" + 0.011*\"carlo\"\n", + "2019-01-31 01:01:26,479 : INFO : topic #0 (0.020): 0.066*\"statewid\" + 0.042*\"line\" + 0.035*\"raid\" + 0.027*\"arsen\" + 0.024*\"museo\" + 0.020*\"traceabl\" + 0.018*\"serv\" + 0.017*\"rosenwald\" + 0.013*\"oper\" + 0.012*\"exhaust\"\n", + "2019-01-31 01:01:26,480 : INFO : topic #49 (0.020): 0.045*\"india\" + 0.033*\"incumb\" + 0.013*\"islam\" + 0.012*\"anglo\" + 0.012*\"pakistan\" + 0.011*\"televis\" + 0.010*\"muskoge\" + 0.010*\"sri\" + 0.010*\"tajikistan\" + 0.010*\"khalsa\"\n", + "2019-01-31 01:01:26,486 : INFO : topic diff=0.004382, rho=0.027545\n", + "2019-01-31 01:01:26,647 : INFO : PROGRESS: pass 0, at document #2638000/4922894\n", + "2019-01-31 01:01:28,029 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:01:28,298 : INFO : topic #32 (0.020): 0.051*\"district\" + 0.043*\"vigour\" + 0.042*\"popolo\" + 0.036*\"tortur\" + 0.031*\"cotton\" + 0.024*\"area\" + 0.024*\"multitud\" + 0.021*\"citi\" + 0.020*\"regim\" + 0.019*\"cede\"\n", + "2019-01-31 01:01:28,299 : INFO : topic #23 (0.020): 0.133*\"audit\" + 0.068*\"best\" + 0.033*\"yawn\" + 0.030*\"jacksonvil\" + 0.022*\"japanes\" + 0.022*\"noll\" + 0.019*\"women\" + 0.019*\"festiv\" + 0.018*\"intern\" + 0.015*\"prison\"\n", + "2019-01-31 01:01:28,300 : INFO : topic #15 (0.020): 0.011*\"small\" + 0.010*\"organ\" + 0.010*\"develop\" + 0.010*\"commun\" + 0.009*\"group\" + 0.009*\"word\" + 0.008*\"peopl\" + 0.007*\"human\" + 0.007*\"woman\" + 0.006*\"summerhil\"\n", + "2019-01-31 01:01:28,301 : INFO : topic #43 (0.020): 0.063*\"elect\" + 0.054*\"parti\" + 0.024*\"voluntari\" + 0.023*\"democrat\" + 0.021*\"member\" + 0.016*\"polici\" + 0.014*\"republ\" + 0.014*\"bypass\" + 0.013*\"report\" + 0.013*\"liber\"\n", + "2019-01-31 01:01:28,303 : INFO : topic #30 (0.020): 0.035*\"cleveland\" + 0.035*\"leagu\" + 0.029*\"place\" + 0.028*\"taxpay\" + 0.024*\"scientist\" + 0.023*\"crete\" + 0.021*\"folei\" + 0.016*\"goal\" + 0.016*\"martin\" + 0.013*\"schmitz\"\n", + "2019-01-31 01:01:28,308 : INFO : topic diff=0.004108, rho=0.027535\n", + "2019-01-31 01:01:31,013 : INFO : -11.656 per-word bound, 3227.8 perplexity estimate based on a held-out corpus of 2000 documents with 541004 words\n", + "2019-01-31 01:01:31,013 : INFO : PROGRESS: pass 0, at document #2640000/4922894\n", + "2019-01-31 01:01:32,405 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:01:32,672 : INFO : topic #47 (0.020): 0.063*\"muscl\" + 0.034*\"perceptu\" + 0.022*\"theater\" + 0.018*\"place\" + 0.018*\"damn\" + 0.017*\"compos\" + 0.013*\"orchestr\" + 0.013*\"olympo\" + 0.013*\"physician\" + 0.011*\"word\"\n", + "2019-01-31 01:01:32,673 : INFO : topic #7 (0.020): 0.021*\"snatch\" + 0.020*\"di\" + 0.019*\"factor\" + 0.016*\"margin\" + 0.016*\"yawn\" + 0.014*\"bone\" + 0.013*\"faster\" + 0.013*\"life\" + 0.012*\"daughter\" + 0.012*\"john\"\n", + "2019-01-31 01:01:32,674 : INFO : topic #6 (0.020): 0.070*\"fewer\" + 0.023*\"epiru\" + 0.022*\"septemb\" + 0.018*\"teacher\" + 0.016*\"stake\" + 0.013*\"rodríguez\" + 0.012*\"proclaim\" + 0.011*\"acrimoni\" + 0.011*\"direct\" + 0.011*\"movi\"\n", + "2019-01-31 01:01:32,676 : INFO : topic #24 (0.020): 0.039*\"book\" + 0.034*\"publicis\" + 0.027*\"word\" + 0.018*\"new\" + 0.014*\"edit\" + 0.013*\"presid\" + 0.012*\"collect\" + 0.011*\"storag\" + 0.011*\"nicola\" + 0.011*\"author\"\n", + "2019-01-31 01:01:32,677 : INFO : topic #34 (0.020): 0.069*\"start\" + 0.034*\"new\" + 0.031*\"american\" + 0.030*\"unionist\" + 0.024*\"cotton\" + 0.021*\"year\" + 0.015*\"california\" + 0.013*\"warrior\" + 0.013*\"terri\" + 0.011*\"north\"\n", + "2019-01-31 01:01:32,683 : INFO : topic diff=0.003775, rho=0.027524\n", + "2019-01-31 01:01:32,843 : INFO : PROGRESS: pass 0, at document #2642000/4922894\n", + "2019-01-31 01:01:34,253 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:01:34,520 : INFO : topic #45 (0.020): 0.027*\"jpg\" + 0.025*\"fifteenth\" + 0.018*\"illicit\" + 0.018*\"colder\" + 0.015*\"black\" + 0.014*\"western\" + 0.012*\"record\" + 0.010*\"pain\" + 0.010*\"blind\" + 0.009*\"depress\"\n", + "2019-01-31 01:01:34,521 : INFO : topic #14 (0.020): 0.024*\"forc\" + 0.024*\"aggress\" + 0.020*\"armi\" + 0.019*\"walter\" + 0.017*\"com\" + 0.014*\"oper\" + 0.014*\"unionist\" + 0.013*\"militari\" + 0.012*\"airbu\" + 0.011*\"diversifi\"\n", + "2019-01-31 01:01:34,522 : INFO : topic #1 (0.020): 0.053*\"china\" + 0.045*\"chilton\" + 0.024*\"hong\" + 0.024*\"kong\" + 0.021*\"korea\" + 0.019*\"korean\" + 0.015*\"shirin\" + 0.015*\"leah\" + 0.015*\"sourc\" + 0.013*\"taiwan\"\n", + "2019-01-31 01:01:34,523 : INFO : topic #35 (0.020): 0.059*\"russia\" + 0.038*\"sovereignti\" + 0.033*\"rural\" + 0.025*\"personifi\" + 0.024*\"poison\" + 0.024*\"reprint\" + 0.021*\"moscow\" + 0.017*\"poland\" + 0.016*\"unfortun\" + 0.015*\"czech\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 01:01:34,524 : INFO : topic #43 (0.020): 0.063*\"elect\" + 0.054*\"parti\" + 0.024*\"voluntari\" + 0.022*\"democrat\" + 0.021*\"member\" + 0.016*\"polici\" + 0.014*\"republ\" + 0.013*\"bypass\" + 0.013*\"report\" + 0.013*\"liber\"\n", + "2019-01-31 01:01:34,529 : INFO : topic diff=0.004781, rho=0.027514\n", + "2019-01-31 01:01:34,689 : INFO : PROGRESS: pass 0, at document #2644000/4922894\n", + "2019-01-31 01:01:36,088 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:01:36,355 : INFO : topic #11 (0.020): 0.024*\"john\" + 0.012*\"will\" + 0.012*\"jame\" + 0.011*\"david\" + 0.010*\"rival\" + 0.009*\"mexican–american\" + 0.008*\"slur\" + 0.008*\"georg\" + 0.008*\"paul\" + 0.008*\"rhyme\"\n", + "2019-01-31 01:01:36,356 : INFO : topic #19 (0.020): 0.016*\"languag\" + 0.016*\"centuri\" + 0.010*\"woodcut\" + 0.009*\"form\" + 0.009*\"origin\" + 0.009*\"mean\" + 0.008*\"trade\" + 0.007*\"english\" + 0.007*\"known\" + 0.006*\"ancestor\"\n", + "2019-01-31 01:01:36,357 : INFO : topic #38 (0.020): 0.023*\"walter\" + 0.010*\"aza\" + 0.008*\"forc\" + 0.008*\"battalion\" + 0.008*\"teufel\" + 0.007*\"empath\" + 0.007*\"armi\" + 0.007*\"till\" + 0.006*\"militari\" + 0.006*\"govern\"\n", + "2019-01-31 01:01:36,358 : INFO : topic #27 (0.020): 0.072*\"questionnair\" + 0.021*\"candid\" + 0.020*\"taxpay\" + 0.014*\"driver\" + 0.013*\"ret\" + 0.012*\"find\" + 0.012*\"tornado\" + 0.011*\"fool\" + 0.011*\"squatter\" + 0.011*\"landslid\"\n", + "2019-01-31 01:01:36,359 : INFO : topic #41 (0.020): 0.041*\"citi\" + 0.024*\"palmer\" + 0.022*\"new\" + 0.015*\"strategist\" + 0.012*\"center\" + 0.012*\"open\" + 0.011*\"includ\" + 0.011*\"lobe\" + 0.009*\"dai\" + 0.009*\"highli\"\n", + "2019-01-31 01:01:36,365 : INFO : topic diff=0.004381, rho=0.027503\n", + "2019-01-31 01:01:36,524 : INFO : PROGRESS: pass 0, at document #2646000/4922894\n", + "2019-01-31 01:01:37,916 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:01:38,184 : INFO : topic #35 (0.020): 0.058*\"russia\" + 0.038*\"sovereignti\" + 0.033*\"rural\" + 0.025*\"personifi\" + 0.024*\"poison\" + 0.024*\"reprint\" + 0.021*\"moscow\" + 0.017*\"poland\" + 0.016*\"unfortun\" + 0.015*\"czech\"\n", + "2019-01-31 01:01:38,185 : INFO : topic #3 (0.020): 0.033*\"present\" + 0.027*\"offic\" + 0.024*\"nation\" + 0.022*\"minist\" + 0.022*\"govern\" + 0.021*\"member\" + 0.017*\"start\" + 0.017*\"serv\" + 0.016*\"gener\" + 0.014*\"chickasaw\"\n", + "2019-01-31 01:01:38,186 : INFO : topic #39 (0.020): 0.059*\"canada\" + 0.046*\"canadian\" + 0.023*\"hoar\" + 0.023*\"toronto\" + 0.020*\"ontario\" + 0.016*\"hydrogen\" + 0.015*\"novotná\" + 0.015*\"new\" + 0.014*\"misericordia\" + 0.013*\"quebec\"\n", + "2019-01-31 01:01:38,187 : INFO : topic #23 (0.020): 0.133*\"audit\" + 0.068*\"best\" + 0.033*\"yawn\" + 0.030*\"jacksonvil\" + 0.022*\"japanes\" + 0.022*\"noll\" + 0.019*\"festiv\" + 0.019*\"women\" + 0.018*\"intern\" + 0.014*\"prison\"\n", + "2019-01-31 01:01:38,188 : INFO : topic #21 (0.020): 0.035*\"samford\" + 0.022*\"spain\" + 0.019*\"del\" + 0.017*\"mexico\" + 0.014*\"soviet\" + 0.014*\"italian\" + 0.012*\"santa\" + 0.011*\"juan\" + 0.011*\"carlo\" + 0.011*\"lizard\"\n", + "2019-01-31 01:01:38,194 : INFO : topic diff=0.003199, rho=0.027493\n", + "2019-01-31 01:01:38,352 : INFO : PROGRESS: pass 0, at document #2648000/4922894\n", + "2019-01-31 01:01:39,736 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:01:40,003 : INFO : topic #31 (0.020): 0.051*\"fusiform\" + 0.028*\"scientist\" + 0.026*\"taxpay\" + 0.022*\"player\" + 0.019*\"place\" + 0.014*\"clot\" + 0.013*\"leagu\" + 0.011*\"folei\" + 0.011*\"yawn\" + 0.009*\"reconstruct\"\n", + "2019-01-31 01:01:40,004 : INFO : topic #38 (0.020): 0.023*\"walter\" + 0.010*\"aza\" + 0.008*\"forc\" + 0.008*\"battalion\" + 0.008*\"teufel\" + 0.007*\"empath\" + 0.007*\"armi\" + 0.007*\"till\" + 0.006*\"militari\" + 0.006*\"govern\"\n", + "2019-01-31 01:01:40,005 : INFO : topic #32 (0.020): 0.050*\"district\" + 0.043*\"popolo\" + 0.043*\"vigour\" + 0.036*\"tortur\" + 0.031*\"cotton\" + 0.024*\"multitud\" + 0.024*\"area\" + 0.021*\"citi\" + 0.020*\"regim\" + 0.019*\"cede\"\n", + "2019-01-31 01:01:40,006 : INFO : topic #34 (0.020): 0.069*\"start\" + 0.034*\"new\" + 0.031*\"american\" + 0.030*\"unionist\" + 0.024*\"cotton\" + 0.021*\"year\" + 0.015*\"california\" + 0.013*\"warrior\" + 0.013*\"terri\" + 0.011*\"north\"\n", + "2019-01-31 01:01:40,007 : INFO : topic #0 (0.020): 0.066*\"statewid\" + 0.042*\"line\" + 0.035*\"raid\" + 0.027*\"arsen\" + 0.024*\"museo\" + 0.020*\"traceabl\" + 0.018*\"serv\" + 0.018*\"rosenwald\" + 0.012*\"oper\" + 0.012*\"exhaust\"\n", + "2019-01-31 01:01:40,013 : INFO : topic diff=0.004189, rho=0.027482\n", + "2019-01-31 01:01:40,167 : INFO : PROGRESS: pass 0, at document #2650000/4922894\n", + "2019-01-31 01:01:41,538 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:01:41,808 : INFO : topic #47 (0.020): 0.063*\"muscl\" + 0.035*\"perceptu\" + 0.021*\"theater\" + 0.018*\"place\" + 0.017*\"compos\" + 0.017*\"damn\" + 0.014*\"orchestr\" + 0.013*\"physician\" + 0.012*\"olympo\" + 0.011*\"word\"\n", + "2019-01-31 01:01:41,809 : INFO : topic #31 (0.020): 0.052*\"fusiform\" + 0.027*\"scientist\" + 0.026*\"taxpay\" + 0.022*\"player\" + 0.019*\"place\" + 0.014*\"clot\" + 0.013*\"leagu\" + 0.011*\"folei\" + 0.011*\"yawn\" + 0.009*\"reconstruct\"\n", + "2019-01-31 01:01:41,810 : INFO : topic #21 (0.020): 0.034*\"samford\" + 0.022*\"spain\" + 0.019*\"del\" + 0.017*\"mexico\" + 0.014*\"soviet\" + 0.014*\"italian\" + 0.012*\"santa\" + 0.011*\"juan\" + 0.011*\"carlo\" + 0.011*\"lizard\"\n", + "2019-01-31 01:01:41,811 : INFO : topic #14 (0.020): 0.024*\"forc\" + 0.024*\"aggress\" + 0.021*\"armi\" + 0.020*\"walter\" + 0.017*\"com\" + 0.014*\"oper\" + 0.014*\"unionist\" + 0.013*\"militari\" + 0.012*\"airbu\" + 0.011*\"diversifi\"\n", + "2019-01-31 01:01:41,812 : INFO : topic #46 (0.020): 0.017*\"norwai\" + 0.017*\"sweden\" + 0.016*\"swedish\" + 0.016*\"stop\" + 0.015*\"damag\" + 0.013*\"norwegian\" + 0.013*\"wind\" + 0.011*\"turkish\" + 0.011*\"treeless\" + 0.011*\"turkei\"\n", + "2019-01-31 01:01:41,818 : INFO : topic diff=0.004307, rho=0.027472\n", + "2019-01-31 01:01:41,976 : INFO : PROGRESS: pass 0, at document #2652000/4922894\n", + "2019-01-31 01:01:43,368 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:01:43,635 : INFO : topic #18 (0.020): 0.011*\"théori\" + 0.007*\"later\" + 0.007*\"sack\" + 0.006*\"dai\" + 0.006*\"kill\" + 0.005*\"retrospect\" + 0.005*\"like\" + 0.005*\"end\" + 0.004*\"help\" + 0.004*\"call\"\n", + "2019-01-31 01:01:43,636 : INFO : topic #22 (0.020): 0.035*\"spars\" + 0.023*\"factor\" + 0.012*\"plaisir\" + 0.012*\"feel\" + 0.011*\"male\" + 0.010*\"genu\" + 0.010*\"adulthood\" + 0.008*\"median\" + 0.008*\"western\" + 0.008*\"biom\"\n", + "2019-01-31 01:01:43,637 : INFO : topic #25 (0.020): 0.032*\"ring\" + 0.018*\"lagrang\" + 0.018*\"area\" + 0.017*\"warmth\" + 0.016*\"mount\" + 0.009*\"north\" + 0.009*\"palmer\" + 0.009*\"sourc\" + 0.008*\"vacant\" + 0.008*\"foam\"\n", + "2019-01-31 01:01:43,638 : INFO : topic #27 (0.020): 0.072*\"questionnair\" + 0.020*\"candid\" + 0.019*\"taxpay\" + 0.014*\"driver\" + 0.013*\"ret\" + 0.012*\"find\" + 0.012*\"fool\" + 0.012*\"tornado\" + 0.011*\"squatter\" + 0.011*\"landslid\"\n", + "2019-01-31 01:01:43,639 : INFO : topic #42 (0.020): 0.047*\"german\" + 0.032*\"germani\" + 0.015*\"vol\" + 0.015*\"berlin\" + 0.013*\"jewish\" + 0.013*\"israel\" + 0.013*\"der\" + 0.010*\"europ\" + 0.010*\"european\" + 0.009*\"austria\"\n", + "2019-01-31 01:01:43,646 : INFO : topic diff=0.004178, rho=0.027462\n", + "2019-01-31 01:01:43,861 : INFO : PROGRESS: pass 0, at document #2654000/4922894\n", + "2019-01-31 01:01:45,254 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:01:45,520 : INFO : topic #16 (0.020): 0.049*\"king\" + 0.030*\"priest\" + 0.021*\"duke\" + 0.019*\"rotterdam\" + 0.018*\"grammat\" + 0.017*\"idiosyncrat\" + 0.017*\"quarterli\" + 0.014*\"kingdom\" + 0.013*\"brazil\" + 0.013*\"order\"\n", + "2019-01-31 01:01:45,521 : INFO : topic #26 (0.020): 0.030*\"workplac\" + 0.028*\"woman\" + 0.028*\"champion\" + 0.026*\"men\" + 0.025*\"olymp\" + 0.021*\"medal\" + 0.019*\"event\" + 0.019*\"atheist\" + 0.019*\"alic\" + 0.018*\"rainfal\"\n", + "2019-01-31 01:01:45,522 : INFO : topic #3 (0.020): 0.033*\"present\" + 0.027*\"offic\" + 0.024*\"nation\" + 0.023*\"minist\" + 0.022*\"govern\" + 0.021*\"member\" + 0.017*\"serv\" + 0.017*\"start\" + 0.016*\"gener\" + 0.014*\"seri\"\n", + "2019-01-31 01:01:45,523 : INFO : topic #18 (0.020): 0.011*\"théori\" + 0.007*\"later\" + 0.007*\"sack\" + 0.006*\"dai\" + 0.006*\"kill\" + 0.005*\"retrospect\" + 0.005*\"like\" + 0.005*\"end\" + 0.004*\"help\" + 0.004*\"call\"\n", + "2019-01-31 01:01:45,524 : INFO : topic #17 (0.020): 0.077*\"church\" + 0.021*\"cathol\" + 0.021*\"christian\" + 0.020*\"bishop\" + 0.016*\"retroflex\" + 0.015*\"sail\" + 0.012*\"centuri\" + 0.009*\"historiographi\" + 0.009*\"relationship\" + 0.009*\"poll\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 01:01:45,530 : INFO : topic diff=0.003964, rho=0.027451\n", + "2019-01-31 01:01:45,685 : INFO : PROGRESS: pass 0, at document #2656000/4922894\n", + "2019-01-31 01:01:47,060 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:01:47,327 : INFO : topic #30 (0.020): 0.036*\"cleveland\" + 0.035*\"leagu\" + 0.029*\"place\" + 0.028*\"taxpay\" + 0.024*\"scientist\" + 0.023*\"crete\" + 0.021*\"folei\" + 0.017*\"goal\" + 0.015*\"martin\" + 0.013*\"schmitz\"\n", + "2019-01-31 01:01:47,328 : INFO : topic #33 (0.020): 0.060*\"french\" + 0.045*\"franc\" + 0.030*\"pari\" + 0.028*\"sail\" + 0.021*\"jean\" + 0.017*\"daphn\" + 0.013*\"lazi\" + 0.012*\"loui\" + 0.011*\"piec\" + 0.008*\"wine\"\n", + "2019-01-31 01:01:47,329 : INFO : topic #47 (0.020): 0.063*\"muscl\" + 0.035*\"perceptu\" + 0.021*\"theater\" + 0.018*\"place\" + 0.018*\"compos\" + 0.017*\"damn\" + 0.014*\"orchestr\" + 0.013*\"physician\" + 0.012*\"olympo\" + 0.011*\"word\"\n", + "2019-01-31 01:01:47,330 : INFO : topic #11 (0.020): 0.024*\"john\" + 0.012*\"will\" + 0.012*\"jame\" + 0.011*\"david\" + 0.010*\"rival\" + 0.009*\"mexican–american\" + 0.008*\"georg\" + 0.008*\"slur\" + 0.008*\"paul\" + 0.008*\"rhyme\"\n", + "2019-01-31 01:01:47,331 : INFO : topic #44 (0.020): 0.029*\"rooftop\" + 0.027*\"final\" + 0.023*\"wife\" + 0.020*\"tourist\" + 0.019*\"champion\" + 0.015*\"martin\" + 0.015*\"chamber\" + 0.015*\"tiepolo\" + 0.014*\"taxpay\" + 0.013*\"winner\"\n", + "2019-01-31 01:01:47,337 : INFO : topic diff=0.003786, rho=0.027441\n", + "2019-01-31 01:01:47,491 : INFO : PROGRESS: pass 0, at document #2658000/4922894\n", + "2019-01-31 01:01:48,834 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:01:49,101 : INFO : topic #27 (0.020): 0.072*\"questionnair\" + 0.021*\"candid\" + 0.020*\"taxpay\" + 0.014*\"driver\" + 0.013*\"ret\" + 0.012*\"tornado\" + 0.012*\"find\" + 0.011*\"fool\" + 0.011*\"landslid\" + 0.010*\"squatter\"\n", + "2019-01-31 01:01:49,102 : INFO : topic #47 (0.020): 0.063*\"muscl\" + 0.035*\"perceptu\" + 0.021*\"theater\" + 0.018*\"place\" + 0.018*\"compos\" + 0.017*\"damn\" + 0.014*\"orchestr\" + 0.013*\"physician\" + 0.012*\"olympo\" + 0.011*\"word\"\n", + "2019-01-31 01:01:49,103 : INFO : topic #30 (0.020): 0.036*\"cleveland\" + 0.035*\"leagu\" + 0.029*\"place\" + 0.028*\"taxpay\" + 0.024*\"scientist\" + 0.023*\"crete\" + 0.021*\"folei\" + 0.017*\"goal\" + 0.015*\"martin\" + 0.013*\"schmitz\"\n", + "2019-01-31 01:01:49,104 : INFO : topic #7 (0.020): 0.021*\"snatch\" + 0.020*\"di\" + 0.019*\"factor\" + 0.016*\"yawn\" + 0.016*\"margin\" + 0.014*\"bone\" + 0.013*\"faster\" + 0.012*\"deal\" + 0.012*\"life\" + 0.012*\"john\"\n", + "2019-01-31 01:01:49,105 : INFO : topic #39 (0.020): 0.058*\"canada\" + 0.044*\"canadian\" + 0.024*\"hoar\" + 0.023*\"toronto\" + 0.019*\"ontario\" + 0.016*\"novotná\" + 0.016*\"hydrogen\" + 0.015*\"new\" + 0.014*\"misericordia\" + 0.014*\"quebec\"\n", + "2019-01-31 01:01:49,111 : INFO : topic diff=0.004013, rho=0.027431\n", + "2019-01-31 01:01:51,765 : INFO : -11.632 per-word bound, 3173.2 perplexity estimate based on a held-out corpus of 2000 documents with 553630 words\n", + "2019-01-31 01:01:51,765 : INFO : PROGRESS: pass 0, at document #2660000/4922894\n", + "2019-01-31 01:01:53,126 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:01:53,392 : INFO : topic #9 (0.020): 0.069*\"bone\" + 0.045*\"american\" + 0.027*\"valour\" + 0.020*\"dutch\" + 0.018*\"english\" + 0.018*\"player\" + 0.018*\"folei\" + 0.017*\"polit\" + 0.012*\"simpler\" + 0.012*\"acrimoni\"\n", + "2019-01-31 01:01:53,394 : INFO : topic #5 (0.020): 0.039*\"abroad\" + 0.029*\"son\" + 0.027*\"rel\" + 0.025*\"reconstruct\" + 0.020*\"band\" + 0.017*\"muscl\" + 0.016*\"simultan\" + 0.015*\"charcoal\" + 0.014*\"toyota\" + 0.009*\"vocabulari\"\n", + "2019-01-31 01:01:53,395 : INFO : topic #26 (0.020): 0.030*\"workplac\" + 0.028*\"champion\" + 0.028*\"woman\" + 0.026*\"men\" + 0.025*\"olymp\" + 0.021*\"medal\" + 0.019*\"event\" + 0.019*\"alic\" + 0.019*\"atheist\" + 0.018*\"rainfal\"\n", + "2019-01-31 01:01:53,396 : INFO : topic #27 (0.020): 0.072*\"questionnair\" + 0.021*\"candid\" + 0.020*\"taxpay\" + 0.013*\"driver\" + 0.013*\"ret\" + 0.012*\"tornado\" + 0.012*\"find\" + 0.012*\"fool\" + 0.011*\"squatter\" + 0.010*\"landslid\"\n", + "2019-01-31 01:01:53,397 : INFO : topic #15 (0.020): 0.011*\"small\" + 0.010*\"organ\" + 0.010*\"develop\" + 0.010*\"commun\" + 0.009*\"word\" + 0.009*\"group\" + 0.008*\"peopl\" + 0.007*\"human\" + 0.006*\"woman\" + 0.006*\"summerhil\"\n", + "2019-01-31 01:01:53,403 : INFO : topic diff=0.004514, rho=0.027420\n", + "2019-01-31 01:01:53,564 : INFO : PROGRESS: pass 0, at document #2662000/4922894\n", + "2019-01-31 01:01:54,975 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:01:55,242 : INFO : topic #8 (0.020): 0.026*\"law\" + 0.023*\"cortic\" + 0.020*\"act\" + 0.018*\"start\" + 0.013*\"ricardo\" + 0.013*\"case\" + 0.010*\"replac\" + 0.010*\"polaris\" + 0.009*\"legal\" + 0.007*\"justic\"\n", + "2019-01-31 01:01:55,243 : INFO : topic #12 (0.020): 0.009*\"number\" + 0.007*\"frontal\" + 0.007*\"gener\" + 0.007*\"servitud\" + 0.006*\"théori\" + 0.006*\"exampl\" + 0.006*\"measur\" + 0.006*\"southern\" + 0.006*\"poet\" + 0.006*\"method\"\n", + "2019-01-31 01:01:55,244 : INFO : topic #41 (0.020): 0.042*\"citi\" + 0.024*\"palmer\" + 0.022*\"new\" + 0.015*\"strategist\" + 0.012*\"center\" + 0.012*\"open\" + 0.011*\"includ\" + 0.011*\"lobe\" + 0.009*\"dai\" + 0.009*\"highli\"\n", + "2019-01-31 01:01:55,245 : INFO : topic #21 (0.020): 0.035*\"samford\" + 0.022*\"spain\" + 0.019*\"del\" + 0.017*\"mexico\" + 0.014*\"soviet\" + 0.014*\"italian\" + 0.012*\"santa\" + 0.011*\"juan\" + 0.011*\"carlo\" + 0.011*\"lizard\"\n", + "2019-01-31 01:01:55,246 : INFO : topic #34 (0.020): 0.069*\"start\" + 0.034*\"new\" + 0.031*\"american\" + 0.030*\"unionist\" + 0.025*\"cotton\" + 0.021*\"year\" + 0.015*\"california\" + 0.013*\"warrior\" + 0.013*\"terri\" + 0.011*\"north\"\n", + "2019-01-31 01:01:55,252 : INFO : topic diff=0.004491, rho=0.027410\n", + "2019-01-31 01:01:55,405 : INFO : PROGRESS: pass 0, at document #2664000/4922894\n", + "2019-01-31 01:01:56,765 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:01:57,032 : INFO : topic #45 (0.020): 0.027*\"jpg\" + 0.025*\"fifteenth\" + 0.018*\"illicit\" + 0.018*\"colder\" + 0.015*\"black\" + 0.014*\"western\" + 0.012*\"record\" + 0.011*\"pain\" + 0.010*\"blind\" + 0.009*\"depress\"\n", + "2019-01-31 01:01:57,033 : INFO : topic #26 (0.020): 0.030*\"workplac\" + 0.028*\"champion\" + 0.027*\"woman\" + 0.026*\"men\" + 0.025*\"olymp\" + 0.022*\"alic\" + 0.021*\"medal\" + 0.019*\"event\" + 0.019*\"atheist\" + 0.018*\"rainfal\"\n", + "2019-01-31 01:01:57,034 : INFO : topic #27 (0.020): 0.071*\"questionnair\" + 0.021*\"taxpay\" + 0.021*\"candid\" + 0.013*\"driver\" + 0.012*\"tornado\" + 0.012*\"ret\" + 0.012*\"find\" + 0.011*\"fool\" + 0.011*\"squatter\" + 0.010*\"landslid\"\n", + "2019-01-31 01:01:57,035 : INFO : topic #12 (0.020): 0.009*\"number\" + 0.007*\"frontal\" + 0.007*\"gener\" + 0.006*\"servitud\" + 0.006*\"théori\" + 0.006*\"exampl\" + 0.006*\"measur\" + 0.006*\"southern\" + 0.006*\"poet\" + 0.006*\"method\"\n", + "2019-01-31 01:01:57,036 : INFO : topic #46 (0.020): 0.017*\"norwai\" + 0.016*\"swedish\" + 0.016*\"sweden\" + 0.016*\"stop\" + 0.015*\"damag\" + 0.014*\"norwegian\" + 0.013*\"wind\" + 0.011*\"turkish\" + 0.011*\"treeless\" + 0.011*\"denmark\"\n", + "2019-01-31 01:01:57,042 : INFO : topic diff=0.004277, rho=0.027400\n", + "2019-01-31 01:01:57,196 : INFO : PROGRESS: pass 0, at document #2666000/4922894\n", + "2019-01-31 01:01:58,554 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:01:58,821 : INFO : topic #12 (0.020): 0.009*\"number\" + 0.007*\"frontal\" + 0.007*\"gener\" + 0.007*\"servitud\" + 0.006*\"théori\" + 0.006*\"exampl\" + 0.006*\"measur\" + 0.006*\"southern\" + 0.006*\"poet\" + 0.006*\"method\"\n", + "2019-01-31 01:01:58,822 : INFO : topic #4 (0.020): 0.021*\"enfranchis\" + 0.016*\"depress\" + 0.015*\"pour\" + 0.009*\"mode\" + 0.009*\"elabor\" + 0.008*\"veget\" + 0.007*\"uruguayan\" + 0.006*\"produc\" + 0.006*\"develop\" + 0.006*\"encyclopedia\"\n", + "2019-01-31 01:01:58,823 : INFO : topic #10 (0.020): 0.011*\"cdd\" + 0.008*\"media\" + 0.008*\"disco\" + 0.007*\"hormon\" + 0.007*\"pathwai\" + 0.007*\"caus\" + 0.006*\"have\" + 0.006*\"effect\" + 0.006*\"proper\" + 0.006*\"treat\"\n", + "2019-01-31 01:01:58,824 : INFO : topic #3 (0.020): 0.033*\"present\" + 0.026*\"offic\" + 0.024*\"nation\" + 0.023*\"minist\" + 0.022*\"govern\" + 0.021*\"member\" + 0.017*\"start\" + 0.017*\"serv\" + 0.016*\"gener\" + 0.014*\"seri\"\n", + "2019-01-31 01:01:58,825 : INFO : topic #43 (0.020): 0.065*\"elect\" + 0.054*\"parti\" + 0.024*\"voluntari\" + 0.022*\"democrat\" + 0.021*\"member\" + 0.016*\"polici\" + 0.014*\"republ\" + 0.013*\"bypass\" + 0.013*\"report\" + 0.013*\"selma\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 01:01:58,830 : INFO : topic diff=0.004350, rho=0.027390\n", + "2019-01-31 01:01:58,987 : INFO : PROGRESS: pass 0, at document #2668000/4922894\n", + "2019-01-31 01:02:00,372 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:02:00,638 : INFO : topic #9 (0.020): 0.069*\"bone\" + 0.045*\"american\" + 0.027*\"valour\" + 0.020*\"dutch\" + 0.018*\"english\" + 0.018*\"player\" + 0.018*\"folei\" + 0.017*\"polit\" + 0.012*\"acrimoni\" + 0.012*\"simpler\"\n", + "2019-01-31 01:02:00,639 : INFO : topic #10 (0.020): 0.011*\"cdd\" + 0.008*\"media\" + 0.008*\"disco\" + 0.008*\"hormon\" + 0.007*\"pathwai\" + 0.007*\"caus\" + 0.006*\"have\" + 0.006*\"effect\" + 0.006*\"proper\" + 0.006*\"treat\"\n", + "2019-01-31 01:02:00,640 : INFO : topic #13 (0.020): 0.026*\"sourc\" + 0.025*\"australia\" + 0.025*\"london\" + 0.025*\"new\" + 0.022*\"england\" + 0.022*\"australian\" + 0.019*\"british\" + 0.018*\"ireland\" + 0.015*\"youth\" + 0.014*\"wale\"\n", + "2019-01-31 01:02:00,641 : INFO : topic #6 (0.020): 0.070*\"fewer\" + 0.023*\"epiru\" + 0.022*\"septemb\" + 0.018*\"teacher\" + 0.016*\"stake\" + 0.013*\"rodríguez\" + 0.012*\"proclaim\" + 0.011*\"direct\" + 0.011*\"acrimoni\" + 0.011*\"movi\"\n", + "2019-01-31 01:02:00,642 : INFO : topic #23 (0.020): 0.135*\"audit\" + 0.068*\"best\" + 0.034*\"yawn\" + 0.029*\"jacksonvil\" + 0.022*\"noll\" + 0.022*\"japanes\" + 0.020*\"festiv\" + 0.019*\"women\" + 0.018*\"intern\" + 0.014*\"prison\"\n", + "2019-01-31 01:02:00,648 : INFO : topic diff=0.003914, rho=0.027379\n", + "2019-01-31 01:02:00,799 : INFO : PROGRESS: pass 0, at document #2670000/4922894\n", + "2019-01-31 01:02:02,142 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:02:02,410 : INFO : topic #6 (0.020): 0.070*\"fewer\" + 0.023*\"epiru\" + 0.022*\"septemb\" + 0.018*\"teacher\" + 0.016*\"stake\" + 0.013*\"rodríguez\" + 0.012*\"proclaim\" + 0.011*\"direct\" + 0.011*\"acrimoni\" + 0.011*\"movi\"\n", + "2019-01-31 01:02:02,411 : INFO : topic #31 (0.020): 0.051*\"fusiform\" + 0.027*\"scientist\" + 0.026*\"taxpay\" + 0.022*\"player\" + 0.019*\"place\" + 0.014*\"clot\" + 0.013*\"leagu\" + 0.011*\"folei\" + 0.011*\"yawn\" + 0.009*\"reconstruct\"\n", + "2019-01-31 01:02:02,412 : INFO : topic #27 (0.020): 0.071*\"questionnair\" + 0.021*\"candid\" + 0.020*\"taxpay\" + 0.014*\"driver\" + 0.013*\"ret\" + 0.012*\"tornado\" + 0.012*\"find\" + 0.011*\"fool\" + 0.011*\"squatter\" + 0.010*\"landslid\"\n", + "2019-01-31 01:02:02,413 : INFO : topic #2 (0.020): 0.052*\"isl\" + 0.039*\"shield\" + 0.018*\"narrat\" + 0.014*\"scot\" + 0.012*\"pope\" + 0.011*\"blur\" + 0.010*\"coalit\" + 0.010*\"nativist\" + 0.009*\"bahá\" + 0.009*\"fleet\"\n", + "2019-01-31 01:02:02,414 : INFO : topic #4 (0.020): 0.020*\"enfranchis\" + 0.015*\"depress\" + 0.015*\"pour\" + 0.009*\"mode\" + 0.009*\"elabor\" + 0.008*\"veget\" + 0.007*\"uruguayan\" + 0.006*\"produc\" + 0.006*\"develop\" + 0.006*\"spectacl\"\n", + "2019-01-31 01:02:02,420 : INFO : topic diff=0.004387, rho=0.027369\n", + "2019-01-31 01:02:02,576 : INFO : PROGRESS: pass 0, at document #2672000/4922894\n", + "2019-01-31 01:02:03,958 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:02:04,226 : INFO : topic #2 (0.020): 0.052*\"isl\" + 0.038*\"shield\" + 0.018*\"narrat\" + 0.014*\"scot\" + 0.012*\"pope\" + 0.011*\"blur\" + 0.010*\"coalit\" + 0.010*\"nativist\" + 0.009*\"bahá\" + 0.009*\"fleet\"\n", + "2019-01-31 01:02:04,228 : INFO : topic #4 (0.020): 0.020*\"enfranchis\" + 0.015*\"depress\" + 0.015*\"pour\" + 0.009*\"mode\" + 0.009*\"elabor\" + 0.008*\"veget\" + 0.007*\"uruguayan\" + 0.006*\"produc\" + 0.006*\"develop\" + 0.006*\"spectacl\"\n", + "2019-01-31 01:02:04,229 : INFO : topic #23 (0.020): 0.134*\"audit\" + 0.068*\"best\" + 0.033*\"yawn\" + 0.029*\"jacksonvil\" + 0.022*\"noll\" + 0.022*\"japanes\" + 0.020*\"festiv\" + 0.020*\"women\" + 0.018*\"intern\" + 0.014*\"prison\"\n", + "2019-01-31 01:02:04,230 : INFO : topic #26 (0.020): 0.030*\"workplac\" + 0.028*\"champion\" + 0.027*\"woman\" + 0.026*\"men\" + 0.025*\"olymp\" + 0.021*\"medal\" + 0.021*\"alic\" + 0.020*\"event\" + 0.019*\"atheist\" + 0.018*\"rainfal\"\n", + "2019-01-31 01:02:04,231 : INFO : topic #31 (0.020): 0.051*\"fusiform\" + 0.027*\"scientist\" + 0.026*\"taxpay\" + 0.022*\"player\" + 0.019*\"place\" + 0.014*\"clot\" + 0.013*\"leagu\" + 0.011*\"folei\" + 0.011*\"yawn\" + 0.009*\"reconstruct\"\n", + "2019-01-31 01:02:04,237 : INFO : topic diff=0.003681, rho=0.027359\n", + "2019-01-31 01:02:04,397 : INFO : PROGRESS: pass 0, at document #2674000/4922894\n", + "2019-01-31 01:02:05,785 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:02:06,051 : INFO : topic #0 (0.020): 0.065*\"statewid\" + 0.043*\"line\" + 0.033*\"raid\" + 0.026*\"arsen\" + 0.023*\"museo\" + 0.020*\"traceabl\" + 0.019*\"rosenwald\" + 0.018*\"serv\" + 0.012*\"oper\" + 0.011*\"exhaust\"\n", + "2019-01-31 01:02:06,052 : INFO : topic #27 (0.020): 0.072*\"questionnair\" + 0.021*\"candid\" + 0.020*\"taxpay\" + 0.014*\"driver\" + 0.013*\"ret\" + 0.012*\"tornado\" + 0.012*\"fool\" + 0.012*\"find\" + 0.011*\"squatter\" + 0.010*\"landslid\"\n", + "2019-01-31 01:02:06,053 : INFO : topic #9 (0.020): 0.069*\"bone\" + 0.045*\"american\" + 0.026*\"valour\" + 0.019*\"dutch\" + 0.018*\"english\" + 0.018*\"player\" + 0.018*\"folei\" + 0.017*\"polit\" + 0.012*\"acrimoni\" + 0.012*\"simpler\"\n", + "2019-01-31 01:02:06,054 : INFO : topic #42 (0.020): 0.045*\"german\" + 0.031*\"germani\" + 0.015*\"vol\" + 0.014*\"israel\" + 0.014*\"berlin\" + 0.013*\"der\" + 0.013*\"jewish\" + 0.010*\"european\" + 0.010*\"europ\" + 0.009*\"austria\"\n", + "2019-01-31 01:02:06,055 : INFO : topic #15 (0.020): 0.011*\"small\" + 0.010*\"organ\" + 0.010*\"develop\" + 0.009*\"commun\" + 0.009*\"word\" + 0.009*\"group\" + 0.008*\"peopl\" + 0.007*\"human\" + 0.007*\"woman\" + 0.006*\"summerhil\"\n", + "2019-01-31 01:02:06,061 : INFO : topic diff=0.005288, rho=0.027349\n", + "2019-01-31 01:02:06,218 : INFO : PROGRESS: pass 0, at document #2676000/4922894\n", + "2019-01-31 01:02:07,594 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:02:07,861 : INFO : topic #47 (0.020): 0.064*\"muscl\" + 0.034*\"perceptu\" + 0.020*\"theater\" + 0.018*\"place\" + 0.017*\"compos\" + 0.017*\"damn\" + 0.014*\"orchestr\" + 0.013*\"physician\" + 0.012*\"olympo\" + 0.011*\"word\"\n", + "2019-01-31 01:02:07,862 : INFO : topic #15 (0.020): 0.011*\"small\" + 0.010*\"organ\" + 0.010*\"develop\" + 0.009*\"commun\" + 0.009*\"word\" + 0.009*\"group\" + 0.008*\"peopl\" + 0.007*\"human\" + 0.007*\"woman\" + 0.006*\"summerhil\"\n", + "2019-01-31 01:02:07,863 : INFO : topic #29 (0.020): 0.030*\"companhia\" + 0.012*\"busi\" + 0.012*\"bank\" + 0.011*\"million\" + 0.011*\"market\" + 0.011*\"produc\" + 0.010*\"industri\" + 0.008*\"yawn\" + 0.008*\"manag\" + 0.007*\"oper\"\n", + "2019-01-31 01:02:07,864 : INFO : topic #24 (0.020): 0.039*\"book\" + 0.033*\"publicis\" + 0.027*\"word\" + 0.018*\"new\" + 0.014*\"edit\" + 0.014*\"presid\" + 0.012*\"collect\" + 0.012*\"storag\" + 0.011*\"nicola\" + 0.011*\"author\"\n", + "2019-01-31 01:02:07,865 : INFO : topic #42 (0.020): 0.045*\"german\" + 0.031*\"germani\" + 0.015*\"vol\" + 0.014*\"berlin\" + 0.014*\"israel\" + 0.013*\"jewish\" + 0.013*\"der\" + 0.010*\"european\" + 0.010*\"europ\" + 0.009*\"austria\"\n", + "2019-01-31 01:02:07,872 : INFO : topic diff=0.004575, rho=0.027338\n", + "2019-01-31 01:02:08,028 : INFO : PROGRESS: pass 0, at document #2678000/4922894\n", + "2019-01-31 01:02:09,381 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:02:09,648 : INFO : topic #39 (0.020): 0.057*\"canada\" + 0.045*\"canadian\" + 0.024*\"hoar\" + 0.022*\"toronto\" + 0.020*\"ontario\" + 0.016*\"novotná\" + 0.016*\"hydrogen\" + 0.014*\"new\" + 0.014*\"misericordia\" + 0.013*\"quebec\"\n", + "2019-01-31 01:02:09,648 : INFO : topic #26 (0.020): 0.030*\"workplac\" + 0.028*\"champion\" + 0.027*\"woman\" + 0.025*\"men\" + 0.024*\"olymp\" + 0.024*\"alic\" + 0.021*\"medal\" + 0.019*\"event\" + 0.019*\"atheist\" + 0.018*\"rainfal\"\n", + "2019-01-31 01:02:09,649 : INFO : topic #36 (0.020): 0.011*\"network\" + 0.011*\"prognosi\" + 0.009*\"pop\" + 0.008*\"develop\" + 0.008*\"cytokin\" + 0.008*\"user\" + 0.008*\"diggin\" + 0.008*\"uruguayan\" + 0.008*\"softwar\" + 0.007*\"includ\"\n", + "2019-01-31 01:02:09,650 : INFO : topic #43 (0.020): 0.064*\"elect\" + 0.053*\"parti\" + 0.024*\"voluntari\" + 0.021*\"democrat\" + 0.021*\"member\" + 0.016*\"polici\" + 0.014*\"republ\" + 0.013*\"bypass\" + 0.013*\"report\" + 0.012*\"seaport\"\n", + "2019-01-31 01:02:09,651 : INFO : topic #42 (0.020): 0.045*\"german\" + 0.031*\"germani\" + 0.015*\"vol\" + 0.014*\"berlin\" + 0.014*\"israel\" + 0.013*\"jewish\" + 0.013*\"der\" + 0.010*\"european\" + 0.010*\"europ\" + 0.009*\"austria\"\n", + "2019-01-31 01:02:09,657 : INFO : topic diff=0.003942, rho=0.027328\n", + "2019-01-31 01:02:12,295 : INFO : -11.608 per-word bound, 3121.9 perplexity estimate based on a held-out corpus of 2000 documents with 542997 words\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 01:02:12,295 : INFO : PROGRESS: pass 0, at document #2680000/4922894\n", + "2019-01-31 01:02:13,649 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:02:13,915 : INFO : topic #36 (0.020): 0.011*\"network\" + 0.011*\"prognosi\" + 0.009*\"pop\" + 0.008*\"develop\" + 0.008*\"cytokin\" + 0.008*\"user\" + 0.008*\"uruguayan\" + 0.008*\"softwar\" + 0.008*\"diggin\" + 0.007*\"includ\"\n", + "2019-01-31 01:02:13,916 : INFO : topic #5 (0.020): 0.039*\"abroad\" + 0.029*\"son\" + 0.027*\"rel\" + 0.025*\"reconstruct\" + 0.020*\"band\" + 0.017*\"muscl\" + 0.016*\"simultan\" + 0.014*\"charcoal\" + 0.014*\"toyota\" + 0.009*\"myspac\"\n", + "2019-01-31 01:02:13,917 : INFO : topic #24 (0.020): 0.039*\"book\" + 0.034*\"publicis\" + 0.027*\"word\" + 0.018*\"new\" + 0.014*\"presid\" + 0.014*\"edit\" + 0.012*\"collect\" + 0.012*\"storag\" + 0.011*\"nicola\" + 0.011*\"author\"\n", + "2019-01-31 01:02:13,918 : INFO : topic #43 (0.020): 0.064*\"elect\" + 0.053*\"parti\" + 0.024*\"voluntari\" + 0.021*\"democrat\" + 0.020*\"member\" + 0.016*\"polici\" + 0.014*\"republ\" + 0.013*\"bypass\" + 0.013*\"selma\" + 0.013*\"report\"\n", + "2019-01-31 01:02:13,919 : INFO : topic #13 (0.020): 0.027*\"sourc\" + 0.025*\"australia\" + 0.025*\"london\" + 0.025*\"new\" + 0.022*\"england\" + 0.022*\"australian\" + 0.019*\"british\" + 0.017*\"ireland\" + 0.015*\"youth\" + 0.014*\"wale\"\n", + "2019-01-31 01:02:13,925 : INFO : topic diff=0.004059, rho=0.027318\n", + "2019-01-31 01:02:14,077 : INFO : PROGRESS: pass 0, at document #2682000/4922894\n", + "2019-01-31 01:02:15,434 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:02:15,701 : INFO : topic #29 (0.020): 0.030*\"companhia\" + 0.012*\"busi\" + 0.012*\"bank\" + 0.011*\"million\" + 0.011*\"market\" + 0.011*\"produc\" + 0.010*\"industri\" + 0.008*\"yawn\" + 0.008*\"manag\" + 0.007*\"oper\"\n", + "2019-01-31 01:02:15,702 : INFO : topic #18 (0.020): 0.010*\"théori\" + 0.007*\"later\" + 0.007*\"sack\" + 0.006*\"dai\" + 0.006*\"kill\" + 0.005*\"retrospect\" + 0.005*\"like\" + 0.005*\"end\" + 0.004*\"help\" + 0.004*\"call\"\n", + "2019-01-31 01:02:15,703 : INFO : topic #34 (0.020): 0.068*\"start\" + 0.034*\"new\" + 0.031*\"american\" + 0.030*\"unionist\" + 0.024*\"cotton\" + 0.021*\"year\" + 0.014*\"california\" + 0.014*\"warrior\" + 0.013*\"terri\" + 0.012*\"north\"\n", + "2019-01-31 01:02:15,704 : INFO : topic #42 (0.020): 0.045*\"german\" + 0.030*\"germani\" + 0.015*\"vol\" + 0.014*\"berlin\" + 0.013*\"israel\" + 0.013*\"der\" + 0.013*\"jewish\" + 0.010*\"european\" + 0.010*\"europ\" + 0.009*\"austria\"\n", + "2019-01-31 01:02:15,705 : INFO : topic #15 (0.020): 0.011*\"small\" + 0.010*\"organ\" + 0.010*\"develop\" + 0.010*\"commun\" + 0.009*\"word\" + 0.009*\"group\" + 0.008*\"peopl\" + 0.007*\"human\" + 0.006*\"woman\" + 0.006*\"summerhil\"\n", + "2019-01-31 01:02:15,711 : INFO : topic diff=0.004733, rho=0.027308\n", + "2019-01-31 01:02:15,862 : INFO : PROGRESS: pass 0, at document #2684000/4922894\n", + "2019-01-31 01:02:17,213 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:02:17,479 : INFO : topic #49 (0.020): 0.044*\"india\" + 0.032*\"incumb\" + 0.013*\"islam\" + 0.011*\"televis\" + 0.011*\"pakistan\" + 0.011*\"anglo\" + 0.011*\"khalsa\" + 0.010*\"muskoge\" + 0.010*\"affection\" + 0.010*\"sri\"\n", + "2019-01-31 01:02:17,480 : INFO : topic #45 (0.020): 0.028*\"jpg\" + 0.026*\"fifteenth\" + 0.018*\"illicit\" + 0.018*\"colder\" + 0.015*\"black\" + 0.014*\"western\" + 0.012*\"pain\" + 0.012*\"record\" + 0.010*\"blind\" + 0.009*\"depress\"\n", + "2019-01-31 01:02:17,481 : INFO : topic #23 (0.020): 0.135*\"audit\" + 0.067*\"best\" + 0.033*\"yawn\" + 0.029*\"jacksonvil\" + 0.022*\"noll\" + 0.022*\"japanes\" + 0.020*\"festiv\" + 0.020*\"women\" + 0.018*\"intern\" + 0.014*\"winner\"\n", + "2019-01-31 01:02:17,482 : INFO : topic #4 (0.020): 0.021*\"enfranchis\" + 0.015*\"depress\" + 0.015*\"pour\" + 0.010*\"mode\" + 0.009*\"elabor\" + 0.008*\"veget\" + 0.007*\"uruguayan\" + 0.006*\"produc\" + 0.006*\"develop\" + 0.006*\"encyclopedia\"\n", + "2019-01-31 01:02:17,483 : INFO : topic #10 (0.020): 0.011*\"cdd\" + 0.008*\"media\" + 0.008*\"disco\" + 0.007*\"hormon\" + 0.007*\"pathwai\" + 0.007*\"caus\" + 0.006*\"have\" + 0.006*\"proper\" + 0.006*\"effect\" + 0.006*\"treat\"\n", + "2019-01-31 01:02:17,489 : INFO : topic diff=0.004078, rho=0.027298\n", + "2019-01-31 01:02:17,700 : INFO : PROGRESS: pass 0, at document #2686000/4922894\n", + "2019-01-31 01:02:19,090 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:02:19,357 : INFO : topic #26 (0.020): 0.030*\"workplac\" + 0.028*\"champion\" + 0.028*\"woman\" + 0.026*\"men\" + 0.024*\"olymp\" + 0.023*\"alic\" + 0.021*\"medal\" + 0.020*\"event\" + 0.019*\"atheist\" + 0.018*\"rainfal\"\n", + "2019-01-31 01:02:19,358 : INFO : topic #11 (0.020): 0.023*\"john\" + 0.012*\"will\" + 0.011*\"jame\" + 0.011*\"david\" + 0.010*\"rival\" + 0.010*\"mexican–american\" + 0.008*\"paul\" + 0.008*\"georg\" + 0.008*\"slur\" + 0.008*\"rhyme\"\n", + "2019-01-31 01:02:19,359 : INFO : topic #43 (0.020): 0.064*\"elect\" + 0.053*\"parti\" + 0.024*\"voluntari\" + 0.022*\"democrat\" + 0.020*\"member\" + 0.016*\"polici\" + 0.015*\"republ\" + 0.014*\"bypass\" + 0.013*\"report\" + 0.013*\"seaport\"\n", + "2019-01-31 01:02:19,360 : INFO : topic #47 (0.020): 0.064*\"muscl\" + 0.034*\"perceptu\" + 0.020*\"theater\" + 0.018*\"compos\" + 0.018*\"place\" + 0.017*\"damn\" + 0.014*\"orchestr\" + 0.013*\"physician\" + 0.012*\"olympo\" + 0.011*\"word\"\n", + "2019-01-31 01:02:19,361 : INFO : topic #42 (0.020): 0.045*\"german\" + 0.031*\"germani\" + 0.015*\"vol\" + 0.014*\"berlin\" + 0.013*\"der\" + 0.013*\"israel\" + 0.013*\"jewish\" + 0.010*\"european\" + 0.010*\"europ\" + 0.009*\"austria\"\n", + "2019-01-31 01:02:19,367 : INFO : topic diff=0.004325, rho=0.027287\n", + "2019-01-31 01:02:19,524 : INFO : PROGRESS: pass 0, at document #2688000/4922894\n", + "2019-01-31 01:02:20,909 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:02:21,176 : INFO : topic #11 (0.020): 0.023*\"john\" + 0.012*\"will\" + 0.011*\"jame\" + 0.011*\"david\" + 0.010*\"rival\" + 0.010*\"mexican–american\" + 0.008*\"paul\" + 0.008*\"georg\" + 0.008*\"slur\" + 0.008*\"rhyme\"\n", + "2019-01-31 01:02:21,177 : INFO : topic #3 (0.020): 0.033*\"present\" + 0.026*\"offic\" + 0.024*\"nation\" + 0.023*\"minist\" + 0.022*\"govern\" + 0.021*\"member\" + 0.017*\"start\" + 0.016*\"serv\" + 0.016*\"gener\" + 0.014*\"seri\"\n", + "2019-01-31 01:02:21,178 : INFO : topic #18 (0.020): 0.011*\"théori\" + 0.007*\"later\" + 0.007*\"sack\" + 0.006*\"dai\" + 0.005*\"kill\" + 0.005*\"retrospect\" + 0.005*\"like\" + 0.005*\"end\" + 0.004*\"help\" + 0.004*\"call\"\n", + "2019-01-31 01:02:21,179 : INFO : topic #31 (0.020): 0.051*\"fusiform\" + 0.027*\"scientist\" + 0.026*\"taxpay\" + 0.022*\"player\" + 0.019*\"place\" + 0.014*\"clot\" + 0.013*\"leagu\" + 0.011*\"folei\" + 0.010*\"yawn\" + 0.009*\"reconstruct\"\n", + "2019-01-31 01:02:21,180 : INFO : topic #39 (0.020): 0.057*\"canada\" + 0.044*\"canadian\" + 0.024*\"hoar\" + 0.022*\"toronto\" + 0.021*\"ontario\" + 0.016*\"hydrogen\" + 0.015*\"novotná\" + 0.015*\"misericordia\" + 0.014*\"new\" + 0.013*\"quebec\"\n", + "2019-01-31 01:02:21,186 : INFO : topic diff=0.003675, rho=0.027277\n", + "2019-01-31 01:02:21,341 : INFO : PROGRESS: pass 0, at document #2690000/4922894\n", + "2019-01-31 01:02:22,713 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:02:22,980 : INFO : topic #8 (0.020): 0.026*\"law\" + 0.024*\"cortic\" + 0.021*\"act\" + 0.018*\"start\" + 0.013*\"ricardo\" + 0.013*\"case\" + 0.010*\"polaris\" + 0.010*\"replac\" + 0.009*\"legal\" + 0.008*\"rudolf\"\n", + "2019-01-31 01:02:22,981 : INFO : topic #32 (0.020): 0.048*\"district\" + 0.043*\"vigour\" + 0.043*\"popolo\" + 0.036*\"tortur\" + 0.033*\"cotton\" + 0.024*\"area\" + 0.023*\"multitud\" + 0.021*\"citi\" + 0.019*\"regim\" + 0.019*\"cede\"\n", + "2019-01-31 01:02:22,982 : INFO : topic #11 (0.020): 0.023*\"john\" + 0.012*\"will\" + 0.011*\"jame\" + 0.011*\"david\" + 0.010*\"rival\" + 0.010*\"mexican–american\" + 0.008*\"paul\" + 0.008*\"georg\" + 0.008*\"slur\" + 0.008*\"rhyme\"\n", + "2019-01-31 01:02:22,983 : INFO : topic #17 (0.020): 0.075*\"church\" + 0.023*\"cathol\" + 0.022*\"christian\" + 0.020*\"bishop\" + 0.016*\"retroflex\" + 0.015*\"sail\" + 0.014*\"centuri\" + 0.009*\"relationship\" + 0.009*\"historiographi\" + 0.008*\"poll\"\n", + "2019-01-31 01:02:22,984 : INFO : topic #37 (0.020): 0.011*\"charact\" + 0.010*\"man\" + 0.010*\"septemb\" + 0.009*\"anim\" + 0.008*\"comic\" + 0.007*\"love\" + 0.007*\"appear\" + 0.006*\"workplac\" + 0.006*\"gestur\" + 0.006*\"storag\"\n", + "2019-01-31 01:02:22,990 : INFO : topic diff=0.003863, rho=0.027267\n", + "2019-01-31 01:02:23,146 : INFO : PROGRESS: pass 0, at document #2692000/4922894\n", + "2019-01-31 01:02:24,527 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 01:02:24,793 : INFO : topic #14 (0.020): 0.024*\"forc\" + 0.022*\"aggress\" + 0.021*\"walter\" + 0.020*\"armi\" + 0.017*\"com\" + 0.014*\"oper\" + 0.014*\"unionist\" + 0.013*\"militari\" + 0.012*\"airbu\" + 0.010*\"diversifi\"\n", + "2019-01-31 01:02:24,794 : INFO : topic #9 (0.020): 0.067*\"bone\" + 0.045*\"american\" + 0.027*\"valour\" + 0.019*\"dutch\" + 0.018*\"english\" + 0.018*\"folei\" + 0.018*\"polit\" + 0.018*\"player\" + 0.012*\"simpler\" + 0.012*\"acrimoni\"\n", + "2019-01-31 01:02:24,795 : INFO : topic #47 (0.020): 0.064*\"muscl\" + 0.034*\"perceptu\" + 0.020*\"theater\" + 0.018*\"compos\" + 0.018*\"place\" + 0.016*\"damn\" + 0.014*\"orchestr\" + 0.013*\"physician\" + 0.012*\"olympo\" + 0.011*\"word\"\n", + "2019-01-31 01:02:24,796 : INFO : topic #4 (0.020): 0.020*\"enfranchis\" + 0.015*\"depress\" + 0.015*\"pour\" + 0.010*\"mode\" + 0.009*\"elabor\" + 0.008*\"veget\" + 0.007*\"uruguayan\" + 0.006*\"encyclopedia\" + 0.006*\"produc\" + 0.006*\"develop\"\n", + "2019-01-31 01:02:24,797 : INFO : topic #38 (0.020): 0.024*\"walter\" + 0.010*\"aza\" + 0.009*\"battalion\" + 0.008*\"forc\" + 0.008*\"teufel\" + 0.007*\"empath\" + 0.007*\"armi\" + 0.007*\"till\" + 0.006*\"militari\" + 0.006*\"govern\"\n", + "2019-01-31 01:02:24,803 : INFO : topic diff=0.003497, rho=0.027257\n", + "2019-01-31 01:02:24,960 : INFO : PROGRESS: pass 0, at document #2694000/4922894\n", + "2019-01-31 01:02:26,318 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:02:26,584 : INFO : topic #45 (0.020): 0.028*\"jpg\" + 0.026*\"fifteenth\" + 0.020*\"illicit\" + 0.018*\"colder\" + 0.015*\"black\" + 0.015*\"western\" + 0.012*\"pain\" + 0.012*\"record\" + 0.010*\"blind\" + 0.009*\"depress\"\n", + "2019-01-31 01:02:26,585 : INFO : topic #26 (0.020): 0.029*\"workplac\" + 0.027*\"champion\" + 0.027*\"woman\" + 0.025*\"men\" + 0.025*\"olymp\" + 0.023*\"alic\" + 0.021*\"medal\" + 0.020*\"event\" + 0.019*\"atheist\" + 0.018*\"rainfal\"\n", + "2019-01-31 01:02:26,586 : INFO : topic #47 (0.020): 0.065*\"muscl\" + 0.034*\"perceptu\" + 0.020*\"theater\" + 0.018*\"compos\" + 0.018*\"place\" + 0.016*\"damn\" + 0.014*\"orchestr\" + 0.013*\"physician\" + 0.012*\"olympo\" + 0.011*\"word\"\n", + "2019-01-31 01:02:26,587 : INFO : topic #18 (0.020): 0.011*\"théori\" + 0.007*\"later\" + 0.007*\"sack\" + 0.006*\"dai\" + 0.005*\"kill\" + 0.005*\"retrospect\" + 0.005*\"like\" + 0.005*\"end\" + 0.004*\"help\" + 0.004*\"call\"\n", + "2019-01-31 01:02:26,589 : INFO : topic #36 (0.020): 0.011*\"prognosi\" + 0.011*\"network\" + 0.009*\"pop\" + 0.009*\"cytokin\" + 0.008*\"develop\" + 0.008*\"user\" + 0.008*\"softwar\" + 0.008*\"uruguayan\" + 0.007*\"diggin\" + 0.007*\"includ\"\n", + "2019-01-31 01:02:26,595 : INFO : topic diff=0.004308, rho=0.027247\n", + "2019-01-31 01:02:26,749 : INFO : PROGRESS: pass 0, at document #2696000/4922894\n", + "2019-01-31 01:02:28,118 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:02:28,384 : INFO : topic #37 (0.020): 0.011*\"charact\" + 0.010*\"man\" + 0.010*\"septemb\" + 0.009*\"anim\" + 0.008*\"comic\" + 0.007*\"appear\" + 0.007*\"love\" + 0.006*\"workplac\" + 0.006*\"gestur\" + 0.006*\"storag\"\n", + "2019-01-31 01:02:28,385 : INFO : topic #14 (0.020): 0.024*\"forc\" + 0.022*\"aggress\" + 0.021*\"walter\" + 0.020*\"armi\" + 0.017*\"com\" + 0.014*\"oper\" + 0.014*\"unionist\" + 0.013*\"militari\" + 0.012*\"airbu\" + 0.011*\"diversifi\"\n", + "2019-01-31 01:02:28,386 : INFO : topic #7 (0.020): 0.021*\"snatch\" + 0.019*\"di\" + 0.019*\"factor\" + 0.016*\"yawn\" + 0.016*\"margin\" + 0.014*\"bone\" + 0.013*\"faster\" + 0.013*\"life\" + 0.012*\"deal\" + 0.012*\"daughter\"\n", + "2019-01-31 01:02:28,387 : INFO : topic #6 (0.020): 0.070*\"fewer\" + 0.023*\"epiru\" + 0.022*\"septemb\" + 0.019*\"teacher\" + 0.016*\"stake\" + 0.012*\"rodríguez\" + 0.012*\"proclaim\" + 0.011*\"direct\" + 0.011*\"movi\" + 0.011*\"acrimoni\"\n", + "2019-01-31 01:02:28,389 : INFO : topic #15 (0.020): 0.011*\"small\" + 0.010*\"organ\" + 0.010*\"develop\" + 0.010*\"commun\" + 0.009*\"word\" + 0.009*\"group\" + 0.008*\"peopl\" + 0.007*\"human\" + 0.006*\"woman\" + 0.006*\"summerhil\"\n", + "2019-01-31 01:02:28,395 : INFO : topic diff=0.005076, rho=0.027237\n", + "2019-01-31 01:02:28,552 : INFO : PROGRESS: pass 0, at document #2698000/4922894\n", + "2019-01-31 01:02:29,924 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:02:30,191 : INFO : topic #10 (0.020): 0.011*\"cdd\" + 0.008*\"media\" + 0.008*\"disco\" + 0.007*\"hormon\" + 0.007*\"pathwai\" + 0.007*\"caus\" + 0.007*\"proper\" + 0.006*\"have\" + 0.006*\"effect\" + 0.006*\"treat\"\n", + "2019-01-31 01:02:30,192 : INFO : topic #1 (0.020): 0.054*\"china\" + 0.045*\"chilton\" + 0.023*\"kong\" + 0.022*\"korea\" + 0.022*\"hong\" + 0.019*\"korean\" + 0.016*\"sourc\" + 0.015*\"shirin\" + 0.015*\"leah\" + 0.014*\"kim\"\n", + "2019-01-31 01:02:30,193 : INFO : topic #25 (0.020): 0.032*\"ring\" + 0.018*\"area\" + 0.018*\"lagrang\" + 0.017*\"warmth\" + 0.015*\"mount\" + 0.010*\"palmer\" + 0.009*\"north\" + 0.009*\"sourc\" + 0.009*\"foam\" + 0.008*\"vacant\"\n", + "2019-01-31 01:02:30,194 : INFO : topic #30 (0.020): 0.036*\"cleveland\" + 0.036*\"leagu\" + 0.030*\"place\" + 0.028*\"taxpay\" + 0.024*\"scientist\" + 0.023*\"crete\" + 0.021*\"folei\" + 0.017*\"goal\" + 0.015*\"martin\" + 0.012*\"schmitz\"\n", + "2019-01-31 01:02:30,195 : INFO : topic #2 (0.020): 0.051*\"isl\" + 0.037*\"shield\" + 0.018*\"narrat\" + 0.014*\"scot\" + 0.013*\"blur\" + 0.012*\"pope\" + 0.010*\"coalit\" + 0.010*\"nativist\" + 0.009*\"sai\" + 0.009*\"bahá\"\n", + "2019-01-31 01:02:30,201 : INFO : topic diff=0.004646, rho=0.027227\n", + "2019-01-31 01:02:32,913 : INFO : -11.879 per-word bound, 3765.6 perplexity estimate based on a held-out corpus of 2000 documents with 556707 words\n", + "2019-01-31 01:02:32,913 : INFO : PROGRESS: pass 0, at document #2700000/4922894\n", + "2019-01-31 01:02:34,307 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:02:34,573 : INFO : topic #34 (0.020): 0.067*\"start\" + 0.034*\"new\" + 0.031*\"american\" + 0.030*\"unionist\" + 0.024*\"cotton\" + 0.021*\"year\" + 0.015*\"california\" + 0.014*\"warrior\" + 0.013*\"terri\" + 0.012*\"north\"\n", + "2019-01-31 01:02:34,575 : INFO : topic #29 (0.020): 0.030*\"companhia\" + 0.012*\"bank\" + 0.012*\"busi\" + 0.011*\"million\" + 0.011*\"market\" + 0.010*\"produc\" + 0.009*\"industri\" + 0.008*\"yawn\" + 0.008*\"manag\" + 0.007*\"oper\"\n", + "2019-01-31 01:02:34,576 : INFO : topic #4 (0.020): 0.020*\"enfranchis\" + 0.015*\"depress\" + 0.015*\"pour\" + 0.010*\"mode\" + 0.009*\"elabor\" + 0.008*\"veget\" + 0.007*\"uruguayan\" + 0.006*\"encyclopedia\" + 0.006*\"spectacl\" + 0.006*\"produc\"\n", + "2019-01-31 01:02:34,577 : INFO : topic #41 (0.020): 0.041*\"citi\" + 0.024*\"palmer\" + 0.022*\"new\" + 0.015*\"strategist\" + 0.012*\"center\" + 0.012*\"open\" + 0.011*\"includ\" + 0.011*\"lobe\" + 0.009*\"highli\" + 0.009*\"dai\"\n", + "2019-01-31 01:02:34,578 : INFO : topic #3 (0.020): 0.033*\"present\" + 0.026*\"offic\" + 0.025*\"nation\" + 0.022*\"minist\" + 0.022*\"govern\" + 0.021*\"member\" + 0.017*\"start\" + 0.016*\"serv\" + 0.016*\"gener\" + 0.014*\"seri\"\n", + "2019-01-31 01:02:34,584 : INFO : topic diff=0.004004, rho=0.027217\n", + "2019-01-31 01:02:34,739 : INFO : PROGRESS: pass 0, at document #2702000/4922894\n", + "2019-01-31 01:02:36,118 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:02:36,385 : INFO : topic #5 (0.020): 0.040*\"abroad\" + 0.029*\"son\" + 0.027*\"rel\" + 0.025*\"reconstruct\" + 0.020*\"band\" + 0.017*\"muscl\" + 0.016*\"simultan\" + 0.014*\"charcoal\" + 0.014*\"toyota\" + 0.010*\"myspac\"\n", + "2019-01-31 01:02:36,386 : INFO : topic #48 (0.020): 0.084*\"march\" + 0.079*\"sens\" + 0.079*\"octob\" + 0.073*\"juli\" + 0.072*\"januari\" + 0.072*\"notion\" + 0.070*\"judici\" + 0.070*\"august\" + 0.069*\"april\" + 0.068*\"decatur\"\n", + "2019-01-31 01:02:36,387 : INFO : topic #26 (0.020): 0.029*\"workplac\" + 0.028*\"woman\" + 0.027*\"champion\" + 0.027*\"alic\" + 0.026*\"men\" + 0.024*\"olymp\" + 0.021*\"medal\" + 0.020*\"event\" + 0.019*\"atheist\" + 0.018*\"taxpay\"\n", + "2019-01-31 01:02:36,388 : INFO : topic #22 (0.020): 0.034*\"spars\" + 0.022*\"factor\" + 0.012*\"plaisir\" + 0.011*\"feel\" + 0.010*\"genu\" + 0.010*\"male\" + 0.009*\"adulthood\" + 0.008*\"median\" + 0.008*\"western\" + 0.007*\"biom\"\n", + "2019-01-31 01:02:36,389 : INFO : topic #34 (0.020): 0.067*\"start\" + 0.034*\"new\" + 0.031*\"american\" + 0.030*\"unionist\" + 0.024*\"cotton\" + 0.021*\"year\" + 0.015*\"california\" + 0.014*\"warrior\" + 0.013*\"terri\" + 0.012*\"north\"\n", + "2019-01-31 01:02:36,395 : INFO : topic diff=0.003907, rho=0.027206\n", + "2019-01-31 01:02:36,548 : INFO : PROGRESS: pass 0, at document #2704000/4922894\n", + "2019-01-31 01:02:37,895 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:02:38,162 : INFO : topic #39 (0.020): 0.056*\"canada\" + 0.045*\"canadian\" + 0.025*\"hoar\" + 0.021*\"toronto\" + 0.021*\"ontario\" + 0.015*\"novotná\" + 0.015*\"hydrogen\" + 0.015*\"new\" + 0.014*\"misericordia\" + 0.013*\"quebec\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 01:02:38,163 : INFO : topic #26 (0.020): 0.029*\"workplac\" + 0.028*\"woman\" + 0.027*\"champion\" + 0.027*\"alic\" + 0.026*\"men\" + 0.024*\"olymp\" + 0.021*\"medal\" + 0.020*\"event\" + 0.018*\"atheist\" + 0.018*\"taxpay\"\n", + "2019-01-31 01:02:38,164 : INFO : topic #46 (0.020): 0.017*\"sweden\" + 0.017*\"norwai\" + 0.016*\"swedish\" + 0.015*\"stop\" + 0.015*\"damag\" + 0.014*\"norwegian\" + 0.013*\"wind\" + 0.011*\"danish\" + 0.011*\"denmark\" + 0.011*\"huntsvil\"\n", + "2019-01-31 01:02:38,165 : INFO : topic #23 (0.020): 0.138*\"audit\" + 0.065*\"best\" + 0.033*\"yawn\" + 0.029*\"jacksonvil\" + 0.022*\"noll\" + 0.022*\"japanes\" + 0.020*\"women\" + 0.020*\"festiv\" + 0.018*\"intern\" + 0.014*\"prison\"\n", + "2019-01-31 01:02:38,166 : INFO : topic #5 (0.020): 0.039*\"abroad\" + 0.029*\"son\" + 0.027*\"rel\" + 0.025*\"reconstruct\" + 0.020*\"band\" + 0.017*\"muscl\" + 0.016*\"simultan\" + 0.014*\"charcoal\" + 0.014*\"toyota\" + 0.010*\"myspac\"\n", + "2019-01-31 01:02:38,171 : INFO : topic diff=0.004478, rho=0.027196\n", + "2019-01-31 01:02:38,326 : INFO : PROGRESS: pass 0, at document #2706000/4922894\n", + "2019-01-31 01:02:39,694 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:02:39,960 : INFO : topic #28 (0.020): 0.032*\"build\" + 0.027*\"hous\" + 0.020*\"rivièr\" + 0.018*\"buford\" + 0.014*\"histor\" + 0.011*\"briarwood\" + 0.011*\"strategist\" + 0.011*\"constitut\" + 0.010*\"linear\" + 0.010*\"depress\"\n", + "2019-01-31 01:02:39,961 : INFO : topic #7 (0.020): 0.021*\"snatch\" + 0.020*\"di\" + 0.019*\"factor\" + 0.016*\"yawn\" + 0.016*\"margin\" + 0.014*\"bone\" + 0.013*\"faster\" + 0.013*\"life\" + 0.012*\"deal\" + 0.012*\"daughter\"\n", + "2019-01-31 01:02:39,962 : INFO : topic #13 (0.020): 0.026*\"sourc\" + 0.025*\"australia\" + 0.025*\"new\" + 0.024*\"london\" + 0.022*\"australian\" + 0.022*\"england\" + 0.019*\"british\" + 0.018*\"ireland\" + 0.015*\"youth\" + 0.014*\"wale\"\n", + "2019-01-31 01:02:39,963 : INFO : topic #25 (0.020): 0.031*\"ring\" + 0.018*\"area\" + 0.018*\"lagrang\" + 0.017*\"warmth\" + 0.015*\"mount\" + 0.010*\"palmer\" + 0.009*\"north\" + 0.009*\"sourc\" + 0.009*\"foam\" + 0.008*\"vacant\"\n", + "2019-01-31 01:02:39,964 : INFO : topic #30 (0.020): 0.036*\"cleveland\" + 0.036*\"leagu\" + 0.030*\"place\" + 0.028*\"taxpay\" + 0.024*\"scientist\" + 0.023*\"crete\" + 0.021*\"folei\" + 0.017*\"goal\" + 0.015*\"martin\" + 0.013*\"schmitz\"\n", + "2019-01-31 01:02:39,970 : INFO : topic diff=0.003706, rho=0.027186\n", + "2019-01-31 01:02:40,123 : INFO : PROGRESS: pass 0, at document #2708000/4922894\n", + "2019-01-31 01:02:41,479 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:02:41,746 : INFO : topic #24 (0.020): 0.039*\"book\" + 0.033*\"publicis\" + 0.027*\"word\" + 0.018*\"new\" + 0.014*\"edit\" + 0.014*\"presid\" + 0.012*\"collect\" + 0.012*\"storag\" + 0.011*\"nicola\" + 0.011*\"author\"\n", + "2019-01-31 01:02:41,747 : INFO : topic #19 (0.020): 0.015*\"centuri\" + 0.015*\"languag\" + 0.010*\"woodcut\" + 0.009*\"form\" + 0.009*\"origin\" + 0.009*\"mean\" + 0.009*\"trade\" + 0.007*\"english\" + 0.007*\"known\" + 0.006*\"ancestor\"\n", + "2019-01-31 01:02:41,748 : INFO : topic #35 (0.020): 0.058*\"russia\" + 0.037*\"sovereignti\" + 0.033*\"rural\" + 0.025*\"poison\" + 0.024*\"personifi\" + 0.023*\"reprint\" + 0.020*\"moscow\" + 0.017*\"poland\" + 0.016*\"unfortun\" + 0.015*\"czech\"\n", + "2019-01-31 01:02:41,749 : INFO : topic #39 (0.020): 0.056*\"canada\" + 0.045*\"canadian\" + 0.025*\"hoar\" + 0.021*\"toronto\" + 0.021*\"ontario\" + 0.016*\"novotná\" + 0.015*\"hydrogen\" + 0.014*\"new\" + 0.014*\"misericordia\" + 0.013*\"quebec\"\n", + "2019-01-31 01:02:41,750 : INFO : topic #28 (0.020): 0.032*\"build\" + 0.027*\"hous\" + 0.020*\"rivièr\" + 0.018*\"buford\" + 0.014*\"histor\" + 0.011*\"briarwood\" + 0.011*\"strategist\" + 0.011*\"constitut\" + 0.010*\"linear\" + 0.010*\"depress\"\n", + "2019-01-31 01:02:41,756 : INFO : topic diff=0.003404, rho=0.027176\n", + "2019-01-31 01:02:41,910 : INFO : PROGRESS: pass 0, at document #2710000/4922894\n", + "2019-01-31 01:02:43,276 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:02:43,543 : INFO : topic #1 (0.020): 0.054*\"china\" + 0.045*\"chilton\" + 0.023*\"kong\" + 0.023*\"korea\" + 0.023*\"hong\" + 0.018*\"korean\" + 0.015*\"sourc\" + 0.015*\"leah\" + 0.015*\"shirin\" + 0.014*\"kim\"\n", + "2019-01-31 01:02:43,544 : INFO : topic #42 (0.020): 0.045*\"german\" + 0.031*\"germani\" + 0.016*\"vol\" + 0.014*\"berlin\" + 0.014*\"der\" + 0.013*\"israel\" + 0.013*\"jewish\" + 0.010*\"european\" + 0.010*\"europ\" + 0.009*\"austria\"\n", + "2019-01-31 01:02:43,545 : INFO : topic #29 (0.020): 0.030*\"companhia\" + 0.012*\"busi\" + 0.012*\"bank\" + 0.011*\"million\" + 0.011*\"market\" + 0.011*\"produc\" + 0.009*\"industri\" + 0.008*\"yawn\" + 0.008*\"manag\" + 0.007*\"function\"\n", + "2019-01-31 01:02:43,546 : INFO : topic #8 (0.020): 0.027*\"law\" + 0.024*\"cortic\" + 0.020*\"act\" + 0.018*\"start\" + 0.013*\"case\" + 0.013*\"ricardo\" + 0.010*\"replac\" + 0.010*\"polaris\" + 0.009*\"legal\" + 0.007*\"rudolf\"\n", + "2019-01-31 01:02:43,547 : INFO : topic #26 (0.020): 0.029*\"workplac\" + 0.028*\"woman\" + 0.028*\"champion\" + 0.026*\"men\" + 0.025*\"alic\" + 0.024*\"olymp\" + 0.021*\"medal\" + 0.020*\"event\" + 0.018*\"atheist\" + 0.018*\"rainfal\"\n", + "2019-01-31 01:02:43,553 : INFO : topic diff=0.004612, rho=0.027166\n", + "2019-01-31 01:02:43,702 : INFO : PROGRESS: pass 0, at document #2712000/4922894\n", + "2019-01-31 01:02:45,030 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:02:45,296 : INFO : topic #19 (0.020): 0.015*\"centuri\" + 0.014*\"languag\" + 0.010*\"woodcut\" + 0.009*\"form\" + 0.009*\"origin\" + 0.009*\"mean\" + 0.009*\"trade\" + 0.007*\"english\" + 0.007*\"known\" + 0.006*\"ancestor\"\n", + "2019-01-31 01:02:45,297 : INFO : topic #32 (0.020): 0.047*\"district\" + 0.043*\"popolo\" + 0.042*\"vigour\" + 0.035*\"tortur\" + 0.034*\"cotton\" + 0.023*\"area\" + 0.023*\"multitud\" + 0.021*\"citi\" + 0.019*\"cede\" + 0.019*\"regim\"\n", + "2019-01-31 01:02:45,298 : INFO : topic #2 (0.020): 0.052*\"isl\" + 0.037*\"shield\" + 0.018*\"narrat\" + 0.014*\"scot\" + 0.013*\"blur\" + 0.012*\"pope\" + 0.011*\"coalit\" + 0.010*\"nativist\" + 0.009*\"bahá\" + 0.009*\"sai\"\n", + "2019-01-31 01:02:45,299 : INFO : topic #44 (0.020): 0.031*\"rooftop\" + 0.027*\"final\" + 0.023*\"wife\" + 0.020*\"tourist\" + 0.019*\"champion\" + 0.015*\"martin\" + 0.015*\"chamber\" + 0.014*\"tiepolo\" + 0.013*\"taxpay\" + 0.012*\"winner\"\n", + "2019-01-31 01:02:45,300 : INFO : topic #26 (0.020): 0.029*\"workplac\" + 0.028*\"woman\" + 0.027*\"champion\" + 0.025*\"men\" + 0.025*\"alic\" + 0.024*\"olymp\" + 0.021*\"medal\" + 0.020*\"event\" + 0.018*\"atheist\" + 0.018*\"rainfal\"\n", + "2019-01-31 01:02:45,306 : INFO : topic diff=0.004241, rho=0.027156\n", + "2019-01-31 01:02:45,463 : INFO : PROGRESS: pass 0, at document #2714000/4922894\n", + "2019-01-31 01:02:46,851 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:02:47,117 : INFO : topic #8 (0.020): 0.027*\"law\" + 0.023*\"cortic\" + 0.020*\"act\" + 0.018*\"start\" + 0.014*\"ricardo\" + 0.013*\"case\" + 0.010*\"replac\" + 0.010*\"polaris\" + 0.009*\"legal\" + 0.007*\"rudolf\"\n", + "2019-01-31 01:02:47,118 : INFO : topic #47 (0.020): 0.066*\"muscl\" + 0.034*\"perceptu\" + 0.019*\"theater\" + 0.018*\"compos\" + 0.018*\"place\" + 0.015*\"damn\" + 0.014*\"orchestr\" + 0.013*\"physician\" + 0.013*\"olympo\" + 0.011*\"word\"\n", + "2019-01-31 01:02:47,119 : INFO : topic #48 (0.020): 0.086*\"march\" + 0.079*\"sens\" + 0.078*\"octob\" + 0.073*\"januari\" + 0.072*\"juli\" + 0.071*\"notion\" + 0.070*\"judici\" + 0.070*\"august\" + 0.069*\"april\" + 0.067*\"decatur\"\n", + "2019-01-31 01:02:47,120 : INFO : topic #28 (0.020): 0.032*\"build\" + 0.027*\"hous\" + 0.020*\"rivièr\" + 0.018*\"buford\" + 0.014*\"histor\" + 0.011*\"briarwood\" + 0.011*\"constitut\" + 0.011*\"strategist\" + 0.010*\"linear\" + 0.010*\"depress\"\n", + "2019-01-31 01:02:47,121 : INFO : topic #20 (0.020): 0.144*\"scholar\" + 0.038*\"struggl\" + 0.036*\"high\" + 0.029*\"educ\" + 0.023*\"collector\" + 0.017*\"yawn\" + 0.013*\"prognosi\" + 0.010*\"district\" + 0.009*\"gothic\" + 0.009*\"start\"\n", + "2019-01-31 01:02:47,127 : INFO : topic diff=0.004319, rho=0.027146\n", + "2019-01-31 01:02:47,283 : INFO : PROGRESS: pass 0, at document #2716000/4922894\n", + "2019-01-31 01:02:48,660 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:02:48,926 : INFO : topic #20 (0.020): 0.142*\"scholar\" + 0.038*\"struggl\" + 0.036*\"high\" + 0.029*\"educ\" + 0.023*\"collector\" + 0.017*\"yawn\" + 0.013*\"prognosi\" + 0.011*\"district\" + 0.010*\"gothic\" + 0.010*\"start\"\n", + "2019-01-31 01:02:48,927 : INFO : topic #40 (0.020): 0.087*\"unit\" + 0.024*\"schuster\" + 0.022*\"institut\" + 0.021*\"requir\" + 0.020*\"collector\" + 0.018*\"student\" + 0.015*\"professor\" + 0.012*\"word\" + 0.012*\"http\" + 0.011*\"governor\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 01:02:48,928 : INFO : topic #10 (0.020): 0.011*\"cdd\" + 0.008*\"disco\" + 0.008*\"media\" + 0.007*\"pathwai\" + 0.007*\"hormon\" + 0.007*\"caus\" + 0.007*\"have\" + 0.006*\"proper\" + 0.006*\"treat\" + 0.006*\"effect\"\n", + "2019-01-31 01:02:48,929 : INFO : topic #37 (0.020): 0.011*\"charact\" + 0.010*\"man\" + 0.010*\"septemb\" + 0.009*\"anim\" + 0.008*\"comic\" + 0.007*\"love\" + 0.007*\"appear\" + 0.006*\"gestur\" + 0.006*\"workplac\" + 0.006*\"storag\"\n", + "2019-01-31 01:02:48,930 : INFO : topic #48 (0.020): 0.085*\"march\" + 0.078*\"sens\" + 0.077*\"octob\" + 0.072*\"januari\" + 0.071*\"juli\" + 0.070*\"notion\" + 0.070*\"judici\" + 0.069*\"august\" + 0.068*\"april\" + 0.067*\"decatur\"\n", + "2019-01-31 01:02:48,936 : INFO : topic diff=0.004555, rho=0.027136\n", + "2019-01-31 01:02:49,095 : INFO : PROGRESS: pass 0, at document #2718000/4922894\n", + "2019-01-31 01:02:50,489 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:02:50,756 : INFO : topic #28 (0.020): 0.032*\"build\" + 0.027*\"hous\" + 0.020*\"rivièr\" + 0.018*\"buford\" + 0.014*\"histor\" + 0.011*\"briarwood\" + 0.011*\"constitut\" + 0.011*\"strategist\" + 0.010*\"linear\" + 0.010*\"depress\"\n", + "2019-01-31 01:02:50,757 : INFO : topic #41 (0.020): 0.041*\"citi\" + 0.024*\"palmer\" + 0.021*\"new\" + 0.015*\"strategist\" + 0.013*\"center\" + 0.012*\"open\" + 0.011*\"includ\" + 0.011*\"lobe\" + 0.009*\"highli\" + 0.009*\"hot\"\n", + "2019-01-31 01:02:50,758 : INFO : topic #4 (0.020): 0.020*\"enfranchis\" + 0.015*\"depress\" + 0.014*\"pour\" + 0.009*\"mode\" + 0.009*\"elabor\" + 0.008*\"veget\" + 0.007*\"uruguayan\" + 0.006*\"encyclopedia\" + 0.006*\"produc\" + 0.006*\"develop\"\n", + "2019-01-31 01:02:50,759 : INFO : topic #24 (0.020): 0.039*\"book\" + 0.033*\"publicis\" + 0.027*\"word\" + 0.018*\"new\" + 0.014*\"edit\" + 0.014*\"presid\" + 0.012*\"collect\" + 0.012*\"storag\" + 0.011*\"nicola\" + 0.011*\"author\"\n", + "2019-01-31 01:02:50,760 : INFO : topic #27 (0.020): 0.072*\"questionnair\" + 0.021*\"candid\" + 0.021*\"taxpay\" + 0.014*\"ret\" + 0.014*\"driver\" + 0.012*\"tornado\" + 0.012*\"fool\" + 0.011*\"find\" + 0.011*\"squatter\" + 0.010*\"champion\"\n", + "2019-01-31 01:02:50,766 : INFO : topic diff=0.004202, rho=0.027126\n", + "2019-01-31 01:02:53,395 : INFO : -11.589 per-word bound, 3080.4 perplexity estimate based on a held-out corpus of 2000 documents with 510275 words\n", + "2019-01-31 01:02:53,396 : INFO : PROGRESS: pass 0, at document #2720000/4922894\n", + "2019-01-31 01:02:54,727 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:02:54,993 : INFO : topic #28 (0.020): 0.032*\"build\" + 0.026*\"hous\" + 0.020*\"rivièr\" + 0.018*\"buford\" + 0.014*\"histor\" + 0.011*\"briarwood\" + 0.011*\"linear\" + 0.011*\"constitut\" + 0.011*\"strategist\" + 0.010*\"depress\"\n", + "2019-01-31 01:02:54,994 : INFO : topic #15 (0.020): 0.011*\"small\" + 0.010*\"organ\" + 0.010*\"develop\" + 0.009*\"commun\" + 0.009*\"group\" + 0.009*\"word\" + 0.008*\"peopl\" + 0.007*\"human\" + 0.006*\"woman\" + 0.006*\"summerhil\"\n", + "2019-01-31 01:02:54,995 : INFO : topic #20 (0.020): 0.142*\"scholar\" + 0.038*\"struggl\" + 0.036*\"high\" + 0.029*\"educ\" + 0.023*\"collector\" + 0.017*\"yawn\" + 0.013*\"prognosi\" + 0.011*\"district\" + 0.010*\"gothic\" + 0.009*\"start\"\n", + "2019-01-31 01:02:54,996 : INFO : topic #42 (0.020): 0.046*\"german\" + 0.032*\"germani\" + 0.015*\"vol\" + 0.014*\"berlin\" + 0.014*\"der\" + 0.013*\"jewish\" + 0.013*\"israel\" + 0.010*\"european\" + 0.010*\"europ\" + 0.009*\"austria\"\n", + "2019-01-31 01:02:54,997 : INFO : topic #16 (0.020): 0.054*\"king\" + 0.031*\"priest\" + 0.022*\"duke\" + 0.019*\"grammat\" + 0.019*\"idiosyncrat\" + 0.018*\"rotterdam\" + 0.018*\"quarterli\" + 0.013*\"brazil\" + 0.012*\"kingdom\" + 0.012*\"maria\"\n", + "2019-01-31 01:02:55,003 : INFO : topic diff=0.004335, rho=0.027116\n", + "2019-01-31 01:02:55,161 : INFO : PROGRESS: pass 0, at document #2722000/4922894\n", + "2019-01-31 01:02:56,546 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:02:56,814 : INFO : topic #9 (0.020): 0.067*\"bone\" + 0.046*\"american\" + 0.027*\"valour\" + 0.019*\"dutch\" + 0.018*\"player\" + 0.018*\"folei\" + 0.018*\"english\" + 0.017*\"polit\" + 0.013*\"simpler\" + 0.012*\"acrimoni\"\n", + "2019-01-31 01:02:56,815 : INFO : topic #13 (0.020): 0.026*\"sourc\" + 0.025*\"australia\" + 0.024*\"london\" + 0.024*\"new\" + 0.022*\"england\" + 0.022*\"australian\" + 0.020*\"ireland\" + 0.019*\"british\" + 0.014*\"youth\" + 0.014*\"wale\"\n", + "2019-01-31 01:02:56,816 : INFO : topic #42 (0.020): 0.046*\"german\" + 0.032*\"germani\" + 0.015*\"vol\" + 0.014*\"berlin\" + 0.014*\"der\" + 0.013*\"jewish\" + 0.013*\"israel\" + 0.010*\"european\" + 0.010*\"europ\" + 0.009*\"austria\"\n", + "2019-01-31 01:02:56,817 : INFO : topic #35 (0.020): 0.059*\"russia\" + 0.037*\"sovereignti\" + 0.032*\"rural\" + 0.026*\"poison\" + 0.023*\"personifi\" + 0.022*\"reprint\" + 0.021*\"moscow\" + 0.017*\"poland\" + 0.016*\"unfortun\" + 0.015*\"turin\"\n", + "2019-01-31 01:02:56,818 : INFO : topic #0 (0.020): 0.064*\"statewid\" + 0.045*\"line\" + 0.033*\"raid\" + 0.027*\"arsen\" + 0.023*\"museo\" + 0.019*\"traceabl\" + 0.019*\"rosenwald\" + 0.019*\"serv\" + 0.012*\"oper\" + 0.012*\"exhaust\"\n", + "2019-01-31 01:02:56,824 : INFO : topic diff=0.003329, rho=0.027106\n", + "2019-01-31 01:02:56,981 : INFO : PROGRESS: pass 0, at document #2724000/4922894\n", + "2019-01-31 01:02:58,357 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:02:58,625 : INFO : topic #35 (0.020): 0.059*\"russia\" + 0.037*\"sovereignti\" + 0.032*\"rural\" + 0.025*\"poison\" + 0.023*\"personifi\" + 0.023*\"reprint\" + 0.021*\"moscow\" + 0.017*\"poland\" + 0.016*\"unfortun\" + 0.015*\"turin\"\n", + "2019-01-31 01:02:58,626 : INFO : topic #38 (0.020): 0.024*\"walter\" + 0.010*\"aza\" + 0.009*\"battalion\" + 0.008*\"forc\" + 0.008*\"teufel\" + 0.007*\"empath\" + 0.007*\"armi\" + 0.006*\"till\" + 0.006*\"militari\" + 0.006*\"govern\"\n", + "2019-01-31 01:02:58,627 : INFO : topic #14 (0.020): 0.024*\"forc\" + 0.022*\"aggress\" + 0.020*\"walter\" + 0.020*\"armi\" + 0.017*\"com\" + 0.014*\"oper\" + 0.014*\"unionist\" + 0.013*\"militari\" + 0.012*\"airbu\" + 0.010*\"diversifi\"\n", + "2019-01-31 01:02:58,628 : INFO : topic #18 (0.020): 0.011*\"théori\" + 0.007*\"later\" + 0.007*\"sack\" + 0.006*\"dai\" + 0.005*\"kill\" + 0.005*\"retrospect\" + 0.005*\"like\" + 0.005*\"end\" + 0.004*\"help\" + 0.004*\"call\"\n", + "2019-01-31 01:02:58,629 : INFO : topic #43 (0.020): 0.067*\"elect\" + 0.053*\"parti\" + 0.023*\"voluntari\" + 0.023*\"democrat\" + 0.022*\"member\" + 0.015*\"polici\" + 0.015*\"republ\" + 0.014*\"bypass\" + 0.013*\"liber\" + 0.013*\"report\"\n", + "2019-01-31 01:02:58,635 : INFO : topic diff=0.004157, rho=0.027096\n", + "2019-01-31 01:02:58,801 : INFO : PROGRESS: pass 0, at document #2726000/4922894\n", + "2019-01-31 01:03:00,222 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:03:00,488 : INFO : topic #33 (0.020): 0.060*\"french\" + 0.046*\"franc\" + 0.032*\"pari\" + 0.024*\"sail\" + 0.022*\"jean\" + 0.017*\"daphn\" + 0.014*\"lazi\" + 0.013*\"loui\" + 0.012*\"piec\" + 0.009*\"wreath\"\n", + "2019-01-31 01:03:00,489 : INFO : topic #46 (0.020): 0.017*\"sweden\" + 0.017*\"wind\" + 0.017*\"norwai\" + 0.015*\"stop\" + 0.015*\"swedish\" + 0.014*\"damag\" + 0.014*\"norwegian\" + 0.012*\"danish\" + 0.012*\"denmark\" + 0.011*\"huntsvil\"\n", + "2019-01-31 01:03:00,490 : INFO : topic #17 (0.020): 0.077*\"church\" + 0.022*\"cathol\" + 0.021*\"christian\" + 0.020*\"bishop\" + 0.015*\"retroflex\" + 0.015*\"sail\" + 0.013*\"centuri\" + 0.009*\"cathedr\" + 0.009*\"historiographi\" + 0.009*\"relationship\"\n", + "2019-01-31 01:03:00,491 : INFO : topic #34 (0.020): 0.068*\"start\" + 0.034*\"new\" + 0.031*\"american\" + 0.030*\"unionist\" + 0.024*\"cotton\" + 0.021*\"year\" + 0.015*\"california\" + 0.014*\"warrior\" + 0.013*\"terri\" + 0.012*\"north\"\n", + "2019-01-31 01:03:00,492 : INFO : topic #18 (0.020): 0.011*\"théori\" + 0.007*\"later\" + 0.007*\"sack\" + 0.006*\"dai\" + 0.005*\"kill\" + 0.005*\"retrospect\" + 0.005*\"like\" + 0.005*\"end\" + 0.004*\"help\" + 0.004*\"call\"\n", + "2019-01-31 01:03:00,498 : INFO : topic diff=0.004914, rho=0.027086\n", + "2019-01-31 01:03:00,657 : INFO : PROGRESS: pass 0, at document #2728000/4922894\n", + "2019-01-31 01:03:02,046 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:03:02,312 : INFO : topic #13 (0.020): 0.026*\"sourc\" + 0.025*\"australia\" + 0.024*\"new\" + 0.024*\"london\" + 0.022*\"australian\" + 0.022*\"england\" + 0.020*\"ireland\" + 0.019*\"british\" + 0.015*\"youth\" + 0.014*\"wale\"\n", + "2019-01-31 01:03:02,313 : INFO : topic #43 (0.020): 0.066*\"elect\" + 0.057*\"parti\" + 0.024*\"democrat\" + 0.023*\"voluntari\" + 0.022*\"member\" + 0.015*\"polici\" + 0.015*\"republ\" + 0.014*\"bypass\" + 0.013*\"liber\" + 0.013*\"report\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 01:03:02,314 : INFO : topic #17 (0.020): 0.077*\"church\" + 0.022*\"cathol\" + 0.021*\"christian\" + 0.020*\"bishop\" + 0.015*\"retroflex\" + 0.015*\"sail\" + 0.013*\"centuri\" + 0.009*\"cathedr\" + 0.009*\"historiographi\" + 0.009*\"relationship\"\n", + "2019-01-31 01:03:02,315 : INFO : topic #14 (0.020): 0.024*\"forc\" + 0.022*\"aggress\" + 0.020*\"walter\" + 0.019*\"armi\" + 0.017*\"com\" + 0.014*\"oper\" + 0.014*\"unionist\" + 0.012*\"militari\" + 0.012*\"airbu\" + 0.010*\"diversifi\"\n", + "2019-01-31 01:03:02,316 : INFO : topic #30 (0.020): 0.036*\"cleveland\" + 0.035*\"leagu\" + 0.030*\"place\" + 0.028*\"taxpay\" + 0.025*\"scientist\" + 0.023*\"crete\" + 0.021*\"folei\" + 0.017*\"goal\" + 0.016*\"martin\" + 0.013*\"schmitz\"\n", + "2019-01-31 01:03:02,322 : INFO : topic diff=0.004180, rho=0.027077\n", + "2019-01-31 01:03:02,479 : INFO : PROGRESS: pass 0, at document #2730000/4922894\n", + "2019-01-31 01:03:03,841 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:03:04,108 : INFO : topic #41 (0.020): 0.041*\"citi\" + 0.024*\"palmer\" + 0.022*\"new\" + 0.015*\"strategist\" + 0.013*\"center\" + 0.012*\"open\" + 0.011*\"includ\" + 0.011*\"lobe\" + 0.009*\"highli\" + 0.009*\"dai\"\n", + "2019-01-31 01:03:04,109 : INFO : topic #14 (0.020): 0.024*\"forc\" + 0.023*\"aggress\" + 0.020*\"walter\" + 0.019*\"armi\" + 0.017*\"com\" + 0.014*\"oper\" + 0.014*\"unionist\" + 0.013*\"militari\" + 0.012*\"airbu\" + 0.010*\"diversifi\"\n", + "2019-01-31 01:03:04,111 : INFO : topic #18 (0.020): 0.011*\"théori\" + 0.007*\"later\" + 0.007*\"sack\" + 0.006*\"dai\" + 0.005*\"kill\" + 0.005*\"retrospect\" + 0.005*\"like\" + 0.005*\"end\" + 0.004*\"help\" + 0.004*\"call\"\n", + "2019-01-31 01:03:04,112 : INFO : topic #1 (0.020): 0.053*\"china\" + 0.045*\"chilton\" + 0.025*\"hong\" + 0.024*\"kong\" + 0.023*\"korea\" + 0.019*\"korean\" + 0.016*\"sourc\" + 0.016*\"leah\" + 0.015*\"shirin\" + 0.014*\"kim\"\n", + "2019-01-31 01:03:04,113 : INFO : topic #21 (0.020): 0.034*\"samford\" + 0.022*\"spain\" + 0.019*\"del\" + 0.018*\"mexico\" + 0.015*\"italian\" + 0.014*\"soviet\" + 0.012*\"santa\" + 0.011*\"juan\" + 0.011*\"lizard\" + 0.011*\"carlo\"\n", + "2019-01-31 01:03:04,119 : INFO : topic diff=0.004918, rho=0.027067\n", + "2019-01-31 01:03:04,277 : INFO : PROGRESS: pass 0, at document #2732000/4922894\n", + "2019-01-31 01:03:05,669 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:03:05,935 : INFO : topic #21 (0.020): 0.033*\"samford\" + 0.022*\"spain\" + 0.019*\"del\" + 0.018*\"mexico\" + 0.015*\"italian\" + 0.014*\"soviet\" + 0.012*\"santa\" + 0.011*\"juan\" + 0.011*\"lizard\" + 0.011*\"carlo\"\n", + "2019-01-31 01:03:05,936 : INFO : topic #48 (0.020): 0.082*\"march\" + 0.078*\"octob\" + 0.078*\"sens\" + 0.071*\"juli\" + 0.071*\"januari\" + 0.070*\"notion\" + 0.069*\"august\" + 0.068*\"judici\" + 0.068*\"decatur\" + 0.067*\"april\"\n", + "2019-01-31 01:03:05,937 : INFO : topic #42 (0.020): 0.047*\"german\" + 0.032*\"germani\" + 0.015*\"vol\" + 0.014*\"berlin\" + 0.014*\"israel\" + 0.013*\"jewish\" + 0.013*\"der\" + 0.010*\"european\" + 0.010*\"europ\" + 0.009*\"isra\"\n", + "2019-01-31 01:03:05,939 : INFO : topic #31 (0.020): 0.051*\"fusiform\" + 0.027*\"scientist\" + 0.025*\"taxpay\" + 0.022*\"player\" + 0.020*\"place\" + 0.014*\"clot\" + 0.012*\"leagu\" + 0.011*\"folei\" + 0.010*\"yawn\" + 0.009*\"yard\"\n", + "2019-01-31 01:03:05,940 : INFO : topic #47 (0.020): 0.066*\"muscl\" + 0.034*\"perceptu\" + 0.020*\"theater\" + 0.018*\"place\" + 0.018*\"compos\" + 0.015*\"damn\" + 0.014*\"orchestr\" + 0.013*\"physician\" + 0.013*\"olympo\" + 0.011*\"word\"\n", + "2019-01-31 01:03:05,945 : INFO : topic diff=0.004245, rho=0.027057\n", + "2019-01-31 01:03:06,099 : INFO : PROGRESS: pass 0, at document #2734000/4922894\n", + "2019-01-31 01:03:07,450 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:03:07,717 : INFO : topic #15 (0.020): 0.011*\"small\" + 0.010*\"organ\" + 0.010*\"develop\" + 0.009*\"commun\" + 0.009*\"group\" + 0.008*\"word\" + 0.008*\"peopl\" + 0.007*\"human\" + 0.006*\"cultur\" + 0.006*\"woman\"\n", + "2019-01-31 01:03:07,719 : INFO : topic #24 (0.020): 0.039*\"book\" + 0.033*\"publicis\" + 0.027*\"word\" + 0.018*\"new\" + 0.014*\"edit\" + 0.014*\"presid\" + 0.012*\"collect\" + 0.012*\"nicola\" + 0.012*\"storag\" + 0.011*\"author\"\n", + "2019-01-31 01:03:07,720 : INFO : topic #31 (0.020): 0.051*\"fusiform\" + 0.027*\"scientist\" + 0.025*\"taxpay\" + 0.022*\"player\" + 0.020*\"place\" + 0.014*\"clot\" + 0.012*\"leagu\" + 0.011*\"folei\" + 0.010*\"yawn\" + 0.009*\"yard\"\n", + "2019-01-31 01:03:07,721 : INFO : topic #20 (0.020): 0.141*\"scholar\" + 0.038*\"struggl\" + 0.035*\"high\" + 0.029*\"educ\" + 0.022*\"collector\" + 0.017*\"yawn\" + 0.012*\"prognosi\" + 0.011*\"district\" + 0.010*\"gothic\" + 0.010*\"start\"\n", + "2019-01-31 01:03:07,722 : INFO : topic #22 (0.020): 0.034*\"spars\" + 0.022*\"factor\" + 0.013*\"plaisir\" + 0.011*\"genu\" + 0.011*\"feel\" + 0.010*\"male\" + 0.008*\"median\" + 0.008*\"western\" + 0.008*\"adulthood\" + 0.008*\"biom\"\n", + "2019-01-31 01:03:07,728 : INFO : topic diff=0.004264, rho=0.027047\n", + "2019-01-31 01:03:07,883 : INFO : PROGRESS: pass 0, at document #2736000/4922894\n", + "2019-01-31 01:03:09,265 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:03:09,532 : INFO : topic #24 (0.020): 0.039*\"book\" + 0.033*\"publicis\" + 0.027*\"word\" + 0.018*\"new\" + 0.014*\"edit\" + 0.014*\"presid\" + 0.012*\"collect\" + 0.012*\"nicola\" + 0.012*\"storag\" + 0.011*\"author\"\n", + "2019-01-31 01:03:09,533 : INFO : topic #35 (0.020): 0.058*\"russia\" + 0.037*\"sovereignti\" + 0.031*\"rural\" + 0.027*\"poison\" + 0.023*\"personifi\" + 0.023*\"reprint\" + 0.021*\"moscow\" + 0.017*\"poland\" + 0.016*\"unfortun\" + 0.015*\"czech\"\n", + "2019-01-31 01:03:09,534 : INFO : topic #13 (0.020): 0.026*\"sourc\" + 0.025*\"australia\" + 0.024*\"new\" + 0.024*\"london\" + 0.022*\"australian\" + 0.022*\"england\" + 0.020*\"ireland\" + 0.019*\"british\" + 0.014*\"youth\" + 0.014*\"wale\"\n", + "2019-01-31 01:03:09,535 : INFO : topic #37 (0.020): 0.011*\"charact\" + 0.011*\"man\" + 0.010*\"septemb\" + 0.009*\"anim\" + 0.008*\"comic\" + 0.007*\"love\" + 0.007*\"appear\" + 0.006*\"gestur\" + 0.006*\"workplac\" + 0.006*\"vision\"\n", + "2019-01-31 01:03:09,536 : INFO : topic #34 (0.020): 0.068*\"start\" + 0.034*\"new\" + 0.031*\"american\" + 0.030*\"unionist\" + 0.025*\"cotton\" + 0.021*\"year\" + 0.015*\"california\" + 0.014*\"warrior\" + 0.013*\"terri\" + 0.012*\"north\"\n", + "2019-01-31 01:03:09,542 : INFO : topic diff=0.004053, rho=0.027037\n", + "2019-01-31 01:03:09,700 : INFO : PROGRESS: pass 0, at document #2738000/4922894\n", + "2019-01-31 01:03:11,093 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:03:11,360 : INFO : topic #17 (0.020): 0.077*\"church\" + 0.022*\"christian\" + 0.022*\"cathol\" + 0.020*\"bishop\" + 0.015*\"retroflex\" + 0.015*\"sail\" + 0.013*\"centuri\" + 0.009*\"relationship\" + 0.009*\"cathedr\" + 0.009*\"historiographi\"\n", + "2019-01-31 01:03:11,361 : INFO : topic #34 (0.020): 0.067*\"start\" + 0.034*\"new\" + 0.032*\"american\" + 0.030*\"unionist\" + 0.025*\"cotton\" + 0.021*\"year\" + 0.015*\"california\" + 0.014*\"warrior\" + 0.013*\"terri\" + 0.012*\"north\"\n", + "2019-01-31 01:03:11,362 : INFO : topic #1 (0.020): 0.052*\"china\" + 0.044*\"chilton\" + 0.025*\"hong\" + 0.024*\"kong\" + 0.022*\"korea\" + 0.019*\"korean\" + 0.016*\"sourc\" + 0.016*\"leah\" + 0.014*\"shirin\" + 0.014*\"kim\"\n", + "2019-01-31 01:03:11,363 : INFO : topic #35 (0.020): 0.059*\"russia\" + 0.037*\"sovereignti\" + 0.032*\"rural\" + 0.026*\"poison\" + 0.023*\"personifi\" + 0.023*\"reprint\" + 0.021*\"moscow\" + 0.017*\"poland\" + 0.016*\"unfortun\" + 0.015*\"czech\"\n", + "2019-01-31 01:03:11,364 : INFO : topic #42 (0.020): 0.047*\"german\" + 0.032*\"germani\" + 0.015*\"vol\" + 0.014*\"berlin\" + 0.014*\"israel\" + 0.014*\"der\" + 0.013*\"jewish\" + 0.010*\"european\" + 0.010*\"europ\" + 0.009*\"isra\"\n", + "2019-01-31 01:03:11,370 : INFO : topic diff=0.003620, rho=0.027027\n", + "2019-01-31 01:03:14,068 : INFO : -11.721 per-word bound, 3375.2 perplexity estimate based on a held-out corpus of 2000 documents with 540851 words\n", + "2019-01-31 01:03:14,068 : INFO : PROGRESS: pass 0, at document #2740000/4922894\n", + "2019-01-31 01:03:15,450 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:03:15,716 : INFO : topic #33 (0.020): 0.061*\"french\" + 0.047*\"franc\" + 0.031*\"pari\" + 0.024*\"sail\" + 0.022*\"jean\" + 0.018*\"daphn\" + 0.014*\"lazi\" + 0.013*\"loui\" + 0.012*\"piec\" + 0.008*\"wreath\"\n", + "2019-01-31 01:03:15,717 : INFO : topic #0 (0.020): 0.065*\"statewid\" + 0.044*\"line\" + 0.032*\"raid\" + 0.026*\"arsen\" + 0.023*\"museo\" + 0.020*\"rosenwald\" + 0.019*\"serv\" + 0.019*\"traceabl\" + 0.013*\"oper\" + 0.012*\"exhaust\"\n", + "2019-01-31 01:03:15,718 : INFO : topic #13 (0.020): 0.026*\"sourc\" + 0.026*\"australia\" + 0.024*\"new\" + 0.024*\"london\" + 0.022*\"australian\" + 0.022*\"england\" + 0.020*\"ireland\" + 0.019*\"british\" + 0.014*\"youth\" + 0.014*\"wale\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 01:03:15,719 : INFO : topic #48 (0.020): 0.082*\"march\" + 0.077*\"octob\" + 0.077*\"sens\" + 0.071*\"juli\" + 0.070*\"januari\" + 0.069*\"notion\" + 0.069*\"august\" + 0.068*\"judici\" + 0.068*\"decatur\" + 0.067*\"april\"\n", + "2019-01-31 01:03:15,720 : INFO : topic #9 (0.020): 0.067*\"bone\" + 0.045*\"american\" + 0.027*\"valour\" + 0.018*\"dutch\" + 0.018*\"player\" + 0.018*\"folei\" + 0.017*\"polit\" + 0.017*\"english\" + 0.012*\"simpler\" + 0.012*\"acrimoni\"\n", + "2019-01-31 01:03:15,726 : INFO : topic diff=0.004130, rho=0.027017\n", + "2019-01-31 01:03:15,888 : INFO : PROGRESS: pass 0, at document #2742000/4922894\n", + "2019-01-31 01:03:17,297 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:03:17,562 : INFO : topic #21 (0.020): 0.033*\"samford\" + 0.022*\"spain\" + 0.019*\"del\" + 0.017*\"mexico\" + 0.015*\"italian\" + 0.014*\"soviet\" + 0.012*\"santa\" + 0.011*\"juan\" + 0.011*\"carlo\" + 0.011*\"lizard\"\n", + "2019-01-31 01:03:17,564 : INFO : topic #6 (0.020): 0.070*\"fewer\" + 0.024*\"epiru\" + 0.020*\"septemb\" + 0.018*\"teacher\" + 0.016*\"stake\" + 0.012*\"rodríguez\" + 0.012*\"proclaim\" + 0.011*\"movi\" + 0.011*\"direct\" + 0.011*\"acrimoni\"\n", + "2019-01-31 01:03:17,565 : INFO : topic #37 (0.020): 0.011*\"charact\" + 0.010*\"man\" + 0.010*\"septemb\" + 0.009*\"anim\" + 0.008*\"comic\" + 0.007*\"love\" + 0.007*\"appear\" + 0.006*\"gestur\" + 0.006*\"workplac\" + 0.006*\"vision\"\n", + "2019-01-31 01:03:17,566 : INFO : topic #24 (0.020): 0.039*\"book\" + 0.033*\"publicis\" + 0.027*\"word\" + 0.018*\"new\" + 0.014*\"edit\" + 0.014*\"presid\" + 0.012*\"collect\" + 0.012*\"nicola\" + 0.011*\"storag\" + 0.011*\"author\"\n", + "2019-01-31 01:03:17,567 : INFO : topic #39 (0.020): 0.056*\"canada\" + 0.045*\"canadian\" + 0.024*\"hoar\" + 0.021*\"ontario\" + 0.021*\"toronto\" + 0.016*\"new\" + 0.016*\"hydrogen\" + 0.015*\"novotná\" + 0.014*\"misericordia\" + 0.014*\"quebec\"\n", + "2019-01-31 01:03:17,573 : INFO : topic diff=0.005132, rho=0.027007\n", + "2019-01-31 01:03:17,728 : INFO : PROGRESS: pass 0, at document #2744000/4922894\n", + "2019-01-31 01:03:19,088 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:03:19,355 : INFO : topic #17 (0.020): 0.077*\"church\" + 0.023*\"christian\" + 0.022*\"cathol\" + 0.020*\"bishop\" + 0.015*\"retroflex\" + 0.015*\"sail\" + 0.013*\"centuri\" + 0.009*\"relationship\" + 0.009*\"cathedr\" + 0.009*\"historiographi\"\n", + "2019-01-31 01:03:19,356 : INFO : topic #14 (0.020): 0.024*\"forc\" + 0.022*\"aggress\" + 0.021*\"armi\" + 0.020*\"walter\" + 0.017*\"com\" + 0.014*\"oper\" + 0.013*\"unionist\" + 0.013*\"militari\" + 0.011*\"airbu\" + 0.010*\"refut\"\n", + "2019-01-31 01:03:19,357 : INFO : topic #18 (0.020): 0.010*\"théori\" + 0.007*\"later\" + 0.007*\"sack\" + 0.006*\"dai\" + 0.005*\"kill\" + 0.005*\"retrospect\" + 0.005*\"like\" + 0.005*\"end\" + 0.004*\"help\" + 0.004*\"call\"\n", + "2019-01-31 01:03:19,358 : INFO : topic #21 (0.020): 0.032*\"samford\" + 0.022*\"spain\" + 0.019*\"del\" + 0.018*\"mexico\" + 0.015*\"italian\" + 0.014*\"soviet\" + 0.012*\"santa\" + 0.011*\"juan\" + 0.011*\"carlo\" + 0.011*\"lizard\"\n", + "2019-01-31 01:03:19,359 : INFO : topic #10 (0.020): 0.011*\"cdd\" + 0.009*\"hormon\" + 0.008*\"media\" + 0.008*\"disco\" + 0.008*\"have\" + 0.007*\"pathwai\" + 0.007*\"caus\" + 0.006*\"proper\" + 0.006*\"effect\" + 0.006*\"treat\"\n", + "2019-01-31 01:03:19,365 : INFO : topic diff=0.004357, rho=0.026997\n", + "2019-01-31 01:03:19,524 : INFO : PROGRESS: pass 0, at document #2746000/4922894\n", + "2019-01-31 01:03:21,267 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:03:21,534 : INFO : topic #17 (0.020): 0.078*\"church\" + 0.023*\"christian\" + 0.022*\"cathol\" + 0.020*\"bishop\" + 0.015*\"retroflex\" + 0.015*\"sail\" + 0.013*\"centuri\" + 0.009*\"historiographi\" + 0.009*\"cathedr\" + 0.009*\"relationship\"\n", + "2019-01-31 01:03:21,535 : INFO : topic #4 (0.020): 0.019*\"enfranchis\" + 0.015*\"depress\" + 0.015*\"pour\" + 0.010*\"mode\" + 0.009*\"elabor\" + 0.007*\"veget\" + 0.007*\"uruguayan\" + 0.006*\"encyclopedia\" + 0.006*\"produc\" + 0.006*\"develop\"\n", + "2019-01-31 01:03:21,536 : INFO : topic #33 (0.020): 0.061*\"french\" + 0.046*\"franc\" + 0.031*\"pari\" + 0.024*\"sail\" + 0.022*\"jean\" + 0.017*\"daphn\" + 0.014*\"lazi\" + 0.013*\"loui\" + 0.012*\"piec\" + 0.009*\"wine\"\n", + "2019-01-31 01:03:21,537 : INFO : topic #14 (0.020): 0.024*\"forc\" + 0.022*\"aggress\" + 0.021*\"armi\" + 0.020*\"walter\" + 0.017*\"com\" + 0.014*\"oper\" + 0.013*\"unionist\" + 0.013*\"militari\" + 0.011*\"airbu\" + 0.010*\"refut\"\n", + "2019-01-31 01:03:21,538 : INFO : topic #11 (0.020): 0.023*\"john\" + 0.012*\"will\" + 0.011*\"jame\" + 0.011*\"david\" + 0.010*\"rival\" + 0.009*\"mexican–american\" + 0.008*\"paul\" + 0.008*\"slur\" + 0.008*\"georg\" + 0.007*\"rhyme\"\n", + "2019-01-31 01:03:21,544 : INFO : topic diff=0.004067, rho=0.026988\n", + "2019-01-31 01:03:21,703 : INFO : PROGRESS: pass 0, at document #2748000/4922894\n", + "2019-01-31 01:03:23,091 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:03:23,357 : INFO : topic #40 (0.020): 0.089*\"unit\" + 0.024*\"schuster\" + 0.022*\"institut\" + 0.021*\"requir\" + 0.020*\"collector\" + 0.019*\"student\" + 0.014*\"professor\" + 0.012*\"word\" + 0.012*\"http\" + 0.011*\"degre\"\n", + "2019-01-31 01:03:23,359 : INFO : topic #18 (0.020): 0.010*\"théori\" + 0.007*\"later\" + 0.007*\"sack\" + 0.006*\"dai\" + 0.005*\"kill\" + 0.005*\"retrospect\" + 0.005*\"like\" + 0.005*\"end\" + 0.004*\"help\" + 0.004*\"call\"\n", + "2019-01-31 01:03:23,359 : INFO : topic #20 (0.020): 0.140*\"scholar\" + 0.038*\"struggl\" + 0.034*\"high\" + 0.029*\"educ\" + 0.022*\"collector\" + 0.017*\"yawn\" + 0.012*\"prognosi\" + 0.011*\"district\" + 0.010*\"gothic\" + 0.010*\"start\"\n", + "2019-01-31 01:03:23,361 : INFO : topic #17 (0.020): 0.077*\"church\" + 0.022*\"christian\" + 0.022*\"cathol\" + 0.020*\"bishop\" + 0.015*\"retroflex\" + 0.015*\"sail\" + 0.012*\"centuri\" + 0.009*\"historiographi\" + 0.009*\"cathedr\" + 0.009*\"relationship\"\n", + "2019-01-31 01:03:23,362 : INFO : topic #15 (0.020): 0.011*\"small\" + 0.010*\"organ\" + 0.010*\"develop\" + 0.009*\"commun\" + 0.009*\"group\" + 0.008*\"word\" + 0.008*\"peopl\" + 0.007*\"human\" + 0.007*\"woman\" + 0.006*\"cultur\"\n", + "2019-01-31 01:03:23,367 : INFO : topic diff=0.004250, rho=0.026978\n", + "2019-01-31 01:03:23,583 : INFO : PROGRESS: pass 0, at document #2750000/4922894\n", + "2019-01-31 01:03:24,968 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:03:25,234 : INFO : topic #42 (0.020): 0.047*\"german\" + 0.032*\"germani\" + 0.015*\"vol\" + 0.014*\"israel\" + 0.014*\"berlin\" + 0.014*\"der\" + 0.013*\"jewish\" + 0.010*\"european\" + 0.010*\"europ\" + 0.009*\"isra\"\n", + "2019-01-31 01:03:25,235 : INFO : topic #0 (0.020): 0.065*\"statewid\" + 0.043*\"line\" + 0.032*\"raid\" + 0.026*\"arsen\" + 0.023*\"museo\" + 0.020*\"rosenwald\" + 0.020*\"traceabl\" + 0.019*\"serv\" + 0.013*\"oper\" + 0.012*\"exhaust\"\n", + "2019-01-31 01:03:25,236 : INFO : topic #28 (0.020): 0.032*\"build\" + 0.026*\"hous\" + 0.021*\"rivièr\" + 0.018*\"buford\" + 0.014*\"histor\" + 0.012*\"briarwood\" + 0.011*\"constitut\" + 0.011*\"strategist\" + 0.011*\"linear\" + 0.010*\"depress\"\n", + "2019-01-31 01:03:25,238 : INFO : topic #38 (0.020): 0.024*\"walter\" + 0.011*\"aza\" + 0.009*\"battalion\" + 0.009*\"forc\" + 0.008*\"teufel\" + 0.007*\"empath\" + 0.007*\"armi\" + 0.007*\"till\" + 0.006*\"militari\" + 0.006*\"govern\"\n", + "2019-01-31 01:03:25,239 : INFO : topic #14 (0.020): 0.024*\"forc\" + 0.022*\"aggress\" + 0.021*\"armi\" + 0.020*\"walter\" + 0.017*\"com\" + 0.014*\"oper\" + 0.013*\"unionist\" + 0.013*\"militari\" + 0.012*\"airbu\" + 0.010*\"refut\"\n", + "2019-01-31 01:03:25,245 : INFO : topic diff=0.003930, rho=0.026968\n", + "2019-01-31 01:03:25,404 : INFO : PROGRESS: pass 0, at document #2752000/4922894\n", + "2019-01-31 01:03:26,789 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:03:27,056 : INFO : topic #3 (0.020): 0.032*\"present\" + 0.026*\"offic\" + 0.024*\"nation\" + 0.023*\"minist\" + 0.021*\"govern\" + 0.021*\"member\" + 0.018*\"serv\" + 0.017*\"gener\" + 0.016*\"start\" + 0.014*\"seri\"\n", + "2019-01-31 01:03:27,057 : INFO : topic #14 (0.020): 0.024*\"forc\" + 0.022*\"aggress\" + 0.021*\"armi\" + 0.020*\"walter\" + 0.017*\"com\" + 0.013*\"oper\" + 0.013*\"unionist\" + 0.013*\"militari\" + 0.011*\"airbu\" + 0.010*\"refut\"\n", + "2019-01-31 01:03:27,058 : INFO : topic #21 (0.020): 0.032*\"samford\" + 0.022*\"spain\" + 0.019*\"del\" + 0.018*\"mexico\" + 0.015*\"italian\" + 0.014*\"soviet\" + 0.012*\"santa\" + 0.011*\"juan\" + 0.011*\"carlo\" + 0.011*\"lizard\"\n", + "2019-01-31 01:03:27,059 : INFO : topic #9 (0.020): 0.065*\"bone\" + 0.046*\"american\" + 0.027*\"valour\" + 0.019*\"player\" + 0.018*\"folei\" + 0.018*\"dutch\" + 0.018*\"polit\" + 0.017*\"english\" + 0.012*\"acrimoni\" + 0.012*\"simpler\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 01:03:27,060 : INFO : topic #20 (0.020): 0.141*\"scholar\" + 0.038*\"struggl\" + 0.034*\"high\" + 0.029*\"educ\" + 0.023*\"collector\" + 0.017*\"yawn\" + 0.012*\"prognosi\" + 0.011*\"district\" + 0.010*\"gothic\" + 0.009*\"start\"\n", + "2019-01-31 01:03:27,066 : INFO : topic diff=0.003851, rho=0.026958\n", + "2019-01-31 01:03:27,223 : INFO : PROGRESS: pass 0, at document #2754000/4922894\n", + "2019-01-31 01:03:28,593 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:03:28,860 : INFO : topic #12 (0.020): 0.010*\"number\" + 0.008*\"frontal\" + 0.007*\"gener\" + 0.006*\"théori\" + 0.006*\"southern\" + 0.006*\"servitud\" + 0.006*\"exampl\" + 0.006*\"poet\" + 0.006*\"method\" + 0.006*\"theoret\"\n", + "2019-01-31 01:03:28,861 : INFO : topic #46 (0.020): 0.017*\"stop\" + 0.016*\"wind\" + 0.016*\"sweden\" + 0.015*\"norwai\" + 0.015*\"swedish\" + 0.014*\"damag\" + 0.013*\"norwegian\" + 0.012*\"danish\" + 0.011*\"huntsvil\" + 0.011*\"denmark\"\n", + "2019-01-31 01:03:28,862 : INFO : topic #15 (0.020): 0.011*\"small\" + 0.010*\"develop\" + 0.010*\"organ\" + 0.009*\"commun\" + 0.009*\"group\" + 0.008*\"word\" + 0.008*\"peopl\" + 0.007*\"human\" + 0.006*\"woman\" + 0.006*\"cultur\"\n", + "2019-01-31 01:03:28,863 : INFO : topic #1 (0.020): 0.052*\"china\" + 0.045*\"chilton\" + 0.026*\"hong\" + 0.025*\"kong\" + 0.021*\"korea\" + 0.018*\"korean\" + 0.016*\"sourc\" + 0.016*\"leah\" + 0.014*\"shirin\" + 0.014*\"kim\"\n", + "2019-01-31 01:03:28,864 : INFO : topic #45 (0.020): 0.028*\"jpg\" + 0.026*\"fifteenth\" + 0.019*\"illicit\" + 0.016*\"colder\" + 0.015*\"black\" + 0.014*\"western\" + 0.012*\"pain\" + 0.012*\"record\" + 0.010*\"blind\" + 0.009*\"depress\"\n", + "2019-01-31 01:03:28,870 : INFO : topic diff=0.005384, rho=0.026948\n", + "2019-01-31 01:03:29,027 : INFO : PROGRESS: pass 0, at document #2756000/4922894\n", + "2019-01-31 01:03:30,422 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:03:30,688 : INFO : topic #14 (0.020): 0.024*\"forc\" + 0.022*\"aggress\" + 0.021*\"armi\" + 0.020*\"walter\" + 0.017*\"com\" + 0.013*\"oper\" + 0.013*\"unionist\" + 0.013*\"militari\" + 0.011*\"airbu\" + 0.010*\"diversifi\"\n", + "2019-01-31 01:03:30,689 : INFO : topic #43 (0.020): 0.067*\"elect\" + 0.055*\"parti\" + 0.024*\"democrat\" + 0.023*\"voluntari\" + 0.023*\"member\" + 0.016*\"liber\" + 0.015*\"polici\" + 0.015*\"republ\" + 0.013*\"report\" + 0.013*\"bypass\"\n", + "2019-01-31 01:03:30,690 : INFO : topic #22 (0.020): 0.034*\"spars\" + 0.022*\"factor\" + 0.013*\"plaisir\" + 0.011*\"feel\" + 0.011*\"genu\" + 0.010*\"male\" + 0.008*\"median\" + 0.008*\"western\" + 0.008*\"biom\" + 0.007*\"incom\"\n", + "2019-01-31 01:03:30,691 : INFO : topic #46 (0.020): 0.018*\"norwai\" + 0.017*\"stop\" + 0.016*\"wind\" + 0.016*\"sweden\" + 0.015*\"swedish\" + 0.014*\"damag\" + 0.013*\"norwegian\" + 0.012*\"denmark\" + 0.012*\"danish\" + 0.011*\"huntsvil\"\n", + "2019-01-31 01:03:30,692 : INFO : topic #4 (0.020): 0.019*\"enfranchis\" + 0.015*\"depress\" + 0.015*\"pour\" + 0.010*\"mode\" + 0.009*\"elabor\" + 0.007*\"veget\" + 0.007*\"uruguayan\" + 0.006*\"encyclopedia\" + 0.006*\"produc\" + 0.006*\"spectacl\"\n", + "2019-01-31 01:03:30,698 : INFO : topic diff=0.003998, rho=0.026939\n", + "2019-01-31 01:03:30,852 : INFO : PROGRESS: pass 0, at document #2758000/4922894\n", + "2019-01-31 01:03:32,211 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:03:32,478 : INFO : topic #1 (0.020): 0.054*\"china\" + 0.045*\"chilton\" + 0.026*\"hong\" + 0.025*\"kong\" + 0.022*\"korea\" + 0.018*\"korean\" + 0.016*\"sourc\" + 0.015*\"leah\" + 0.014*\"shirin\" + 0.013*\"kim\"\n", + "2019-01-31 01:03:32,479 : INFO : topic #36 (0.020): 0.011*\"prognosi\" + 0.011*\"network\" + 0.009*\"pop\" + 0.008*\"cytokin\" + 0.008*\"develop\" + 0.008*\"softwar\" + 0.008*\"diggin\" + 0.008*\"uruguayan\" + 0.008*\"user\" + 0.007*\"championship\"\n", + "2019-01-31 01:03:32,480 : INFO : topic #28 (0.020): 0.032*\"build\" + 0.026*\"hous\" + 0.021*\"rivièr\" + 0.018*\"buford\" + 0.014*\"histor\" + 0.011*\"constitut\" + 0.011*\"briarwood\" + 0.011*\"linear\" + 0.011*\"strategist\" + 0.010*\"depress\"\n", + "2019-01-31 01:03:32,481 : INFO : topic #9 (0.020): 0.067*\"bone\" + 0.048*\"american\" + 0.026*\"valour\" + 0.018*\"english\" + 0.018*\"dutch\" + 0.018*\"player\" + 0.017*\"folei\" + 0.017*\"polit\" + 0.016*\"poch\" + 0.012*\"simpler\"\n", + "2019-01-31 01:03:32,482 : INFO : topic #32 (0.020): 0.049*\"district\" + 0.043*\"popolo\" + 0.041*\"vigour\" + 0.036*\"cotton\" + 0.035*\"tortur\" + 0.024*\"area\" + 0.021*\"multitud\" + 0.021*\"citi\" + 0.019*\"cede\" + 0.019*\"regim\"\n", + "2019-01-31 01:03:32,488 : INFO : topic diff=0.003665, rho=0.026929\n", + "2019-01-31 01:03:35,176 : INFO : -12.105 per-word bound, 4403.9 perplexity estimate based on a held-out corpus of 2000 documents with 559641 words\n", + "2019-01-31 01:03:35,177 : INFO : PROGRESS: pass 0, at document #2760000/4922894\n", + "2019-01-31 01:03:36,562 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:03:36,828 : INFO : topic #22 (0.020): 0.034*\"spars\" + 0.021*\"factor\" + 0.013*\"plaisir\" + 0.011*\"feel\" + 0.011*\"genu\" + 0.010*\"male\" + 0.008*\"median\" + 0.008*\"western\" + 0.008*\"biom\" + 0.007*\"incom\"\n", + "2019-01-31 01:03:36,829 : INFO : topic #21 (0.020): 0.032*\"samford\" + 0.022*\"spain\" + 0.020*\"del\" + 0.018*\"mexico\" + 0.015*\"italian\" + 0.014*\"soviet\" + 0.012*\"santa\" + 0.011*\"juan\" + 0.011*\"carlo\" + 0.011*\"lizard\"\n", + "2019-01-31 01:03:36,831 : INFO : topic #29 (0.020): 0.029*\"companhia\" + 0.012*\"busi\" + 0.012*\"million\" + 0.012*\"bank\" + 0.011*\"market\" + 0.011*\"produc\" + 0.009*\"industri\" + 0.008*\"yawn\" + 0.008*\"manag\" + 0.007*\"serv\"\n", + "2019-01-31 01:03:36,831 : INFO : topic #11 (0.020): 0.023*\"john\" + 0.012*\"will\" + 0.011*\"david\" + 0.011*\"jame\" + 0.010*\"rival\" + 0.009*\"mexican–american\" + 0.008*\"paul\" + 0.008*\"slur\" + 0.008*\"georg\" + 0.007*\"rhyme\"\n", + "2019-01-31 01:03:36,833 : INFO : topic #40 (0.020): 0.088*\"unit\" + 0.024*\"schuster\" + 0.022*\"institut\" + 0.021*\"requir\" + 0.020*\"collector\" + 0.019*\"student\" + 0.015*\"professor\" + 0.012*\"word\" + 0.012*\"http\" + 0.011*\"governor\"\n", + "2019-01-31 01:03:36,838 : INFO : topic diff=0.004872, rho=0.026919\n", + "2019-01-31 01:03:36,998 : INFO : PROGRESS: pass 0, at document #2762000/4922894\n", + "2019-01-31 01:03:38,395 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:03:38,661 : INFO : topic #47 (0.020): 0.063*\"muscl\" + 0.033*\"perceptu\" + 0.019*\"theater\" + 0.017*\"place\" + 0.017*\"compos\" + 0.015*\"damn\" + 0.015*\"orchestr\" + 0.013*\"physician\" + 0.013*\"olympo\" + 0.011*\"word\"\n", + "2019-01-31 01:03:38,662 : INFO : topic #14 (0.020): 0.024*\"forc\" + 0.022*\"aggress\" + 0.021*\"armi\" + 0.020*\"walter\" + 0.017*\"com\" + 0.013*\"oper\" + 0.013*\"unionist\" + 0.013*\"militari\" + 0.011*\"airbu\" + 0.011*\"refut\"\n", + "2019-01-31 01:03:38,664 : INFO : topic #45 (0.020): 0.028*\"jpg\" + 0.026*\"fifteenth\" + 0.019*\"illicit\" + 0.016*\"colder\" + 0.015*\"black\" + 0.014*\"western\" + 0.012*\"pain\" + 0.012*\"record\" + 0.010*\"blind\" + 0.009*\"depress\"\n", + "2019-01-31 01:03:38,665 : INFO : topic #32 (0.020): 0.049*\"district\" + 0.043*\"popolo\" + 0.041*\"vigour\" + 0.036*\"cotton\" + 0.035*\"tortur\" + 0.024*\"area\" + 0.021*\"multitud\" + 0.021*\"citi\" + 0.019*\"cede\" + 0.019*\"regim\"\n", + "2019-01-31 01:03:38,666 : INFO : topic #24 (0.020): 0.038*\"book\" + 0.033*\"publicis\" + 0.027*\"word\" + 0.018*\"new\" + 0.014*\"edit\" + 0.014*\"presid\" + 0.012*\"collect\" + 0.012*\"storag\" + 0.011*\"nicola\" + 0.010*\"author\"\n", + "2019-01-31 01:03:38,671 : INFO : topic diff=0.004664, rho=0.026909\n", + "2019-01-31 01:03:38,827 : INFO : PROGRESS: pass 0, at document #2764000/4922894\n", + "2019-01-31 01:03:40,214 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:03:40,480 : INFO : topic #49 (0.020): 0.042*\"india\" + 0.031*\"incumb\" + 0.014*\"islam\" + 0.012*\"pakistan\" + 0.012*\"anglo\" + 0.011*\"televis\" + 0.011*\"tajikistan\" + 0.010*\"khalsa\" + 0.010*\"muskoge\" + 0.010*\"sri\"\n", + "2019-01-31 01:03:40,481 : INFO : topic #10 (0.020): 0.012*\"cdd\" + 0.009*\"media\" + 0.008*\"hormon\" + 0.008*\"disco\" + 0.007*\"pathwai\" + 0.007*\"have\" + 0.007*\"caus\" + 0.006*\"proper\" + 0.006*\"effect\" + 0.006*\"treat\"\n", + "2019-01-31 01:03:40,482 : INFO : topic #30 (0.020): 0.036*\"cleveland\" + 0.035*\"leagu\" + 0.030*\"place\" + 0.028*\"taxpay\" + 0.024*\"scientist\" + 0.023*\"crete\" + 0.021*\"folei\" + 0.016*\"goal\" + 0.015*\"martin\" + 0.012*\"schmitz\"\n", + "2019-01-31 01:03:40,483 : INFO : topic #15 (0.020): 0.011*\"small\" + 0.010*\"develop\" + 0.010*\"organ\" + 0.010*\"commun\" + 0.008*\"group\" + 0.008*\"word\" + 0.008*\"peopl\" + 0.007*\"human\" + 0.006*\"woman\" + 0.006*\"summerhil\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 01:03:40,484 : INFO : topic #44 (0.020): 0.030*\"rooftop\" + 0.026*\"final\" + 0.022*\"wife\" + 0.020*\"tourist\" + 0.019*\"champion\" + 0.015*\"martin\" + 0.014*\"chamber\" + 0.014*\"taxpay\" + 0.013*\"tiepolo\" + 0.013*\"winner\"\n", + "2019-01-31 01:03:40,490 : INFO : topic diff=0.004126, rho=0.026900\n", + "2019-01-31 01:03:40,645 : INFO : PROGRESS: pass 0, at document #2766000/4922894\n", + "2019-01-31 01:03:42,012 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:03:42,279 : INFO : topic #14 (0.020): 0.024*\"forc\" + 0.022*\"aggress\" + 0.021*\"armi\" + 0.020*\"walter\" + 0.017*\"com\" + 0.013*\"oper\" + 0.013*\"unionist\" + 0.013*\"militari\" + 0.011*\"airbu\" + 0.011*\"refut\"\n", + "2019-01-31 01:03:42,280 : INFO : topic #32 (0.020): 0.049*\"district\" + 0.043*\"popolo\" + 0.041*\"vigour\" + 0.036*\"cotton\" + 0.035*\"tortur\" + 0.024*\"area\" + 0.021*\"multitud\" + 0.021*\"citi\" + 0.019*\"cede\" + 0.019*\"regim\"\n", + "2019-01-31 01:03:42,281 : INFO : topic #19 (0.020): 0.017*\"languag\" + 0.015*\"centuri\" + 0.010*\"woodcut\" + 0.009*\"form\" + 0.009*\"origin\" + 0.009*\"mean\" + 0.008*\"trade\" + 0.007*\"english\" + 0.007*\"known\" + 0.007*\"ancestor\"\n", + "2019-01-31 01:03:42,282 : INFO : topic #26 (0.020): 0.031*\"workplac\" + 0.029*\"champion\" + 0.028*\"woman\" + 0.026*\"men\" + 0.024*\"olymp\" + 0.022*\"alic\" + 0.021*\"medal\" + 0.020*\"event\" + 0.018*\"atheist\" + 0.018*\"rainfal\"\n", + "2019-01-31 01:03:42,283 : INFO : topic #49 (0.020): 0.042*\"india\" + 0.031*\"incumb\" + 0.014*\"islam\" + 0.012*\"anglo\" + 0.012*\"pakistan\" + 0.011*\"televis\" + 0.010*\"tajikistan\" + 0.010*\"muskoge\" + 0.010*\"khalsa\" + 0.010*\"sri\"\n", + "2019-01-31 01:03:42,289 : INFO : topic diff=0.003602, rho=0.026890\n", + "2019-01-31 01:03:42,443 : INFO : PROGRESS: pass 0, at document #2768000/4922894\n", + "2019-01-31 01:03:43,825 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:03:44,091 : INFO : topic #10 (0.020): 0.012*\"cdd\" + 0.008*\"media\" + 0.008*\"hormon\" + 0.008*\"disco\" + 0.007*\"have\" + 0.007*\"pathwai\" + 0.007*\"caus\" + 0.006*\"proper\" + 0.006*\"effect\" + 0.006*\"treat\"\n", + "2019-01-31 01:03:44,093 : INFO : topic #24 (0.020): 0.039*\"book\" + 0.033*\"publicis\" + 0.027*\"word\" + 0.018*\"new\" + 0.015*\"edit\" + 0.014*\"presid\" + 0.012*\"collect\" + 0.012*\"storag\" + 0.011*\"nicola\" + 0.010*\"author\"\n", + "2019-01-31 01:03:44,094 : INFO : topic #15 (0.020): 0.011*\"small\" + 0.010*\"develop\" + 0.010*\"organ\" + 0.010*\"commun\" + 0.009*\"group\" + 0.008*\"word\" + 0.008*\"peopl\" + 0.007*\"human\" + 0.006*\"woman\" + 0.006*\"summerhil\"\n", + "2019-01-31 01:03:44,095 : INFO : topic #41 (0.020): 0.040*\"citi\" + 0.025*\"palmer\" + 0.022*\"new\" + 0.014*\"strategist\" + 0.013*\"center\" + 0.012*\"open\" + 0.011*\"includ\" + 0.011*\"lobe\" + 0.010*\"dai\" + 0.009*\"highli\"\n", + "2019-01-31 01:03:44,096 : INFO : topic #17 (0.020): 0.077*\"church\" + 0.022*\"christian\" + 0.022*\"cathol\" + 0.020*\"bishop\" + 0.015*\"sail\" + 0.015*\"retroflex\" + 0.012*\"centuri\" + 0.009*\"relationship\" + 0.009*\"cathedr\" + 0.009*\"historiographi\"\n", + "2019-01-31 01:03:44,102 : INFO : topic diff=0.003832, rho=0.026880\n", + "2019-01-31 01:03:44,253 : INFO : PROGRESS: pass 0, at document #2770000/4922894\n", + "2019-01-31 01:03:45,590 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:03:45,856 : INFO : topic #15 (0.020): 0.011*\"small\" + 0.010*\"develop\" + 0.010*\"organ\" + 0.009*\"commun\" + 0.009*\"group\" + 0.008*\"word\" + 0.008*\"peopl\" + 0.007*\"human\" + 0.006*\"woman\" + 0.006*\"summerhil\"\n", + "2019-01-31 01:03:45,857 : INFO : topic #35 (0.020): 0.057*\"russia\" + 0.037*\"sovereignti\" + 0.033*\"rural\" + 0.027*\"poison\" + 0.025*\"personifi\" + 0.023*\"moscow\" + 0.023*\"reprint\" + 0.017*\"poland\" + 0.016*\"unfortun\" + 0.014*\"malaysia\"\n", + "2019-01-31 01:03:45,858 : INFO : topic #37 (0.020): 0.011*\"charact\" + 0.010*\"man\" + 0.010*\"septemb\" + 0.009*\"anim\" + 0.008*\"comic\" + 0.007*\"appear\" + 0.007*\"love\" + 0.006*\"gestur\" + 0.006*\"workplac\" + 0.005*\"storag\"\n", + "2019-01-31 01:03:45,859 : INFO : topic #40 (0.020): 0.087*\"unit\" + 0.024*\"schuster\" + 0.023*\"institut\" + 0.021*\"requir\" + 0.021*\"collector\" + 0.019*\"student\" + 0.015*\"professor\" + 0.012*\"word\" + 0.012*\"http\" + 0.011*\"governor\"\n", + "2019-01-31 01:03:45,860 : INFO : topic #48 (0.020): 0.081*\"march\" + 0.080*\"octob\" + 0.079*\"sens\" + 0.071*\"juli\" + 0.071*\"januari\" + 0.071*\"august\" + 0.070*\"notion\" + 0.069*\"judici\" + 0.068*\"decatur\" + 0.068*\"april\"\n", + "2019-01-31 01:03:45,866 : INFO : topic diff=0.004574, rho=0.026870\n", + "2019-01-31 01:03:46,026 : INFO : PROGRESS: pass 0, at document #2772000/4922894\n", + "2019-01-31 01:03:47,429 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:03:47,695 : INFO : topic #23 (0.020): 0.137*\"audit\" + 0.067*\"best\" + 0.033*\"yawn\" + 0.029*\"jacksonvil\" + 0.023*\"japanes\" + 0.021*\"noll\" + 0.020*\"festiv\" + 0.019*\"women\" + 0.018*\"intern\" + 0.014*\"prison\"\n", + "2019-01-31 01:03:47,696 : INFO : topic #4 (0.020): 0.020*\"enfranchis\" + 0.015*\"pour\" + 0.015*\"depress\" + 0.010*\"elabor\" + 0.010*\"mode\" + 0.008*\"veget\" + 0.007*\"uruguayan\" + 0.006*\"encyclopedia\" + 0.006*\"develop\" + 0.006*\"spectacl\"\n", + "2019-01-31 01:03:47,697 : INFO : topic #0 (0.020): 0.067*\"statewid\" + 0.043*\"line\" + 0.032*\"raid\" + 0.025*\"arsen\" + 0.023*\"museo\" + 0.021*\"rosenwald\" + 0.020*\"traceabl\" + 0.019*\"serv\" + 0.013*\"oper\" + 0.011*\"exhaust\"\n", + "2019-01-31 01:03:47,698 : INFO : topic #7 (0.020): 0.021*\"snatch\" + 0.020*\"di\" + 0.019*\"factor\" + 0.016*\"yawn\" + 0.016*\"margin\" + 0.014*\"bone\" + 0.013*\"life\" + 0.013*\"faster\" + 0.012*\"deal\" + 0.012*\"john\"\n", + "2019-01-31 01:03:47,700 : INFO : topic #41 (0.020): 0.041*\"citi\" + 0.025*\"palmer\" + 0.022*\"new\" + 0.014*\"strategist\" + 0.013*\"center\" + 0.012*\"open\" + 0.011*\"includ\" + 0.011*\"lobe\" + 0.010*\"dai\" + 0.009*\"highli\"\n", + "2019-01-31 01:03:47,705 : INFO : topic diff=0.004350, rho=0.026861\n", + "2019-01-31 01:03:47,861 : INFO : PROGRESS: pass 0, at document #2774000/4922894\n", + "2019-01-31 01:03:49,243 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:03:49,509 : INFO : topic #35 (0.020): 0.057*\"russia\" + 0.038*\"sovereignti\" + 0.033*\"rural\" + 0.026*\"poison\" + 0.025*\"personifi\" + 0.023*\"moscow\" + 0.023*\"reprint\" + 0.017*\"poland\" + 0.016*\"unfortun\" + 0.015*\"malaysia\"\n", + "2019-01-31 01:03:49,510 : INFO : topic #45 (0.020): 0.027*\"jpg\" + 0.025*\"fifteenth\" + 0.019*\"illicit\" + 0.016*\"colder\" + 0.015*\"black\" + 0.014*\"western\" + 0.012*\"pain\" + 0.012*\"record\" + 0.010*\"blind\" + 0.009*\"depress\"\n", + "2019-01-31 01:03:49,511 : INFO : topic #10 (0.020): 0.012*\"cdd\" + 0.009*\"hormon\" + 0.008*\"media\" + 0.008*\"disco\" + 0.007*\"pathwai\" + 0.007*\"have\" + 0.007*\"caus\" + 0.006*\"proper\" + 0.006*\"effect\" + 0.006*\"treat\"\n", + "2019-01-31 01:03:49,513 : INFO : topic #23 (0.020): 0.136*\"audit\" + 0.067*\"best\" + 0.033*\"yawn\" + 0.029*\"jacksonvil\" + 0.023*\"japanes\" + 0.021*\"noll\" + 0.020*\"festiv\" + 0.019*\"women\" + 0.018*\"intern\" + 0.014*\"prison\"\n", + "2019-01-31 01:03:49,514 : INFO : topic #39 (0.020): 0.058*\"canada\" + 0.044*\"canadian\" + 0.024*\"hoar\" + 0.022*\"toronto\" + 0.021*\"ontario\" + 0.016*\"new\" + 0.015*\"hydrogen\" + 0.014*\"novotná\" + 0.014*\"misericordia\" + 0.013*\"quebec\"\n", + "2019-01-31 01:03:49,520 : INFO : topic diff=0.003771, rho=0.026851\n", + "2019-01-31 01:03:49,671 : INFO : PROGRESS: pass 0, at document #2776000/4922894\n", + "2019-01-31 01:03:51,045 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:03:51,311 : INFO : topic #14 (0.020): 0.024*\"forc\" + 0.022*\"armi\" + 0.022*\"aggress\" + 0.020*\"walter\" + 0.017*\"com\" + 0.013*\"oper\" + 0.013*\"unionist\" + 0.012*\"militari\" + 0.012*\"airbu\" + 0.011*\"refut\"\n", + "2019-01-31 01:03:51,312 : INFO : topic #16 (0.020): 0.053*\"king\" + 0.031*\"priest\" + 0.023*\"duke\" + 0.021*\"idiosyncrat\" + 0.020*\"rotterdam\" + 0.018*\"grammat\" + 0.018*\"quarterli\" + 0.012*\"kingdom\" + 0.012*\"brazil\" + 0.012*\"count\"\n", + "2019-01-31 01:03:51,313 : INFO : topic #21 (0.020): 0.034*\"samford\" + 0.022*\"spain\" + 0.019*\"del\" + 0.017*\"mexico\" + 0.015*\"italian\" + 0.014*\"soviet\" + 0.012*\"santa\" + 0.011*\"lizard\" + 0.011*\"carlo\" + 0.011*\"juan\"\n", + "2019-01-31 01:03:51,314 : INFO : topic #22 (0.020): 0.034*\"spars\" + 0.021*\"factor\" + 0.013*\"plaisir\" + 0.011*\"genu\" + 0.010*\"feel\" + 0.009*\"male\" + 0.008*\"median\" + 0.008*\"western\" + 0.008*\"biom\" + 0.007*\"incom\"\n", + "2019-01-31 01:03:51,315 : INFO : topic #24 (0.020): 0.038*\"book\" + 0.034*\"publicis\" + 0.028*\"word\" + 0.018*\"new\" + 0.015*\"edit\" + 0.014*\"presid\" + 0.012*\"collect\" + 0.012*\"storag\" + 0.011*\"nicola\" + 0.010*\"author\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 01:03:51,321 : INFO : topic diff=0.003960, rho=0.026841\n", + "2019-01-31 01:03:51,479 : INFO : PROGRESS: pass 0, at document #2778000/4922894\n", + "2019-01-31 01:03:52,981 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:03:53,246 : INFO : topic #42 (0.020): 0.047*\"german\" + 0.031*\"germani\" + 0.016*\"vol\" + 0.014*\"berlin\" + 0.014*\"israel\" + 0.014*\"der\" + 0.013*\"jewish\" + 0.010*\"european\" + 0.009*\"europ\" + 0.009*\"austria\"\n", + "2019-01-31 01:03:53,248 : INFO : topic #5 (0.020): 0.039*\"abroad\" + 0.029*\"son\" + 0.027*\"rel\" + 0.026*\"reconstruct\" + 0.021*\"band\" + 0.017*\"muscl\" + 0.016*\"simultan\" + 0.014*\"charcoal\" + 0.014*\"toyota\" + 0.010*\"myspac\"\n", + "2019-01-31 01:03:53,249 : INFO : topic #46 (0.020): 0.019*\"norwai\" + 0.017*\"sweden\" + 0.016*\"stop\" + 0.016*\"wind\" + 0.015*\"swedish\" + 0.014*\"norwegian\" + 0.013*\"damag\" + 0.012*\"danish\" + 0.012*\"denmark\" + 0.010*\"huntsvil\"\n", + "2019-01-31 01:03:53,250 : INFO : topic #21 (0.020): 0.034*\"samford\" + 0.022*\"spain\" + 0.019*\"del\" + 0.017*\"mexico\" + 0.015*\"italian\" + 0.014*\"soviet\" + 0.013*\"santa\" + 0.011*\"lizard\" + 0.011*\"carlo\" + 0.011*\"juan\"\n", + "2019-01-31 01:03:53,251 : INFO : topic #12 (0.020): 0.010*\"number\" + 0.008*\"frontal\" + 0.007*\"gener\" + 0.007*\"théori\" + 0.006*\"exampl\" + 0.006*\"southern\" + 0.006*\"method\" + 0.006*\"servitud\" + 0.006*\"poet\" + 0.006*\"measur\"\n", + "2019-01-31 01:03:53,257 : INFO : topic diff=0.004358, rho=0.026832\n", + "2019-01-31 01:03:55,893 : INFO : -11.579 per-word bound, 3060.1 perplexity estimate based on a held-out corpus of 2000 documents with 531217 words\n", + "2019-01-31 01:03:55,893 : INFO : PROGRESS: pass 0, at document #2780000/4922894\n", + "2019-01-31 01:03:57,259 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:03:57,525 : INFO : topic #44 (0.020): 0.030*\"rooftop\" + 0.027*\"final\" + 0.022*\"wife\" + 0.021*\"tourist\" + 0.019*\"champion\" + 0.015*\"martin\" + 0.015*\"chamber\" + 0.014*\"tiepolo\" + 0.014*\"taxpay\" + 0.013*\"winner\"\n", + "2019-01-31 01:03:57,526 : INFO : topic #28 (0.020): 0.032*\"build\" + 0.026*\"hous\" + 0.021*\"rivièr\" + 0.017*\"buford\" + 0.014*\"histor\" + 0.011*\"briarwood\" + 0.011*\"constitut\" + 0.011*\"strategist\" + 0.010*\"depress\" + 0.010*\"linear\"\n", + "2019-01-31 01:03:57,527 : INFO : topic #16 (0.020): 0.053*\"king\" + 0.031*\"priest\" + 0.023*\"duke\" + 0.021*\"idiosyncrat\" + 0.020*\"rotterdam\" + 0.018*\"grammat\" + 0.018*\"quarterli\" + 0.012*\"brazil\" + 0.012*\"kingdom\" + 0.012*\"count\"\n", + "2019-01-31 01:03:57,529 : INFO : topic #4 (0.020): 0.020*\"enfranchis\" + 0.015*\"depress\" + 0.015*\"pour\" + 0.010*\"mode\" + 0.010*\"elabor\" + 0.008*\"veget\" + 0.007*\"uruguayan\" + 0.006*\"spectacl\" + 0.006*\"develop\" + 0.006*\"encyclopedia\"\n", + "2019-01-31 01:03:57,530 : INFO : topic #49 (0.020): 0.042*\"india\" + 0.033*\"incumb\" + 0.014*\"islam\" + 0.012*\"pakistan\" + 0.012*\"anglo\" + 0.011*\"muskoge\" + 0.010*\"televis\" + 0.010*\"khalsa\" + 0.010*\"affection\" + 0.010*\"tajikistan\"\n", + "2019-01-31 01:03:57,535 : INFO : topic diff=0.003553, rho=0.026822\n", + "2019-01-31 01:03:57,749 : INFO : PROGRESS: pass 0, at document #2782000/4922894\n", + "2019-01-31 01:03:59,140 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:03:59,406 : INFO : topic #23 (0.020): 0.136*\"audit\" + 0.067*\"best\" + 0.033*\"yawn\" + 0.029*\"jacksonvil\" + 0.023*\"japanes\" + 0.021*\"noll\" + 0.020*\"festiv\" + 0.019*\"women\" + 0.018*\"intern\" + 0.014*\"prison\"\n", + "2019-01-31 01:03:59,408 : INFO : topic #11 (0.020): 0.023*\"john\" + 0.012*\"will\" + 0.012*\"jame\" + 0.011*\"david\" + 0.010*\"rival\" + 0.009*\"mexican–american\" + 0.008*\"paul\" + 0.008*\"slur\" + 0.008*\"georg\" + 0.007*\"rhyme\"\n", + "2019-01-31 01:03:59,409 : INFO : topic #16 (0.020): 0.053*\"king\" + 0.031*\"priest\" + 0.023*\"duke\" + 0.021*\"idiosyncrat\" + 0.020*\"rotterdam\" + 0.018*\"quarterli\" + 0.018*\"grammat\" + 0.012*\"brazil\" + 0.012*\"kingdom\" + 0.012*\"portugues\"\n", + "2019-01-31 01:03:59,410 : INFO : topic #34 (0.020): 0.067*\"start\" + 0.034*\"new\" + 0.031*\"american\" + 0.029*\"unionist\" + 0.025*\"cotton\" + 0.022*\"year\" + 0.015*\"california\" + 0.013*\"warrior\" + 0.013*\"terri\" + 0.012*\"north\"\n", + "2019-01-31 01:03:59,411 : INFO : topic #43 (0.020): 0.067*\"elect\" + 0.055*\"parti\" + 0.024*\"democrat\" + 0.023*\"voluntari\" + 0.022*\"member\" + 0.016*\"polici\" + 0.015*\"liber\" + 0.015*\"republ\" + 0.014*\"bypass\" + 0.013*\"report\"\n", + "2019-01-31 01:03:59,417 : INFO : topic diff=0.004201, rho=0.026812\n", + "2019-01-31 01:03:59,576 : INFO : PROGRESS: pass 0, at document #2784000/4922894\n", + "2019-01-31 01:04:00,967 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:04:01,234 : INFO : topic #0 (0.020): 0.067*\"statewid\" + 0.044*\"line\" + 0.034*\"raid\" + 0.024*\"arsen\" + 0.023*\"museo\" + 0.020*\"rosenwald\" + 0.020*\"traceabl\" + 0.019*\"serv\" + 0.013*\"oper\" + 0.011*\"exhaust\"\n", + "2019-01-31 01:04:01,235 : INFO : topic #44 (0.020): 0.030*\"rooftop\" + 0.027*\"final\" + 0.023*\"wife\" + 0.021*\"tourist\" + 0.019*\"champion\" + 0.015*\"martin\" + 0.015*\"chamber\" + 0.014*\"tiepolo\" + 0.014*\"taxpay\" + 0.013*\"winner\"\n", + "2019-01-31 01:04:01,236 : INFO : topic #28 (0.020): 0.032*\"build\" + 0.026*\"hous\" + 0.020*\"rivièr\" + 0.017*\"buford\" + 0.014*\"histor\" + 0.012*\"briarwood\" + 0.011*\"constitut\" + 0.011*\"strategist\" + 0.010*\"depress\" + 0.010*\"linear\"\n", + "2019-01-31 01:04:01,237 : INFO : topic #39 (0.020): 0.058*\"canada\" + 0.044*\"canadian\" + 0.023*\"hoar\" + 0.023*\"toronto\" + 0.022*\"ontario\" + 0.017*\"new\" + 0.015*\"novotná\" + 0.014*\"hydrogen\" + 0.014*\"misericordia\" + 0.013*\"quebec\"\n", + "2019-01-31 01:04:01,238 : INFO : topic #18 (0.020): 0.010*\"théori\" + 0.007*\"later\" + 0.007*\"sack\" + 0.006*\"dai\" + 0.005*\"kill\" + 0.005*\"like\" + 0.005*\"retrospect\" + 0.005*\"end\" + 0.004*\"call\" + 0.004*\"kenworthi\"\n", + "2019-01-31 01:04:01,244 : INFO : topic diff=0.004013, rho=0.026803\n", + "2019-01-31 01:04:01,403 : INFO : PROGRESS: pass 0, at document #2786000/4922894\n", + "2019-01-31 01:04:02,795 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:04:03,061 : INFO : topic #47 (0.020): 0.064*\"muscl\" + 0.032*\"perceptu\" + 0.019*\"theater\" + 0.017*\"compos\" + 0.017*\"place\" + 0.015*\"damn\" + 0.014*\"orchestr\" + 0.013*\"olympo\" + 0.013*\"physician\" + 0.011*\"word\"\n", + "2019-01-31 01:04:03,063 : INFO : topic #10 (0.020): 0.012*\"cdd\" + 0.009*\"hormon\" + 0.008*\"media\" + 0.008*\"disco\" + 0.007*\"have\" + 0.007*\"pathwai\" + 0.007*\"caus\" + 0.006*\"proper\" + 0.006*\"effect\" + 0.006*\"treat\"\n", + "2019-01-31 01:04:03,065 : INFO : topic #15 (0.020): 0.011*\"small\" + 0.010*\"develop\" + 0.010*\"organ\" + 0.009*\"commun\" + 0.008*\"group\" + 0.008*\"word\" + 0.008*\"peopl\" + 0.007*\"human\" + 0.006*\"summerhil\" + 0.006*\"woman\"\n", + "2019-01-31 01:04:03,066 : INFO : topic #42 (0.020): 0.047*\"german\" + 0.031*\"germani\" + 0.015*\"vol\" + 0.014*\"berlin\" + 0.014*\"israel\" + 0.014*\"der\" + 0.013*\"jewish\" + 0.010*\"european\" + 0.009*\"austria\" + 0.009*\"europ\"\n", + "2019-01-31 01:04:03,067 : INFO : topic #4 (0.020): 0.020*\"enfranchis\" + 0.015*\"depress\" + 0.015*\"pour\" + 0.010*\"mode\" + 0.010*\"elabor\" + 0.008*\"veget\" + 0.007*\"uruguayan\" + 0.006*\"spectacl\" + 0.006*\"encyclopedia\" + 0.006*\"produc\"\n", + "2019-01-31 01:04:03,073 : INFO : topic diff=0.004963, rho=0.026793\n", + "2019-01-31 01:04:03,224 : INFO : PROGRESS: pass 0, at document #2788000/4922894\n", + "2019-01-31 01:04:04,694 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:04:04,960 : INFO : topic #19 (0.020): 0.017*\"languag\" + 0.014*\"centuri\" + 0.011*\"woodcut\" + 0.009*\"form\" + 0.009*\"mean\" + 0.009*\"origin\" + 0.008*\"trade\" + 0.008*\"english\" + 0.007*\"known\" + 0.006*\"ancestor\"\n", + "2019-01-31 01:04:04,962 : INFO : topic #42 (0.020): 0.047*\"german\" + 0.031*\"germani\" + 0.015*\"vol\" + 0.014*\"berlin\" + 0.014*\"israel\" + 0.014*\"der\" + 0.013*\"jewish\" + 0.011*\"european\" + 0.009*\"europ\" + 0.009*\"austria\"\n", + "2019-01-31 01:04:04,963 : INFO : topic #16 (0.020): 0.053*\"king\" + 0.030*\"priest\" + 0.023*\"duke\" + 0.020*\"idiosyncrat\" + 0.020*\"rotterdam\" + 0.018*\"grammat\" + 0.018*\"quarterli\" + 0.013*\"brazil\" + 0.012*\"kingdom\" + 0.012*\"portugues\"\n", + "2019-01-31 01:04:04,964 : INFO : topic #28 (0.020): 0.032*\"build\" + 0.026*\"hous\" + 0.020*\"rivièr\" + 0.017*\"buford\" + 0.014*\"histor\" + 0.011*\"strategist\" + 0.011*\"briarwood\" + 0.011*\"constitut\" + 0.010*\"depress\" + 0.010*\"linear\"\n", + "2019-01-31 01:04:04,965 : INFO : topic #24 (0.020): 0.039*\"book\" + 0.033*\"publicis\" + 0.028*\"word\" + 0.018*\"new\" + 0.015*\"edit\" + 0.013*\"presid\" + 0.012*\"storag\" + 0.012*\"collect\" + 0.011*\"nicola\" + 0.010*\"author\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 01:04:04,971 : INFO : topic diff=0.003588, rho=0.026784\n", + "2019-01-31 01:04:05,129 : INFO : PROGRESS: pass 0, at document #2790000/4922894\n", + "2019-01-31 01:04:06,533 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:04:06,800 : INFO : topic #11 (0.020): 0.023*\"john\" + 0.012*\"will\" + 0.012*\"jame\" + 0.012*\"david\" + 0.010*\"rival\" + 0.009*\"mexican–american\" + 0.008*\"paul\" + 0.008*\"slur\" + 0.008*\"georg\" + 0.007*\"rhyme\"\n", + "2019-01-31 01:04:06,801 : INFO : topic #41 (0.020): 0.042*\"citi\" + 0.024*\"palmer\" + 0.022*\"new\" + 0.016*\"strategist\" + 0.013*\"center\" + 0.012*\"open\" + 0.011*\"includ\" + 0.011*\"lobe\" + 0.010*\"dai\" + 0.009*\"highli\"\n", + "2019-01-31 01:04:06,802 : INFO : topic #36 (0.020): 0.011*\"prognosi\" + 0.011*\"network\" + 0.009*\"pop\" + 0.009*\"cytokin\" + 0.008*\"develop\" + 0.008*\"uruguayan\" + 0.008*\"user\" + 0.008*\"softwar\" + 0.007*\"diggin\" + 0.007*\"includ\"\n", + "2019-01-31 01:04:06,803 : INFO : topic #14 (0.020): 0.024*\"forc\" + 0.022*\"aggress\" + 0.022*\"armi\" + 0.020*\"walter\" + 0.017*\"com\" + 0.013*\"oper\" + 0.013*\"unionist\" + 0.012*\"militari\" + 0.012*\"airbu\" + 0.011*\"refut\"\n", + "2019-01-31 01:04:06,804 : INFO : topic #13 (0.020): 0.027*\"sourc\" + 0.026*\"australia\" + 0.024*\"new\" + 0.024*\"london\" + 0.022*\"england\" + 0.022*\"australian\" + 0.019*\"british\" + 0.018*\"ireland\" + 0.015*\"youth\" + 0.014*\"wale\"\n", + "2019-01-31 01:04:06,810 : INFO : topic diff=0.004202, rho=0.026774\n", + "2019-01-31 01:04:06,969 : INFO : PROGRESS: pass 0, at document #2792000/4922894\n", + "2019-01-31 01:04:08,367 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:04:08,634 : INFO : topic #46 (0.020): 0.018*\"norwai\" + 0.017*\"stop\" + 0.017*\"sweden\" + 0.015*\"wind\" + 0.015*\"damag\" + 0.014*\"swedish\" + 0.014*\"norwegian\" + 0.012*\"denmark\" + 0.011*\"farid\" + 0.011*\"danish\"\n", + "2019-01-31 01:04:08,635 : INFO : topic #22 (0.020): 0.035*\"spars\" + 0.021*\"factor\" + 0.013*\"plaisir\" + 0.011*\"genu\" + 0.010*\"feel\" + 0.009*\"male\" + 0.008*\"median\" + 0.008*\"western\" + 0.007*\"biom\" + 0.007*\"incom\"\n", + "2019-01-31 01:04:08,636 : INFO : topic #39 (0.020): 0.059*\"canada\" + 0.044*\"canadian\" + 0.023*\"toronto\" + 0.023*\"hoar\" + 0.022*\"ontario\" + 0.017*\"new\" + 0.015*\"novotná\" + 0.015*\"misericordia\" + 0.014*\"hydrogen\" + 0.013*\"quebec\"\n", + "2019-01-31 01:04:08,637 : INFO : topic #29 (0.020): 0.030*\"companhia\" + 0.012*\"busi\" + 0.012*\"bank\" + 0.012*\"market\" + 0.011*\"million\" + 0.011*\"produc\" + 0.009*\"industri\" + 0.008*\"yawn\" + 0.008*\"manag\" + 0.007*\"serv\"\n", + "2019-01-31 01:04:08,638 : INFO : topic #17 (0.020): 0.077*\"church\" + 0.022*\"christian\" + 0.022*\"cathol\" + 0.020*\"bishop\" + 0.016*\"retroflex\" + 0.015*\"sail\" + 0.012*\"centuri\" + 0.010*\"relationship\" + 0.009*\"historiographi\" + 0.009*\"cathedr\"\n", + "2019-01-31 01:04:08,644 : INFO : topic diff=0.003997, rho=0.026764\n", + "2019-01-31 01:04:08,806 : INFO : PROGRESS: pass 0, at document #2794000/4922894\n", + "2019-01-31 01:04:10,233 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:04:10,499 : INFO : topic #22 (0.020): 0.034*\"spars\" + 0.021*\"factor\" + 0.013*\"plaisir\" + 0.011*\"genu\" + 0.010*\"feel\" + 0.009*\"male\" + 0.008*\"western\" + 0.008*\"median\" + 0.007*\"biom\" + 0.007*\"incom\"\n", + "2019-01-31 01:04:10,500 : INFO : topic #43 (0.020): 0.067*\"elect\" + 0.056*\"parti\" + 0.024*\"democrat\" + 0.023*\"voluntari\" + 0.022*\"member\" + 0.016*\"polici\" + 0.015*\"republ\" + 0.014*\"liber\" + 0.013*\"bypass\" + 0.013*\"report\"\n", + "2019-01-31 01:04:10,501 : INFO : topic #15 (0.020): 0.011*\"small\" + 0.011*\"develop\" + 0.010*\"organ\" + 0.009*\"commun\" + 0.008*\"group\" + 0.008*\"word\" + 0.008*\"peopl\" + 0.007*\"human\" + 0.006*\"woman\" + 0.006*\"summerhil\"\n", + "2019-01-31 01:04:10,502 : INFO : topic #16 (0.020): 0.053*\"king\" + 0.030*\"priest\" + 0.022*\"duke\" + 0.021*\"idiosyncrat\" + 0.020*\"rotterdam\" + 0.018*\"grammat\" + 0.018*\"quarterli\" + 0.013*\"portugues\" + 0.012*\"brazil\" + 0.012*\"kingdom\"\n", + "2019-01-31 01:04:10,503 : INFO : topic #37 (0.020): 0.011*\"charact\" + 0.010*\"man\" + 0.010*\"septemb\" + 0.009*\"anim\" + 0.008*\"comic\" + 0.007*\"appear\" + 0.007*\"love\" + 0.006*\"gestur\" + 0.006*\"workplac\" + 0.006*\"storag\"\n", + "2019-01-31 01:04:10,509 : INFO : topic diff=0.004727, rho=0.026755\n", + "2019-01-31 01:04:10,668 : INFO : PROGRESS: pass 0, at document #2796000/4922894\n", + "2019-01-31 01:04:12,083 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:04:12,349 : INFO : topic #48 (0.020): 0.085*\"march\" + 0.079*\"octob\" + 0.078*\"sens\" + 0.074*\"januari\" + 0.072*\"juli\" + 0.070*\"august\" + 0.070*\"notion\" + 0.070*\"judici\" + 0.069*\"april\" + 0.068*\"decatur\"\n", + "2019-01-31 01:04:12,350 : INFO : topic #23 (0.020): 0.136*\"audit\" + 0.067*\"best\" + 0.033*\"yawn\" + 0.028*\"jacksonvil\" + 0.022*\"japanes\" + 0.021*\"noll\" + 0.020*\"festiv\" + 0.019*\"women\" + 0.018*\"intern\" + 0.015*\"prison\"\n", + "2019-01-31 01:04:12,351 : INFO : topic #15 (0.020): 0.011*\"small\" + 0.011*\"develop\" + 0.010*\"organ\" + 0.009*\"commun\" + 0.008*\"group\" + 0.008*\"word\" + 0.008*\"peopl\" + 0.007*\"human\" + 0.006*\"woman\" + 0.006*\"summerhil\"\n", + "2019-01-31 01:04:12,352 : INFO : topic #19 (0.020): 0.017*\"languag\" + 0.014*\"centuri\" + 0.010*\"woodcut\" + 0.009*\"form\" + 0.009*\"origin\" + 0.009*\"mean\" + 0.008*\"trade\" + 0.008*\"english\" + 0.007*\"known\" + 0.006*\"ancestor\"\n", + "2019-01-31 01:04:12,353 : INFO : topic #1 (0.020): 0.053*\"china\" + 0.045*\"chilton\" + 0.025*\"hong\" + 0.024*\"kong\" + 0.021*\"korea\" + 0.019*\"korean\" + 0.016*\"sourc\" + 0.016*\"shirin\" + 0.015*\"leah\" + 0.013*\"kim\"\n", + "2019-01-31 01:04:12,359 : INFO : topic diff=0.004487, rho=0.026745\n", + "2019-01-31 01:04:12,518 : INFO : PROGRESS: pass 0, at document #2798000/4922894\n", + "2019-01-31 01:04:13,909 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:04:14,176 : INFO : topic #35 (0.020): 0.063*\"russia\" + 0.036*\"sovereignti\" + 0.033*\"rural\" + 0.027*\"personifi\" + 0.025*\"poison\" + 0.025*\"reprint\" + 0.021*\"moscow\" + 0.017*\"poland\" + 0.015*\"unfortun\" + 0.015*\"malaysia\"\n", + "2019-01-31 01:04:14,177 : INFO : topic #36 (0.020): 0.011*\"network\" + 0.011*\"prognosi\" + 0.009*\"pop\" + 0.008*\"cytokin\" + 0.008*\"develop\" + 0.008*\"user\" + 0.008*\"uruguayan\" + 0.008*\"softwar\" + 0.007*\"diggin\" + 0.007*\"championship\"\n", + "2019-01-31 01:04:14,178 : INFO : topic #17 (0.020): 0.077*\"church\" + 0.022*\"christian\" + 0.021*\"cathol\" + 0.020*\"bishop\" + 0.016*\"retroflex\" + 0.015*\"sail\" + 0.012*\"centuri\" + 0.010*\"relationship\" + 0.009*\"cathedr\" + 0.009*\"historiographi\"\n", + "2019-01-31 01:04:14,179 : INFO : topic #1 (0.020): 0.053*\"china\" + 0.046*\"chilton\" + 0.025*\"hong\" + 0.024*\"kong\" + 0.021*\"korea\" + 0.019*\"korean\" + 0.016*\"sourc\" + 0.016*\"shirin\" + 0.015*\"leah\" + 0.013*\"kim\"\n", + "2019-01-31 01:04:14,180 : INFO : topic #48 (0.020): 0.084*\"march\" + 0.079*\"octob\" + 0.078*\"sens\" + 0.074*\"januari\" + 0.072*\"juli\" + 0.070*\"august\" + 0.070*\"notion\" + 0.070*\"judici\" + 0.068*\"april\" + 0.068*\"decatur\"\n", + "2019-01-31 01:04:14,186 : INFO : topic diff=0.003417, rho=0.026736\n", + "2019-01-31 01:04:16,870 : INFO : -11.760 per-word bound, 3467.9 perplexity estimate based on a held-out corpus of 2000 documents with 547626 words\n", + "2019-01-31 01:04:16,870 : INFO : PROGRESS: pass 0, at document #2800000/4922894\n", + "2019-01-31 01:04:18,251 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:04:18,518 : INFO : topic #18 (0.020): 0.010*\"théori\" + 0.007*\"later\" + 0.007*\"sack\" + 0.007*\"dai\" + 0.005*\"kill\" + 0.005*\"retrospect\" + 0.005*\"like\" + 0.005*\"end\" + 0.004*\"call\" + 0.004*\"help\"\n", + "2019-01-31 01:04:18,519 : INFO : topic #6 (0.020): 0.071*\"fewer\" + 0.023*\"epiru\" + 0.020*\"septemb\" + 0.018*\"teacher\" + 0.016*\"stake\" + 0.012*\"rodríguez\" + 0.012*\"proclaim\" + 0.011*\"movi\" + 0.011*\"produc\" + 0.011*\"direct\"\n", + "2019-01-31 01:04:18,520 : INFO : topic #39 (0.020): 0.059*\"canada\" + 0.044*\"canadian\" + 0.022*\"hoar\" + 0.022*\"toronto\" + 0.022*\"ontario\" + 0.016*\"new\" + 0.014*\"novotná\" + 0.014*\"hydrogen\" + 0.014*\"misericordia\" + 0.014*\"quebec\"\n", + "2019-01-31 01:04:18,521 : INFO : topic #35 (0.020): 0.063*\"russia\" + 0.036*\"sovereignti\" + 0.033*\"rural\" + 0.027*\"personifi\" + 0.025*\"poison\" + 0.025*\"reprint\" + 0.021*\"moscow\" + 0.017*\"poland\" + 0.015*\"unfortun\" + 0.015*\"malaysia\"\n", + "2019-01-31 01:04:18,522 : INFO : topic #29 (0.020): 0.030*\"companhia\" + 0.012*\"busi\" + 0.012*\"million\" + 0.011*\"market\" + 0.011*\"bank\" + 0.011*\"produc\" + 0.009*\"industri\" + 0.008*\"yawn\" + 0.008*\"manag\" + 0.007*\"serv\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 01:04:18,528 : INFO : topic diff=0.003759, rho=0.026726\n", + "2019-01-31 01:04:18,690 : INFO : PROGRESS: pass 0, at document #2802000/4922894\n", + "2019-01-31 01:04:20,108 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:04:20,375 : INFO : topic #7 (0.020): 0.020*\"snatch\" + 0.020*\"di\" + 0.018*\"factor\" + 0.016*\"yawn\" + 0.016*\"margin\" + 0.014*\"bone\" + 0.013*\"life\" + 0.013*\"faster\" + 0.012*\"deal\" + 0.012*\"john\"\n", + "2019-01-31 01:04:20,376 : INFO : topic #24 (0.020): 0.039*\"book\" + 0.034*\"publicis\" + 0.028*\"word\" + 0.018*\"new\" + 0.014*\"edit\" + 0.013*\"presid\" + 0.012*\"storag\" + 0.012*\"collect\" + 0.011*\"nicola\" + 0.011*\"author\"\n", + "2019-01-31 01:04:20,377 : INFO : topic #37 (0.020): 0.011*\"charact\" + 0.010*\"man\" + 0.010*\"septemb\" + 0.009*\"anim\" + 0.008*\"comic\" + 0.007*\"appear\" + 0.006*\"love\" + 0.006*\"gestur\" + 0.006*\"workplac\" + 0.005*\"storag\"\n", + "2019-01-31 01:04:20,379 : INFO : topic #41 (0.020): 0.042*\"citi\" + 0.024*\"palmer\" + 0.022*\"new\" + 0.016*\"strategist\" + 0.013*\"center\" + 0.012*\"open\" + 0.011*\"includ\" + 0.011*\"lobe\" + 0.010*\"dai\" + 0.009*\"highli\"\n", + "2019-01-31 01:04:20,380 : INFO : topic #12 (0.020): 0.010*\"number\" + 0.008*\"frontal\" + 0.007*\"gener\" + 0.007*\"théori\" + 0.006*\"exampl\" + 0.006*\"poet\" + 0.006*\"method\" + 0.006*\"southern\" + 0.006*\"servitud\" + 0.006*\"measur\"\n", + "2019-01-31 01:04:20,385 : INFO : topic diff=0.004402, rho=0.026717\n", + "2019-01-31 01:04:20,540 : INFO : PROGRESS: pass 0, at document #2804000/4922894\n", + "2019-01-31 01:04:21,910 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:04:22,176 : INFO : topic #19 (0.020): 0.017*\"languag\" + 0.014*\"centuri\" + 0.011*\"woodcut\" + 0.009*\"form\" + 0.009*\"mean\" + 0.009*\"origin\" + 0.008*\"trade\" + 0.008*\"english\" + 0.007*\"known\" + 0.006*\"ancestor\"\n", + "2019-01-31 01:04:22,177 : INFO : topic #15 (0.020): 0.011*\"small\" + 0.011*\"develop\" + 0.010*\"organ\" + 0.009*\"commun\" + 0.008*\"word\" + 0.008*\"group\" + 0.008*\"peopl\" + 0.007*\"human\" + 0.006*\"cultur\" + 0.006*\"summerhil\"\n", + "2019-01-31 01:04:22,178 : INFO : topic #28 (0.020): 0.032*\"build\" + 0.026*\"hous\" + 0.020*\"rivièr\" + 0.017*\"buford\" + 0.014*\"histor\" + 0.011*\"briarwood\" + 0.011*\"constitut\" + 0.011*\"strategist\" + 0.011*\"depress\" + 0.010*\"silicon\"\n", + "2019-01-31 01:04:22,179 : INFO : topic #12 (0.020): 0.010*\"number\" + 0.008*\"frontal\" + 0.007*\"théori\" + 0.007*\"gener\" + 0.006*\"exampl\" + 0.006*\"poet\" + 0.006*\"method\" + 0.006*\"southern\" + 0.006*\"measur\" + 0.006*\"servitud\"\n", + "2019-01-31 01:04:22,180 : INFO : topic #49 (0.020): 0.043*\"india\" + 0.032*\"incumb\" + 0.013*\"islam\" + 0.012*\"pakistan\" + 0.011*\"sri\" + 0.011*\"televis\" + 0.011*\"anglo\" + 0.010*\"muskoge\" + 0.010*\"tajikistan\" + 0.010*\"singh\"\n", + "2019-01-31 01:04:22,186 : INFO : topic diff=0.003843, rho=0.026707\n", + "2019-01-31 01:04:22,341 : INFO : PROGRESS: pass 0, at document #2806000/4922894\n", + "2019-01-31 01:04:23,723 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:04:23,989 : INFO : topic #34 (0.020): 0.068*\"start\" + 0.034*\"new\" + 0.031*\"american\" + 0.030*\"unionist\" + 0.024*\"cotton\" + 0.021*\"year\" + 0.015*\"california\" + 0.013*\"warrior\" + 0.013*\"terri\" + 0.012*\"north\"\n", + "2019-01-31 01:04:23,990 : INFO : topic #22 (0.020): 0.034*\"spars\" + 0.021*\"factor\" + 0.013*\"plaisir\" + 0.011*\"genu\" + 0.010*\"feel\" + 0.009*\"male\" + 0.008*\"western\" + 0.008*\"median\" + 0.008*\"incom\" + 0.008*\"biom\"\n", + "2019-01-31 01:04:23,991 : INFO : topic #19 (0.020): 0.016*\"languag\" + 0.014*\"centuri\" + 0.011*\"woodcut\" + 0.009*\"form\" + 0.009*\"mean\" + 0.009*\"origin\" + 0.008*\"trade\" + 0.008*\"english\" + 0.007*\"known\" + 0.006*\"ancestor\"\n", + "2019-01-31 01:04:23,992 : INFO : topic #49 (0.020): 0.043*\"india\" + 0.032*\"incumb\" + 0.013*\"islam\" + 0.012*\"pakistan\" + 0.012*\"sri\" + 0.011*\"televis\" + 0.011*\"anglo\" + 0.010*\"muskoge\" + 0.010*\"tajikistan\" + 0.010*\"singh\"\n", + "2019-01-31 01:04:23,993 : INFO : topic #36 (0.020): 0.011*\"network\" + 0.011*\"prognosi\" + 0.009*\"pop\" + 0.008*\"develop\" + 0.008*\"cytokin\" + 0.008*\"softwar\" + 0.008*\"uruguayan\" + 0.008*\"user\" + 0.007*\"diggin\" + 0.007*\"includ\"\n", + "2019-01-31 01:04:23,999 : INFO : topic diff=0.003960, rho=0.026698\n", + "2019-01-31 01:04:24,155 : INFO : PROGRESS: pass 0, at document #2808000/4922894\n", + "2019-01-31 01:04:25,542 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:04:25,809 : INFO : topic #6 (0.020): 0.071*\"fewer\" + 0.023*\"epiru\" + 0.020*\"septemb\" + 0.018*\"teacher\" + 0.016*\"stake\" + 0.013*\"proclaim\" + 0.012*\"rodríguez\" + 0.011*\"movi\" + 0.011*\"direct\" + 0.011*\"produc\"\n", + "2019-01-31 01:04:25,810 : INFO : topic #48 (0.020): 0.084*\"march\" + 0.078*\"octob\" + 0.077*\"sens\" + 0.074*\"januari\" + 0.072*\"juli\" + 0.070*\"august\" + 0.069*\"notion\" + 0.069*\"judici\" + 0.069*\"april\" + 0.068*\"decatur\"\n", + "2019-01-31 01:04:25,811 : INFO : topic #20 (0.020): 0.139*\"scholar\" + 0.038*\"struggl\" + 0.034*\"high\" + 0.029*\"educ\" + 0.024*\"collector\" + 0.017*\"yawn\" + 0.013*\"prognosi\" + 0.011*\"gothic\" + 0.011*\"district\" + 0.010*\"task\"\n", + "2019-01-31 01:04:25,812 : INFO : topic #27 (0.020): 0.068*\"questionnair\" + 0.020*\"candid\" + 0.019*\"taxpay\" + 0.017*\"ret\" + 0.013*\"driver\" + 0.012*\"tornado\" + 0.012*\"find\" + 0.011*\"fool\" + 0.010*\"squatter\" + 0.010*\"landslid\"\n", + "2019-01-31 01:04:25,813 : INFO : topic #21 (0.020): 0.033*\"samford\" + 0.021*\"spain\" + 0.019*\"del\" + 0.017*\"mexico\" + 0.015*\"italian\" + 0.013*\"soviet\" + 0.012*\"santa\" + 0.011*\"lizard\" + 0.011*\"juan\" + 0.011*\"carlo\"\n", + "2019-01-31 01:04:25,819 : INFO : topic diff=0.004372, rho=0.026688\n", + "2019-01-31 01:04:25,976 : INFO : PROGRESS: pass 0, at document #2810000/4922894\n", + "2019-01-31 01:04:27,364 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:04:27,630 : INFO : topic #1 (0.020): 0.054*\"china\" + 0.046*\"chilton\" + 0.024*\"hong\" + 0.024*\"kong\" + 0.024*\"korea\" + 0.019*\"korean\" + 0.016*\"sourc\" + 0.016*\"shirin\" + 0.015*\"leah\" + 0.013*\"kim\"\n", + "2019-01-31 01:04:27,631 : INFO : topic #41 (0.020): 0.042*\"citi\" + 0.024*\"palmer\" + 0.022*\"new\" + 0.015*\"strategist\" + 0.013*\"center\" + 0.012*\"open\" + 0.011*\"includ\" + 0.011*\"lobe\" + 0.010*\"dai\" + 0.009*\"highli\"\n", + "2019-01-31 01:04:27,632 : INFO : topic #16 (0.020): 0.056*\"king\" + 0.032*\"priest\" + 0.022*\"duke\" + 0.020*\"idiosyncrat\" + 0.020*\"rotterdam\" + 0.018*\"grammat\" + 0.016*\"quarterli\" + 0.014*\"count\" + 0.013*\"kingdom\" + 0.012*\"brazil\"\n", + "2019-01-31 01:04:27,633 : INFO : topic #42 (0.020): 0.048*\"german\" + 0.031*\"germani\" + 0.015*\"vol\" + 0.014*\"jewish\" + 0.014*\"der\" + 0.014*\"berlin\" + 0.014*\"israel\" + 0.011*\"european\" + 0.009*\"europ\" + 0.009*\"austria\"\n", + "2019-01-31 01:04:27,634 : INFO : topic #35 (0.020): 0.060*\"russia\" + 0.039*\"sovereignti\" + 0.033*\"rural\" + 0.026*\"personifi\" + 0.025*\"reprint\" + 0.024*\"poison\" + 0.021*\"moscow\" + 0.019*\"alexand\" + 0.017*\"poland\" + 0.016*\"unfortun\"\n", + "2019-01-31 01:04:27,640 : INFO : topic diff=0.004003, rho=0.026679\n", + "2019-01-31 01:04:27,796 : INFO : PROGRESS: pass 0, at document #2812000/4922894\n", + "2019-01-31 01:04:29,181 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:04:29,447 : INFO : topic #19 (0.020): 0.017*\"languag\" + 0.014*\"centuri\" + 0.011*\"woodcut\" + 0.009*\"form\" + 0.009*\"origin\" + 0.009*\"mean\" + 0.008*\"trade\" + 0.008*\"english\" + 0.007*\"known\" + 0.006*\"ancestor\"\n", + "2019-01-31 01:04:29,448 : INFO : topic #1 (0.020): 0.054*\"china\" + 0.046*\"chilton\" + 0.024*\"hong\" + 0.024*\"kong\" + 0.024*\"korea\" + 0.019*\"korean\" + 0.016*\"sourc\" + 0.016*\"shirin\" + 0.015*\"leah\" + 0.013*\"kim\"\n", + "2019-01-31 01:04:29,449 : INFO : topic #47 (0.020): 0.064*\"muscl\" + 0.032*\"perceptu\" + 0.020*\"theater\" + 0.017*\"place\" + 0.017*\"compos\" + 0.014*\"damn\" + 0.014*\"orchestr\" + 0.013*\"olympo\" + 0.013*\"physician\" + 0.012*\"jack\"\n", + "2019-01-31 01:04:29,450 : INFO : topic #4 (0.020): 0.020*\"enfranchis\" + 0.015*\"pour\" + 0.015*\"depress\" + 0.010*\"mode\" + 0.010*\"elabor\" + 0.008*\"veget\" + 0.007*\"uruguayan\" + 0.006*\"encyclopedia\" + 0.006*\"develop\" + 0.006*\"spectacl\"\n", + "2019-01-31 01:04:29,451 : INFO : topic #38 (0.020): 0.025*\"walter\" + 0.010*\"aza\" + 0.009*\"empath\" + 0.009*\"battalion\" + 0.008*\"forc\" + 0.007*\"teufel\" + 0.007*\"armi\" + 0.006*\"till\" + 0.006*\"militari\" + 0.006*\"govern\"\n", + "2019-01-31 01:04:29,457 : INFO : topic diff=0.003786, rho=0.026669\n", + "2019-01-31 01:04:29,668 : INFO : PROGRESS: pass 0, at document #2814000/4922894\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 01:04:31,053 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:04:31,320 : INFO : topic #34 (0.020): 0.069*\"start\" + 0.034*\"new\" + 0.031*\"american\" + 0.030*\"unionist\" + 0.025*\"cotton\" + 0.021*\"year\" + 0.015*\"california\" + 0.014*\"terri\" + 0.013*\"warrior\" + 0.012*\"north\"\n", + "2019-01-31 01:04:31,321 : INFO : topic #18 (0.020): 0.010*\"théori\" + 0.007*\"later\" + 0.007*\"sack\" + 0.006*\"dai\" + 0.005*\"kill\" + 0.005*\"retrospect\" + 0.005*\"end\" + 0.005*\"like\" + 0.004*\"call\" + 0.004*\"help\"\n", + "2019-01-31 01:04:31,322 : INFO : topic #3 (0.020): 0.032*\"present\" + 0.027*\"offic\" + 0.023*\"nation\" + 0.023*\"minist\" + 0.021*\"govern\" + 0.021*\"member\" + 0.019*\"serv\" + 0.016*\"gener\" + 0.016*\"start\" + 0.014*\"chickasaw\"\n", + "2019-01-31 01:04:31,323 : INFO : topic #38 (0.020): 0.025*\"walter\" + 0.010*\"aza\" + 0.009*\"empath\" + 0.009*\"battalion\" + 0.008*\"forc\" + 0.007*\"teufel\" + 0.007*\"armi\" + 0.006*\"militari\" + 0.006*\"till\" + 0.006*\"govern\"\n", + "2019-01-31 01:04:31,324 : INFO : topic #12 (0.020): 0.010*\"number\" + 0.008*\"frontal\" + 0.007*\"théori\" + 0.007*\"gener\" + 0.006*\"exampl\" + 0.006*\"poet\" + 0.006*\"southern\" + 0.006*\"servitud\" + 0.006*\"method\" + 0.006*\"differ\"\n", + "2019-01-31 01:04:31,330 : INFO : topic diff=0.003671, rho=0.026660\n", + "2019-01-31 01:04:31,490 : INFO : PROGRESS: pass 0, at document #2816000/4922894\n", + "2019-01-31 01:04:32,901 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:04:33,168 : INFO : topic #28 (0.020): 0.033*\"build\" + 0.026*\"hous\" + 0.019*\"rivièr\" + 0.018*\"buford\" + 0.014*\"histor\" + 0.011*\"briarwood\" + 0.011*\"constitut\" + 0.010*\"depress\" + 0.010*\"strategist\" + 0.010*\"linear\"\n", + "2019-01-31 01:04:33,169 : INFO : topic #24 (0.020): 0.039*\"book\" + 0.034*\"publicis\" + 0.028*\"word\" + 0.018*\"new\" + 0.014*\"edit\" + 0.013*\"presid\" + 0.012*\"storag\" + 0.012*\"collect\" + 0.011*\"nicola\" + 0.011*\"author\"\n", + "2019-01-31 01:04:33,170 : INFO : topic #46 (0.020): 0.018*\"norwai\" + 0.017*\"stop\" + 0.017*\"sweden\" + 0.015*\"wind\" + 0.015*\"swedish\" + 0.015*\"norwegian\" + 0.015*\"damag\" + 0.011*\"farid\" + 0.011*\"denmark\" + 0.011*\"huntsvil\"\n", + "2019-01-31 01:04:33,171 : INFO : topic #4 (0.020): 0.020*\"enfranchis\" + 0.015*\"pour\" + 0.015*\"depress\" + 0.010*\"mode\" + 0.010*\"elabor\" + 0.008*\"veget\" + 0.007*\"uruguayan\" + 0.006*\"encyclopedia\" + 0.006*\"develop\" + 0.006*\"spectacl\"\n", + "2019-01-31 01:04:33,172 : INFO : topic #20 (0.020): 0.140*\"scholar\" + 0.039*\"struggl\" + 0.033*\"high\" + 0.029*\"educ\" + 0.024*\"collector\" + 0.017*\"yawn\" + 0.013*\"prognosi\" + 0.011*\"gothic\" + 0.010*\"district\" + 0.010*\"task\"\n", + "2019-01-31 01:04:33,178 : INFO : topic diff=0.005209, rho=0.026650\n", + "2019-01-31 01:04:33,337 : INFO : PROGRESS: pass 0, at document #2818000/4922894\n", + "2019-01-31 01:04:34,732 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:04:34,998 : INFO : topic #14 (0.020): 0.024*\"forc\" + 0.023*\"aggress\" + 0.021*\"armi\" + 0.019*\"walter\" + 0.017*\"com\" + 0.014*\"oper\" + 0.014*\"unionist\" + 0.012*\"militari\" + 0.012*\"airbu\" + 0.012*\"solitari\"\n", + "2019-01-31 01:04:34,999 : INFO : topic #37 (0.020): 0.011*\"charact\" + 0.010*\"man\" + 0.010*\"septemb\" + 0.009*\"anim\" + 0.008*\"comic\" + 0.007*\"appear\" + 0.007*\"love\" + 0.006*\"gestur\" + 0.006*\"workplac\" + 0.005*\"storag\"\n", + "2019-01-31 01:04:35,000 : INFO : topic #11 (0.020): 0.023*\"john\" + 0.012*\"will\" + 0.012*\"david\" + 0.011*\"jame\" + 0.010*\"rival\" + 0.009*\"mexican–american\" + 0.008*\"slur\" + 0.008*\"paul\" + 0.008*\"georg\" + 0.007*\"rhyme\"\n", + "2019-01-31 01:04:35,001 : INFO : topic #24 (0.020): 0.039*\"book\" + 0.034*\"publicis\" + 0.028*\"word\" + 0.018*\"new\" + 0.014*\"edit\" + 0.013*\"presid\" + 0.012*\"storag\" + 0.012*\"collect\" + 0.011*\"nicola\" + 0.010*\"author\"\n", + "2019-01-31 01:04:35,002 : INFO : topic #49 (0.020): 0.046*\"india\" + 0.032*\"incumb\" + 0.013*\"islam\" + 0.012*\"pakistan\" + 0.012*\"televis\" + 0.011*\"sri\" + 0.011*\"anglo\" + 0.010*\"muskoge\" + 0.010*\"affection\" + 0.010*\"tajikistan\"\n", + "2019-01-31 01:04:35,008 : INFO : topic diff=0.004168, rho=0.026641\n", + "2019-01-31 01:04:37,758 : INFO : -11.921 per-word bound, 3878.7 perplexity estimate based on a held-out corpus of 2000 documents with 562777 words\n", + "2019-01-31 01:04:37,759 : INFO : PROGRESS: pass 0, at document #2820000/4922894\n", + "2019-01-31 01:04:39,161 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:04:39,427 : INFO : topic #22 (0.020): 0.034*\"spars\" + 0.020*\"factor\" + 0.012*\"plaisir\" + 0.010*\"feel\" + 0.010*\"genu\" + 0.010*\"male\" + 0.008*\"median\" + 0.008*\"western\" + 0.008*\"biom\" + 0.008*\"incom\"\n", + "2019-01-31 01:04:39,428 : INFO : topic #35 (0.020): 0.059*\"russia\" + 0.038*\"sovereignti\" + 0.033*\"rural\" + 0.026*\"personifi\" + 0.024*\"reprint\" + 0.023*\"poison\" + 0.021*\"moscow\" + 0.019*\"alexand\" + 0.016*\"poland\" + 0.015*\"unfortun\"\n", + "2019-01-31 01:04:39,429 : INFO : topic #48 (0.020): 0.085*\"march\" + 0.078*\"octob\" + 0.076*\"sens\" + 0.075*\"januari\" + 0.073*\"juli\" + 0.071*\"notion\" + 0.071*\"judici\" + 0.070*\"august\" + 0.069*\"april\" + 0.069*\"decatur\"\n", + "2019-01-31 01:04:39,430 : INFO : topic #10 (0.020): 0.012*\"cdd\" + 0.008*\"media\" + 0.008*\"hormon\" + 0.008*\"disco\" + 0.007*\"have\" + 0.007*\"pathwai\" + 0.007*\"caus\" + 0.006*\"proper\" + 0.006*\"treat\" + 0.006*\"effect\"\n", + "2019-01-31 01:04:39,431 : INFO : topic #28 (0.020): 0.033*\"build\" + 0.026*\"hous\" + 0.019*\"rivièr\" + 0.018*\"buford\" + 0.014*\"histor\" + 0.011*\"briarwood\" + 0.011*\"constitut\" + 0.011*\"strategist\" + 0.011*\"linear\" + 0.010*\"depress\"\n", + "2019-01-31 01:04:39,437 : INFO : topic diff=0.003160, rho=0.026631\n", + "2019-01-31 01:04:39,599 : INFO : PROGRESS: pass 0, at document #2822000/4922894\n", + "2019-01-31 01:04:40,995 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:04:41,262 : INFO : topic #28 (0.020): 0.033*\"build\" + 0.026*\"hous\" + 0.019*\"rivièr\" + 0.018*\"buford\" + 0.014*\"histor\" + 0.011*\"briarwood\" + 0.011*\"constitut\" + 0.011*\"strategist\" + 0.011*\"linear\" + 0.010*\"depress\"\n", + "2019-01-31 01:04:41,263 : INFO : topic #44 (0.020): 0.030*\"rooftop\" + 0.027*\"final\" + 0.022*\"wife\" + 0.020*\"tourist\" + 0.019*\"champion\" + 0.015*\"martin\" + 0.015*\"chamber\" + 0.014*\"tiepolo\" + 0.013*\"open\" + 0.013*\"taxpay\"\n", + "2019-01-31 01:04:41,265 : INFO : topic #29 (0.020): 0.030*\"companhia\" + 0.012*\"busi\" + 0.012*\"market\" + 0.011*\"million\" + 0.011*\"produc\" + 0.011*\"bank\" + 0.009*\"industri\" + 0.008*\"manag\" + 0.008*\"yawn\" + 0.007*\"serv\"\n", + "2019-01-31 01:04:41,266 : INFO : topic #43 (0.020): 0.067*\"elect\" + 0.056*\"parti\" + 0.025*\"democrat\" + 0.024*\"voluntari\" + 0.022*\"member\" + 0.016*\"polici\" + 0.016*\"republ\" + 0.014*\"liber\" + 0.014*\"bypass\" + 0.013*\"report\"\n", + "2019-01-31 01:04:41,267 : INFO : topic #45 (0.020): 0.027*\"jpg\" + 0.026*\"fifteenth\" + 0.018*\"illicit\" + 0.016*\"colder\" + 0.015*\"western\" + 0.014*\"black\" + 0.014*\"pain\" + 0.011*\"record\" + 0.010*\"depress\" + 0.009*\"blind\"\n", + "2019-01-31 01:04:41,273 : INFO : topic diff=0.004925, rho=0.026622\n", + "2019-01-31 01:04:41,424 : INFO : PROGRESS: pass 0, at document #2824000/4922894\n", + "2019-01-31 01:04:42,775 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:04:43,041 : INFO : topic #16 (0.020): 0.057*\"king\" + 0.031*\"priest\" + 0.021*\"duke\" + 0.020*\"idiosyncrat\" + 0.020*\"rotterdam\" + 0.018*\"grammat\" + 0.017*\"quarterli\" + 0.013*\"kingdom\" + 0.013*\"count\" + 0.012*\"portugues\"\n", + "2019-01-31 01:04:43,043 : INFO : topic #9 (0.020): 0.068*\"bone\" + 0.045*\"american\" + 0.027*\"valour\" + 0.019*\"player\" + 0.019*\"folei\" + 0.018*\"dutch\" + 0.017*\"english\" + 0.016*\"polit\" + 0.013*\"acrimoni\" + 0.012*\"simpler\"\n", + "2019-01-31 01:04:43,044 : INFO : topic #15 (0.020): 0.011*\"small\" + 0.011*\"develop\" + 0.010*\"organ\" + 0.009*\"commun\" + 0.008*\"group\" + 0.008*\"word\" + 0.008*\"peopl\" + 0.007*\"human\" + 0.006*\"woman\" + 0.006*\"summerhil\"\n", + "2019-01-31 01:04:43,045 : INFO : topic #5 (0.020): 0.039*\"abroad\" + 0.028*\"son\" + 0.027*\"rel\" + 0.026*\"reconstruct\" + 0.020*\"band\" + 0.017*\"muscl\" + 0.016*\"simultan\" + 0.014*\"charcoal\" + 0.014*\"toyota\" + 0.010*\"myspac\"\n", + "2019-01-31 01:04:43,046 : INFO : topic #45 (0.020): 0.027*\"jpg\" + 0.026*\"fifteenth\" + 0.018*\"illicit\" + 0.015*\"colder\" + 0.015*\"western\" + 0.014*\"black\" + 0.014*\"pain\" + 0.011*\"record\" + 0.010*\"depress\" + 0.009*\"blind\"\n", + "2019-01-31 01:04:43,052 : INFO : topic diff=0.004127, rho=0.026612\n", + "2019-01-31 01:04:43,210 : INFO : PROGRESS: pass 0, at document #2826000/4922894\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 01:04:44,578 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:04:44,847 : INFO : topic #11 (0.020): 0.023*\"john\" + 0.012*\"will\" + 0.012*\"david\" + 0.011*\"jame\" + 0.010*\"rival\" + 0.009*\"mexican–american\" + 0.008*\"paul\" + 0.008*\"slur\" + 0.008*\"georg\" + 0.007*\"rhyme\"\n", + "2019-01-31 01:04:44,848 : INFO : topic #39 (0.020): 0.059*\"canada\" + 0.044*\"canadian\" + 0.023*\"hoar\" + 0.022*\"ontario\" + 0.022*\"toronto\" + 0.016*\"hydrogen\" + 0.016*\"new\" + 0.015*\"novotná\" + 0.014*\"misericordia\" + 0.013*\"quebec\"\n", + "2019-01-31 01:04:44,849 : INFO : topic #21 (0.020): 0.034*\"samford\" + 0.021*\"spain\" + 0.018*\"del\" + 0.017*\"mexico\" + 0.015*\"italian\" + 0.013*\"soviet\" + 0.012*\"santa\" + 0.011*\"lizard\" + 0.011*\"juan\" + 0.011*\"carlo\"\n", + "2019-01-31 01:04:44,850 : INFO : topic #12 (0.020): 0.009*\"number\" + 0.008*\"frontal\" + 0.007*\"théori\" + 0.007*\"poet\" + 0.007*\"gener\" + 0.006*\"exampl\" + 0.006*\"southern\" + 0.006*\"method\" + 0.006*\"servitud\" + 0.006*\"differ\"\n", + "2019-01-31 01:04:44,851 : INFO : topic #37 (0.020): 0.011*\"charact\" + 0.010*\"man\" + 0.010*\"septemb\" + 0.009*\"anim\" + 0.008*\"comic\" + 0.007*\"appear\" + 0.006*\"love\" + 0.006*\"gestur\" + 0.006*\"workplac\" + 0.006*\"dixi\"\n", + "2019-01-31 01:04:44,857 : INFO : topic diff=0.004192, rho=0.026603\n", + "2019-01-31 01:04:45,013 : INFO : PROGRESS: pass 0, at document #2828000/4922894\n", + "2019-01-31 01:04:46,390 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:04:46,656 : INFO : topic #42 (0.020): 0.047*\"german\" + 0.031*\"germani\" + 0.015*\"vol\" + 0.015*\"israel\" + 0.015*\"jewish\" + 0.014*\"berlin\" + 0.014*\"der\" + 0.011*\"european\" + 0.009*\"europ\" + 0.009*\"austria\"\n", + "2019-01-31 01:04:46,657 : INFO : topic #28 (0.020): 0.034*\"build\" + 0.026*\"hous\" + 0.019*\"rivièr\" + 0.018*\"buford\" + 0.014*\"histor\" + 0.011*\"briarwood\" + 0.011*\"constitut\" + 0.011*\"strategist\" + 0.010*\"depress\" + 0.010*\"linear\"\n", + "2019-01-31 01:04:46,659 : INFO : topic #2 (0.020): 0.050*\"isl\" + 0.038*\"shield\" + 0.018*\"narrat\" + 0.016*\"scot\" + 0.012*\"blur\" + 0.011*\"pope\" + 0.010*\"coalit\" + 0.010*\"nativist\" + 0.010*\"bahá\" + 0.010*\"fleet\"\n", + "2019-01-31 01:04:46,660 : INFO : topic #48 (0.020): 0.085*\"march\" + 0.078*\"octob\" + 0.077*\"sens\" + 0.074*\"januari\" + 0.073*\"juli\" + 0.071*\"notion\" + 0.070*\"judici\" + 0.070*\"august\" + 0.069*\"decatur\" + 0.068*\"april\"\n", + "2019-01-31 01:04:46,661 : INFO : topic #8 (0.020): 0.028*\"law\" + 0.023*\"cortic\" + 0.019*\"start\" + 0.018*\"act\" + 0.013*\"ricardo\" + 0.012*\"case\" + 0.010*\"replac\" + 0.010*\"polaris\" + 0.009*\"legal\" + 0.007*\"judaism\"\n", + "2019-01-31 01:04:46,666 : INFO : topic diff=0.004394, rho=0.026593\n", + "2019-01-31 01:04:46,822 : INFO : PROGRESS: pass 0, at document #2830000/4922894\n", + "2019-01-31 01:04:48,211 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:04:48,477 : INFO : topic #47 (0.020): 0.064*\"muscl\" + 0.033*\"perceptu\" + 0.020*\"theater\" + 0.017*\"place\" + 0.017*\"compos\" + 0.014*\"damn\" + 0.013*\"orchestr\" + 0.013*\"olympo\" + 0.013*\"physician\" + 0.011*\"word\"\n", + "2019-01-31 01:04:48,478 : INFO : topic #5 (0.020): 0.039*\"abroad\" + 0.028*\"son\" + 0.027*\"rel\" + 0.026*\"reconstruct\" + 0.021*\"band\" + 0.017*\"muscl\" + 0.016*\"simultan\" + 0.014*\"charcoal\" + 0.014*\"toyota\" + 0.010*\"myspac\"\n", + "2019-01-31 01:04:48,479 : INFO : topic #0 (0.020): 0.067*\"statewid\" + 0.043*\"line\" + 0.035*\"raid\" + 0.021*\"arsen\" + 0.021*\"museo\" + 0.020*\"traceabl\" + 0.020*\"rosenwald\" + 0.019*\"serv\" + 0.012*\"oper\" + 0.011*\"exhaust\"\n", + "2019-01-31 01:04:48,480 : INFO : topic #21 (0.020): 0.034*\"samford\" + 0.021*\"spain\" + 0.018*\"del\" + 0.017*\"mexico\" + 0.015*\"italian\" + 0.013*\"soviet\" + 0.012*\"santa\" + 0.011*\"lizard\" + 0.011*\"juan\" + 0.011*\"mexican\"\n", + "2019-01-31 01:04:48,481 : INFO : topic #35 (0.020): 0.059*\"russia\" + 0.038*\"sovereignti\" + 0.033*\"rural\" + 0.026*\"personifi\" + 0.024*\"reprint\" + 0.024*\"poison\" + 0.020*\"moscow\" + 0.019*\"alexand\" + 0.017*\"poland\" + 0.015*\"unfortun\"\n", + "2019-01-31 01:04:48,487 : INFO : topic diff=0.003896, rho=0.026584\n", + "2019-01-31 01:04:48,640 : INFO : PROGRESS: pass 0, at document #2832000/4922894\n", + "2019-01-31 01:04:49,999 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:04:50,268 : INFO : topic #13 (0.020): 0.027*\"sourc\" + 0.025*\"australia\" + 0.025*\"london\" + 0.024*\"new\" + 0.023*\"england\" + 0.022*\"australian\" + 0.020*\"ireland\" + 0.019*\"british\" + 0.014*\"youth\" + 0.013*\"wale\"\n", + "2019-01-31 01:04:50,269 : INFO : topic #0 (0.020): 0.067*\"statewid\" + 0.043*\"line\" + 0.036*\"raid\" + 0.021*\"museo\" + 0.021*\"arsen\" + 0.020*\"traceabl\" + 0.019*\"rosenwald\" + 0.019*\"serv\" + 0.012*\"oper\" + 0.011*\"exhaust\"\n", + "2019-01-31 01:04:50,270 : INFO : topic #39 (0.020): 0.059*\"canada\" + 0.044*\"canadian\" + 0.024*\"hoar\" + 0.023*\"toronto\" + 0.022*\"ontario\" + 0.016*\"hydrogen\" + 0.016*\"new\" + 0.015*\"misericordia\" + 0.015*\"novotná\" + 0.013*\"quebec\"\n", + "2019-01-31 01:04:50,271 : INFO : topic #46 (0.020): 0.018*\"stop\" + 0.017*\"norwai\" + 0.017*\"sweden\" + 0.015*\"swedish\" + 0.015*\"wind\" + 0.014*\"norwegian\" + 0.014*\"damag\" + 0.012*\"huntsvil\" + 0.011*\"treeless\" + 0.011*\"denmark\"\n", + "2019-01-31 01:04:50,272 : INFO : topic #7 (0.020): 0.021*\"snatch\" + 0.020*\"di\" + 0.018*\"factor\" + 0.016*\"yawn\" + 0.016*\"margin\" + 0.014*\"bone\" + 0.013*\"life\" + 0.013*\"faster\" + 0.012*\"deal\" + 0.012*\"daughter\"\n", + "2019-01-31 01:04:50,278 : INFO : topic diff=0.003917, rho=0.026575\n", + "2019-01-31 01:04:50,434 : INFO : PROGRESS: pass 0, at document #2834000/4922894\n", + "2019-01-31 01:04:51,808 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:04:52,074 : INFO : topic #29 (0.020): 0.030*\"companhia\" + 0.012*\"busi\" + 0.012*\"market\" + 0.011*\"million\" + 0.011*\"produc\" + 0.011*\"bank\" + 0.009*\"industri\" + 0.008*\"manag\" + 0.008*\"yawn\" + 0.007*\"serv\"\n", + "2019-01-31 01:04:52,075 : INFO : topic #40 (0.020): 0.088*\"unit\" + 0.024*\"schuster\" + 0.023*\"institut\" + 0.021*\"collector\" + 0.021*\"requir\" + 0.019*\"student\" + 0.015*\"professor\" + 0.012*\"word\" + 0.011*\"governor\" + 0.011*\"http\"\n", + "2019-01-31 01:04:52,076 : INFO : topic #26 (0.020): 0.031*\"workplac\" + 0.029*\"champion\" + 0.028*\"woman\" + 0.026*\"olymp\" + 0.024*\"men\" + 0.023*\"medal\" + 0.022*\"alic\" + 0.020*\"event\" + 0.019*\"rainfal\" + 0.018*\"atheist\"\n", + "2019-01-31 01:04:52,077 : INFO : topic #39 (0.020): 0.059*\"canada\" + 0.045*\"canadian\" + 0.023*\"hoar\" + 0.023*\"toronto\" + 0.022*\"ontario\" + 0.016*\"new\" + 0.016*\"hydrogen\" + 0.015*\"misericordia\" + 0.015*\"novotná\" + 0.013*\"quebec\"\n", + "2019-01-31 01:04:52,078 : INFO : topic #41 (0.020): 0.041*\"citi\" + 0.023*\"palmer\" + 0.022*\"new\" + 0.016*\"strategist\" + 0.013*\"center\" + 0.012*\"open\" + 0.011*\"includ\" + 0.011*\"lobe\" + 0.009*\"dai\" + 0.009*\"highli\"\n", + "2019-01-31 01:04:52,084 : INFO : topic diff=0.003520, rho=0.026565\n", + "2019-01-31 01:04:52,247 : INFO : PROGRESS: pass 0, at document #2836000/4922894\n", + "2019-01-31 01:04:53,655 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:04:53,924 : INFO : topic #43 (0.020): 0.066*\"elect\" + 0.056*\"parti\" + 0.024*\"democrat\" + 0.023*\"voluntari\" + 0.022*\"member\" + 0.016*\"polici\" + 0.016*\"republ\" + 0.014*\"liber\" + 0.014*\"bypass\" + 0.013*\"report\"\n", + "2019-01-31 01:04:53,925 : INFO : topic #23 (0.020): 0.136*\"audit\" + 0.068*\"best\" + 0.033*\"yawn\" + 0.027*\"jacksonvil\" + 0.022*\"noll\" + 0.021*\"japanes\" + 0.020*\"festiv\" + 0.020*\"women\" + 0.018*\"intern\" + 0.015*\"prison\"\n", + "2019-01-31 01:04:53,926 : INFO : topic #45 (0.020): 0.027*\"jpg\" + 0.025*\"fifteenth\" + 0.018*\"illicit\" + 0.016*\"colder\" + 0.015*\"western\" + 0.014*\"black\" + 0.014*\"pain\" + 0.011*\"record\" + 0.010*\"depress\" + 0.009*\"blind\"\n", + "2019-01-31 01:04:53,927 : INFO : topic #8 (0.020): 0.029*\"law\" + 0.023*\"cortic\" + 0.019*\"start\" + 0.018*\"act\" + 0.013*\"ricardo\" + 0.012*\"case\" + 0.010*\"replac\" + 0.010*\"polaris\" + 0.009*\"legal\" + 0.007*\"judaism\"\n", + "2019-01-31 01:04:53,928 : INFO : topic #22 (0.020): 0.034*\"spars\" + 0.021*\"factor\" + 0.012*\"plaisir\" + 0.010*\"feel\" + 0.010*\"genu\" + 0.010*\"male\" + 0.009*\"median\" + 0.009*\"western\" + 0.008*\"biom\" + 0.008*\"incom\"\n", + "2019-01-31 01:04:53,934 : INFO : topic diff=0.003504, rho=0.026556\n", + "2019-01-31 01:04:54,087 : INFO : PROGRESS: pass 0, at document #2838000/4922894\n", + "2019-01-31 01:04:55,435 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:04:55,702 : INFO : topic #41 (0.020): 0.041*\"citi\" + 0.023*\"palmer\" + 0.022*\"new\" + 0.016*\"strategist\" + 0.013*\"center\" + 0.012*\"open\" + 0.011*\"includ\" + 0.011*\"lobe\" + 0.009*\"dai\" + 0.009*\"highli\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 01:04:55,703 : INFO : topic #1 (0.020): 0.052*\"china\" + 0.043*\"chilton\" + 0.023*\"hong\" + 0.023*\"korea\" + 0.022*\"kong\" + 0.019*\"korean\" + 0.017*\"leah\" + 0.016*\"kim\" + 0.016*\"sourc\" + 0.014*\"shirin\"\n", + "2019-01-31 01:04:55,704 : INFO : topic #35 (0.020): 0.059*\"russia\" + 0.037*\"sovereignti\" + 0.033*\"rural\" + 0.025*\"personifi\" + 0.025*\"poison\" + 0.024*\"reprint\" + 0.021*\"moscow\" + 0.018*\"alexand\" + 0.017*\"poland\" + 0.015*\"unfortun\"\n", + "2019-01-31 01:04:55,705 : INFO : topic #22 (0.020): 0.034*\"spars\" + 0.021*\"factor\" + 0.012*\"plaisir\" + 0.010*\"feel\" + 0.010*\"genu\" + 0.010*\"male\" + 0.009*\"median\" + 0.009*\"western\" + 0.008*\"biom\" + 0.008*\"incom\"\n", + "2019-01-31 01:04:55,706 : INFO : topic #45 (0.020): 0.026*\"jpg\" + 0.025*\"fifteenth\" + 0.018*\"illicit\" + 0.016*\"colder\" + 0.015*\"western\" + 0.014*\"black\" + 0.014*\"pain\" + 0.011*\"record\" + 0.010*\"depress\" + 0.009*\"blind\"\n", + "2019-01-31 01:04:55,712 : INFO : topic diff=0.004200, rho=0.026547\n", + "2019-01-31 01:04:58,414 : INFO : -11.467 per-word bound, 2830.7 perplexity estimate based on a held-out corpus of 2000 documents with 565743 words\n", + "2019-01-31 01:04:58,415 : INFO : PROGRESS: pass 0, at document #2840000/4922894\n", + "2019-01-31 01:04:59,795 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:05:00,062 : INFO : topic #47 (0.020): 0.065*\"muscl\" + 0.033*\"perceptu\" + 0.020*\"theater\" + 0.017*\"place\" + 0.017*\"compos\" + 0.014*\"damn\" + 0.013*\"orchestr\" + 0.013*\"physician\" + 0.013*\"olympo\" + 0.011*\"word\"\n", + "2019-01-31 01:05:00,063 : INFO : topic #25 (0.020): 0.031*\"ring\" + 0.018*\"area\" + 0.017*\"lagrang\" + 0.017*\"warmth\" + 0.015*\"mount\" + 0.009*\"palmer\" + 0.009*\"north\" + 0.009*\"sourc\" + 0.009*\"foam\" + 0.009*\"land\"\n", + "2019-01-31 01:05:00,064 : INFO : topic #31 (0.020): 0.052*\"fusiform\" + 0.026*\"scientist\" + 0.026*\"taxpay\" + 0.023*\"player\" + 0.020*\"place\" + 0.014*\"clot\" + 0.013*\"leagu\" + 0.011*\"folei\" + 0.010*\"yawn\" + 0.009*\"reconstruct\"\n", + "2019-01-31 01:05:00,066 : INFO : topic #41 (0.020): 0.041*\"citi\" + 0.024*\"palmer\" + 0.022*\"new\" + 0.016*\"strategist\" + 0.013*\"center\" + 0.012*\"open\" + 0.011*\"includ\" + 0.011*\"lobe\" + 0.009*\"dai\" + 0.009*\"highli\"\n", + "2019-01-31 01:05:00,067 : INFO : topic #5 (0.020): 0.038*\"abroad\" + 0.028*\"son\" + 0.027*\"rel\" + 0.026*\"reconstruct\" + 0.021*\"band\" + 0.017*\"muscl\" + 0.016*\"simultan\" + 0.014*\"charcoal\" + 0.013*\"toyota\" + 0.010*\"vocabulari\"\n", + "2019-01-31 01:05:00,073 : INFO : topic diff=0.003749, rho=0.026537\n", + "2019-01-31 01:05:00,228 : INFO : PROGRESS: pass 0, at document #2842000/4922894\n", + "2019-01-31 01:05:01,599 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:05:01,866 : INFO : topic #35 (0.020): 0.058*\"russia\" + 0.038*\"sovereignti\" + 0.032*\"rural\" + 0.026*\"reprint\" + 0.025*\"personifi\" + 0.025*\"poison\" + 0.021*\"moscow\" + 0.018*\"alexand\" + 0.018*\"poland\" + 0.015*\"unfortun\"\n", + "2019-01-31 01:05:01,867 : INFO : topic #34 (0.020): 0.068*\"start\" + 0.034*\"new\" + 0.031*\"american\" + 0.030*\"unionist\" + 0.026*\"cotton\" + 0.021*\"year\" + 0.015*\"california\" + 0.013*\"terri\" + 0.013*\"warrior\" + 0.012*\"north\"\n", + "2019-01-31 01:05:01,868 : INFO : topic #10 (0.020): 0.012*\"cdd\" + 0.008*\"media\" + 0.008*\"disco\" + 0.008*\"hormon\" + 0.008*\"have\" + 0.007*\"pathwai\" + 0.007*\"caus\" + 0.006*\"proper\" + 0.006*\"treat\" + 0.006*\"effect\"\n", + "2019-01-31 01:05:01,869 : INFO : topic #28 (0.020): 0.033*\"build\" + 0.026*\"hous\" + 0.019*\"rivièr\" + 0.018*\"buford\" + 0.014*\"histor\" + 0.012*\"briarwood\" + 0.011*\"constitut\" + 0.011*\"strategist\" + 0.010*\"linear\" + 0.010*\"depress\"\n", + "2019-01-31 01:05:01,870 : INFO : topic #39 (0.020): 0.060*\"canada\" + 0.044*\"canadian\" + 0.024*\"hoar\" + 0.023*\"toronto\" + 0.022*\"ontario\" + 0.016*\"hydrogen\" + 0.016*\"new\" + 0.015*\"misericordia\" + 0.015*\"novotná\" + 0.013*\"quebec\"\n", + "2019-01-31 01:05:01,877 : INFO : topic diff=0.004018, rho=0.026528\n", + "2019-01-31 01:05:02,034 : INFO : PROGRESS: pass 0, at document #2844000/4922894\n", + "2019-01-31 01:05:03,415 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:05:03,681 : INFO : topic #35 (0.020): 0.058*\"russia\" + 0.038*\"sovereignti\" + 0.032*\"rural\" + 0.026*\"personifi\" + 0.025*\"reprint\" + 0.024*\"poison\" + 0.021*\"moscow\" + 0.018*\"alexand\" + 0.017*\"poland\" + 0.015*\"unfortun\"\n", + "2019-01-31 01:05:03,683 : INFO : topic #31 (0.020): 0.053*\"fusiform\" + 0.026*\"scientist\" + 0.025*\"taxpay\" + 0.023*\"player\" + 0.020*\"place\" + 0.014*\"clot\" + 0.013*\"leagu\" + 0.011*\"folei\" + 0.010*\"yawn\" + 0.009*\"reconstruct\"\n", + "2019-01-31 01:05:03,684 : INFO : topic #36 (0.020): 0.011*\"network\" + 0.011*\"prognosi\" + 0.010*\"pop\" + 0.008*\"cytokin\" + 0.008*\"develop\" + 0.008*\"softwar\" + 0.008*\"uruguayan\" + 0.007*\"user\" + 0.007*\"diggin\" + 0.007*\"includ\"\n", + "2019-01-31 01:05:03,685 : INFO : topic #16 (0.020): 0.056*\"king\" + 0.031*\"priest\" + 0.020*\"idiosyncrat\" + 0.020*\"duke\" + 0.019*\"rotterdam\" + 0.019*\"grammat\" + 0.017*\"quarterli\" + 0.013*\"kingdom\" + 0.013*\"count\" + 0.012*\"portugues\"\n", + "2019-01-31 01:05:03,686 : INFO : topic #1 (0.020): 0.053*\"china\" + 0.043*\"chilton\" + 0.023*\"hong\" + 0.022*\"kong\" + 0.022*\"korea\" + 0.018*\"korean\" + 0.017*\"leah\" + 0.016*\"kim\" + 0.016*\"sourc\" + 0.014*\"shirin\"\n", + "2019-01-31 01:05:03,691 : INFO : topic diff=0.003896, rho=0.026519\n", + "2019-01-31 01:05:03,851 : INFO : PROGRESS: pass 0, at document #2846000/4922894\n", + "2019-01-31 01:05:05,240 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:05:05,507 : INFO : topic #30 (0.020): 0.036*\"leagu\" + 0.036*\"cleveland\" + 0.029*\"place\" + 0.028*\"taxpay\" + 0.024*\"scientist\" + 0.024*\"crete\" + 0.021*\"folei\" + 0.017*\"goal\" + 0.015*\"martin\" + 0.012*\"schmitz\"\n", + "2019-01-31 01:05:05,508 : INFO : topic #7 (0.020): 0.021*\"snatch\" + 0.020*\"di\" + 0.018*\"factor\" + 0.016*\"yawn\" + 0.016*\"margin\" + 0.014*\"bone\" + 0.013*\"life\" + 0.013*\"faster\" + 0.012*\"deal\" + 0.012*\"john\"\n", + "2019-01-31 01:05:05,509 : INFO : topic #38 (0.020): 0.024*\"walter\" + 0.010*\"aza\" + 0.009*\"battalion\" + 0.009*\"empath\" + 0.008*\"forc\" + 0.007*\"teufel\" + 0.007*\"armi\" + 0.006*\"till\" + 0.006*\"militari\" + 0.006*\"govern\"\n", + "2019-01-31 01:05:05,510 : INFO : topic #2 (0.020): 0.050*\"isl\" + 0.038*\"shield\" + 0.018*\"narrat\" + 0.015*\"scot\" + 0.012*\"blur\" + 0.011*\"pope\" + 0.011*\"coalit\" + 0.010*\"nativist\" + 0.010*\"fleet\" + 0.010*\"bahá\"\n", + "2019-01-31 01:05:05,511 : INFO : topic #41 (0.020): 0.041*\"citi\" + 0.023*\"palmer\" + 0.022*\"new\" + 0.016*\"strategist\" + 0.013*\"center\" + 0.012*\"open\" + 0.011*\"includ\" + 0.011*\"lobe\" + 0.010*\"dai\" + 0.009*\"highli\"\n", + "2019-01-31 01:05:05,517 : INFO : topic diff=0.003716, rho=0.026509\n", + "2019-01-31 01:05:05,731 : INFO : PROGRESS: pass 0, at document #2848000/4922894\n", + "2019-01-31 01:05:07,083 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:05:07,350 : INFO : topic #2 (0.020): 0.050*\"isl\" + 0.038*\"shield\" + 0.018*\"narrat\" + 0.015*\"scot\" + 0.012*\"blur\" + 0.011*\"coalit\" + 0.011*\"pope\" + 0.010*\"nativist\" + 0.010*\"fleet\" + 0.010*\"bahá\"\n", + "2019-01-31 01:05:07,351 : INFO : topic #36 (0.020): 0.011*\"network\" + 0.011*\"prognosi\" + 0.010*\"pop\" + 0.008*\"cytokin\" + 0.008*\"develop\" + 0.008*\"softwar\" + 0.008*\"uruguayan\" + 0.008*\"user\" + 0.007*\"includ\" + 0.007*\"diggin\"\n", + "2019-01-31 01:05:07,352 : INFO : topic #13 (0.020): 0.026*\"sourc\" + 0.025*\"london\" + 0.025*\"australia\" + 0.024*\"new\" + 0.024*\"england\" + 0.021*\"australian\" + 0.019*\"ireland\" + 0.019*\"british\" + 0.015*\"youth\" + 0.014*\"wale\"\n", + "2019-01-31 01:05:07,353 : INFO : topic #48 (0.020): 0.084*\"march\" + 0.078*\"sens\" + 0.078*\"octob\" + 0.077*\"januari\" + 0.073*\"juli\" + 0.071*\"judici\" + 0.071*\"notion\" + 0.070*\"august\" + 0.069*\"decatur\" + 0.069*\"april\"\n", + "2019-01-31 01:05:07,354 : INFO : topic #0 (0.020): 0.066*\"statewid\" + 0.042*\"line\" + 0.035*\"raid\" + 0.021*\"museo\" + 0.020*\"arsen\" + 0.020*\"rosenwald\" + 0.020*\"traceabl\" + 0.019*\"serv\" + 0.013*\"oper\" + 0.010*\"exhaust\"\n", + "2019-01-31 01:05:07,360 : INFO : topic diff=0.004339, rho=0.026500\n", + "2019-01-31 01:05:07,514 : INFO : PROGRESS: pass 0, at document #2850000/4922894\n", + "2019-01-31 01:05:08,892 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:05:09,159 : INFO : topic #44 (0.020): 0.031*\"rooftop\" + 0.028*\"final\" + 0.023*\"wife\" + 0.020*\"tourist\" + 0.019*\"champion\" + 0.015*\"chamber\" + 0.015*\"martin\" + 0.014*\"tiepolo\" + 0.014*\"taxpay\" + 0.013*\"open\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 01:05:09,160 : INFO : topic #21 (0.020): 0.034*\"samford\" + 0.021*\"spain\" + 0.018*\"del\" + 0.017*\"mexico\" + 0.015*\"italian\" + 0.013*\"soviet\" + 0.012*\"santa\" + 0.011*\"juan\" + 0.011*\"carlo\" + 0.011*\"lizard\"\n", + "2019-01-31 01:05:09,161 : INFO : topic #36 (0.020): 0.011*\"network\" + 0.011*\"prognosi\" + 0.010*\"pop\" + 0.008*\"cytokin\" + 0.008*\"develop\" + 0.008*\"softwar\" + 0.008*\"uruguayan\" + 0.007*\"user\" + 0.007*\"includ\" + 0.007*\"diggin\"\n", + "2019-01-31 01:05:09,162 : INFO : topic #20 (0.020): 0.145*\"scholar\" + 0.039*\"struggl\" + 0.033*\"high\" + 0.029*\"educ\" + 0.023*\"collector\" + 0.017*\"yawn\" + 0.013*\"prognosi\" + 0.010*\"district\" + 0.010*\"gothic\" + 0.009*\"start\"\n", + "2019-01-31 01:05:09,163 : INFO : topic #33 (0.020): 0.063*\"french\" + 0.050*\"franc\" + 0.034*\"pari\" + 0.023*\"sail\" + 0.022*\"jean\" + 0.017*\"daphn\" + 0.014*\"loui\" + 0.013*\"lazi\" + 0.011*\"piec\" + 0.010*\"wreath\"\n", + "2019-01-31 01:05:09,169 : INFO : topic diff=0.004088, rho=0.026491\n", + "2019-01-31 01:05:09,325 : INFO : PROGRESS: pass 0, at document #2852000/4922894\n", + "2019-01-31 01:05:10,702 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:05:10,969 : INFO : topic #28 (0.020): 0.033*\"build\" + 0.026*\"hous\" + 0.019*\"rivièr\" + 0.018*\"buford\" + 0.014*\"histor\" + 0.011*\"briarwood\" + 0.011*\"constitut\" + 0.011*\"strategist\" + 0.010*\"depress\" + 0.010*\"linear\"\n", + "2019-01-31 01:05:10,970 : INFO : topic #34 (0.020): 0.068*\"start\" + 0.034*\"new\" + 0.031*\"unionist\" + 0.031*\"american\" + 0.026*\"cotton\" + 0.021*\"year\" + 0.015*\"california\" + 0.013*\"terri\" + 0.013*\"warrior\" + 0.012*\"north\"\n", + "2019-01-31 01:05:10,971 : INFO : topic #9 (0.020): 0.070*\"bone\" + 0.044*\"american\" + 0.028*\"valour\" + 0.019*\"dutch\" + 0.018*\"folei\" + 0.018*\"player\" + 0.017*\"polit\" + 0.016*\"english\" + 0.012*\"acrimoni\" + 0.012*\"simpler\"\n", + "2019-01-31 01:05:10,973 : INFO : topic #24 (0.020): 0.039*\"book\" + 0.034*\"publicis\" + 0.028*\"word\" + 0.018*\"new\" + 0.014*\"edit\" + 0.013*\"presid\" + 0.012*\"collect\" + 0.011*\"storag\" + 0.011*\"nicola\" + 0.011*\"arsen\"\n", + "2019-01-31 01:05:10,974 : INFO : topic #23 (0.020): 0.135*\"audit\" + 0.067*\"best\" + 0.033*\"yawn\" + 0.028*\"jacksonvil\" + 0.022*\"noll\" + 0.021*\"japanes\" + 0.020*\"festiv\" + 0.020*\"women\" + 0.018*\"intern\" + 0.014*\"prison\"\n", + "2019-01-31 01:05:10,979 : INFO : topic diff=0.004027, rho=0.026481\n", + "2019-01-31 01:05:11,135 : INFO : PROGRESS: pass 0, at document #2854000/4922894\n", + "2019-01-31 01:05:12,507 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:05:12,773 : INFO : topic #29 (0.020): 0.031*\"companhia\" + 0.012*\"busi\" + 0.012*\"market\" + 0.012*\"million\" + 0.011*\"produc\" + 0.010*\"bank\" + 0.009*\"industri\" + 0.008*\"manag\" + 0.008*\"yawn\" + 0.007*\"oper\"\n", + "2019-01-31 01:05:12,775 : INFO : topic #45 (0.020): 0.026*\"jpg\" + 0.024*\"fifteenth\" + 0.018*\"illicit\" + 0.015*\"colder\" + 0.015*\"western\" + 0.014*\"black\" + 0.014*\"pain\" + 0.011*\"record\" + 0.010*\"depress\" + 0.009*\"blind\"\n", + "2019-01-31 01:05:12,776 : INFO : topic #33 (0.020): 0.063*\"french\" + 0.050*\"franc\" + 0.034*\"pari\" + 0.023*\"sail\" + 0.021*\"jean\" + 0.017*\"daphn\" + 0.013*\"loui\" + 0.013*\"lazi\" + 0.011*\"piec\" + 0.010*\"wreath\"\n", + "2019-01-31 01:05:12,777 : INFO : topic #49 (0.020): 0.044*\"india\" + 0.031*\"incumb\" + 0.013*\"islam\" + 0.013*\"pakistan\" + 0.012*\"televis\" + 0.011*\"anglo\" + 0.011*\"sri\" + 0.010*\"muskoge\" + 0.010*\"khalsa\" + 0.009*\"alam\"\n", + "2019-01-31 01:05:12,778 : INFO : topic #19 (0.020): 0.016*\"languag\" + 0.015*\"centuri\" + 0.011*\"woodcut\" + 0.009*\"form\" + 0.009*\"origin\" + 0.009*\"mean\" + 0.008*\"trade\" + 0.008*\"english\" + 0.007*\"known\" + 0.006*\"ancestor\"\n", + "2019-01-31 01:05:12,784 : INFO : topic diff=0.003710, rho=0.026472\n", + "2019-01-31 01:05:12,941 : INFO : PROGRESS: pass 0, at document #2856000/4922894\n", + "2019-01-31 01:05:14,323 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:05:14,589 : INFO : topic #7 (0.020): 0.020*\"snatch\" + 0.020*\"di\" + 0.018*\"factor\" + 0.016*\"yawn\" + 0.016*\"margin\" + 0.014*\"bone\" + 0.013*\"life\" + 0.013*\"faster\" + 0.012*\"deal\" + 0.012*\"daughter\"\n", + "2019-01-31 01:05:14,591 : INFO : topic #32 (0.020): 0.048*\"district\" + 0.044*\"popolo\" + 0.041*\"vigour\" + 0.036*\"tortur\" + 0.034*\"cotton\" + 0.023*\"area\" + 0.021*\"multitud\" + 0.020*\"citi\" + 0.018*\"cede\" + 0.018*\"regim\"\n", + "2019-01-31 01:05:14,592 : INFO : topic #10 (0.020): 0.012*\"cdd\" + 0.009*\"media\" + 0.008*\"disco\" + 0.008*\"have\" + 0.008*\"hormon\" + 0.007*\"pathwai\" + 0.007*\"caus\" + 0.006*\"proper\" + 0.006*\"treat\" + 0.006*\"effect\"\n", + "2019-01-31 01:05:14,593 : INFO : topic #0 (0.020): 0.065*\"statewid\" + 0.042*\"line\" + 0.036*\"raid\" + 0.021*\"rosenwald\" + 0.020*\"museo\" + 0.020*\"traceabl\" + 0.020*\"arsen\" + 0.018*\"serv\" + 0.013*\"oper\" + 0.011*\"radiu\"\n", + "2019-01-31 01:05:14,594 : INFO : topic #45 (0.020): 0.026*\"jpg\" + 0.024*\"fifteenth\" + 0.018*\"illicit\" + 0.015*\"colder\" + 0.015*\"western\" + 0.014*\"black\" + 0.014*\"pain\" + 0.011*\"record\" + 0.010*\"depress\" + 0.009*\"blind\"\n", + "2019-01-31 01:05:14,600 : INFO : topic diff=0.003561, rho=0.026463\n", + "2019-01-31 01:05:14,756 : INFO : PROGRESS: pass 0, at document #2858000/4922894\n", + "2019-01-31 01:05:16,127 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:05:16,394 : INFO : topic #19 (0.020): 0.016*\"languag\" + 0.015*\"centuri\" + 0.011*\"woodcut\" + 0.009*\"form\" + 0.009*\"origin\" + 0.009*\"mean\" + 0.008*\"trade\" + 0.008*\"english\" + 0.007*\"known\" + 0.007*\"ancestor\"\n", + "2019-01-31 01:05:16,395 : INFO : topic #22 (0.020): 0.035*\"spars\" + 0.021*\"factor\" + 0.012*\"plaisir\" + 0.010*\"feel\" + 0.010*\"genu\" + 0.009*\"male\" + 0.009*\"western\" + 0.008*\"median\" + 0.008*\"biom\" + 0.008*\"incom\"\n", + "2019-01-31 01:05:16,396 : INFO : topic #8 (0.020): 0.028*\"law\" + 0.023*\"cortic\" + 0.018*\"act\" + 0.018*\"start\" + 0.013*\"ricardo\" + 0.012*\"case\" + 0.010*\"replac\" + 0.010*\"polaris\" + 0.009*\"legal\" + 0.007*\"order\"\n", + "2019-01-31 01:05:16,397 : INFO : topic #39 (0.020): 0.060*\"canada\" + 0.043*\"canadian\" + 0.023*\"toronto\" + 0.023*\"hoar\" + 0.022*\"ontario\" + 0.016*\"new\" + 0.015*\"hydrogen\" + 0.015*\"quebec\" + 0.015*\"misericordia\" + 0.014*\"novotná\"\n", + "2019-01-31 01:05:16,399 : INFO : topic #37 (0.020): 0.011*\"charact\" + 0.010*\"septemb\" + 0.010*\"man\" + 0.009*\"anim\" + 0.008*\"comic\" + 0.007*\"appear\" + 0.007*\"love\" + 0.006*\"gestur\" + 0.006*\"workplac\" + 0.006*\"dixi\"\n", + "2019-01-31 01:05:16,404 : INFO : topic diff=0.003787, rho=0.026454\n", + "2019-01-31 01:05:19,124 : INFO : -11.694 per-word bound, 3312.7 perplexity estimate based on a held-out corpus of 2000 documents with 571272 words\n", + "2019-01-31 01:05:19,124 : INFO : PROGRESS: pass 0, at document #2860000/4922894\n", + "2019-01-31 01:05:20,519 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:05:20,786 : INFO : topic #16 (0.020): 0.055*\"king\" + 0.031*\"priest\" + 0.021*\"idiosyncrat\" + 0.020*\"duke\" + 0.019*\"rotterdam\" + 0.019*\"grammat\" + 0.017*\"quarterli\" + 0.014*\"kingdom\" + 0.013*\"count\" + 0.013*\"portugues\"\n", + "2019-01-31 01:05:20,787 : INFO : topic #14 (0.020): 0.023*\"forc\" + 0.022*\"aggress\" + 0.021*\"armi\" + 0.019*\"walter\" + 0.017*\"com\" + 0.014*\"oper\" + 0.014*\"unionist\" + 0.012*\"militari\" + 0.012*\"airbu\" + 0.011*\"solitari\"\n", + "2019-01-31 01:05:20,788 : INFO : topic #9 (0.020): 0.070*\"bone\" + 0.044*\"american\" + 0.028*\"valour\" + 0.019*\"player\" + 0.018*\"dutch\" + 0.018*\"folei\" + 0.017*\"english\" + 0.017*\"polit\" + 0.012*\"acrimoni\" + 0.012*\"simpler\"\n", + "2019-01-31 01:05:20,789 : INFO : topic #29 (0.020): 0.030*\"companhia\" + 0.012*\"busi\" + 0.012*\"market\" + 0.012*\"million\" + 0.011*\"produc\" + 0.010*\"bank\" + 0.009*\"industri\" + 0.008*\"manag\" + 0.008*\"yawn\" + 0.007*\"oper\"\n", + "2019-01-31 01:05:20,790 : INFO : topic #1 (0.020): 0.052*\"china\" + 0.042*\"chilton\" + 0.022*\"hong\" + 0.022*\"korea\" + 0.022*\"kong\" + 0.019*\"korean\" + 0.017*\"leah\" + 0.016*\"sourc\" + 0.016*\"kim\" + 0.014*\"shirin\"\n", + "2019-01-31 01:05:20,796 : INFO : topic diff=0.004324, rho=0.026444\n", + "2019-01-31 01:05:20,953 : INFO : PROGRESS: pass 0, at document #2862000/4922894\n", + "2019-01-31 01:05:22,330 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:05:22,596 : INFO : topic #46 (0.020): 0.018*\"stop\" + 0.016*\"sweden\" + 0.016*\"norwai\" + 0.016*\"damag\" + 0.015*\"swedish\" + 0.014*\"wind\" + 0.014*\"norwegian\" + 0.012*\"denmark\" + 0.012*\"danish\" + 0.011*\"farid\"\n", + "2019-01-31 01:05:22,597 : INFO : topic #48 (0.020): 0.086*\"march\" + 0.078*\"octob\" + 0.077*\"sens\" + 0.076*\"januari\" + 0.071*\"juli\" + 0.071*\"notion\" + 0.069*\"august\" + 0.069*\"judici\" + 0.069*\"decatur\" + 0.067*\"april\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 01:05:22,598 : INFO : topic #20 (0.020): 0.145*\"scholar\" + 0.038*\"struggl\" + 0.033*\"high\" + 0.029*\"educ\" + 0.023*\"collector\" + 0.017*\"yawn\" + 0.013*\"prognosi\" + 0.011*\"district\" + 0.010*\"gothic\" + 0.010*\"start\"\n", + "2019-01-31 01:05:22,599 : INFO : topic #12 (0.020): 0.009*\"number\" + 0.008*\"frontal\" + 0.007*\"théori\" + 0.007*\"gener\" + 0.006*\"exampl\" + 0.006*\"poet\" + 0.006*\"measur\" + 0.006*\"southern\" + 0.006*\"differ\" + 0.006*\"theoret\"\n", + "2019-01-31 01:05:22,601 : INFO : topic #6 (0.020): 0.072*\"fewer\" + 0.023*\"epiru\" + 0.020*\"septemb\" + 0.018*\"teacher\" + 0.015*\"stake\" + 0.013*\"proclaim\" + 0.012*\"rodríguez\" + 0.011*\"movi\" + 0.011*\"direct\" + 0.010*\"produc\"\n", + "2019-01-31 01:05:22,606 : INFO : topic diff=0.004343, rho=0.026435\n", + "2019-01-31 01:05:22,766 : INFO : PROGRESS: pass 0, at document #2864000/4922894\n", + "2019-01-31 01:05:24,151 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:05:24,417 : INFO : topic #4 (0.020): 0.020*\"enfranchis\" + 0.015*\"depress\" + 0.015*\"pour\" + 0.009*\"mode\" + 0.009*\"elabor\" + 0.008*\"veget\" + 0.007*\"uruguayan\" + 0.006*\"develop\" + 0.006*\"encyclopedia\" + 0.006*\"spectacl\"\n", + "2019-01-31 01:05:24,418 : INFO : topic #6 (0.020): 0.073*\"fewer\" + 0.023*\"epiru\" + 0.020*\"septemb\" + 0.018*\"teacher\" + 0.015*\"stake\" + 0.013*\"proclaim\" + 0.012*\"rodríguez\" + 0.011*\"movi\" + 0.011*\"direct\" + 0.010*\"produc\"\n", + "2019-01-31 01:05:24,419 : INFO : topic #14 (0.020): 0.023*\"forc\" + 0.022*\"aggress\" + 0.020*\"armi\" + 0.019*\"walter\" + 0.017*\"com\" + 0.015*\"oper\" + 0.014*\"unionist\" + 0.012*\"militari\" + 0.012*\"airbu\" + 0.011*\"solitari\"\n", + "2019-01-31 01:05:24,421 : INFO : topic #24 (0.020): 0.039*\"book\" + 0.034*\"publicis\" + 0.027*\"word\" + 0.018*\"new\" + 0.014*\"edit\" + 0.013*\"presid\" + 0.012*\"collect\" + 0.011*\"storag\" + 0.011*\"nicola\" + 0.011*\"arsen\"\n", + "2019-01-31 01:05:24,422 : INFO : topic #11 (0.020): 0.023*\"john\" + 0.012*\"will\" + 0.012*\"david\" + 0.012*\"jame\" + 0.010*\"rival\" + 0.009*\"mexican–american\" + 0.008*\"slur\" + 0.008*\"paul\" + 0.008*\"georg\" + 0.007*\"rhyme\"\n", + "2019-01-31 01:05:24,428 : INFO : topic diff=0.003659, rho=0.026426\n", + "2019-01-31 01:05:24,584 : INFO : PROGRESS: pass 0, at document #2866000/4922894\n", + "2019-01-31 01:05:25,955 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:05:26,222 : INFO : topic #25 (0.020): 0.031*\"ring\" + 0.018*\"area\" + 0.017*\"lagrang\" + 0.016*\"warmth\" + 0.015*\"mount\" + 0.010*\"palmer\" + 0.009*\"north\" + 0.009*\"foam\" + 0.009*\"sourc\" + 0.009*\"land\"\n", + "2019-01-31 01:05:26,223 : INFO : topic #38 (0.020): 0.024*\"walter\" + 0.011*\"battalion\" + 0.010*\"aza\" + 0.009*\"empath\" + 0.008*\"forc\" + 0.007*\"teufel\" + 0.007*\"armi\" + 0.006*\"govern\" + 0.006*\"militari\" + 0.006*\"pour\"\n", + "2019-01-31 01:05:26,224 : INFO : topic #42 (0.020): 0.047*\"german\" + 0.031*\"germani\" + 0.016*\"vol\" + 0.014*\"israel\" + 0.014*\"berlin\" + 0.014*\"jewish\" + 0.014*\"der\" + 0.011*\"european\" + 0.009*\"austria\" + 0.009*\"europ\"\n", + "2019-01-31 01:05:26,225 : INFO : topic #6 (0.020): 0.073*\"fewer\" + 0.023*\"epiru\" + 0.020*\"septemb\" + 0.018*\"teacher\" + 0.015*\"stake\" + 0.013*\"proclaim\" + 0.012*\"rodríguez\" + 0.011*\"direct\" + 0.011*\"movi\" + 0.010*\"acrimoni\"\n", + "2019-01-31 01:05:26,227 : INFO : topic #14 (0.020): 0.023*\"forc\" + 0.022*\"aggress\" + 0.020*\"armi\" + 0.019*\"walter\" + 0.017*\"com\" + 0.015*\"oper\" + 0.014*\"unionist\" + 0.012*\"militari\" + 0.012*\"airbu\" + 0.011*\"solitari\"\n", + "2019-01-31 01:05:26,232 : INFO : topic diff=0.004924, rho=0.026417\n", + "2019-01-31 01:05:26,388 : INFO : PROGRESS: pass 0, at document #2868000/4922894\n", + "2019-01-31 01:05:27,774 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:05:28,040 : INFO : topic #23 (0.020): 0.134*\"audit\" + 0.069*\"best\" + 0.033*\"yawn\" + 0.028*\"jacksonvil\" + 0.023*\"noll\" + 0.020*\"japanes\" + 0.020*\"women\" + 0.020*\"festiv\" + 0.019*\"intern\" + 0.015*\"prison\"\n", + "2019-01-31 01:05:28,041 : INFO : topic #31 (0.020): 0.052*\"fusiform\" + 0.026*\"scientist\" + 0.026*\"taxpay\" + 0.023*\"player\" + 0.020*\"place\" + 0.014*\"clot\" + 0.013*\"leagu\" + 0.011*\"folei\" + 0.011*\"yawn\" + 0.009*\"reconstruct\"\n", + "2019-01-31 01:05:28,042 : INFO : topic #24 (0.020): 0.039*\"book\" + 0.034*\"publicis\" + 0.027*\"word\" + 0.018*\"new\" + 0.014*\"edit\" + 0.013*\"presid\" + 0.012*\"collect\" + 0.011*\"nicola\" + 0.011*\"storag\" + 0.011*\"arsen\"\n", + "2019-01-31 01:05:28,043 : INFO : topic #17 (0.020): 0.077*\"church\" + 0.022*\"cathol\" + 0.022*\"christian\" + 0.020*\"bishop\" + 0.016*\"sail\" + 0.016*\"retroflex\" + 0.011*\"centuri\" + 0.010*\"relationship\" + 0.009*\"cathedr\" + 0.009*\"historiographi\"\n", + "2019-01-31 01:05:28,044 : INFO : topic #0 (0.020): 0.065*\"statewid\" + 0.042*\"line\" + 0.036*\"raid\" + 0.023*\"arsen\" + 0.021*\"rosenwald\" + 0.020*\"museo\" + 0.020*\"traceabl\" + 0.018*\"serv\" + 0.013*\"oper\" + 0.010*\"exhaust\"\n", + "2019-01-31 01:05:28,050 : INFO : topic diff=0.003945, rho=0.026407\n", + "2019-01-31 01:05:28,209 : INFO : PROGRESS: pass 0, at document #2870000/4922894\n", + "2019-01-31 01:05:29,610 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:05:29,877 : INFO : topic #34 (0.020): 0.067*\"start\" + 0.033*\"new\" + 0.030*\"american\" + 0.030*\"unionist\" + 0.026*\"cotton\" + 0.020*\"year\" + 0.015*\"california\" + 0.013*\"terri\" + 0.013*\"warrior\" + 0.012*\"north\"\n", + "2019-01-31 01:05:29,878 : INFO : topic #36 (0.020): 0.011*\"prognosi\" + 0.011*\"network\" + 0.010*\"pop\" + 0.009*\"cytokin\" + 0.008*\"develop\" + 0.008*\"uruguayan\" + 0.008*\"softwar\" + 0.008*\"user\" + 0.007*\"includ\" + 0.007*\"diggin\"\n", + "2019-01-31 01:05:29,879 : INFO : topic #15 (0.020): 0.011*\"small\" + 0.010*\"organ\" + 0.010*\"develop\" + 0.010*\"commun\" + 0.009*\"group\" + 0.008*\"word\" + 0.008*\"peopl\" + 0.007*\"human\" + 0.007*\"summerhil\" + 0.006*\"woman\"\n", + "2019-01-31 01:05:29,880 : INFO : topic #38 (0.020): 0.024*\"walter\" + 0.011*\"battalion\" + 0.010*\"aza\" + 0.009*\"empath\" + 0.008*\"forc\" + 0.007*\"teufel\" + 0.007*\"armi\" + 0.006*\"govern\" + 0.006*\"militari\" + 0.006*\"till\"\n", + "2019-01-31 01:05:29,881 : INFO : topic #11 (0.020): 0.023*\"john\" + 0.012*\"will\" + 0.012*\"david\" + 0.012*\"jame\" + 0.010*\"rival\" + 0.009*\"mexican–american\" + 0.008*\"georg\" + 0.008*\"paul\" + 0.008*\"slur\" + 0.007*\"rhyme\"\n", + "2019-01-31 01:05:29,887 : INFO : topic diff=0.004331, rho=0.026398\n", + "2019-01-31 01:05:30,042 : INFO : PROGRESS: pass 0, at document #2872000/4922894\n", + "2019-01-31 01:05:31,418 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:05:31,684 : INFO : topic #13 (0.020): 0.027*\"london\" + 0.026*\"england\" + 0.026*\"sourc\" + 0.025*\"australia\" + 0.024*\"new\" + 0.022*\"australian\" + 0.019*\"british\" + 0.019*\"ireland\" + 0.015*\"youth\" + 0.014*\"wale\"\n", + "2019-01-31 01:05:31,685 : INFO : topic #39 (0.020): 0.059*\"canada\" + 0.043*\"canadian\" + 0.023*\"hoar\" + 0.022*\"toronto\" + 0.022*\"ontario\" + 0.016*\"new\" + 0.015*\"hydrogen\" + 0.015*\"misericordia\" + 0.014*\"novotná\" + 0.014*\"quebec\"\n", + "2019-01-31 01:05:31,687 : INFO : topic #41 (0.020): 0.040*\"citi\" + 0.023*\"palmer\" + 0.022*\"new\" + 0.015*\"strategist\" + 0.013*\"center\" + 0.013*\"open\" + 0.011*\"includ\" + 0.011*\"lobe\" + 0.009*\"dai\" + 0.009*\"hot\"\n", + "2019-01-31 01:05:31,688 : INFO : topic #35 (0.020): 0.058*\"russia\" + 0.036*\"sovereignti\" + 0.033*\"rural\" + 0.025*\"poison\" + 0.025*\"personifi\" + 0.024*\"reprint\" + 0.020*\"moscow\" + 0.017*\"poland\" + 0.016*\"alexand\" + 0.015*\"unfortun\"\n", + "2019-01-31 01:05:31,689 : INFO : topic #33 (0.020): 0.062*\"french\" + 0.050*\"franc\" + 0.036*\"pari\" + 0.024*\"sail\" + 0.022*\"jean\" + 0.017*\"daphn\" + 0.014*\"loui\" + 0.013*\"lazi\" + 0.011*\"piec\" + 0.009*\"wine\"\n", + "2019-01-31 01:05:31,694 : INFO : topic diff=0.004138, rho=0.026389\n", + "2019-01-31 01:05:31,857 : INFO : PROGRESS: pass 0, at document #2874000/4922894\n", + "2019-01-31 01:05:33,274 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:05:33,541 : INFO : topic #21 (0.020): 0.035*\"samford\" + 0.021*\"spain\" + 0.018*\"del\" + 0.017*\"mexico\" + 0.015*\"italian\" + 0.013*\"soviet\" + 0.012*\"santa\" + 0.011*\"juan\" + 0.011*\"carlo\" + 0.010*\"francisco\"\n", + "2019-01-31 01:05:33,542 : INFO : topic #28 (0.020): 0.033*\"build\" + 0.026*\"hous\" + 0.019*\"rivièr\" + 0.018*\"buford\" + 0.014*\"histor\" + 0.012*\"briarwood\" + 0.011*\"constitut\" + 0.011*\"strategist\" + 0.010*\"linear\" + 0.010*\"silicon\"\n", + "2019-01-31 01:05:33,543 : INFO : topic #4 (0.020): 0.020*\"enfranchis\" + 0.015*\"pour\" + 0.015*\"depress\" + 0.009*\"mode\" + 0.009*\"elabor\" + 0.008*\"veget\" + 0.007*\"uruguayan\" + 0.006*\"encyclopedia\" + 0.006*\"develop\" + 0.006*\"produc\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 01:05:33,544 : INFO : topic #37 (0.020): 0.011*\"charact\" + 0.011*\"septemb\" + 0.010*\"man\" + 0.009*\"anim\" + 0.008*\"comic\" + 0.007*\"appear\" + 0.006*\"gestur\" + 0.006*\"love\" + 0.006*\"workplac\" + 0.006*\"fusiform\"\n", + "2019-01-31 01:05:33,545 : INFO : topic #48 (0.020): 0.085*\"march\" + 0.078*\"octob\" + 0.077*\"sens\" + 0.075*\"januari\" + 0.071*\"notion\" + 0.071*\"juli\" + 0.070*\"judici\" + 0.068*\"decatur\" + 0.068*\"august\" + 0.068*\"april\"\n", + "2019-01-31 01:05:33,551 : INFO : topic diff=0.004295, rho=0.026380\n", + "2019-01-31 01:05:33,707 : INFO : PROGRESS: pass 0, at document #2876000/4922894\n", + "2019-01-31 01:05:35,093 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:05:35,359 : INFO : topic #35 (0.020): 0.058*\"russia\" + 0.036*\"sovereignti\" + 0.033*\"rural\" + 0.025*\"poison\" + 0.024*\"personifi\" + 0.024*\"reprint\" + 0.020*\"moscow\" + 0.017*\"poland\" + 0.015*\"alexand\" + 0.015*\"unfortun\"\n", + "2019-01-31 01:05:35,360 : INFO : topic #22 (0.020): 0.036*\"spars\" + 0.021*\"factor\" + 0.012*\"plaisir\" + 0.010*\"genu\" + 0.010*\"feel\" + 0.009*\"male\" + 0.009*\"median\" + 0.009*\"western\" + 0.008*\"biom\" + 0.008*\"incom\"\n", + "2019-01-31 01:05:35,361 : INFO : topic #8 (0.020): 0.029*\"law\" + 0.023*\"cortic\" + 0.018*\"start\" + 0.018*\"act\" + 0.013*\"ricardo\" + 0.012*\"case\" + 0.010*\"polaris\" + 0.010*\"replac\" + 0.009*\"legal\" + 0.007*\"judaism\"\n", + "2019-01-31 01:05:35,362 : INFO : topic #3 (0.020): 0.032*\"present\" + 0.026*\"offic\" + 0.024*\"minist\" + 0.023*\"nation\" + 0.021*\"govern\" + 0.020*\"member\" + 0.020*\"serv\" + 0.017*\"gener\" + 0.016*\"council\" + 0.016*\"start\"\n", + "2019-01-31 01:05:35,363 : INFO : topic #37 (0.020): 0.011*\"charact\" + 0.011*\"septemb\" + 0.010*\"man\" + 0.009*\"anim\" + 0.008*\"comic\" + 0.007*\"appear\" + 0.006*\"gestur\" + 0.006*\"love\" + 0.006*\"workplac\" + 0.006*\"fusiform\"\n", + "2019-01-31 01:05:35,369 : INFO : topic diff=0.003851, rho=0.026371\n", + "2019-01-31 01:05:35,588 : INFO : PROGRESS: pass 0, at document #2878000/4922894\n", + "2019-01-31 01:05:37,000 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:05:37,267 : INFO : topic #39 (0.020): 0.058*\"canada\" + 0.043*\"canadian\" + 0.023*\"toronto\" + 0.022*\"hoar\" + 0.022*\"ontario\" + 0.016*\"new\" + 0.015*\"hydrogen\" + 0.014*\"misericordia\" + 0.014*\"novotná\" + 0.013*\"quebec\"\n", + "2019-01-31 01:05:37,268 : INFO : topic #45 (0.020): 0.026*\"jpg\" + 0.025*\"fifteenth\" + 0.019*\"illicit\" + 0.015*\"colder\" + 0.015*\"western\" + 0.015*\"black\" + 0.014*\"pain\" + 0.011*\"record\" + 0.010*\"depress\" + 0.009*\"blind\"\n", + "2019-01-31 01:05:37,269 : INFO : topic #2 (0.020): 0.050*\"isl\" + 0.037*\"shield\" + 0.018*\"narrat\" + 0.015*\"scot\" + 0.012*\"blur\" + 0.011*\"pope\" + 0.011*\"coalit\" + 0.010*\"nativist\" + 0.010*\"fleet\" + 0.009*\"bahá\"\n", + "2019-01-31 01:05:37,270 : INFO : topic #0 (0.020): 0.068*\"statewid\" + 0.043*\"line\" + 0.036*\"raid\" + 0.022*\"arsen\" + 0.020*\"rosenwald\" + 0.020*\"museo\" + 0.020*\"traceabl\" + 0.018*\"serv\" + 0.013*\"oper\" + 0.011*\"brook\"\n", + "2019-01-31 01:05:37,271 : INFO : topic #1 (0.020): 0.052*\"china\" + 0.042*\"chilton\" + 0.025*\"hong\" + 0.024*\"kong\" + 0.022*\"korea\" + 0.018*\"korean\" + 0.018*\"leah\" + 0.016*\"kim\" + 0.015*\"sourc\" + 0.014*\"shirin\"\n", + "2019-01-31 01:05:37,277 : INFO : topic diff=0.005459, rho=0.026361\n", + "2019-01-31 01:05:40,021 : INFO : -11.841 per-word bound, 3669.2 perplexity estimate based on a held-out corpus of 2000 documents with 574444 words\n", + "2019-01-31 01:05:40,022 : INFO : PROGRESS: pass 0, at document #2880000/4922894\n", + "2019-01-31 01:05:41,423 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:05:41,689 : INFO : topic #11 (0.020): 0.023*\"john\" + 0.012*\"will\" + 0.012*\"david\" + 0.011*\"jame\" + 0.010*\"rival\" + 0.010*\"mexican–american\" + 0.008*\"georg\" + 0.008*\"slur\" + 0.008*\"paul\" + 0.007*\"rhyme\"\n", + "2019-01-31 01:05:41,690 : INFO : topic #34 (0.020): 0.067*\"start\" + 0.034*\"new\" + 0.030*\"american\" + 0.029*\"unionist\" + 0.026*\"cotton\" + 0.021*\"year\" + 0.015*\"california\" + 0.013*\"terri\" + 0.013*\"warrior\" + 0.012*\"north\"\n", + "2019-01-31 01:05:41,691 : INFO : topic #44 (0.020): 0.028*\"rooftop\" + 0.028*\"final\" + 0.023*\"wife\" + 0.020*\"tourist\" + 0.018*\"champion\" + 0.014*\"martin\" + 0.014*\"tiepolo\" + 0.014*\"open\" + 0.014*\"taxpay\" + 0.014*\"chamber\"\n", + "2019-01-31 01:05:41,692 : INFO : topic #19 (0.020): 0.016*\"languag\" + 0.015*\"centuri\" + 0.011*\"woodcut\" + 0.009*\"form\" + 0.009*\"origin\" + 0.009*\"mean\" + 0.008*\"trade\" + 0.008*\"english\" + 0.007*\"known\" + 0.007*\"ancestor\"\n", + "2019-01-31 01:05:41,693 : INFO : topic #10 (0.020): 0.011*\"cdd\" + 0.009*\"disco\" + 0.008*\"media\" + 0.008*\"hormon\" + 0.008*\"have\" + 0.007*\"caus\" + 0.007*\"pathwai\" + 0.006*\"proper\" + 0.006*\"effect\" + 0.006*\"treat\"\n", + "2019-01-31 01:05:41,699 : INFO : topic diff=0.003446, rho=0.026352\n", + "2019-01-31 01:05:41,859 : INFO : PROGRESS: pass 0, at document #2882000/4922894\n", + "2019-01-31 01:05:43,249 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:05:43,516 : INFO : topic #18 (0.020): 0.010*\"théori\" + 0.007*\"later\" + 0.007*\"sack\" + 0.006*\"dai\" + 0.006*\"kill\" + 0.005*\"retrospect\" + 0.005*\"end\" + 0.005*\"like\" + 0.004*\"call\" + 0.004*\"help\"\n", + "2019-01-31 01:05:43,517 : INFO : topic #36 (0.020): 0.011*\"prognosi\" + 0.011*\"network\" + 0.011*\"pop\" + 0.009*\"cytokin\" + 0.008*\"develop\" + 0.008*\"uruguayan\" + 0.008*\"user\" + 0.008*\"softwar\" + 0.007*\"includ\" + 0.007*\"diggin\"\n", + "2019-01-31 01:05:43,518 : INFO : topic #33 (0.020): 0.063*\"french\" + 0.050*\"franc\" + 0.035*\"pari\" + 0.025*\"sail\" + 0.022*\"jean\" + 0.017*\"daphn\" + 0.013*\"loui\" + 0.013*\"lazi\" + 0.011*\"piec\" + 0.009*\"wine\"\n", + "2019-01-31 01:05:43,519 : INFO : topic #40 (0.020): 0.088*\"unit\" + 0.023*\"schuster\" + 0.023*\"institut\" + 0.022*\"collector\" + 0.021*\"requir\" + 0.019*\"student\" + 0.015*\"professor\" + 0.012*\"word\" + 0.012*\"degre\" + 0.011*\"governor\"\n", + "2019-01-31 01:05:43,520 : INFO : topic #28 (0.020): 0.033*\"build\" + 0.026*\"hous\" + 0.019*\"rivièr\" + 0.018*\"buford\" + 0.014*\"histor\" + 0.012*\"briarwood\" + 0.011*\"constitut\" + 0.010*\"strategist\" + 0.010*\"linear\" + 0.010*\"silicon\"\n", + "2019-01-31 01:05:43,526 : INFO : topic diff=0.004025, rho=0.026343\n", + "2019-01-31 01:05:43,683 : INFO : PROGRESS: pass 0, at document #2884000/4922894\n", + "2019-01-31 01:05:45,059 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:05:45,326 : INFO : topic #26 (0.020): 0.031*\"workplac\" + 0.029*\"champion\" + 0.028*\"woman\" + 0.026*\"olymp\" + 0.024*\"men\" + 0.023*\"medal\" + 0.022*\"alic\" + 0.020*\"event\" + 0.018*\"rainfal\" + 0.018*\"taxpay\"\n", + "2019-01-31 01:05:45,327 : INFO : topic #47 (0.020): 0.065*\"muscl\" + 0.033*\"perceptu\" + 0.019*\"theater\" + 0.017*\"compos\" + 0.017*\"place\" + 0.014*\"damn\" + 0.013*\"orchestr\" + 0.013*\"olympo\" + 0.013*\"physician\" + 0.012*\"word\"\n", + "2019-01-31 01:05:45,328 : INFO : topic #3 (0.020): 0.032*\"present\" + 0.027*\"offic\" + 0.024*\"minist\" + 0.023*\"nation\" + 0.021*\"govern\" + 0.020*\"member\" + 0.020*\"serv\" + 0.017*\"gener\" + 0.016*\"council\" + 0.016*\"start\"\n", + "2019-01-31 01:05:45,329 : INFO : topic #30 (0.020): 0.036*\"cleveland\" + 0.036*\"leagu\" + 0.029*\"place\" + 0.028*\"taxpay\" + 0.024*\"scientist\" + 0.024*\"crete\" + 0.022*\"folei\" + 0.016*\"goal\" + 0.015*\"martin\" + 0.012*\"schmitz\"\n", + "2019-01-31 01:05:45,330 : INFO : topic #43 (0.020): 0.066*\"elect\" + 0.054*\"parti\" + 0.024*\"voluntari\" + 0.022*\"democrat\" + 0.022*\"member\" + 0.016*\"polici\" + 0.015*\"republ\" + 0.014*\"liber\" + 0.014*\"bypass\" + 0.014*\"report\"\n", + "2019-01-31 01:05:45,336 : INFO : topic diff=0.004115, rho=0.026334\n", + "2019-01-31 01:05:45,493 : INFO : PROGRESS: pass 0, at document #2886000/4922894\n", + "2019-01-31 01:05:46,856 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:05:47,122 : INFO : topic #23 (0.020): 0.136*\"audit\" + 0.068*\"best\" + 0.034*\"yawn\" + 0.028*\"jacksonvil\" + 0.022*\"noll\" + 0.020*\"japanes\" + 0.020*\"festiv\" + 0.020*\"women\" + 0.018*\"intern\" + 0.014*\"prison\"\n", + "2019-01-31 01:05:47,123 : INFO : topic #20 (0.020): 0.146*\"scholar\" + 0.039*\"struggl\" + 0.034*\"high\" + 0.029*\"educ\" + 0.023*\"collector\" + 0.017*\"yawn\" + 0.013*\"prognosi\" + 0.011*\"district\" + 0.010*\"gothic\" + 0.010*\"start\"\n", + "2019-01-31 01:05:47,124 : INFO : topic #10 (0.020): 0.012*\"cdd\" + 0.009*\"disco\" + 0.008*\"media\" + 0.008*\"hormon\" + 0.008*\"have\" + 0.007*\"caus\" + 0.007*\"pathwai\" + 0.006*\"proper\" + 0.006*\"effect\" + 0.006*\"treat\"\n", + "2019-01-31 01:05:47,125 : INFO : topic #16 (0.020): 0.056*\"king\" + 0.030*\"priest\" + 0.022*\"idiosyncrat\" + 0.019*\"rotterdam\" + 0.019*\"duke\" + 0.019*\"grammat\" + 0.016*\"quarterli\" + 0.015*\"count\" + 0.013*\"portugues\" + 0.012*\"kingdom\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 01:05:47,127 : INFO : topic #7 (0.020): 0.021*\"snatch\" + 0.020*\"di\" + 0.018*\"factor\" + 0.016*\"yawn\" + 0.016*\"margin\" + 0.015*\"bone\" + 0.013*\"faster\" + 0.013*\"deal\" + 0.013*\"life\" + 0.012*\"john\"\n", + "2019-01-31 01:05:47,132 : INFO : topic diff=0.003781, rho=0.026325\n", + "2019-01-31 01:05:47,286 : INFO : PROGRESS: pass 0, at document #2888000/4922894\n", + "2019-01-31 01:05:48,646 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:05:48,911 : INFO : topic #44 (0.020): 0.028*\"final\" + 0.028*\"rooftop\" + 0.023*\"wife\" + 0.020*\"tourist\" + 0.018*\"champion\" + 0.014*\"martin\" + 0.014*\"open\" + 0.014*\"taxpay\" + 0.014*\"tiepolo\" + 0.014*\"chamber\"\n", + "2019-01-31 01:05:48,912 : INFO : topic #12 (0.020): 0.010*\"number\" + 0.008*\"frontal\" + 0.007*\"gener\" + 0.007*\"théori\" + 0.006*\"exampl\" + 0.006*\"poet\" + 0.006*\"measur\" + 0.006*\"method\" + 0.006*\"southern\" + 0.006*\"differ\"\n", + "2019-01-31 01:05:48,914 : INFO : topic #26 (0.020): 0.031*\"workplac\" + 0.029*\"champion\" + 0.027*\"woman\" + 0.026*\"olymp\" + 0.024*\"men\" + 0.023*\"medal\" + 0.022*\"alic\" + 0.020*\"event\" + 0.018*\"rainfal\" + 0.018*\"taxpay\"\n", + "2019-01-31 01:05:48,915 : INFO : topic #38 (0.020): 0.024*\"walter\" + 0.011*\"battalion\" + 0.010*\"aza\" + 0.009*\"empath\" + 0.009*\"forc\" + 0.007*\"armi\" + 0.007*\"teufel\" + 0.006*\"militari\" + 0.006*\"govern\" + 0.006*\"till\"\n", + "2019-01-31 01:05:48,916 : INFO : topic #33 (0.020): 0.063*\"french\" + 0.049*\"franc\" + 0.035*\"pari\" + 0.024*\"sail\" + 0.022*\"jean\" + 0.017*\"daphn\" + 0.013*\"loui\" + 0.013*\"lazi\" + 0.011*\"piec\" + 0.009*\"wine\"\n", + "2019-01-31 01:05:48,922 : INFO : topic diff=0.004085, rho=0.026316\n", + "2019-01-31 01:05:49,076 : INFO : PROGRESS: pass 0, at document #2890000/4922894\n", + "2019-01-31 01:05:50,422 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:05:50,689 : INFO : topic #40 (0.020): 0.088*\"unit\" + 0.023*\"schuster\" + 0.023*\"institut\" + 0.022*\"collector\" + 0.021*\"requir\" + 0.019*\"student\" + 0.015*\"professor\" + 0.012*\"word\" + 0.012*\"degre\" + 0.011*\"governor\"\n", + "2019-01-31 01:05:50,691 : INFO : topic #20 (0.020): 0.147*\"scholar\" + 0.039*\"struggl\" + 0.034*\"high\" + 0.030*\"educ\" + 0.023*\"collector\" + 0.017*\"yawn\" + 0.013*\"prognosi\" + 0.011*\"district\" + 0.010*\"start\" + 0.010*\"gothic\"\n", + "2019-01-31 01:05:50,692 : INFO : topic #19 (0.020): 0.016*\"languag\" + 0.015*\"centuri\" + 0.011*\"woodcut\" + 0.009*\"origin\" + 0.009*\"form\" + 0.008*\"mean\" + 0.008*\"trade\" + 0.007*\"english\" + 0.007*\"known\" + 0.007*\"ancestor\"\n", + "2019-01-31 01:05:50,693 : INFO : topic #46 (0.020): 0.017*\"stop\" + 0.017*\"sweden\" + 0.016*\"damag\" + 0.016*\"norwai\" + 0.015*\"swedish\" + 0.014*\"wind\" + 0.014*\"norwegian\" + 0.012*\"denmark\" + 0.011*\"danish\" + 0.011*\"huntsvil\"\n", + "2019-01-31 01:05:50,694 : INFO : topic #29 (0.020): 0.030*\"companhia\" + 0.013*\"market\" + 0.012*\"busi\" + 0.011*\"produc\" + 0.011*\"million\" + 0.010*\"bank\" + 0.010*\"industri\" + 0.008*\"yawn\" + 0.008*\"manag\" + 0.007*\"serv\"\n", + "2019-01-31 01:05:50,700 : INFO : topic diff=0.003725, rho=0.026307\n", + "2019-01-31 01:05:50,855 : INFO : PROGRESS: pass 0, at document #2892000/4922894\n", + "2019-01-31 01:05:52,245 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:05:52,511 : INFO : topic #43 (0.020): 0.065*\"elect\" + 0.054*\"parti\" + 0.024*\"voluntari\" + 0.022*\"democrat\" + 0.022*\"member\" + 0.016*\"polici\" + 0.015*\"republ\" + 0.014*\"bypass\" + 0.014*\"selma\" + 0.014*\"liber\"\n", + "2019-01-31 01:05:52,512 : INFO : topic #48 (0.020): 0.083*\"march\" + 0.077*\"octob\" + 0.076*\"sens\" + 0.075*\"januari\" + 0.070*\"juli\" + 0.069*\"notion\" + 0.068*\"judici\" + 0.067*\"august\" + 0.067*\"decatur\" + 0.066*\"april\"\n", + "2019-01-31 01:05:52,514 : INFO : topic #41 (0.020): 0.041*\"citi\" + 0.023*\"palmer\" + 0.022*\"new\" + 0.016*\"strategist\" + 0.013*\"center\" + 0.012*\"open\" + 0.011*\"includ\" + 0.011*\"lobe\" + 0.009*\"dai\" + 0.009*\"hot\"\n", + "2019-01-31 01:05:52,515 : INFO : topic #9 (0.020): 0.067*\"bone\" + 0.045*\"american\" + 0.028*\"valour\" + 0.019*\"dutch\" + 0.019*\"player\" + 0.019*\"folei\" + 0.017*\"english\" + 0.017*\"polit\" + 0.012*\"acrimoni\" + 0.011*\"simpler\"\n", + "2019-01-31 01:05:52,515 : INFO : topic #21 (0.020): 0.036*\"samford\" + 0.021*\"spain\" + 0.018*\"del\" + 0.018*\"mexico\" + 0.016*\"italian\" + 0.014*\"soviet\" + 0.012*\"santa\" + 0.011*\"juan\" + 0.011*\"carlo\" + 0.010*\"francisco\"\n", + "2019-01-31 01:05:52,521 : INFO : topic diff=0.004450, rho=0.026298\n", + "2019-01-31 01:05:52,678 : INFO : PROGRESS: pass 0, at document #2894000/4922894\n", + "2019-01-31 01:05:54,046 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:05:54,313 : INFO : topic #43 (0.020): 0.065*\"elect\" + 0.054*\"parti\" + 0.025*\"voluntari\" + 0.022*\"democrat\" + 0.022*\"member\" + 0.016*\"polici\" + 0.014*\"republ\" + 0.014*\"bypass\" + 0.014*\"selma\" + 0.014*\"report\"\n", + "2019-01-31 01:05:54,313 : INFO : topic #48 (0.020): 0.084*\"march\" + 0.078*\"octob\" + 0.077*\"sens\" + 0.074*\"januari\" + 0.070*\"juli\" + 0.069*\"notion\" + 0.068*\"judici\" + 0.068*\"august\" + 0.067*\"decatur\" + 0.067*\"april\"\n", + "2019-01-31 01:05:54,314 : INFO : topic #3 (0.020): 0.031*\"present\" + 0.027*\"offic\" + 0.024*\"minist\" + 0.023*\"nation\" + 0.021*\"govern\" + 0.021*\"member\" + 0.020*\"serv\" + 0.016*\"gener\" + 0.016*\"council\" + 0.016*\"start\"\n", + "2019-01-31 01:05:54,316 : INFO : topic #41 (0.020): 0.041*\"citi\" + 0.024*\"palmer\" + 0.022*\"new\" + 0.015*\"strategist\" + 0.013*\"center\" + 0.012*\"open\" + 0.011*\"includ\" + 0.011*\"lobe\" + 0.009*\"dai\" + 0.009*\"hot\"\n", + "2019-01-31 01:05:54,317 : INFO : topic #42 (0.020): 0.046*\"german\" + 0.031*\"germani\" + 0.016*\"vol\" + 0.015*\"jewish\" + 0.014*\"israel\" + 0.014*\"berlin\" + 0.014*\"der\" + 0.012*\"european\" + 0.009*\"europ\" + 0.009*\"austria\"\n", + "2019-01-31 01:05:54,322 : INFO : topic diff=0.004276, rho=0.026288\n", + "2019-01-31 01:05:54,478 : INFO : PROGRESS: pass 0, at document #2896000/4922894\n", + "2019-01-31 01:05:55,855 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:05:56,121 : INFO : topic #10 (0.020): 0.012*\"cdd\" + 0.009*\"disco\" + 0.008*\"media\" + 0.008*\"hormon\" + 0.008*\"have\" + 0.007*\"pathwai\" + 0.007*\"caus\" + 0.006*\"proper\" + 0.006*\"effect\" + 0.006*\"treat\"\n", + "2019-01-31 01:05:56,122 : INFO : topic #35 (0.020): 0.057*\"russia\" + 0.036*\"sovereignti\" + 0.035*\"rural\" + 0.025*\"personifi\" + 0.025*\"poison\" + 0.023*\"reprint\" + 0.020*\"moscow\" + 0.017*\"poland\" + 0.016*\"unfortun\" + 0.014*\"tyrant\"\n", + "2019-01-31 01:05:56,123 : INFO : topic #4 (0.020): 0.020*\"enfranchis\" + 0.015*\"pour\" + 0.014*\"depress\" + 0.010*\"elabor\" + 0.010*\"mode\" + 0.009*\"veget\" + 0.007*\"uruguayan\" + 0.007*\"encyclopedia\" + 0.006*\"develop\" + 0.006*\"produc\"\n", + "2019-01-31 01:05:56,124 : INFO : topic #44 (0.020): 0.029*\"rooftop\" + 0.028*\"final\" + 0.023*\"wife\" + 0.020*\"tourist\" + 0.018*\"champion\" + 0.014*\"martin\" + 0.014*\"taxpay\" + 0.014*\"open\" + 0.014*\"tiepolo\" + 0.014*\"chamber\"\n", + "2019-01-31 01:05:56,126 : INFO : topic #0 (0.020): 0.068*\"statewid\" + 0.042*\"line\" + 0.035*\"raid\" + 0.022*\"arsen\" + 0.022*\"museo\" + 0.022*\"rosenwald\" + 0.020*\"traceabl\" + 0.019*\"serv\" + 0.013*\"oper\" + 0.011*\"brook\"\n", + "2019-01-31 01:05:56,131 : INFO : topic diff=0.004365, rho=0.026279\n", + "2019-01-31 01:05:56,283 : INFO : PROGRESS: pass 0, at document #2898000/4922894\n", + "2019-01-31 01:05:57,629 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:05:57,896 : INFO : topic #1 (0.020): 0.054*\"china\" + 0.041*\"chilton\" + 0.024*\"hong\" + 0.023*\"kong\" + 0.023*\"korea\" + 0.019*\"leah\" + 0.018*\"korean\" + 0.016*\"sourc\" + 0.016*\"kim\" + 0.013*\"shirin\"\n", + "2019-01-31 01:05:57,897 : INFO : topic #11 (0.020): 0.023*\"john\" + 0.012*\"will\" + 0.012*\"david\" + 0.012*\"jame\" + 0.010*\"rival\" + 0.009*\"mexican–american\" + 0.008*\"georg\" + 0.008*\"slur\" + 0.008*\"paul\" + 0.007*\"rhyme\"\n", + "2019-01-31 01:05:57,898 : INFO : topic #46 (0.020): 0.017*\"stop\" + 0.017*\"sweden\" + 0.016*\"damag\" + 0.016*\"norwai\" + 0.015*\"swedish\" + 0.014*\"wind\" + 0.013*\"norwegian\" + 0.011*\"denmark\" + 0.011*\"danish\" + 0.010*\"treeless\"\n", + "2019-01-31 01:05:57,899 : INFO : topic #27 (0.020): 0.071*\"questionnair\" + 0.021*\"candid\" + 0.019*\"taxpay\" + 0.013*\"driver\" + 0.013*\"ret\" + 0.013*\"fool\" + 0.012*\"tornado\" + 0.012*\"find\" + 0.011*\"squatter\" + 0.010*\"landslid\"\n", + "2019-01-31 01:05:57,900 : INFO : topic #30 (0.020): 0.036*\"cleveland\" + 0.036*\"leagu\" + 0.029*\"place\" + 0.028*\"taxpay\" + 0.024*\"scientist\" + 0.024*\"crete\" + 0.022*\"folei\" + 0.016*\"goal\" + 0.015*\"martin\" + 0.012*\"schmitz\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 01:05:57,906 : INFO : topic diff=0.003455, rho=0.026270\n", + "2019-01-31 01:06:00,558 : INFO : -11.614 per-word bound, 3133.7 perplexity estimate based on a held-out corpus of 2000 documents with 560306 words\n", + "2019-01-31 01:06:00,559 : INFO : PROGRESS: pass 0, at document #2900000/4922894\n", + "2019-01-31 01:06:01,920 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:06:02,186 : INFO : topic #21 (0.020): 0.036*\"samford\" + 0.021*\"spain\" + 0.018*\"del\" + 0.018*\"mexico\" + 0.016*\"italian\" + 0.014*\"soviet\" + 0.012*\"santa\" + 0.011*\"juan\" + 0.011*\"carlo\" + 0.010*\"josé\"\n", + "2019-01-31 01:06:02,187 : INFO : topic #18 (0.020): 0.011*\"théori\" + 0.007*\"later\" + 0.007*\"sack\" + 0.006*\"dai\" + 0.006*\"kill\" + 0.005*\"retrospect\" + 0.005*\"end\" + 0.005*\"like\" + 0.004*\"call\" + 0.004*\"help\"\n", + "2019-01-31 01:06:02,188 : INFO : topic #10 (0.020): 0.012*\"cdd\" + 0.009*\"disco\" + 0.008*\"media\" + 0.008*\"hormon\" + 0.008*\"have\" + 0.007*\"caus\" + 0.007*\"pathwai\" + 0.006*\"proper\" + 0.006*\"effect\" + 0.006*\"treat\"\n", + "2019-01-31 01:06:02,189 : INFO : topic #15 (0.020): 0.011*\"small\" + 0.010*\"organ\" + 0.010*\"develop\" + 0.009*\"commun\" + 0.009*\"group\" + 0.008*\"word\" + 0.008*\"peopl\" + 0.007*\"human\" + 0.007*\"summerhil\" + 0.006*\"woman\"\n", + "2019-01-31 01:06:02,191 : INFO : topic #37 (0.020): 0.011*\"charact\" + 0.011*\"septemb\" + 0.010*\"man\" + 0.009*\"anim\" + 0.008*\"comic\" + 0.007*\"appear\" + 0.006*\"love\" + 0.006*\"gestur\" + 0.006*\"workplac\" + 0.006*\"dixi\"\n", + "2019-01-31 01:06:02,197 : INFO : topic diff=0.004961, rho=0.026261\n", + "2019-01-31 01:06:02,355 : INFO : PROGRESS: pass 0, at document #2902000/4922894\n", + "2019-01-31 01:06:03,723 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:06:03,989 : INFO : topic #5 (0.020): 0.038*\"abroad\" + 0.029*\"son\" + 0.027*\"rel\" + 0.026*\"reconstruct\" + 0.021*\"band\" + 0.017*\"muscl\" + 0.016*\"simultan\" + 0.014*\"charcoal\" + 0.014*\"toyota\" + 0.010*\"vocabulari\"\n", + "2019-01-31 01:06:03,990 : INFO : topic #8 (0.020): 0.029*\"law\" + 0.023*\"cortic\" + 0.019*\"act\" + 0.018*\"start\" + 0.013*\"ricardo\" + 0.012*\"case\" + 0.010*\"replac\" + 0.010*\"polaris\" + 0.009*\"legal\" + 0.007*\"judaism\"\n", + "2019-01-31 01:06:03,991 : INFO : topic #21 (0.020): 0.035*\"samford\" + 0.021*\"spain\" + 0.018*\"del\" + 0.018*\"mexico\" + 0.016*\"italian\" + 0.014*\"soviet\" + 0.011*\"santa\" + 0.011*\"juan\" + 0.011*\"carlo\" + 0.010*\"josé\"\n", + "2019-01-31 01:06:03,992 : INFO : topic #47 (0.020): 0.064*\"muscl\" + 0.033*\"perceptu\" + 0.019*\"theater\" + 0.018*\"compos\" + 0.017*\"place\" + 0.015*\"damn\" + 0.014*\"orchestr\" + 0.013*\"olympo\" + 0.012*\"physician\" + 0.012*\"word\"\n", + "2019-01-31 01:06:03,993 : INFO : topic #38 (0.020): 0.025*\"walter\" + 0.011*\"battalion\" + 0.010*\"aza\" + 0.009*\"forc\" + 0.008*\"empath\" + 0.007*\"teufel\" + 0.007*\"armi\" + 0.006*\"militari\" + 0.006*\"govern\" + 0.006*\"pour\"\n", + "2019-01-31 01:06:03,999 : INFO : topic diff=0.003988, rho=0.026252\n", + "2019-01-31 01:06:04,153 : INFO : PROGRESS: pass 0, at document #2904000/4922894\n", + "2019-01-31 01:06:05,520 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:06:05,786 : INFO : topic #47 (0.020): 0.064*\"muscl\" + 0.033*\"perceptu\" + 0.019*\"theater\" + 0.018*\"compos\" + 0.017*\"place\" + 0.015*\"damn\" + 0.014*\"orchestr\" + 0.013*\"olympo\" + 0.012*\"physician\" + 0.012*\"word\"\n", + "2019-01-31 01:06:05,788 : INFO : topic #37 (0.020): 0.011*\"charact\" + 0.011*\"septemb\" + 0.010*\"man\" + 0.009*\"anim\" + 0.008*\"comic\" + 0.007*\"appear\" + 0.006*\"love\" + 0.006*\"gestur\" + 0.006*\"workplac\" + 0.006*\"fusiform\"\n", + "2019-01-31 01:06:05,789 : INFO : topic #12 (0.020): 0.009*\"number\" + 0.008*\"frontal\" + 0.007*\"théori\" + 0.007*\"gener\" + 0.007*\"poet\" + 0.006*\"exampl\" + 0.006*\"southern\" + 0.006*\"measur\" + 0.006*\"differ\" + 0.006*\"servitud\"\n", + "2019-01-31 01:06:05,790 : INFO : topic #39 (0.020): 0.057*\"canada\" + 0.042*\"canadian\" + 0.023*\"toronto\" + 0.022*\"hoar\" + 0.022*\"ontario\" + 0.015*\"new\" + 0.014*\"misericordia\" + 0.014*\"hydrogen\" + 0.014*\"novotná\" + 0.013*\"quebec\"\n", + "2019-01-31 01:06:05,791 : INFO : topic #32 (0.020): 0.049*\"district\" + 0.043*\"popolo\" + 0.041*\"vigour\" + 0.036*\"tortur\" + 0.033*\"cotton\" + 0.024*\"area\" + 0.022*\"multitud\" + 0.020*\"citi\" + 0.019*\"regim\" + 0.018*\"cede\"\n", + "2019-01-31 01:06:05,797 : INFO : topic diff=0.003743, rho=0.026243\n", + "2019-01-31 01:06:05,954 : INFO : PROGRESS: pass 0, at document #2906000/4922894\n", + "2019-01-31 01:06:07,337 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:06:07,603 : INFO : topic #28 (0.020): 0.032*\"build\" + 0.026*\"hous\" + 0.019*\"rivièr\" + 0.017*\"buford\" + 0.014*\"histor\" + 0.011*\"briarwood\" + 0.011*\"constitut\" + 0.010*\"strategist\" + 0.010*\"linear\" + 0.010*\"depress\"\n", + "2019-01-31 01:06:07,604 : INFO : topic #32 (0.020): 0.050*\"district\" + 0.043*\"popolo\" + 0.041*\"vigour\" + 0.036*\"tortur\" + 0.033*\"cotton\" + 0.024*\"area\" + 0.022*\"multitud\" + 0.020*\"citi\" + 0.019*\"regim\" + 0.018*\"cede\"\n", + "2019-01-31 01:06:07,606 : INFO : topic #38 (0.020): 0.025*\"walter\" + 0.011*\"battalion\" + 0.010*\"aza\" + 0.009*\"forc\" + 0.008*\"empath\" + 0.007*\"teufel\" + 0.007*\"armi\" + 0.007*\"militari\" + 0.006*\"govern\" + 0.006*\"pour\"\n", + "2019-01-31 01:06:07,607 : INFO : topic #29 (0.020): 0.030*\"companhia\" + 0.013*\"market\" + 0.012*\"busi\" + 0.011*\"million\" + 0.011*\"produc\" + 0.011*\"bank\" + 0.010*\"industri\" + 0.008*\"yawn\" + 0.008*\"manag\" + 0.007*\"serv\"\n", + "2019-01-31 01:06:07,608 : INFO : topic #13 (0.020): 0.028*\"australia\" + 0.028*\"sourc\" + 0.026*\"london\" + 0.026*\"new\" + 0.025*\"england\" + 0.022*\"australian\" + 0.019*\"british\" + 0.017*\"ireland\" + 0.016*\"youth\" + 0.015*\"wale\"\n", + "2019-01-31 01:06:07,613 : INFO : topic diff=0.003763, rho=0.026234\n", + "2019-01-31 01:06:07,773 : INFO : PROGRESS: pass 0, at document #2908000/4922894\n", + "2019-01-31 01:06:09,170 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:06:09,436 : INFO : topic #1 (0.020): 0.053*\"china\" + 0.041*\"chilton\" + 0.025*\"hong\" + 0.024*\"kong\" + 0.022*\"korea\" + 0.019*\"leah\" + 0.018*\"korean\" + 0.016*\"kim\" + 0.016*\"sourc\" + 0.013*\"shirin\"\n", + "2019-01-31 01:06:09,437 : INFO : topic #45 (0.020): 0.026*\"jpg\" + 0.025*\"fifteenth\" + 0.018*\"illicit\" + 0.015*\"colder\" + 0.015*\"western\" + 0.014*\"pain\" + 0.014*\"black\" + 0.011*\"record\" + 0.010*\"depress\" + 0.010*\"blind\"\n", + "2019-01-31 01:06:09,438 : INFO : topic #5 (0.020): 0.038*\"abroad\" + 0.029*\"son\" + 0.027*\"rel\" + 0.026*\"reconstruct\" + 0.021*\"band\" + 0.017*\"muscl\" + 0.016*\"simultan\" + 0.014*\"charcoal\" + 0.014*\"toyota\" + 0.010*\"vocabulari\"\n", + "2019-01-31 01:06:09,440 : INFO : topic #3 (0.020): 0.031*\"present\" + 0.027*\"offic\" + 0.024*\"nation\" + 0.023*\"minist\" + 0.022*\"govern\" + 0.021*\"member\" + 0.020*\"serv\" + 0.016*\"gener\" + 0.016*\"start\" + 0.015*\"council\"\n", + "2019-01-31 01:06:09,441 : INFO : topic #33 (0.020): 0.064*\"french\" + 0.049*\"franc\" + 0.035*\"pari\" + 0.024*\"sail\" + 0.022*\"jean\" + 0.017*\"daphn\" + 0.013*\"lazi\" + 0.013*\"loui\" + 0.011*\"piec\" + 0.009*\"wine\"\n", + "2019-01-31 01:06:09,446 : INFO : topic diff=0.004871, rho=0.026225\n", + "2019-01-31 01:06:09,663 : INFO : PROGRESS: pass 0, at document #2910000/4922894\n", + "2019-01-31 01:06:11,063 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:06:11,329 : INFO : topic #29 (0.020): 0.030*\"companhia\" + 0.013*\"market\" + 0.012*\"busi\" + 0.011*\"million\" + 0.011*\"produc\" + 0.010*\"bank\" + 0.010*\"industri\" + 0.008*\"yawn\" + 0.008*\"manag\" + 0.007*\"serv\"\n", + "2019-01-31 01:06:11,330 : INFO : topic #47 (0.020): 0.067*\"muscl\" + 0.033*\"perceptu\" + 0.019*\"theater\" + 0.018*\"compos\" + 0.017*\"place\" + 0.015*\"damn\" + 0.014*\"orchestr\" + 0.013*\"olympo\" + 0.012*\"word\" + 0.012*\"physician\"\n", + "2019-01-31 01:06:11,332 : INFO : topic #43 (0.020): 0.066*\"elect\" + 0.055*\"parti\" + 0.024*\"voluntari\" + 0.022*\"democrat\" + 0.021*\"member\" + 0.017*\"polici\" + 0.014*\"bypass\" + 0.014*\"seaport\" + 0.014*\"republ\" + 0.014*\"report\"\n", + "2019-01-31 01:06:11,333 : INFO : topic #38 (0.020): 0.025*\"walter\" + 0.011*\"battalion\" + 0.010*\"aza\" + 0.009*\"forc\" + 0.008*\"empath\" + 0.007*\"teufel\" + 0.007*\"armi\" + 0.007*\"militari\" + 0.006*\"govern\" + 0.006*\"pour\"\n", + "2019-01-31 01:06:11,334 : INFO : topic #24 (0.020): 0.039*\"book\" + 0.033*\"publicis\" + 0.028*\"word\" + 0.018*\"new\" + 0.014*\"edit\" + 0.013*\"presid\" + 0.012*\"arsen\" + 0.011*\"collect\" + 0.011*\"nicola\" + 0.011*\"magazin\"\n", + "2019-01-31 01:06:11,340 : INFO : topic diff=0.002952, rho=0.026216\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 01:06:11,495 : INFO : PROGRESS: pass 0, at document #2912000/4922894\n", + "2019-01-31 01:06:12,956 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:06:13,223 : INFO : topic #18 (0.020): 0.011*\"théori\" + 0.007*\"later\" + 0.007*\"sack\" + 0.006*\"dai\" + 0.006*\"kill\" + 0.005*\"end\" + 0.005*\"retrospect\" + 0.005*\"like\" + 0.004*\"call\" + 0.004*\"help\"\n", + "2019-01-31 01:06:13,224 : INFO : topic #40 (0.020): 0.088*\"unit\" + 0.024*\"schuster\" + 0.022*\"institut\" + 0.021*\"collector\" + 0.021*\"requir\" + 0.019*\"student\" + 0.015*\"professor\" + 0.012*\"word\" + 0.012*\"degre\" + 0.011*\"governor\"\n", + "2019-01-31 01:06:13,225 : INFO : topic #33 (0.020): 0.063*\"french\" + 0.049*\"franc\" + 0.034*\"pari\" + 0.024*\"sail\" + 0.022*\"jean\" + 0.017*\"daphn\" + 0.013*\"lazi\" + 0.013*\"loui\" + 0.011*\"piec\" + 0.010*\"wine\"\n", + "2019-01-31 01:06:13,226 : INFO : topic #16 (0.020): 0.056*\"king\" + 0.031*\"priest\" + 0.020*\"idiosyncrat\" + 0.020*\"duke\" + 0.019*\"rotterdam\" + 0.018*\"quarterli\" + 0.018*\"grammat\" + 0.015*\"count\" + 0.013*\"portugues\" + 0.013*\"kingdom\"\n", + "2019-01-31 01:06:13,227 : INFO : topic #0 (0.020): 0.067*\"statewid\" + 0.041*\"line\" + 0.034*\"raid\" + 0.022*\"rosenwald\" + 0.021*\"museo\" + 0.021*\"arsen\" + 0.021*\"traceabl\" + 0.019*\"serv\" + 0.013*\"oper\" + 0.011*\"brook\"\n", + "2019-01-31 01:06:13,233 : INFO : topic diff=0.004410, rho=0.026207\n", + "2019-01-31 01:06:13,391 : INFO : PROGRESS: pass 0, at document #2914000/4922894\n", + "2019-01-31 01:06:14,784 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:06:15,051 : INFO : topic #4 (0.020): 0.020*\"enfranchis\" + 0.014*\"pour\" + 0.014*\"depress\" + 0.010*\"elabor\" + 0.009*\"mode\" + 0.009*\"veget\" + 0.007*\"uruguayan\" + 0.006*\"encyclopedia\" + 0.006*\"develop\" + 0.006*\"produc\"\n", + "2019-01-31 01:06:15,052 : INFO : topic #48 (0.020): 0.082*\"march\" + 0.078*\"sens\" + 0.077*\"octob\" + 0.071*\"januari\" + 0.069*\"juli\" + 0.068*\"notion\" + 0.067*\"judici\" + 0.067*\"august\" + 0.066*\"april\" + 0.066*\"decatur\"\n", + "2019-01-31 01:06:15,054 : INFO : topic #37 (0.020): 0.011*\"charact\" + 0.011*\"septemb\" + 0.010*\"man\" + 0.009*\"anim\" + 0.008*\"comic\" + 0.007*\"appear\" + 0.006*\"workplac\" + 0.006*\"love\" + 0.006*\"gestur\" + 0.006*\"fusiform\"\n", + "2019-01-31 01:06:15,055 : INFO : topic #43 (0.020): 0.066*\"elect\" + 0.055*\"parti\" + 0.024*\"voluntari\" + 0.022*\"democrat\" + 0.021*\"member\" + 0.017*\"polici\" + 0.014*\"bypass\" + 0.014*\"seaport\" + 0.014*\"republ\" + 0.014*\"report\"\n", + "2019-01-31 01:06:15,056 : INFO : topic #11 (0.020): 0.023*\"john\" + 0.016*\"will\" + 0.012*\"david\" + 0.012*\"jame\" + 0.010*\"rival\" + 0.009*\"mexican–american\" + 0.008*\"georg\" + 0.007*\"paul\" + 0.007*\"slur\" + 0.007*\"rhyme\"\n", + "2019-01-31 01:06:15,062 : INFO : topic diff=0.004112, rho=0.026198\n", + "2019-01-31 01:06:15,221 : INFO : PROGRESS: pass 0, at document #2916000/4922894\n", + "2019-01-31 01:06:16,642 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:06:16,911 : INFO : topic #12 (0.020): 0.009*\"number\" + 0.008*\"frontal\" + 0.007*\"théori\" + 0.007*\"gener\" + 0.006*\"exampl\" + 0.006*\"poet\" + 0.006*\"measur\" + 0.006*\"southern\" + 0.006*\"differ\" + 0.006*\"servitud\"\n", + "2019-01-31 01:06:16,912 : INFO : topic #16 (0.020): 0.055*\"king\" + 0.030*\"priest\" + 0.021*\"idiosyncrat\" + 0.019*\"duke\" + 0.019*\"rotterdam\" + 0.018*\"quarterli\" + 0.018*\"grammat\" + 0.015*\"count\" + 0.013*\"portugues\" + 0.012*\"kingdom\"\n", + "2019-01-31 01:06:16,914 : INFO : topic #33 (0.020): 0.063*\"french\" + 0.049*\"franc\" + 0.034*\"pari\" + 0.024*\"sail\" + 0.022*\"jean\" + 0.017*\"daphn\" + 0.013*\"lazi\" + 0.013*\"loui\" + 0.011*\"piec\" + 0.010*\"wine\"\n", + "2019-01-31 01:06:16,915 : INFO : topic #8 (0.020): 0.028*\"law\" + 0.023*\"cortic\" + 0.018*\"act\" + 0.018*\"start\" + 0.013*\"ricardo\" + 0.012*\"case\" + 0.010*\"polaris\" + 0.010*\"replac\" + 0.009*\"legal\" + 0.007*\"justic\"\n", + "2019-01-31 01:06:16,916 : INFO : topic #43 (0.020): 0.066*\"elect\" + 0.055*\"parti\" + 0.024*\"voluntari\" + 0.022*\"democrat\" + 0.021*\"member\" + 0.017*\"polici\" + 0.014*\"bypass\" + 0.014*\"seaport\" + 0.014*\"republ\" + 0.014*\"report\"\n", + "2019-01-31 01:06:16,921 : INFO : topic diff=0.003684, rho=0.026189\n", + "2019-01-31 01:06:17,077 : INFO : PROGRESS: pass 0, at document #2918000/4922894\n", + "2019-01-31 01:06:18,443 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:06:18,709 : INFO : topic #13 (0.020): 0.028*\"australia\" + 0.027*\"sourc\" + 0.026*\"london\" + 0.026*\"new\" + 0.024*\"england\" + 0.022*\"australian\" + 0.019*\"british\" + 0.017*\"ireland\" + 0.015*\"youth\" + 0.015*\"wale\"\n", + "2019-01-31 01:06:18,710 : INFO : topic #42 (0.020): 0.048*\"german\" + 0.032*\"germani\" + 0.015*\"vol\" + 0.015*\"israel\" + 0.014*\"berlin\" + 0.014*\"jewish\" + 0.014*\"der\" + 0.012*\"european\" + 0.009*\"europ\" + 0.009*\"austria\"\n", + "2019-01-31 01:06:18,711 : INFO : topic #4 (0.020): 0.020*\"enfranchis\" + 0.014*\"pour\" + 0.014*\"depress\" + 0.010*\"elabor\" + 0.009*\"mode\" + 0.009*\"veget\" + 0.007*\"uruguayan\" + 0.007*\"encyclopedia\" + 0.006*\"develop\" + 0.006*\"produc\"\n", + "2019-01-31 01:06:18,712 : INFO : topic #12 (0.020): 0.009*\"number\" + 0.008*\"frontal\" + 0.007*\"théori\" + 0.007*\"gener\" + 0.006*\"poet\" + 0.006*\"exampl\" + 0.006*\"measur\" + 0.006*\"southern\" + 0.006*\"differ\" + 0.006*\"servitud\"\n", + "2019-01-31 01:06:18,713 : INFO : topic #25 (0.020): 0.031*\"ring\" + 0.019*\"area\" + 0.017*\"lagrang\" + 0.016*\"warmth\" + 0.015*\"mount\" + 0.009*\"north\" + 0.009*\"palmer\" + 0.009*\"sourc\" + 0.008*\"land\" + 0.008*\"lobe\"\n", + "2019-01-31 01:06:18,719 : INFO : topic diff=0.004067, rho=0.026180\n", + "2019-01-31 01:06:21,320 : INFO : -11.774 per-word bound, 3501.6 perplexity estimate based on a held-out corpus of 2000 documents with 520506 words\n", + "2019-01-31 01:06:21,321 : INFO : PROGRESS: pass 0, at document #2920000/4922894\n", + "2019-01-31 01:06:22,670 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:06:22,940 : INFO : topic #1 (0.020): 0.052*\"china\" + 0.044*\"chilton\" + 0.025*\"hong\" + 0.024*\"kong\" + 0.022*\"korea\" + 0.018*\"korean\" + 0.017*\"leah\" + 0.016*\"kim\" + 0.015*\"sourc\" + 0.014*\"shirin\"\n", + "2019-01-31 01:06:22,941 : INFO : topic #32 (0.020): 0.049*\"district\" + 0.043*\"popolo\" + 0.041*\"vigour\" + 0.037*\"tortur\" + 0.032*\"cotton\" + 0.024*\"area\" + 0.022*\"multitud\" + 0.020*\"citi\" + 0.019*\"regim\" + 0.018*\"cede\"\n", + "2019-01-31 01:06:22,942 : INFO : topic #28 (0.020): 0.032*\"build\" + 0.025*\"hous\" + 0.019*\"rivièr\" + 0.018*\"buford\" + 0.014*\"histor\" + 0.011*\"briarwood\" + 0.011*\"constitut\" + 0.011*\"strategist\" + 0.010*\"linear\" + 0.010*\"depress\"\n", + "2019-01-31 01:06:22,943 : INFO : topic #4 (0.020): 0.020*\"enfranchis\" + 0.014*\"pour\" + 0.014*\"depress\" + 0.010*\"elabor\" + 0.009*\"mode\" + 0.009*\"veget\" + 0.007*\"uruguayan\" + 0.006*\"encyclopedia\" + 0.006*\"develop\" + 0.006*\"produc\"\n", + "2019-01-31 01:06:22,944 : INFO : topic #24 (0.020): 0.038*\"book\" + 0.033*\"publicis\" + 0.028*\"word\" + 0.018*\"new\" + 0.014*\"edit\" + 0.013*\"presid\" + 0.012*\"arsen\" + 0.012*\"collect\" + 0.011*\"nicola\" + 0.011*\"storag\"\n", + "2019-01-31 01:06:22,950 : INFO : topic diff=0.004123, rho=0.026171\n", + "2019-01-31 01:06:23,106 : INFO : PROGRESS: pass 0, at document #2922000/4922894\n", + "2019-01-31 01:06:24,481 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:06:24,748 : INFO : topic #19 (0.020): 0.017*\"languag\" + 0.014*\"centuri\" + 0.011*\"woodcut\" + 0.009*\"form\" + 0.009*\"origin\" + 0.009*\"mean\" + 0.008*\"trade\" + 0.007*\"english\" + 0.007*\"known\" + 0.007*\"ancestor\"\n", + "2019-01-31 01:06:24,749 : INFO : topic #13 (0.020): 0.028*\"australia\" + 0.027*\"sourc\" + 0.026*\"london\" + 0.026*\"new\" + 0.024*\"england\" + 0.022*\"australian\" + 0.019*\"british\" + 0.018*\"ireland\" + 0.016*\"youth\" + 0.015*\"wale\"\n", + "2019-01-31 01:06:24,750 : INFO : topic #28 (0.020): 0.032*\"build\" + 0.026*\"hous\" + 0.018*\"rivièr\" + 0.018*\"buford\" + 0.014*\"histor\" + 0.011*\"briarwood\" + 0.011*\"constitut\" + 0.011*\"strategist\" + 0.010*\"linear\" + 0.010*\"depress\"\n", + "2019-01-31 01:06:24,751 : INFO : topic #40 (0.020): 0.088*\"unit\" + 0.024*\"schuster\" + 0.022*\"institut\" + 0.021*\"collector\" + 0.020*\"requir\" + 0.019*\"student\" + 0.015*\"professor\" + 0.012*\"degre\" + 0.012*\"word\" + 0.011*\"governor\"\n", + "2019-01-31 01:06:24,752 : INFO : topic #34 (0.020): 0.067*\"start\" + 0.033*\"new\" + 0.031*\"american\" + 0.029*\"unionist\" + 0.025*\"cotton\" + 0.020*\"year\" + 0.015*\"california\" + 0.013*\"terri\" + 0.013*\"warrior\" + 0.012*\"north\"\n", + "2019-01-31 01:06:24,758 : INFO : topic diff=0.003835, rho=0.026162\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 01:06:24,912 : INFO : PROGRESS: pass 0, at document #2924000/4922894\n", + "2019-01-31 01:06:26,293 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:06:26,559 : INFO : topic #48 (0.020): 0.080*\"march\" + 0.077*\"octob\" + 0.077*\"sens\" + 0.072*\"januari\" + 0.069*\"juli\" + 0.068*\"notion\" + 0.066*\"august\" + 0.066*\"judici\" + 0.066*\"decatur\" + 0.065*\"april\"\n", + "2019-01-31 01:06:26,560 : INFO : topic #19 (0.020): 0.017*\"languag\" + 0.015*\"centuri\" + 0.011*\"woodcut\" + 0.009*\"form\" + 0.009*\"origin\" + 0.009*\"mean\" + 0.008*\"trade\" + 0.007*\"english\" + 0.007*\"known\" + 0.007*\"ancestor\"\n", + "2019-01-31 01:06:26,562 : INFO : topic #42 (0.020): 0.047*\"german\" + 0.032*\"germani\" + 0.015*\"vol\" + 0.014*\"israel\" + 0.014*\"berlin\" + 0.014*\"jewish\" + 0.014*\"der\" + 0.012*\"european\" + 0.010*\"europ\" + 0.009*\"austria\"\n", + "2019-01-31 01:06:26,563 : INFO : topic #9 (0.020): 0.072*\"bone\" + 0.048*\"american\" + 0.029*\"valour\" + 0.021*\"folei\" + 0.019*\"player\" + 0.019*\"dutch\" + 0.018*\"english\" + 0.017*\"polit\" + 0.012*\"acrimoni\" + 0.011*\"simpler\"\n", + "2019-01-31 01:06:26,563 : INFO : topic #25 (0.020): 0.032*\"ring\" + 0.019*\"area\" + 0.017*\"lagrang\" + 0.016*\"warmth\" + 0.015*\"mount\" + 0.009*\"north\" + 0.009*\"palmer\" + 0.009*\"sourc\" + 0.008*\"lobe\" + 0.008*\"land\"\n", + "2019-01-31 01:06:26,569 : INFO : topic diff=0.003623, rho=0.026153\n", + "2019-01-31 01:06:26,723 : INFO : PROGRESS: pass 0, at document #2926000/4922894\n", + "2019-01-31 01:06:28,095 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:06:28,361 : INFO : topic #35 (0.020): 0.058*\"russia\" + 0.035*\"sovereignti\" + 0.034*\"rural\" + 0.026*\"personifi\" + 0.024*\"poison\" + 0.023*\"reprint\" + 0.020*\"moscow\" + 0.016*\"turin\" + 0.016*\"poland\" + 0.015*\"unfortun\"\n", + "2019-01-31 01:06:28,362 : INFO : topic #18 (0.020): 0.011*\"théori\" + 0.007*\"later\" + 0.007*\"sack\" + 0.006*\"dai\" + 0.006*\"kill\" + 0.005*\"end\" + 0.005*\"retrospect\" + 0.005*\"like\" + 0.004*\"call\" + 0.004*\"help\"\n", + "2019-01-31 01:06:28,363 : INFO : topic #36 (0.020): 0.011*\"network\" + 0.010*\"prognosi\" + 0.010*\"pop\" + 0.009*\"cytokin\" + 0.008*\"develop\" + 0.008*\"softwar\" + 0.008*\"user\" + 0.008*\"uruguayan\" + 0.007*\"includ\" + 0.007*\"diggin\"\n", + "2019-01-31 01:06:28,364 : INFO : topic #13 (0.020): 0.028*\"australia\" + 0.027*\"sourc\" + 0.026*\"london\" + 0.026*\"new\" + 0.023*\"england\" + 0.022*\"australian\" + 0.019*\"british\" + 0.018*\"ireland\" + 0.016*\"youth\" + 0.015*\"wale\"\n", + "2019-01-31 01:06:28,365 : INFO : topic #22 (0.020): 0.035*\"spars\" + 0.021*\"factor\" + 0.012*\"plaisir\" + 0.011*\"genu\" + 0.009*\"feel\" + 0.009*\"male\" + 0.009*\"western\" + 0.008*\"median\" + 0.008*\"biom\" + 0.007*\"incom\"\n", + "2019-01-31 01:06:28,371 : INFO : topic diff=0.003958, rho=0.026144\n", + "2019-01-31 01:06:28,523 : INFO : PROGRESS: pass 0, at document #2928000/4922894\n", + "2019-01-31 01:06:29,877 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:06:30,143 : INFO : topic #13 (0.020): 0.028*\"australia\" + 0.027*\"sourc\" + 0.026*\"london\" + 0.026*\"new\" + 0.023*\"england\" + 0.022*\"australian\" + 0.019*\"british\" + 0.018*\"ireland\" + 0.016*\"youth\" + 0.015*\"wale\"\n", + "2019-01-31 01:06:30,144 : INFO : topic #9 (0.020): 0.073*\"bone\" + 0.048*\"american\" + 0.029*\"valour\" + 0.021*\"folei\" + 0.019*\"player\" + 0.019*\"dutch\" + 0.018*\"english\" + 0.017*\"polit\" + 0.012*\"acrimoni\" + 0.011*\"simpler\"\n", + "2019-01-31 01:06:30,145 : INFO : topic #49 (0.020): 0.044*\"india\" + 0.031*\"incumb\" + 0.012*\"islam\" + 0.012*\"televis\" + 0.011*\"pakistan\" + 0.011*\"sri\" + 0.011*\"affection\" + 0.011*\"anglo\" + 0.011*\"alam\" + 0.010*\"tajikistan\"\n", + "2019-01-31 01:06:30,146 : INFO : topic #47 (0.020): 0.066*\"muscl\" + 0.033*\"perceptu\" + 0.019*\"theater\" + 0.018*\"compos\" + 0.017*\"place\" + 0.014*\"damn\" + 0.014*\"orchestr\" + 0.013*\"olympo\" + 0.012*\"physician\" + 0.012*\"word\"\n", + "2019-01-31 01:06:30,147 : INFO : topic #48 (0.020): 0.081*\"march\" + 0.078*\"octob\" + 0.078*\"sens\" + 0.072*\"januari\" + 0.069*\"juli\" + 0.068*\"notion\" + 0.067*\"judici\" + 0.067*\"august\" + 0.066*\"decatur\" + 0.065*\"april\"\n", + "2019-01-31 01:06:30,153 : INFO : topic diff=0.004249, rho=0.026135\n", + "2019-01-31 01:06:30,311 : INFO : PROGRESS: pass 0, at document #2930000/4922894\n", + "2019-01-31 01:06:31,688 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:06:31,954 : INFO : topic #25 (0.020): 0.031*\"ring\" + 0.019*\"area\" + 0.017*\"lagrang\" + 0.016*\"warmth\" + 0.016*\"mount\" + 0.010*\"north\" + 0.009*\"palmer\" + 0.009*\"sourc\" + 0.008*\"vacant\" + 0.008*\"lobe\"\n", + "2019-01-31 01:06:31,955 : INFO : topic #43 (0.020): 0.065*\"elect\" + 0.058*\"parti\" + 0.024*\"voluntari\" + 0.024*\"democrat\" + 0.021*\"member\" + 0.017*\"polici\" + 0.016*\"republ\" + 0.014*\"bypass\" + 0.014*\"seaport\" + 0.013*\"report\"\n", + "2019-01-31 01:06:31,957 : INFO : topic #4 (0.020): 0.021*\"enfranchis\" + 0.014*\"pour\" + 0.014*\"depress\" + 0.011*\"elabor\" + 0.009*\"mode\" + 0.008*\"veget\" + 0.007*\"uruguayan\" + 0.007*\"encyclopedia\" + 0.006*\"develop\" + 0.006*\"produc\"\n", + "2019-01-31 01:06:31,957 : INFO : topic #42 (0.020): 0.047*\"german\" + 0.032*\"germani\" + 0.015*\"israel\" + 0.015*\"vol\" + 0.014*\"berlin\" + 0.014*\"jewish\" + 0.013*\"der\" + 0.012*\"european\" + 0.009*\"europ\" + 0.009*\"austria\"\n", + "2019-01-31 01:06:31,958 : INFO : topic #1 (0.020): 0.052*\"china\" + 0.043*\"chilton\" + 0.026*\"hong\" + 0.025*\"kong\" + 0.022*\"korea\" + 0.018*\"korean\" + 0.017*\"leah\" + 0.016*\"kim\" + 0.015*\"sourc\" + 0.014*\"shirin\"\n", + "2019-01-31 01:06:31,964 : INFO : topic diff=0.003839, rho=0.026126\n", + "2019-01-31 01:06:32,133 : INFO : PROGRESS: pass 0, at document #2932000/4922894\n", + "2019-01-31 01:06:33,558 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:06:33,824 : INFO : topic #20 (0.020): 0.151*\"scholar\" + 0.038*\"struggl\" + 0.035*\"high\" + 0.029*\"educ\" + 0.022*\"collector\" + 0.017*\"yawn\" + 0.013*\"prognosi\" + 0.011*\"district\" + 0.010*\"task\" + 0.010*\"start\"\n", + "2019-01-31 01:06:33,825 : INFO : topic #30 (0.020): 0.036*\"cleveland\" + 0.036*\"leagu\" + 0.029*\"place\" + 0.028*\"taxpay\" + 0.024*\"scientist\" + 0.023*\"crete\" + 0.022*\"folei\" + 0.016*\"goal\" + 0.015*\"martin\" + 0.012*\"schmitz\"\n", + "2019-01-31 01:06:33,827 : INFO : topic #38 (0.020): 0.024*\"walter\" + 0.010*\"battalion\" + 0.010*\"aza\" + 0.009*\"forc\" + 0.008*\"empath\" + 0.007*\"teufel\" + 0.007*\"armi\" + 0.007*\"militari\" + 0.006*\"govern\" + 0.006*\"pour\"\n", + "2019-01-31 01:06:33,828 : INFO : topic #2 (0.020): 0.053*\"isl\" + 0.036*\"shield\" + 0.017*\"narrat\" + 0.015*\"scot\" + 0.012*\"pope\" + 0.012*\"blur\" + 0.011*\"coalit\" + 0.010*\"nativist\" + 0.010*\"bahá\" + 0.009*\"class\"\n", + "2019-01-31 01:06:33,829 : INFO : topic #10 (0.020): 0.012*\"cdd\" + 0.009*\"media\" + 0.008*\"disco\" + 0.008*\"hormon\" + 0.008*\"have\" + 0.007*\"pathwai\" + 0.007*\"caus\" + 0.006*\"proper\" + 0.006*\"treat\" + 0.006*\"effect\"\n", + "2019-01-31 01:06:33,834 : INFO : topic diff=0.004412, rho=0.026118\n", + "2019-01-31 01:06:33,987 : INFO : PROGRESS: pass 0, at document #2934000/4922894\n", + "2019-01-31 01:06:35,336 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:06:35,603 : INFO : topic #33 (0.020): 0.062*\"french\" + 0.047*\"franc\" + 0.033*\"pari\" + 0.023*\"sail\" + 0.022*\"jean\" + 0.017*\"daphn\" + 0.013*\"loui\" + 0.013*\"lazi\" + 0.011*\"piec\" + 0.010*\"wine\"\n", + "2019-01-31 01:06:35,604 : INFO : topic #46 (0.020): 0.016*\"stop\" + 0.016*\"sweden\" + 0.016*\"norwai\" + 0.016*\"damag\" + 0.015*\"norwegian\" + 0.015*\"swedish\" + 0.014*\"wind\" + 0.012*\"denmark\" + 0.011*\"danish\" + 0.010*\"turkei\"\n", + "2019-01-31 01:06:35,605 : INFO : topic #22 (0.020): 0.036*\"spars\" + 0.020*\"factor\" + 0.012*\"plaisir\" + 0.011*\"genu\" + 0.009*\"feel\" + 0.009*\"male\" + 0.009*\"western\" + 0.008*\"biom\" + 0.008*\"median\" + 0.007*\"incom\"\n", + "2019-01-31 01:06:35,606 : INFO : topic #23 (0.020): 0.136*\"audit\" + 0.068*\"best\" + 0.033*\"yawn\" + 0.030*\"jacksonvil\" + 0.022*\"japanes\" + 0.021*\"noll\" + 0.020*\"festiv\" + 0.019*\"women\" + 0.018*\"intern\" + 0.014*\"prison\"\n", + "2019-01-31 01:06:35,607 : INFO : topic #0 (0.020): 0.067*\"statewid\" + 0.041*\"line\" + 0.033*\"raid\" + 0.023*\"rosenwald\" + 0.022*\"traceabl\" + 0.021*\"museo\" + 0.019*\"arsen\" + 0.019*\"serv\" + 0.013*\"oper\" + 0.011*\"brook\"\n", + "2019-01-31 01:06:35,612 : INFO : topic diff=0.004612, rho=0.026109\n", + "2019-01-31 01:06:35,766 : INFO : PROGRESS: pass 0, at document #2936000/4922894\n", + "2019-01-31 01:06:37,184 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 01:06:37,451 : INFO : topic #34 (0.020): 0.068*\"start\" + 0.033*\"new\" + 0.031*\"american\" + 0.029*\"unionist\" + 0.025*\"cotton\" + 0.020*\"year\" + 0.015*\"california\" + 0.013*\"terri\" + 0.013*\"warrior\" + 0.012*\"north\"\n", + "2019-01-31 01:06:37,452 : INFO : topic #28 (0.020): 0.032*\"build\" + 0.026*\"hous\" + 0.018*\"rivièr\" + 0.018*\"buford\" + 0.014*\"histor\" + 0.011*\"briarwood\" + 0.011*\"constitut\" + 0.010*\"strategist\" + 0.010*\"linear\" + 0.010*\"silicon\"\n", + "2019-01-31 01:06:37,453 : INFO : topic #39 (0.020): 0.057*\"canada\" + 0.043*\"canadian\" + 0.024*\"hoar\" + 0.023*\"toronto\" + 0.021*\"ontario\" + 0.015*\"hydrogen\" + 0.015*\"new\" + 0.015*\"misericordia\" + 0.014*\"novotná\" + 0.013*\"quebec\"\n", + "2019-01-31 01:06:37,454 : INFO : topic #16 (0.020): 0.055*\"king\" + 0.031*\"priest\" + 0.020*\"rotterdam\" + 0.020*\"idiosyncrat\" + 0.020*\"duke\" + 0.018*\"quarterli\" + 0.017*\"grammat\" + 0.014*\"count\" + 0.013*\"portugues\" + 0.012*\"brazil\"\n", + "2019-01-31 01:06:37,455 : INFO : topic #11 (0.020): 0.024*\"john\" + 0.015*\"will\" + 0.012*\"david\" + 0.012*\"jame\" + 0.010*\"rival\" + 0.009*\"mexican–american\" + 0.008*\"georg\" + 0.008*\"slur\" + 0.007*\"rhyme\" + 0.007*\"paul\"\n", + "2019-01-31 01:06:37,461 : INFO : topic diff=0.003781, rho=0.026100\n", + "2019-01-31 01:06:37,623 : INFO : PROGRESS: pass 0, at document #2938000/4922894\n", + "2019-01-31 01:06:38,972 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:06:39,241 : INFO : topic #1 (0.020): 0.052*\"china\" + 0.042*\"chilton\" + 0.026*\"hong\" + 0.025*\"kong\" + 0.023*\"korea\" + 0.019*\"korean\" + 0.018*\"leah\" + 0.016*\"kim\" + 0.016*\"sourc\" + 0.014*\"shirin\"\n", + "2019-01-31 01:06:39,242 : INFO : topic #3 (0.020): 0.031*\"present\" + 0.027*\"offic\" + 0.024*\"nation\" + 0.023*\"minist\" + 0.022*\"govern\" + 0.021*\"member\" + 0.020*\"serv\" + 0.016*\"gener\" + 0.016*\"start\" + 0.015*\"council\"\n", + "2019-01-31 01:06:39,243 : INFO : topic #35 (0.020): 0.058*\"russia\" + 0.035*\"sovereignti\" + 0.035*\"rural\" + 0.025*\"poison\" + 0.025*\"personifi\" + 0.023*\"reprint\" + 0.020*\"moscow\" + 0.016*\"poland\" + 0.015*\"unfortun\" + 0.015*\"turin\"\n", + "2019-01-31 01:06:39,244 : INFO : topic #4 (0.020): 0.021*\"enfranchis\" + 0.014*\"pour\" + 0.014*\"depress\" + 0.010*\"elabor\" + 0.009*\"mode\" + 0.008*\"veget\" + 0.007*\"uruguayan\" + 0.007*\"encyclopedia\" + 0.006*\"develop\" + 0.006*\"candid\"\n", + "2019-01-31 01:06:39,246 : INFO : topic #5 (0.020): 0.038*\"abroad\" + 0.029*\"son\" + 0.027*\"rel\" + 0.025*\"reconstruct\" + 0.021*\"band\" + 0.017*\"simultan\" + 0.016*\"muscl\" + 0.014*\"charcoal\" + 0.013*\"toyota\" + 0.010*\"myspac\"\n", + "2019-01-31 01:06:39,251 : INFO : topic diff=0.003591, rho=0.026091\n", + "2019-01-31 01:06:41,885 : INFO : -11.647 per-word bound, 3205.9 perplexity estimate based on a held-out corpus of 2000 documents with 510279 words\n", + "2019-01-31 01:06:41,885 : INFO : PROGRESS: pass 0, at document #2940000/4922894\n", + "2019-01-31 01:06:43,251 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:06:43,517 : INFO : topic #44 (0.020): 0.030*\"rooftop\" + 0.029*\"final\" + 0.025*\"wife\" + 0.021*\"tourist\" + 0.018*\"champion\" + 0.015*\"taxpay\" + 0.014*\"chamber\" + 0.014*\"open\" + 0.013*\"tiepolo\" + 0.013*\"martin\"\n", + "2019-01-31 01:06:43,518 : INFO : topic #35 (0.020): 0.058*\"russia\" + 0.035*\"sovereignti\" + 0.034*\"rural\" + 0.025*\"poison\" + 0.025*\"personifi\" + 0.023*\"reprint\" + 0.020*\"moscow\" + 0.016*\"poland\" + 0.015*\"unfortun\" + 0.015*\"turin\"\n", + "2019-01-31 01:06:43,519 : INFO : topic #27 (0.020): 0.072*\"questionnair\" + 0.019*\"candid\" + 0.019*\"taxpay\" + 0.014*\"ret\" + 0.013*\"driver\" + 0.013*\"tornado\" + 0.012*\"find\" + 0.011*\"fool\" + 0.011*\"squatter\" + 0.010*\"landslid\"\n", + "2019-01-31 01:06:43,521 : INFO : topic #42 (0.020): 0.047*\"german\" + 0.032*\"germani\" + 0.015*\"israel\" + 0.015*\"vol\" + 0.015*\"jewish\" + 0.014*\"berlin\" + 0.013*\"der\" + 0.012*\"european\" + 0.010*\"europ\" + 0.009*\"austria\"\n", + "2019-01-31 01:06:43,522 : INFO : topic #0 (0.020): 0.067*\"statewid\" + 0.041*\"line\" + 0.034*\"raid\" + 0.024*\"rosenwald\" + 0.022*\"traceabl\" + 0.020*\"museo\" + 0.019*\"arsen\" + 0.018*\"serv\" + 0.013*\"oper\" + 0.010*\"brook\"\n", + "2019-01-31 01:06:43,528 : INFO : topic diff=0.004179, rho=0.026082\n", + "2019-01-31 01:06:43,685 : INFO : PROGRESS: pass 0, at document #2942000/4922894\n", + "2019-01-31 01:06:45,092 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:06:45,359 : INFO : topic #49 (0.020): 0.044*\"india\" + 0.031*\"incumb\" + 0.012*\"televis\" + 0.012*\"islam\" + 0.012*\"pakistan\" + 0.011*\"sri\" + 0.011*\"alam\" + 0.011*\"affection\" + 0.011*\"anglo\" + 0.010*\"tajikistan\"\n", + "2019-01-31 01:06:45,360 : INFO : topic #35 (0.020): 0.058*\"russia\" + 0.035*\"sovereignti\" + 0.034*\"rural\" + 0.026*\"poison\" + 0.025*\"personifi\" + 0.023*\"reprint\" + 0.020*\"moscow\" + 0.016*\"poland\" + 0.015*\"unfortun\" + 0.015*\"czech\"\n", + "2019-01-31 01:06:45,361 : INFO : topic #30 (0.020): 0.036*\"cleveland\" + 0.036*\"leagu\" + 0.030*\"place\" + 0.028*\"taxpay\" + 0.024*\"scientist\" + 0.024*\"crete\" + 0.022*\"folei\" + 0.016*\"goal\" + 0.015*\"martin\" + 0.012*\"schmitz\"\n", + "2019-01-31 01:06:45,362 : INFO : topic #43 (0.020): 0.065*\"elect\" + 0.059*\"parti\" + 0.024*\"voluntari\" + 0.023*\"democrat\" + 0.021*\"member\" + 0.017*\"polici\" + 0.015*\"republ\" + 0.014*\"bypass\" + 0.014*\"seaport\" + 0.013*\"report\"\n", + "2019-01-31 01:06:45,363 : INFO : topic #40 (0.020): 0.087*\"unit\" + 0.024*\"schuster\" + 0.022*\"collector\" + 0.022*\"institut\" + 0.020*\"requir\" + 0.019*\"student\" + 0.015*\"professor\" + 0.012*\"word\" + 0.012*\"degre\" + 0.011*\"governor\"\n", + "2019-01-31 01:06:45,368 : INFO : topic diff=0.003636, rho=0.026073\n", + "2019-01-31 01:06:45,582 : INFO : PROGRESS: pass 0, at document #2944000/4922894\n", + "2019-01-31 01:06:46,972 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:06:47,239 : INFO : topic #5 (0.020): 0.038*\"abroad\" + 0.029*\"son\" + 0.027*\"rel\" + 0.025*\"reconstruct\" + 0.021*\"band\" + 0.017*\"muscl\" + 0.016*\"simultan\" + 0.014*\"charcoal\" + 0.013*\"toyota\" + 0.010*\"myspac\"\n", + "2019-01-31 01:06:47,240 : INFO : topic #17 (0.020): 0.076*\"church\" + 0.023*\"christian\" + 0.021*\"cathol\" + 0.020*\"bishop\" + 0.016*\"sail\" + 0.015*\"retroflex\" + 0.010*\"centuri\" + 0.010*\"relationship\" + 0.009*\"cathedr\" + 0.009*\"historiographi\"\n", + "2019-01-31 01:06:47,241 : INFO : topic #36 (0.020): 0.011*\"network\" + 0.011*\"prognosi\" + 0.010*\"pop\" + 0.009*\"cytokin\" + 0.008*\"softwar\" + 0.008*\"develop\" + 0.008*\"uruguayan\" + 0.008*\"user\" + 0.007*\"includ\" + 0.007*\"base\"\n", + "2019-01-31 01:06:47,242 : INFO : topic #10 (0.020): 0.012*\"cdd\" + 0.009*\"media\" + 0.008*\"disco\" + 0.008*\"hormon\" + 0.007*\"pathwai\" + 0.007*\"have\" + 0.007*\"caus\" + 0.007*\"proper\" + 0.006*\"treat\" + 0.006*\"effect\"\n", + "2019-01-31 01:06:47,243 : INFO : topic #14 (0.020): 0.025*\"forc\" + 0.023*\"aggress\" + 0.020*\"armi\" + 0.019*\"walter\" + 0.017*\"com\" + 0.015*\"oper\" + 0.013*\"unionist\" + 0.012*\"airbu\" + 0.012*\"militari\" + 0.011*\"solitari\"\n", + "2019-01-31 01:06:47,249 : INFO : topic diff=0.004064, rho=0.026064\n", + "2019-01-31 01:06:47,403 : INFO : PROGRESS: pass 0, at document #2946000/4922894\n", + "2019-01-31 01:06:48,771 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:06:49,037 : INFO : topic #37 (0.020): 0.012*\"charact\" + 0.011*\"septemb\" + 0.010*\"man\" + 0.009*\"anim\" + 0.008*\"comic\" + 0.007*\"appear\" + 0.006*\"love\" + 0.006*\"workplac\" + 0.006*\"fusiform\" + 0.006*\"storag\"\n", + "2019-01-31 01:06:49,038 : INFO : topic #35 (0.020): 0.057*\"russia\" + 0.035*\"sovereignti\" + 0.034*\"rural\" + 0.027*\"poison\" + 0.025*\"personifi\" + 0.023*\"reprint\" + 0.020*\"moscow\" + 0.017*\"poland\" + 0.015*\"unfortun\" + 0.015*\"tyrant\"\n", + "2019-01-31 01:06:49,039 : INFO : topic #20 (0.020): 0.151*\"scholar\" + 0.038*\"struggl\" + 0.035*\"high\" + 0.029*\"educ\" + 0.022*\"collector\" + 0.017*\"yawn\" + 0.013*\"prognosi\" + 0.010*\"district\" + 0.010*\"task\" + 0.009*\"start\"\n", + "2019-01-31 01:06:49,040 : INFO : topic #32 (0.020): 0.049*\"district\" + 0.044*\"popolo\" + 0.041*\"vigour\" + 0.037*\"tortur\" + 0.033*\"cotton\" + 0.024*\"area\" + 0.022*\"multitud\" + 0.020*\"citi\" + 0.019*\"adulthood\" + 0.019*\"cede\"\n", + "2019-01-31 01:06:49,041 : INFO : topic #49 (0.020): 0.044*\"india\" + 0.030*\"incumb\" + 0.012*\"islam\" + 0.012*\"televis\" + 0.012*\"pakistan\" + 0.011*\"sri\" + 0.011*\"anglo\" + 0.011*\"affection\" + 0.011*\"alam\" + 0.010*\"muskoge\"\n", + "2019-01-31 01:06:49,047 : INFO : topic diff=0.003477, rho=0.026055\n", + "2019-01-31 01:06:49,200 : INFO : PROGRESS: pass 0, at document #2948000/4922894\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 01:06:50,571 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:06:50,837 : INFO : topic #2 (0.020): 0.052*\"isl\" + 0.037*\"shield\" + 0.017*\"narrat\" + 0.015*\"scot\" + 0.012*\"pope\" + 0.012*\"blur\" + 0.011*\"nativist\" + 0.011*\"coalit\" + 0.009*\"bahá\" + 0.009*\"fleet\"\n", + "2019-01-31 01:06:50,839 : INFO : topic #41 (0.020): 0.040*\"citi\" + 0.023*\"palmer\" + 0.022*\"new\" + 0.015*\"strategist\" + 0.013*\"center\" + 0.012*\"open\" + 0.011*\"dai\" + 0.011*\"includ\" + 0.011*\"lobe\" + 0.009*\"hot\"\n", + "2019-01-31 01:06:50,840 : INFO : topic #34 (0.020): 0.067*\"start\" + 0.034*\"new\" + 0.031*\"american\" + 0.029*\"unionist\" + 0.026*\"cotton\" + 0.021*\"year\" + 0.015*\"california\" + 0.013*\"warrior\" + 0.013*\"terri\" + 0.012*\"north\"\n", + "2019-01-31 01:06:50,841 : INFO : topic #6 (0.020): 0.071*\"fewer\" + 0.024*\"epiru\" + 0.022*\"septemb\" + 0.018*\"teacher\" + 0.016*\"stake\" + 0.013*\"proclaim\" + 0.012*\"rodríguez\" + 0.011*\"acrimoni\" + 0.011*\"direct\" + 0.011*\"movi\"\n", + "2019-01-31 01:06:50,842 : INFO : topic #15 (0.020): 0.011*\"small\" + 0.010*\"organ\" + 0.010*\"develop\" + 0.009*\"commun\" + 0.008*\"group\" + 0.008*\"peopl\" + 0.008*\"word\" + 0.007*\"human\" + 0.006*\"summerhil\" + 0.006*\"workplac\"\n", + "2019-01-31 01:06:50,848 : INFO : topic diff=0.003853, rho=0.026047\n", + "2019-01-31 01:06:51,006 : INFO : PROGRESS: pass 0, at document #2950000/4922894\n", + "2019-01-31 01:06:52,398 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:06:52,668 : INFO : topic #24 (0.020): 0.038*\"book\" + 0.033*\"publicis\" + 0.028*\"word\" + 0.018*\"new\" + 0.014*\"edit\" + 0.013*\"arsen\" + 0.013*\"presid\" + 0.012*\"collect\" + 0.011*\"nicola\" + 0.011*\"storag\"\n", + "2019-01-31 01:06:52,669 : INFO : topic #30 (0.020): 0.036*\"cleveland\" + 0.035*\"leagu\" + 0.029*\"place\" + 0.028*\"taxpay\" + 0.024*\"scientist\" + 0.023*\"crete\" + 0.022*\"folei\" + 0.017*\"goal\" + 0.015*\"martin\" + 0.012*\"schmitz\"\n", + "2019-01-31 01:06:52,670 : INFO : topic #9 (0.020): 0.073*\"bone\" + 0.047*\"american\" + 0.029*\"valour\" + 0.020*\"folei\" + 0.018*\"player\" + 0.018*\"dutch\" + 0.017*\"english\" + 0.017*\"polit\" + 0.011*\"acrimoni\" + 0.011*\"simpler\"\n", + "2019-01-31 01:06:52,671 : INFO : topic #39 (0.020): 0.057*\"canada\" + 0.044*\"canadian\" + 0.023*\"hoar\" + 0.023*\"toronto\" + 0.021*\"ontario\" + 0.015*\"new\" + 0.015*\"hydrogen\" + 0.015*\"misericordia\" + 0.014*\"quebec\" + 0.014*\"novotná\"\n", + "2019-01-31 01:06:52,672 : INFO : topic #28 (0.020): 0.032*\"build\" + 0.026*\"hous\" + 0.018*\"rivièr\" + 0.018*\"buford\" + 0.014*\"histor\" + 0.012*\"briarwood\" + 0.011*\"constitut\" + 0.011*\"depress\" + 0.010*\"linear\" + 0.010*\"silicon\"\n", + "2019-01-31 01:06:52,678 : INFO : topic diff=0.004486, rho=0.026038\n", + "2019-01-31 01:06:52,838 : INFO : PROGRESS: pass 0, at document #2952000/4922894\n", + "2019-01-31 01:06:54,238 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:06:54,505 : INFO : topic #29 (0.020): 0.030*\"companhia\" + 0.012*\"busi\" + 0.012*\"market\" + 0.011*\"produc\" + 0.011*\"million\" + 0.010*\"bank\" + 0.010*\"industri\" + 0.008*\"yawn\" + 0.008*\"manag\" + 0.007*\"trace\"\n", + "2019-01-31 01:06:54,506 : INFO : topic #21 (0.020): 0.034*\"samford\" + 0.021*\"spain\" + 0.020*\"del\" + 0.017*\"mexico\" + 0.016*\"italian\" + 0.013*\"soviet\" + 0.012*\"santa\" + 0.011*\"carlo\" + 0.011*\"juan\" + 0.011*\"josé\"\n", + "2019-01-31 01:06:54,507 : INFO : topic #28 (0.020): 0.032*\"build\" + 0.026*\"hous\" + 0.018*\"buford\" + 0.018*\"rivièr\" + 0.014*\"histor\" + 0.012*\"briarwood\" + 0.011*\"constitut\" + 0.010*\"depress\" + 0.010*\"strategist\" + 0.010*\"silicon\"\n", + "2019-01-31 01:06:54,508 : INFO : topic #38 (0.020): 0.024*\"walter\" + 0.010*\"battalion\" + 0.010*\"aza\" + 0.009*\"forc\" + 0.008*\"empath\" + 0.007*\"teufel\" + 0.007*\"armi\" + 0.007*\"militari\" + 0.006*\"govern\" + 0.006*\"pour\"\n", + "2019-01-31 01:06:54,509 : INFO : topic #49 (0.020): 0.043*\"india\" + 0.030*\"incumb\" + 0.013*\"pakistan\" + 0.013*\"islam\" + 0.012*\"televis\" + 0.011*\"affection\" + 0.011*\"alam\" + 0.011*\"anglo\" + 0.011*\"sri\" + 0.010*\"muskoge\"\n", + "2019-01-31 01:06:54,515 : INFO : topic diff=0.004274, rho=0.026029\n", + "2019-01-31 01:06:54,674 : INFO : PROGRESS: pass 0, at document #2954000/4922894\n", + "2019-01-31 01:06:56,067 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:06:56,333 : INFO : topic #27 (0.020): 0.071*\"questionnair\" + 0.019*\"candid\" + 0.018*\"taxpay\" + 0.013*\"ret\" + 0.013*\"driver\" + 0.013*\"tornado\" + 0.011*\"find\" + 0.011*\"fool\" + 0.011*\"théori\" + 0.010*\"squatter\"\n", + "2019-01-31 01:06:56,335 : INFO : topic #34 (0.020): 0.067*\"start\" + 0.034*\"new\" + 0.031*\"american\" + 0.029*\"unionist\" + 0.026*\"cotton\" + 0.021*\"year\" + 0.015*\"california\" + 0.013*\"warrior\" + 0.013*\"terri\" + 0.012*\"north\"\n", + "2019-01-31 01:06:56,336 : INFO : topic #44 (0.020): 0.030*\"rooftop\" + 0.029*\"final\" + 0.024*\"wife\" + 0.021*\"tourist\" + 0.018*\"champion\" + 0.015*\"taxpay\" + 0.014*\"chamber\" + 0.014*\"open\" + 0.014*\"tiepolo\" + 0.013*\"martin\"\n", + "2019-01-31 01:06:56,337 : INFO : topic #17 (0.020): 0.077*\"church\" + 0.023*\"christian\" + 0.021*\"cathol\" + 0.020*\"bishop\" + 0.016*\"sail\" + 0.015*\"retroflex\" + 0.010*\"relationship\" + 0.010*\"centuri\" + 0.009*\"cathedr\" + 0.009*\"historiographi\"\n", + "2019-01-31 01:06:56,338 : INFO : topic #13 (0.020): 0.027*\"new\" + 0.027*\"australia\" + 0.026*\"london\" + 0.026*\"sourc\" + 0.023*\"england\" + 0.022*\"australian\" + 0.019*\"british\" + 0.018*\"ireland\" + 0.016*\"youth\" + 0.014*\"wale\"\n", + "2019-01-31 01:06:56,343 : INFO : topic diff=0.004382, rho=0.026020\n", + "2019-01-31 01:06:56,505 : INFO : PROGRESS: pass 0, at document #2956000/4922894\n", + "2019-01-31 01:06:57,928 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:06:58,194 : INFO : topic #21 (0.020): 0.034*\"samford\" + 0.021*\"spain\" + 0.020*\"del\" + 0.017*\"mexico\" + 0.016*\"italian\" + 0.013*\"soviet\" + 0.011*\"santa\" + 0.011*\"carlo\" + 0.011*\"juan\" + 0.011*\"josé\"\n", + "2019-01-31 01:06:58,195 : INFO : topic #8 (0.020): 0.028*\"law\" + 0.023*\"cortic\" + 0.018*\"start\" + 0.017*\"act\" + 0.013*\"ricardo\" + 0.012*\"case\" + 0.010*\"replac\" + 0.009*\"polaris\" + 0.009*\"legal\" + 0.007*\"justic\"\n", + "2019-01-31 01:06:58,196 : INFO : topic #33 (0.020): 0.062*\"french\" + 0.046*\"franc\" + 0.033*\"pari\" + 0.023*\"jean\" + 0.023*\"sail\" + 0.017*\"daphn\" + 0.014*\"lazi\" + 0.013*\"loui\" + 0.011*\"piec\" + 0.009*\"wine\"\n", + "2019-01-31 01:06:58,197 : INFO : topic #31 (0.020): 0.054*\"fusiform\" + 0.027*\"scientist\" + 0.026*\"taxpay\" + 0.023*\"player\" + 0.020*\"place\" + 0.014*\"clot\" + 0.013*\"leagu\" + 0.011*\"folei\" + 0.011*\"yawn\" + 0.009*\"reconstruct\"\n", + "2019-01-31 01:06:58,198 : INFO : topic #5 (0.020): 0.038*\"abroad\" + 0.028*\"son\" + 0.027*\"rel\" + 0.025*\"reconstruct\" + 0.021*\"band\" + 0.017*\"muscl\" + 0.016*\"simultan\" + 0.014*\"charcoal\" + 0.013*\"toyota\" + 0.010*\"myspac\"\n", + "2019-01-31 01:06:58,204 : INFO : topic diff=0.003995, rho=0.026011\n", + "2019-01-31 01:06:58,359 : INFO : PROGRESS: pass 0, at document #2958000/4922894\n", + "2019-01-31 01:06:59,726 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:06:59,993 : INFO : topic #4 (0.020): 0.021*\"enfranchis\" + 0.015*\"pour\" + 0.014*\"depress\" + 0.010*\"elabor\" + 0.009*\"mode\" + 0.008*\"veget\" + 0.007*\"uruguayan\" + 0.007*\"encyclopedia\" + 0.006*\"develop\" + 0.006*\"candid\"\n", + "2019-01-31 01:06:59,994 : INFO : topic #27 (0.020): 0.071*\"questionnair\" + 0.019*\"candid\" + 0.018*\"taxpay\" + 0.013*\"driver\" + 0.013*\"ret\" + 0.013*\"tornado\" + 0.011*\"find\" + 0.011*\"fool\" + 0.011*\"théori\" + 0.010*\"squatter\"\n", + "2019-01-31 01:06:59,995 : INFO : topic #14 (0.020): 0.025*\"forc\" + 0.022*\"aggress\" + 0.020*\"armi\" + 0.019*\"walter\" + 0.017*\"com\" + 0.015*\"oper\" + 0.013*\"unionist\" + 0.012*\"militari\" + 0.012*\"airbu\" + 0.011*\"diversifi\"\n", + "2019-01-31 01:06:59,996 : INFO : topic #0 (0.020): 0.067*\"statewid\" + 0.041*\"line\" + 0.034*\"raid\" + 0.024*\"rosenwald\" + 0.022*\"traceabl\" + 0.020*\"museo\" + 0.018*\"serv\" + 0.018*\"arsen\" + 0.013*\"oper\" + 0.010*\"brook\"\n", + "2019-01-31 01:06:59,997 : INFO : topic #18 (0.020): 0.011*\"théori\" + 0.007*\"later\" + 0.007*\"sack\" + 0.006*\"dai\" + 0.006*\"kill\" + 0.005*\"retrospect\" + 0.005*\"end\" + 0.005*\"like\" + 0.005*\"wander\" + 0.004*\"call\"\n", + "2019-01-31 01:07:00,003 : INFO : topic diff=0.003716, rho=0.026003\n", + "2019-01-31 01:07:02,730 : INFO : -11.626 per-word bound, 3161.7 perplexity estimate based on a held-out corpus of 2000 documents with 584538 words\n", + "2019-01-31 01:07:02,731 : INFO : PROGRESS: pass 0, at document #2960000/4922894\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 01:07:04,132 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:07:04,399 : INFO : topic #6 (0.020): 0.071*\"fewer\" + 0.023*\"epiru\" + 0.021*\"septemb\" + 0.018*\"teacher\" + 0.016*\"stake\" + 0.014*\"proclaim\" + 0.012*\"rodríguez\" + 0.011*\"acrimoni\" + 0.011*\"direct\" + 0.011*\"movi\"\n", + "2019-01-31 01:07:04,400 : INFO : topic #41 (0.020): 0.040*\"citi\" + 0.022*\"palmer\" + 0.022*\"new\" + 0.015*\"strategist\" + 0.013*\"center\" + 0.012*\"open\" + 0.011*\"dai\" + 0.011*\"includ\" + 0.011*\"lobe\" + 0.009*\"yawn\"\n", + "2019-01-31 01:07:04,401 : INFO : topic #5 (0.020): 0.038*\"abroad\" + 0.028*\"son\" + 0.027*\"rel\" + 0.025*\"reconstruct\" + 0.021*\"band\" + 0.017*\"muscl\" + 0.016*\"simultan\" + 0.014*\"charcoal\" + 0.013*\"toyota\" + 0.010*\"myspac\"\n", + "2019-01-31 01:07:04,402 : INFO : topic #26 (0.020): 0.032*\"workplac\" + 0.030*\"champion\" + 0.028*\"woman\" + 0.025*\"olymp\" + 0.024*\"men\" + 0.022*\"medal\" + 0.020*\"event\" + 0.018*\"taxpay\" + 0.018*\"rainfal\" + 0.017*\"atheist\"\n", + "2019-01-31 01:07:04,403 : INFO : topic #20 (0.020): 0.149*\"scholar\" + 0.038*\"struggl\" + 0.035*\"high\" + 0.029*\"educ\" + 0.023*\"collector\" + 0.017*\"yawn\" + 0.013*\"prognosi\" + 0.010*\"district\" + 0.010*\"task\" + 0.009*\"gothic\"\n", + "2019-01-31 01:07:04,409 : INFO : topic diff=0.004390, rho=0.025994\n", + "2019-01-31 01:07:04,567 : INFO : PROGRESS: pass 0, at document #2962000/4922894\n", + "2019-01-31 01:07:05,949 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:07:06,219 : INFO : topic #2 (0.020): 0.051*\"isl\" + 0.038*\"shield\" + 0.017*\"narrat\" + 0.015*\"scot\" + 0.013*\"pope\" + 0.012*\"blur\" + 0.011*\"coalit\" + 0.010*\"nativist\" + 0.010*\"bahá\" + 0.009*\"fleet\"\n", + "2019-01-31 01:07:06,220 : INFO : topic #30 (0.020): 0.036*\"cleveland\" + 0.036*\"leagu\" + 0.029*\"place\" + 0.028*\"taxpay\" + 0.024*\"scientist\" + 0.024*\"crete\" + 0.022*\"folei\" + 0.016*\"goal\" + 0.015*\"martin\" + 0.012*\"schmitz\"\n", + "2019-01-31 01:07:06,221 : INFO : topic #28 (0.020): 0.032*\"build\" + 0.025*\"hous\" + 0.018*\"buford\" + 0.018*\"rivièr\" + 0.014*\"histor\" + 0.012*\"briarwood\" + 0.011*\"constitut\" + 0.011*\"silicon\" + 0.010*\"strategist\" + 0.010*\"linear\"\n", + "2019-01-31 01:07:06,222 : INFO : topic #25 (0.020): 0.032*\"ring\" + 0.019*\"area\" + 0.017*\"lagrang\" + 0.016*\"warmth\" + 0.016*\"mount\" + 0.010*\"north\" + 0.009*\"palmer\" + 0.009*\"sourc\" + 0.008*\"vacant\" + 0.008*\"lobe\"\n", + "2019-01-31 01:07:06,223 : INFO : topic #48 (0.020): 0.083*\"march\" + 0.077*\"octob\" + 0.076*\"sens\" + 0.072*\"januari\" + 0.068*\"juli\" + 0.068*\"notion\" + 0.065*\"judici\" + 0.065*\"august\" + 0.065*\"april\" + 0.065*\"decatur\"\n", + "2019-01-31 01:07:06,229 : INFO : topic diff=0.004177, rho=0.025985\n", + "2019-01-31 01:07:06,380 : INFO : PROGRESS: pass 0, at document #2964000/4922894\n", + "2019-01-31 01:07:07,732 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:07:07,998 : INFO : topic #48 (0.020): 0.083*\"march\" + 0.077*\"octob\" + 0.077*\"sens\" + 0.072*\"januari\" + 0.069*\"juli\" + 0.068*\"notion\" + 0.066*\"judici\" + 0.066*\"august\" + 0.065*\"april\" + 0.065*\"decatur\"\n", + "2019-01-31 01:07:07,999 : INFO : topic #14 (0.020): 0.025*\"forc\" + 0.022*\"aggress\" + 0.020*\"armi\" + 0.019*\"walter\" + 0.017*\"com\" + 0.015*\"oper\" + 0.014*\"unionist\" + 0.012*\"militari\" + 0.012*\"airbu\" + 0.011*\"diversifi\"\n", + "2019-01-31 01:07:08,000 : INFO : topic #46 (0.020): 0.016*\"norwai\" + 0.016*\"sweden\" + 0.016*\"stop\" + 0.015*\"swedish\" + 0.015*\"norwegian\" + 0.015*\"damag\" + 0.014*\"wind\" + 0.011*\"treeless\" + 0.011*\"denmark\" + 0.011*\"danish\"\n", + "2019-01-31 01:07:08,001 : INFO : topic #23 (0.020): 0.135*\"audit\" + 0.070*\"best\" + 0.033*\"yawn\" + 0.030*\"jacksonvil\" + 0.022*\"japanes\" + 0.021*\"noll\" + 0.020*\"festiv\" + 0.019*\"women\" + 0.018*\"intern\" + 0.014*\"prison\"\n", + "2019-01-31 01:07:08,002 : INFO : topic #47 (0.020): 0.066*\"muscl\" + 0.033*\"perceptu\" + 0.018*\"theater\" + 0.018*\"compos\" + 0.017*\"place\" + 0.014*\"damn\" + 0.014*\"orchestr\" + 0.013*\"olympo\" + 0.012*\"physician\" + 0.012*\"word\"\n", + "2019-01-31 01:07:08,008 : INFO : topic diff=0.004479, rho=0.025976\n", + "2019-01-31 01:07:08,162 : INFO : PROGRESS: pass 0, at document #2966000/4922894\n", + "2019-01-31 01:07:09,545 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:07:09,811 : INFO : topic #1 (0.020): 0.053*\"china\" + 0.042*\"chilton\" + 0.025*\"hong\" + 0.025*\"kong\" + 0.022*\"korea\" + 0.020*\"korean\" + 0.017*\"leah\" + 0.016*\"sourc\" + 0.016*\"kim\" + 0.013*\"shirin\"\n", + "2019-01-31 01:07:09,812 : INFO : topic #27 (0.020): 0.071*\"questionnair\" + 0.019*\"candid\" + 0.018*\"taxpay\" + 0.013*\"driver\" + 0.012*\"tornado\" + 0.012*\"ret\" + 0.012*\"find\" + 0.011*\"fool\" + 0.011*\"théori\" + 0.010*\"squatter\"\n", + "2019-01-31 01:07:09,813 : INFO : topic #36 (0.020): 0.011*\"network\" + 0.010*\"prognosi\" + 0.010*\"pop\" + 0.009*\"cytokin\" + 0.008*\"develop\" + 0.008*\"softwar\" + 0.008*\"uruguayan\" + 0.008*\"user\" + 0.007*\"includ\" + 0.007*\"base\"\n", + "2019-01-31 01:07:09,814 : INFO : topic #2 (0.020): 0.052*\"isl\" + 0.038*\"shield\" + 0.017*\"narrat\" + 0.015*\"scot\" + 0.013*\"pope\" + 0.012*\"blur\" + 0.011*\"coalit\" + 0.010*\"nativist\" + 0.010*\"bahá\" + 0.009*\"fleet\"\n", + "2019-01-31 01:07:09,815 : INFO : topic #48 (0.020): 0.083*\"march\" + 0.077*\"octob\" + 0.077*\"sens\" + 0.072*\"januari\" + 0.069*\"juli\" + 0.068*\"notion\" + 0.066*\"judici\" + 0.066*\"august\" + 0.065*\"april\" + 0.065*\"decatur\"\n", + "2019-01-31 01:07:09,821 : INFO : topic diff=0.003740, rho=0.025967\n", + "2019-01-31 01:07:09,974 : INFO : PROGRESS: pass 0, at document #2968000/4922894\n", + "2019-01-31 01:07:11,343 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:07:11,610 : INFO : topic #1 (0.020): 0.052*\"china\" + 0.042*\"chilton\" + 0.026*\"hong\" + 0.025*\"kong\" + 0.022*\"korea\" + 0.020*\"korean\" + 0.017*\"leah\" + 0.016*\"sourc\" + 0.016*\"kim\" + 0.013*\"shirin\"\n", + "2019-01-31 01:07:11,611 : INFO : topic #26 (0.020): 0.032*\"workplac\" + 0.030*\"champion\" + 0.029*\"woman\" + 0.025*\"olymp\" + 0.024*\"men\" + 0.023*\"medal\" + 0.019*\"event\" + 0.018*\"rainfal\" + 0.018*\"taxpay\" + 0.018*\"atheist\"\n", + "2019-01-31 01:07:11,612 : INFO : topic #22 (0.020): 0.035*\"spars\" + 0.020*\"factor\" + 0.012*\"plaisir\" + 0.010*\"genu\" + 0.009*\"feel\" + 0.009*\"male\" + 0.009*\"western\" + 0.008*\"median\" + 0.008*\"biom\" + 0.008*\"incom\"\n", + "2019-01-31 01:07:11,612 : INFO : topic #43 (0.020): 0.065*\"elect\" + 0.057*\"parti\" + 0.024*\"voluntari\" + 0.023*\"democrat\" + 0.021*\"member\" + 0.017*\"polici\" + 0.015*\"republ\" + 0.014*\"bypass\" + 0.013*\"seaport\" + 0.013*\"liber\"\n", + "2019-01-31 01:07:11,614 : INFO : topic #41 (0.020): 0.040*\"citi\" + 0.022*\"palmer\" + 0.022*\"new\" + 0.015*\"strategist\" + 0.013*\"center\" + 0.012*\"open\" + 0.011*\"dai\" + 0.011*\"includ\" + 0.011*\"lobe\" + 0.009*\"hot\"\n", + "2019-01-31 01:07:11,619 : INFO : topic diff=0.004443, rho=0.025959\n", + "2019-01-31 01:07:11,780 : INFO : PROGRESS: pass 0, at document #2970000/4922894\n", + "2019-01-31 01:07:13,182 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:07:13,448 : INFO : topic #44 (0.020): 0.031*\"rooftop\" + 0.029*\"final\" + 0.024*\"wife\" + 0.021*\"tourist\" + 0.018*\"champion\" + 0.015*\"taxpay\" + 0.014*\"chamber\" + 0.014*\"tiepolo\" + 0.013*\"open\" + 0.013*\"martin\"\n", + "2019-01-31 01:07:13,449 : INFO : topic #13 (0.020): 0.026*\"new\" + 0.026*\"london\" + 0.026*\"sourc\" + 0.026*\"australia\" + 0.023*\"england\" + 0.022*\"australian\" + 0.019*\"british\" + 0.017*\"ireland\" + 0.015*\"youth\" + 0.015*\"wale\"\n", + "2019-01-31 01:07:13,450 : INFO : topic #41 (0.020): 0.040*\"citi\" + 0.022*\"palmer\" + 0.022*\"new\" + 0.015*\"strategist\" + 0.013*\"center\" + 0.012*\"open\" + 0.011*\"dai\" + 0.011*\"includ\" + 0.011*\"lobe\" + 0.009*\"hot\"\n", + "2019-01-31 01:07:13,451 : INFO : topic #11 (0.020): 0.023*\"john\" + 0.014*\"will\" + 0.012*\"david\" + 0.012*\"jame\" + 0.010*\"mexican–american\" + 0.010*\"rival\" + 0.008*\"georg\" + 0.008*\"slur\" + 0.008*\"paul\" + 0.007*\"rhyme\"\n", + "2019-01-31 01:07:13,452 : INFO : topic #5 (0.020): 0.038*\"abroad\" + 0.028*\"son\" + 0.026*\"rel\" + 0.025*\"reconstruct\" + 0.021*\"band\" + 0.017*\"muscl\" + 0.016*\"simultan\" + 0.014*\"charcoal\" + 0.013*\"toyota\" + 0.010*\"vocabulari\"\n", + "2019-01-31 01:07:13,458 : INFO : topic diff=0.003788, rho=0.025950\n", + "2019-01-31 01:07:13,615 : INFO : PROGRESS: pass 0, at document #2972000/4922894\n", + "2019-01-31 01:07:15,016 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:07:15,283 : INFO : topic #22 (0.020): 0.034*\"spars\" + 0.020*\"factor\" + 0.012*\"plaisir\" + 0.012*\"genu\" + 0.009*\"feel\" + 0.008*\"male\" + 0.008*\"western\" + 0.008*\"median\" + 0.008*\"biom\" + 0.008*\"incom\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 01:07:15,284 : INFO : topic #26 (0.020): 0.032*\"workplac\" + 0.030*\"champion\" + 0.028*\"woman\" + 0.025*\"olymp\" + 0.024*\"men\" + 0.023*\"medal\" + 0.019*\"event\" + 0.018*\"rainfal\" + 0.018*\"taxpay\" + 0.018*\"atheist\"\n", + "2019-01-31 01:07:15,286 : INFO : topic #15 (0.020): 0.011*\"small\" + 0.010*\"organ\" + 0.010*\"develop\" + 0.009*\"commun\" + 0.009*\"group\" + 0.008*\"peopl\" + 0.008*\"word\" + 0.008*\"human\" + 0.007*\"summerhil\" + 0.006*\"woman\"\n", + "2019-01-31 01:07:15,287 : INFO : topic #31 (0.020): 0.054*\"fusiform\" + 0.027*\"scientist\" + 0.026*\"taxpay\" + 0.024*\"player\" + 0.021*\"place\" + 0.014*\"clot\" + 0.013*\"leagu\" + 0.011*\"folei\" + 0.011*\"yawn\" + 0.009*\"reconstruct\"\n", + "2019-01-31 01:07:15,288 : INFO : topic #9 (0.020): 0.074*\"bone\" + 0.047*\"american\" + 0.028*\"valour\" + 0.022*\"folei\" + 0.020*\"player\" + 0.019*\"dutch\" + 0.016*\"english\" + 0.016*\"polit\" + 0.011*\"acrimoni\" + 0.011*\"simpler\"\n", + "2019-01-31 01:07:15,294 : INFO : topic diff=0.003298, rho=0.025941\n", + "2019-01-31 01:07:15,507 : INFO : PROGRESS: pass 0, at document #2974000/4922894\n", + "2019-01-31 01:07:16,891 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:07:17,158 : INFO : topic #39 (0.020): 0.056*\"canada\" + 0.044*\"canadian\" + 0.024*\"toronto\" + 0.023*\"hoar\" + 0.020*\"ontario\" + 0.015*\"hydrogen\" + 0.014*\"misericordia\" + 0.014*\"new\" + 0.014*\"quebec\" + 0.013*\"novotná\"\n", + "2019-01-31 01:07:17,159 : INFO : topic #45 (0.020): 0.026*\"jpg\" + 0.025*\"fifteenth\" + 0.019*\"illicit\" + 0.016*\"colder\" + 0.015*\"pain\" + 0.015*\"western\" + 0.014*\"black\" + 0.011*\"record\" + 0.010*\"depress\" + 0.009*\"blind\"\n", + "2019-01-31 01:07:17,160 : INFO : topic #21 (0.020): 0.032*\"samford\" + 0.021*\"spain\" + 0.019*\"del\" + 0.016*\"mexico\" + 0.016*\"italian\" + 0.013*\"soviet\" + 0.011*\"santa\" + 0.011*\"carlo\" + 0.011*\"juan\" + 0.010*\"josé\"\n", + "2019-01-31 01:07:17,161 : INFO : topic #11 (0.020): 0.023*\"john\" + 0.014*\"will\" + 0.012*\"david\" + 0.011*\"jame\" + 0.010*\"mexican–american\" + 0.010*\"rival\" + 0.008*\"georg\" + 0.008*\"slur\" + 0.008*\"paul\" + 0.007*\"rhyme\"\n", + "2019-01-31 01:07:17,162 : INFO : topic #37 (0.020): 0.012*\"charact\" + 0.011*\"septemb\" + 0.010*\"man\" + 0.009*\"anim\" + 0.008*\"comic\" + 0.007*\"appear\" + 0.006*\"love\" + 0.006*\"workplac\" + 0.006*\"storag\" + 0.006*\"dixi\"\n", + "2019-01-31 01:07:17,168 : INFO : topic diff=0.003809, rho=0.025933\n", + "2019-01-31 01:07:17,327 : INFO : PROGRESS: pass 0, at document #2976000/4922894\n", + "2019-01-31 01:07:18,736 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:07:19,002 : INFO : topic #16 (0.020): 0.054*\"king\" + 0.032*\"priest\" + 0.020*\"idiosyncrat\" + 0.019*\"duke\" + 0.019*\"rotterdam\" + 0.017*\"grammat\" + 0.017*\"quarterli\" + 0.014*\"count\" + 0.014*\"portugues\" + 0.013*\"brazil\"\n", + "2019-01-31 01:07:19,003 : INFO : topic #3 (0.020): 0.031*\"present\" + 0.026*\"offic\" + 0.024*\"nation\" + 0.023*\"minist\" + 0.022*\"govern\" + 0.021*\"member\" + 0.020*\"serv\" + 0.016*\"start\" + 0.016*\"gener\" + 0.015*\"council\"\n", + "2019-01-31 01:07:19,004 : INFO : topic #36 (0.020): 0.011*\"network\" + 0.010*\"prognosi\" + 0.010*\"pop\" + 0.009*\"cytokin\" + 0.008*\"develop\" + 0.008*\"softwar\" + 0.008*\"user\" + 0.008*\"uruguayan\" + 0.007*\"includ\" + 0.007*\"ural\"\n", + "2019-01-31 01:07:19,005 : INFO : topic #17 (0.020): 0.077*\"church\" + 0.023*\"christian\" + 0.021*\"cathol\" + 0.020*\"bishop\" + 0.016*\"retroflex\" + 0.015*\"sail\" + 0.010*\"relationship\" + 0.010*\"centuri\" + 0.009*\"cathedr\" + 0.009*\"historiographi\"\n", + "2019-01-31 01:07:19,006 : INFO : topic #37 (0.020): 0.012*\"charact\" + 0.011*\"septemb\" + 0.010*\"man\" + 0.009*\"anim\" + 0.008*\"comic\" + 0.007*\"appear\" + 0.006*\"love\" + 0.006*\"workplac\" + 0.006*\"storag\" + 0.006*\"dixi\"\n", + "2019-01-31 01:07:19,012 : INFO : topic diff=0.003767, rho=0.025924\n", + "2019-01-31 01:07:19,170 : INFO : PROGRESS: pass 0, at document #2978000/4922894\n", + "2019-01-31 01:07:20,577 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:07:20,843 : INFO : topic #27 (0.020): 0.070*\"questionnair\" + 0.019*\"candid\" + 0.018*\"taxpay\" + 0.013*\"driver\" + 0.012*\"ret\" + 0.012*\"tornado\" + 0.012*\"find\" + 0.011*\"fool\" + 0.011*\"théori\" + 0.011*\"squatter\"\n", + "2019-01-31 01:07:20,844 : INFO : topic #30 (0.020): 0.036*\"cleveland\" + 0.035*\"leagu\" + 0.030*\"place\" + 0.028*\"taxpay\" + 0.024*\"scientist\" + 0.024*\"crete\" + 0.022*\"folei\" + 0.016*\"goal\" + 0.015*\"martin\" + 0.012*\"schmitz\"\n", + "2019-01-31 01:07:20,845 : INFO : topic #39 (0.020): 0.056*\"canada\" + 0.044*\"canadian\" + 0.023*\"toronto\" + 0.023*\"hoar\" + 0.020*\"ontario\" + 0.015*\"hydrogen\" + 0.014*\"new\" + 0.014*\"misericordia\" + 0.013*\"novotná\" + 0.013*\"quebec\"\n", + "2019-01-31 01:07:20,846 : INFO : topic #38 (0.020): 0.024*\"walter\" + 0.010*\"battalion\" + 0.010*\"aza\" + 0.009*\"forc\" + 0.007*\"empath\" + 0.007*\"armi\" + 0.007*\"teufel\" + 0.007*\"militari\" + 0.006*\"govern\" + 0.006*\"pour\"\n", + "2019-01-31 01:07:20,848 : INFO : topic #6 (0.020): 0.073*\"fewer\" + 0.023*\"epiru\" + 0.021*\"septemb\" + 0.018*\"teacher\" + 0.016*\"stake\" + 0.014*\"proclaim\" + 0.012*\"rodríguez\" + 0.011*\"acrimoni\" + 0.011*\"direct\" + 0.011*\"movi\"\n", + "2019-01-31 01:07:20,853 : INFO : topic diff=0.003541, rho=0.025915\n", + "2019-01-31 01:07:23,514 : INFO : -11.815 per-word bound, 3602.4 perplexity estimate based on a held-out corpus of 2000 documents with 552617 words\n", + "2019-01-31 01:07:23,515 : INFO : PROGRESS: pass 0, at document #2980000/4922894\n", + "2019-01-31 01:07:24,881 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:07:25,147 : INFO : topic #33 (0.020): 0.062*\"french\" + 0.045*\"franc\" + 0.032*\"pari\" + 0.023*\"sail\" + 0.022*\"jean\" + 0.017*\"daphn\" + 0.014*\"loui\" + 0.013*\"lazi\" + 0.011*\"piec\" + 0.009*\"wine\"\n", + "2019-01-31 01:07:25,148 : INFO : topic #32 (0.020): 0.049*\"district\" + 0.044*\"popolo\" + 0.042*\"vigour\" + 0.036*\"tortur\" + 0.033*\"cotton\" + 0.024*\"area\" + 0.022*\"multitud\" + 0.020*\"citi\" + 0.019*\"adulthood\" + 0.019*\"cede\"\n", + "2019-01-31 01:07:25,149 : INFO : topic #36 (0.020): 0.010*\"prognosi\" + 0.010*\"network\" + 0.010*\"pop\" + 0.008*\"cytokin\" + 0.008*\"develop\" + 0.008*\"softwar\" + 0.008*\"user\" + 0.008*\"uruguayan\" + 0.007*\"includ\" + 0.007*\"ural\"\n", + "2019-01-31 01:07:25,150 : INFO : topic #29 (0.020): 0.030*\"companhia\" + 0.012*\"busi\" + 0.012*\"bank\" + 0.012*\"market\" + 0.011*\"produc\" + 0.011*\"million\" + 0.010*\"industri\" + 0.008*\"yawn\" + 0.008*\"manag\" + 0.007*\"trace\"\n", + "2019-01-31 01:07:25,151 : INFO : topic #3 (0.020): 0.031*\"present\" + 0.026*\"offic\" + 0.024*\"nation\" + 0.022*\"minist\" + 0.022*\"govern\" + 0.021*\"member\" + 0.020*\"serv\" + 0.016*\"start\" + 0.016*\"gener\" + 0.015*\"council\"\n", + "2019-01-31 01:07:25,156 : INFO : topic diff=0.003830, rho=0.025906\n", + "2019-01-31 01:07:25,316 : INFO : PROGRESS: pass 0, at document #2982000/4922894\n", + "2019-01-31 01:07:26,713 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:07:26,980 : INFO : topic #22 (0.020): 0.035*\"spars\" + 0.020*\"factor\" + 0.012*\"genu\" + 0.012*\"plaisir\" + 0.009*\"feel\" + 0.008*\"biom\" + 0.008*\"western\" + 0.008*\"median\" + 0.008*\"male\" + 0.007*\"incom\"\n", + "2019-01-31 01:07:26,981 : INFO : topic #29 (0.020): 0.030*\"companhia\" + 0.012*\"busi\" + 0.012*\"bank\" + 0.012*\"market\" + 0.011*\"produc\" + 0.011*\"million\" + 0.010*\"industri\" + 0.008*\"yawn\" + 0.008*\"manag\" + 0.007*\"trace\"\n", + "2019-01-31 01:07:26,982 : INFO : topic #6 (0.020): 0.072*\"fewer\" + 0.023*\"epiru\" + 0.021*\"septemb\" + 0.018*\"teacher\" + 0.016*\"stake\" + 0.013*\"proclaim\" + 0.012*\"rodríguez\" + 0.011*\"acrimoni\" + 0.011*\"direct\" + 0.011*\"movi\"\n", + "2019-01-31 01:07:26,983 : INFO : topic #2 (0.020): 0.049*\"isl\" + 0.038*\"shield\" + 0.017*\"narrat\" + 0.015*\"scot\" + 0.013*\"pope\" + 0.012*\"blur\" + 0.011*\"coalit\" + 0.010*\"nativist\" + 0.009*\"bahá\" + 0.009*\"fleet\"\n", + "2019-01-31 01:07:26,984 : INFO : topic #4 (0.020): 0.021*\"enfranchis\" + 0.014*\"depress\" + 0.014*\"pour\" + 0.010*\"elabor\" + 0.009*\"mode\" + 0.008*\"veget\" + 0.007*\"uruguayan\" + 0.007*\"encyclopedia\" + 0.006*\"develop\" + 0.006*\"candid\"\n", + "2019-01-31 01:07:26,990 : INFO : topic diff=0.003649, rho=0.025898\n", + "2019-01-31 01:07:27,149 : INFO : PROGRESS: pass 0, at document #2984000/4922894\n", + "2019-01-31 01:07:28,536 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:07:28,802 : INFO : topic #25 (0.020): 0.031*\"ring\" + 0.018*\"area\" + 0.018*\"lagrang\" + 0.017*\"warmth\" + 0.016*\"mount\" + 0.010*\"north\" + 0.009*\"palmer\" + 0.009*\"sourc\" + 0.008*\"vacant\" + 0.008*\"land\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 01:07:28,803 : INFO : topic #40 (0.020): 0.088*\"unit\" + 0.024*\"schuster\" + 0.022*\"institut\" + 0.021*\"collector\" + 0.021*\"requir\" + 0.018*\"student\" + 0.014*\"professor\" + 0.012*\"word\" + 0.011*\"degre\" + 0.011*\"http\"\n", + "2019-01-31 01:07:28,804 : INFO : topic #46 (0.020): 0.016*\"sweden\" + 0.016*\"norwai\" + 0.016*\"damag\" + 0.016*\"swedish\" + 0.015*\"stop\" + 0.015*\"norwegian\" + 0.013*\"wind\" + 0.011*\"denmark\" + 0.011*\"danish\" + 0.011*\"treeless\"\n", + "2019-01-31 01:07:28,805 : INFO : topic #32 (0.020): 0.049*\"district\" + 0.044*\"popolo\" + 0.042*\"vigour\" + 0.036*\"tortur\" + 0.033*\"cotton\" + 0.024*\"area\" + 0.022*\"multitud\" + 0.020*\"citi\" + 0.019*\"adulthood\" + 0.019*\"cede\"\n", + "2019-01-31 01:07:28,806 : INFO : topic #3 (0.020): 0.031*\"present\" + 0.027*\"offic\" + 0.024*\"nation\" + 0.023*\"minist\" + 0.022*\"govern\" + 0.021*\"member\" + 0.019*\"serv\" + 0.016*\"start\" + 0.016*\"gener\" + 0.015*\"council\"\n", + "2019-01-31 01:07:28,812 : INFO : topic diff=0.003988, rho=0.025889\n", + "2019-01-31 01:07:28,976 : INFO : PROGRESS: pass 0, at document #2986000/4922894\n", + "2019-01-31 01:07:30,367 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:07:30,636 : INFO : topic #37 (0.020): 0.012*\"charact\" + 0.011*\"septemb\" + 0.010*\"man\" + 0.009*\"anim\" + 0.008*\"comic\" + 0.007*\"appear\" + 0.006*\"storag\" + 0.006*\"love\" + 0.006*\"workplac\" + 0.006*\"gestur\"\n", + "2019-01-31 01:07:30,637 : INFO : topic #45 (0.020): 0.026*\"jpg\" + 0.025*\"fifteenth\" + 0.018*\"illicit\" + 0.016*\"colder\" + 0.016*\"pain\" + 0.014*\"western\" + 0.014*\"black\" + 0.011*\"record\" + 0.010*\"depress\" + 0.009*\"blind\"\n", + "2019-01-31 01:07:30,638 : INFO : topic #30 (0.020): 0.037*\"cleveland\" + 0.035*\"leagu\" + 0.030*\"place\" + 0.028*\"taxpay\" + 0.024*\"scientist\" + 0.023*\"crete\" + 0.022*\"folei\" + 0.016*\"goal\" + 0.014*\"martin\" + 0.012*\"schmitz\"\n", + "2019-01-31 01:07:30,639 : INFO : topic #21 (0.020): 0.032*\"samford\" + 0.022*\"spain\" + 0.019*\"del\" + 0.017*\"mexico\" + 0.017*\"italian\" + 0.013*\"soviet\" + 0.011*\"santa\" + 0.011*\"juan\" + 0.011*\"carlo\" + 0.010*\"josé\"\n", + "2019-01-31 01:07:30,640 : INFO : topic #28 (0.020): 0.032*\"build\" + 0.025*\"hous\" + 0.018*\"rivièr\" + 0.018*\"buford\" + 0.014*\"histor\" + 0.011*\"constitut\" + 0.011*\"briarwood\" + 0.010*\"depress\" + 0.010*\"strategist\" + 0.010*\"silicon\"\n", + "2019-01-31 01:07:30,646 : INFO : topic diff=0.003692, rho=0.025880\n", + "2019-01-31 01:07:30,800 : INFO : PROGRESS: pass 0, at document #2988000/4922894\n", + "2019-01-31 01:07:32,169 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:07:32,436 : INFO : topic #22 (0.020): 0.035*\"spars\" + 0.020*\"factor\" + 0.012*\"genu\" + 0.011*\"plaisir\" + 0.008*\"feel\" + 0.008*\"western\" + 0.008*\"median\" + 0.008*\"biom\" + 0.008*\"male\" + 0.007*\"incom\"\n", + "2019-01-31 01:07:32,437 : INFO : topic #39 (0.020): 0.056*\"canada\" + 0.044*\"canadian\" + 0.024*\"hoar\" + 0.023*\"toronto\" + 0.020*\"ontario\" + 0.015*\"hydrogen\" + 0.015*\"new\" + 0.014*\"misericordia\" + 0.013*\"novotná\" + 0.013*\"quebec\"\n", + "2019-01-31 01:07:32,438 : INFO : topic #7 (0.020): 0.021*\"snatch\" + 0.020*\"di\" + 0.019*\"factor\" + 0.016*\"yawn\" + 0.016*\"margin\" + 0.014*\"bone\" + 0.013*\"faster\" + 0.012*\"life\" + 0.012*\"deal\" + 0.012*\"daughter\"\n", + "2019-01-31 01:07:32,438 : INFO : topic #13 (0.020): 0.026*\"new\" + 0.026*\"london\" + 0.026*\"sourc\" + 0.025*\"australia\" + 0.023*\"england\" + 0.022*\"australian\" + 0.020*\"ireland\" + 0.019*\"british\" + 0.015*\"youth\" + 0.015*\"wale\"\n", + "2019-01-31 01:07:32,439 : INFO : topic #20 (0.020): 0.151*\"scholar\" + 0.039*\"struggl\" + 0.038*\"high\" + 0.029*\"educ\" + 0.023*\"collector\" + 0.017*\"yawn\" + 0.013*\"prognosi\" + 0.010*\"task\" + 0.009*\"class\" + 0.009*\"district\"\n", + "2019-01-31 01:07:32,445 : INFO : topic diff=0.003734, rho=0.025872\n", + "2019-01-31 01:07:32,603 : INFO : PROGRESS: pass 0, at document #2990000/4922894\n", + "2019-01-31 01:07:33,990 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:07:34,258 : INFO : topic #14 (0.020): 0.024*\"forc\" + 0.022*\"aggress\" + 0.020*\"armi\" + 0.019*\"walter\" + 0.017*\"com\" + 0.015*\"oper\" + 0.014*\"unionist\" + 0.012*\"airbu\" + 0.012*\"militari\" + 0.011*\"refut\"\n", + "2019-01-31 01:07:34,259 : INFO : topic #22 (0.020): 0.035*\"spars\" + 0.020*\"factor\" + 0.012*\"plaisir\" + 0.012*\"genu\" + 0.008*\"feel\" + 0.008*\"western\" + 0.008*\"biom\" + 0.008*\"median\" + 0.008*\"male\" + 0.007*\"incom\"\n", + "2019-01-31 01:07:34,260 : INFO : topic #47 (0.020): 0.068*\"muscl\" + 0.034*\"perceptu\" + 0.018*\"theater\" + 0.018*\"compos\" + 0.017*\"place\" + 0.015*\"damn\" + 0.013*\"orchestr\" + 0.013*\"olympo\" + 0.012*\"word\" + 0.011*\"physician\"\n", + "2019-01-31 01:07:34,261 : INFO : topic #17 (0.020): 0.078*\"church\" + 0.022*\"christian\" + 0.022*\"cathol\" + 0.020*\"bishop\" + 0.016*\"retroflex\" + 0.015*\"sail\" + 0.010*\"relationship\" + 0.010*\"centuri\" + 0.009*\"cathedr\" + 0.009*\"historiographi\"\n", + "2019-01-31 01:07:34,262 : INFO : topic #9 (0.020): 0.072*\"bone\" + 0.047*\"american\" + 0.027*\"valour\" + 0.021*\"folei\" + 0.020*\"player\" + 0.019*\"dutch\" + 0.017*\"polit\" + 0.016*\"english\" + 0.011*\"acrimoni\" + 0.011*\"simpler\"\n", + "2019-01-31 01:07:34,268 : INFO : topic diff=0.003532, rho=0.025863\n", + "2019-01-31 01:07:34,423 : INFO : PROGRESS: pass 0, at document #2992000/4922894\n", + "2019-01-31 01:07:35,815 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:07:36,082 : INFO : topic #45 (0.020): 0.026*\"jpg\" + 0.025*\"fifteenth\" + 0.018*\"illicit\" + 0.016*\"colder\" + 0.016*\"pain\" + 0.014*\"western\" + 0.013*\"black\" + 0.011*\"record\" + 0.010*\"depress\" + 0.009*\"blind\"\n", + "2019-01-31 01:07:36,083 : INFO : topic #37 (0.020): 0.012*\"charact\" + 0.011*\"septemb\" + 0.010*\"man\" + 0.009*\"anim\" + 0.008*\"comic\" + 0.007*\"appear\" + 0.006*\"storag\" + 0.006*\"workplac\" + 0.006*\"love\" + 0.006*\"gestur\"\n", + "2019-01-31 01:07:36,084 : INFO : topic #25 (0.020): 0.031*\"ring\" + 0.018*\"area\" + 0.018*\"lagrang\" + 0.017*\"warmth\" + 0.016*\"mount\" + 0.010*\"north\" + 0.009*\"palmer\" + 0.009*\"sourc\" + 0.008*\"foam\" + 0.008*\"land\"\n", + "2019-01-31 01:07:36,085 : INFO : topic #35 (0.020): 0.057*\"russia\" + 0.034*\"sovereignti\" + 0.034*\"rural\" + 0.026*\"poison\" + 0.024*\"personifi\" + 0.024*\"reprint\" + 0.020*\"moscow\" + 0.016*\"poland\" + 0.015*\"tyrant\" + 0.015*\"unfortun\"\n", + "2019-01-31 01:07:36,086 : INFO : topic #36 (0.020): 0.011*\"prognosi\" + 0.011*\"pop\" + 0.011*\"network\" + 0.008*\"cytokin\" + 0.008*\"develop\" + 0.008*\"softwar\" + 0.008*\"uruguayan\" + 0.008*\"user\" + 0.007*\"includ\" + 0.007*\"ural\"\n", + "2019-01-31 01:07:36,092 : INFO : topic diff=0.003888, rho=0.025854\n", + "2019-01-31 01:07:36,248 : INFO : PROGRESS: pass 0, at document #2994000/4922894\n", + "2019-01-31 01:07:37,621 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:07:37,887 : INFO : topic #14 (0.020): 0.024*\"forc\" + 0.022*\"aggress\" + 0.020*\"armi\" + 0.019*\"walter\" + 0.017*\"com\" + 0.015*\"oper\" + 0.014*\"unionist\" + 0.012*\"airbu\" + 0.012*\"militari\" + 0.010*\"refut\"\n", + "2019-01-31 01:07:37,888 : INFO : topic #40 (0.020): 0.087*\"unit\" + 0.024*\"schuster\" + 0.022*\"institut\" + 0.021*\"requir\" + 0.021*\"collector\" + 0.019*\"student\" + 0.014*\"professor\" + 0.012*\"word\" + 0.011*\"degre\" + 0.011*\"http\"\n", + "2019-01-31 01:07:37,889 : INFO : topic #41 (0.020): 0.040*\"citi\" + 0.022*\"palmer\" + 0.022*\"new\" + 0.015*\"strategist\" + 0.014*\"center\" + 0.012*\"open\" + 0.011*\"dai\" + 0.011*\"includ\" + 0.011*\"lobe\" + 0.009*\"highli\"\n", + "2019-01-31 01:07:37,890 : INFO : topic #20 (0.020): 0.151*\"scholar\" + 0.038*\"high\" + 0.038*\"struggl\" + 0.030*\"educ\" + 0.022*\"collector\" + 0.017*\"yawn\" + 0.013*\"prognosi\" + 0.010*\"task\" + 0.010*\"district\" + 0.010*\"gothic\"\n", + "2019-01-31 01:07:37,891 : INFO : topic #16 (0.020): 0.053*\"king\" + 0.031*\"priest\" + 0.020*\"duke\" + 0.019*\"idiosyncrat\" + 0.019*\"rotterdam\" + 0.018*\"quarterli\" + 0.017*\"grammat\" + 0.014*\"portugues\" + 0.014*\"count\" + 0.013*\"brazil\"\n", + "2019-01-31 01:07:37,897 : INFO : topic diff=0.004370, rho=0.025846\n", + "2019-01-31 01:07:38,060 : INFO : PROGRESS: pass 0, at document #2996000/4922894\n", + "2019-01-31 01:07:39,450 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:07:39,719 : INFO : topic #40 (0.020): 0.087*\"unit\" + 0.024*\"schuster\" + 0.022*\"institut\" + 0.021*\"collector\" + 0.021*\"requir\" + 0.019*\"student\" + 0.014*\"professor\" + 0.012*\"word\" + 0.011*\"degre\" + 0.011*\"http\"\n", + "2019-01-31 01:07:39,720 : INFO : topic #34 (0.020): 0.067*\"start\" + 0.034*\"new\" + 0.031*\"american\" + 0.029*\"unionist\" + 0.025*\"cotton\" + 0.021*\"year\" + 0.015*\"california\" + 0.013*\"warrior\" + 0.013*\"terri\" + 0.011*\"north\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 01:07:39,721 : INFO : topic #22 (0.020): 0.035*\"spars\" + 0.020*\"factor\" + 0.012*\"plaisir\" + 0.012*\"genu\" + 0.008*\"feel\" + 0.008*\"western\" + 0.008*\"biom\" + 0.008*\"median\" + 0.008*\"male\" + 0.007*\"incom\"\n", + "2019-01-31 01:07:39,723 : INFO : topic #12 (0.020): 0.009*\"number\" + 0.007*\"frontal\" + 0.007*\"gener\" + 0.007*\"poet\" + 0.007*\"théori\" + 0.006*\"exampl\" + 0.006*\"measur\" + 0.006*\"method\" + 0.006*\"southern\" + 0.006*\"differ\"\n", + "2019-01-31 01:07:39,724 : INFO : topic #18 (0.020): 0.011*\"théori\" + 0.007*\"later\" + 0.007*\"sack\" + 0.006*\"dai\" + 0.006*\"kill\" + 0.005*\"retrospect\" + 0.005*\"end\" + 0.005*\"like\" + 0.004*\"wander\" + 0.004*\"call\"\n", + "2019-01-31 01:07:39,730 : INFO : topic diff=0.004008, rho=0.025837\n", + "2019-01-31 01:07:39,888 : INFO : PROGRESS: pass 0, at document #2998000/4922894\n", + "2019-01-31 01:07:41,402 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:07:41,669 : INFO : topic #34 (0.020): 0.067*\"start\" + 0.034*\"new\" + 0.031*\"american\" + 0.029*\"unionist\" + 0.025*\"cotton\" + 0.021*\"year\" + 0.015*\"california\" + 0.013*\"warrior\" + 0.013*\"terri\" + 0.011*\"north\"\n", + "2019-01-31 01:07:41,670 : INFO : topic #0 (0.020): 0.068*\"statewid\" + 0.042*\"line\" + 0.034*\"raid\" + 0.024*\"rosenwald\" + 0.021*\"traceabl\" + 0.019*\"serv\" + 0.018*\"museo\" + 0.015*\"arsen\" + 0.013*\"oper\" + 0.011*\"brook\"\n", + "2019-01-31 01:07:41,671 : INFO : topic #9 (0.020): 0.072*\"bone\" + 0.046*\"american\" + 0.027*\"valour\" + 0.021*\"folei\" + 0.020*\"player\" + 0.019*\"dutch\" + 0.017*\"polit\" + 0.016*\"english\" + 0.011*\"acrimoni\" + 0.011*\"simpler\"\n", + "2019-01-31 01:07:41,672 : INFO : topic #47 (0.020): 0.067*\"muscl\" + 0.033*\"perceptu\" + 0.018*\"theater\" + 0.018*\"compos\" + 0.017*\"place\" + 0.015*\"damn\" + 0.013*\"orchestr\" + 0.013*\"olympo\" + 0.012*\"word\" + 0.012*\"physician\"\n", + "2019-01-31 01:07:41,673 : INFO : topic #29 (0.020): 0.030*\"companhia\" + 0.012*\"busi\" + 0.012*\"bank\" + 0.012*\"market\" + 0.011*\"million\" + 0.011*\"produc\" + 0.010*\"industri\" + 0.008*\"yawn\" + 0.008*\"manag\" + 0.007*\"oper\"\n", + "2019-01-31 01:07:41,679 : INFO : topic diff=0.003026, rho=0.025828\n", + "2019-01-31 01:07:44,342 : INFO : -11.517 per-word bound, 2929.7 perplexity estimate based on a held-out corpus of 2000 documents with 539424 words\n", + "2019-01-31 01:07:44,342 : INFO : PROGRESS: pass 0, at document #3000000/4922894\n", + "2019-01-31 01:07:45,715 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:07:45,981 : INFO : topic #22 (0.020): 0.035*\"spars\" + 0.020*\"factor\" + 0.012*\"plaisir\" + 0.012*\"genu\" + 0.008*\"feel\" + 0.008*\"biom\" + 0.008*\"western\" + 0.008*\"male\" + 0.008*\"median\" + 0.007*\"incom\"\n", + "2019-01-31 01:07:45,982 : INFO : topic #31 (0.020): 0.054*\"fusiform\" + 0.026*\"scientist\" + 0.026*\"taxpay\" + 0.023*\"player\" + 0.021*\"place\" + 0.014*\"clot\" + 0.012*\"leagu\" + 0.011*\"folei\" + 0.010*\"yawn\" + 0.009*\"reconstruct\"\n", + "2019-01-31 01:07:45,984 : INFO : topic #44 (0.020): 0.031*\"rooftop\" + 0.030*\"final\" + 0.024*\"wife\" + 0.022*\"tourist\" + 0.018*\"champion\" + 0.015*\"taxpay\" + 0.014*\"chamber\" + 0.013*\"tiepolo\" + 0.013*\"martin\" + 0.013*\"open\"\n", + "2019-01-31 01:07:45,985 : INFO : topic #20 (0.020): 0.151*\"scholar\" + 0.038*\"struggl\" + 0.038*\"high\" + 0.030*\"educ\" + 0.022*\"collector\" + 0.017*\"yawn\" + 0.013*\"prognosi\" + 0.010*\"task\" + 0.010*\"district\" + 0.010*\"gothic\"\n", + "2019-01-31 01:07:45,986 : INFO : topic #15 (0.020): 0.011*\"small\" + 0.010*\"organ\" + 0.010*\"develop\" + 0.009*\"commun\" + 0.009*\"group\" + 0.008*\"peopl\" + 0.008*\"word\" + 0.007*\"human\" + 0.007*\"summerhil\" + 0.006*\"woman\"\n", + "2019-01-31 01:07:45,992 : INFO : topic diff=0.002984, rho=0.025820\n", + "2019-01-31 01:07:46,148 : INFO : PROGRESS: pass 0, at document #3002000/4922894\n", + "2019-01-31 01:07:47,540 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:07:47,807 : INFO : topic #14 (0.020): 0.024*\"forc\" + 0.022*\"aggress\" + 0.020*\"armi\" + 0.020*\"walter\" + 0.018*\"com\" + 0.015*\"oper\" + 0.014*\"unionist\" + 0.012*\"airbu\" + 0.012*\"militari\" + 0.011*\"refut\"\n", + "2019-01-31 01:07:47,808 : INFO : topic #25 (0.020): 0.032*\"ring\" + 0.019*\"area\" + 0.018*\"lagrang\" + 0.016*\"warmth\" + 0.016*\"mount\" + 0.010*\"north\" + 0.009*\"palmer\" + 0.009*\"sourc\" + 0.008*\"foam\" + 0.008*\"lobe\"\n", + "2019-01-31 01:07:47,809 : INFO : topic #0 (0.020): 0.067*\"statewid\" + 0.042*\"line\" + 0.034*\"raid\" + 0.024*\"rosenwald\" + 0.021*\"traceabl\" + 0.019*\"serv\" + 0.018*\"museo\" + 0.014*\"arsen\" + 0.013*\"oper\" + 0.010*\"brook\"\n", + "2019-01-31 01:07:47,810 : INFO : topic #12 (0.020): 0.009*\"number\" + 0.007*\"frontal\" + 0.007*\"gener\" + 0.007*\"poet\" + 0.007*\"théori\" + 0.007*\"exampl\" + 0.006*\"measur\" + 0.006*\"method\" + 0.006*\"southern\" + 0.006*\"differ\"\n", + "2019-01-31 01:07:47,812 : INFO : topic #6 (0.020): 0.071*\"fewer\" + 0.023*\"epiru\" + 0.021*\"septemb\" + 0.019*\"teacher\" + 0.016*\"stake\" + 0.013*\"proclaim\" + 0.012*\"rodríguez\" + 0.011*\"acrimoni\" + 0.011*\"direct\" + 0.010*\"movi\"\n", + "2019-01-31 01:07:47,817 : INFO : topic diff=0.003965, rho=0.025811\n", + "2019-01-31 01:07:47,975 : INFO : PROGRESS: pass 0, at document #3004000/4922894\n", + "2019-01-31 01:07:49,377 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:07:49,643 : INFO : topic #21 (0.020): 0.032*\"samford\" + 0.022*\"spain\" + 0.019*\"del\" + 0.017*\"mexico\" + 0.016*\"italian\" + 0.013*\"soviet\" + 0.011*\"santa\" + 0.011*\"carlo\" + 0.011*\"juan\" + 0.010*\"francisco\"\n", + "2019-01-31 01:07:49,644 : INFO : topic #2 (0.020): 0.051*\"isl\" + 0.037*\"shield\" + 0.017*\"narrat\" + 0.015*\"scot\" + 0.014*\"pope\" + 0.012*\"blur\" + 0.011*\"coalit\" + 0.010*\"nativist\" + 0.010*\"bahá\" + 0.009*\"fleet\"\n", + "2019-01-31 01:07:49,645 : INFO : topic #46 (0.020): 0.016*\"sweden\" + 0.016*\"stop\" + 0.016*\"norwai\" + 0.016*\"swedish\" + 0.015*\"norwegian\" + 0.014*\"damag\" + 0.012*\"wind\" + 0.011*\"danish\" + 0.011*\"denmark\" + 0.010*\"turkish\"\n", + "2019-01-31 01:07:49,646 : INFO : topic #41 (0.020): 0.040*\"citi\" + 0.023*\"palmer\" + 0.022*\"new\" + 0.015*\"strategist\" + 0.014*\"center\" + 0.012*\"open\" + 0.011*\"dai\" + 0.011*\"includ\" + 0.011*\"lobe\" + 0.009*\"highli\"\n", + "2019-01-31 01:07:49,647 : INFO : topic #3 (0.020): 0.032*\"present\" + 0.026*\"offic\" + 0.024*\"minist\" + 0.024*\"nation\" + 0.022*\"govern\" + 0.020*\"member\" + 0.019*\"serv\" + 0.017*\"start\" + 0.016*\"gener\" + 0.014*\"council\"\n", + "2019-01-31 01:07:49,653 : INFO : topic diff=0.003540, rho=0.025803\n", + "2019-01-31 01:07:49,864 : INFO : PROGRESS: pass 0, at document #3006000/4922894\n", + "2019-01-31 01:07:51,252 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:07:51,518 : INFO : topic #47 (0.020): 0.066*\"muscl\" + 0.033*\"perceptu\" + 0.018*\"theater\" + 0.018*\"compos\" + 0.017*\"place\" + 0.015*\"damn\" + 0.013*\"orchestr\" + 0.012*\"olympo\" + 0.012*\"physician\" + 0.012*\"word\"\n", + "2019-01-31 01:07:51,519 : INFO : topic #6 (0.020): 0.071*\"fewer\" + 0.023*\"epiru\" + 0.021*\"septemb\" + 0.019*\"teacher\" + 0.016*\"stake\" + 0.013*\"proclaim\" + 0.012*\"rodríguez\" + 0.011*\"acrimoni\" + 0.011*\"direct\" + 0.010*\"movi\"\n", + "2019-01-31 01:07:51,520 : INFO : topic #3 (0.020): 0.032*\"present\" + 0.026*\"offic\" + 0.024*\"nation\" + 0.023*\"minist\" + 0.022*\"govern\" + 0.020*\"member\" + 0.019*\"serv\" + 0.017*\"start\" + 0.016*\"gener\" + 0.014*\"council\"\n", + "2019-01-31 01:07:51,521 : INFO : topic #0 (0.020): 0.067*\"statewid\" + 0.042*\"line\" + 0.034*\"raid\" + 0.024*\"rosenwald\" + 0.021*\"traceabl\" + 0.020*\"serv\" + 0.018*\"museo\" + 0.014*\"arsen\" + 0.013*\"oper\" + 0.010*\"brook\"\n", + "2019-01-31 01:07:51,522 : INFO : topic #31 (0.020): 0.053*\"fusiform\" + 0.026*\"scientist\" + 0.026*\"taxpay\" + 0.023*\"player\" + 0.021*\"place\" + 0.014*\"clot\" + 0.012*\"leagu\" + 0.011*\"folei\" + 0.010*\"yawn\" + 0.009*\"reconstruct\"\n", + "2019-01-31 01:07:51,528 : INFO : topic diff=0.003522, rho=0.025794\n", + "2019-01-31 01:07:51,686 : INFO : PROGRESS: pass 0, at document #3008000/4922894\n", + "2019-01-31 01:07:53,094 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:07:53,370 : INFO : topic #16 (0.020): 0.054*\"king\" + 0.031*\"priest\" + 0.020*\"duke\" + 0.019*\"idiosyncrat\" + 0.018*\"rotterdam\" + 0.018*\"quarterli\" + 0.017*\"grammat\" + 0.014*\"count\" + 0.013*\"portugues\" + 0.013*\"brazil\"\n", + "2019-01-31 01:07:53,371 : INFO : topic #2 (0.020): 0.052*\"isl\" + 0.037*\"shield\" + 0.017*\"narrat\" + 0.015*\"scot\" + 0.014*\"pope\" + 0.012*\"blur\" + 0.011*\"coalit\" + 0.010*\"nativist\" + 0.009*\"bahá\" + 0.009*\"fleet\"\n", + "2019-01-31 01:07:53,372 : INFO : topic #15 (0.020): 0.011*\"small\" + 0.010*\"organ\" + 0.010*\"develop\" + 0.010*\"commun\" + 0.009*\"group\" + 0.008*\"peopl\" + 0.008*\"word\" + 0.007*\"human\" + 0.007*\"summerhil\" + 0.006*\"woman\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 01:07:53,373 : INFO : topic #9 (0.020): 0.072*\"bone\" + 0.046*\"american\" + 0.027*\"valour\" + 0.021*\"folei\" + 0.020*\"player\" + 0.019*\"dutch\" + 0.017*\"polit\" + 0.016*\"english\" + 0.011*\"acrimoni\" + 0.011*\"simpler\"\n", + "2019-01-31 01:07:53,374 : INFO : topic #35 (0.020): 0.059*\"russia\" + 0.034*\"sovereignti\" + 0.034*\"rural\" + 0.025*\"poison\" + 0.024*\"personifi\" + 0.024*\"reprint\" + 0.020*\"moscow\" + 0.016*\"poland\" + 0.015*\"unfortun\" + 0.015*\"tyrant\"\n", + "2019-01-31 01:07:53,380 : INFO : topic diff=0.003674, rho=0.025786\n", + "2019-01-31 01:07:53,540 : INFO : PROGRESS: pass 0, at document #3010000/4922894\n", + "2019-01-31 01:07:54,944 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:07:55,210 : INFO : topic #14 (0.020): 0.024*\"forc\" + 0.022*\"aggress\" + 0.020*\"armi\" + 0.019*\"walter\" + 0.018*\"com\" + 0.015*\"oper\" + 0.014*\"unionist\" + 0.012*\"militari\" + 0.012*\"airbu\" + 0.011*\"refut\"\n", + "2019-01-31 01:07:55,211 : INFO : topic #8 (0.020): 0.028*\"law\" + 0.024*\"cortic\" + 0.018*\"start\" + 0.016*\"act\" + 0.012*\"ricardo\" + 0.012*\"case\" + 0.010*\"replac\" + 0.010*\"polaris\" + 0.009*\"legal\" + 0.007*\"judaism\"\n", + "2019-01-31 01:07:55,212 : INFO : topic #30 (0.020): 0.036*\"cleveland\" + 0.036*\"leagu\" + 0.030*\"place\" + 0.028*\"taxpay\" + 0.024*\"scientist\" + 0.024*\"crete\" + 0.022*\"folei\" + 0.016*\"goal\" + 0.015*\"martin\" + 0.012*\"schmitz\"\n", + "2019-01-31 01:07:55,213 : INFO : topic #12 (0.020): 0.009*\"number\" + 0.007*\"frontal\" + 0.007*\"poet\" + 0.007*\"gener\" + 0.007*\"théori\" + 0.006*\"exampl\" + 0.006*\"southern\" + 0.006*\"measur\" + 0.006*\"method\" + 0.006*\"utopian\"\n", + "2019-01-31 01:07:55,214 : INFO : topic #9 (0.020): 0.072*\"bone\" + 0.046*\"american\" + 0.027*\"valour\" + 0.021*\"folei\" + 0.020*\"player\" + 0.019*\"dutch\" + 0.017*\"polit\" + 0.016*\"english\" + 0.011*\"acrimoni\" + 0.011*\"simpler\"\n", + "2019-01-31 01:07:55,220 : INFO : topic diff=0.003409, rho=0.025777\n", + "2019-01-31 01:07:55,379 : INFO : PROGRESS: pass 0, at document #3012000/4922894\n", + "2019-01-31 01:07:56,776 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:07:57,042 : INFO : topic #19 (0.020): 0.017*\"languag\" + 0.015*\"centuri\" + 0.011*\"woodcut\" + 0.009*\"form\" + 0.009*\"mean\" + 0.009*\"origin\" + 0.008*\"trade\" + 0.007*\"english\" + 0.007*\"known\" + 0.006*\"ancestor\"\n", + "2019-01-31 01:07:57,043 : INFO : topic #15 (0.020): 0.011*\"small\" + 0.010*\"organ\" + 0.010*\"develop\" + 0.010*\"commun\" + 0.009*\"group\" + 0.008*\"peopl\" + 0.008*\"word\" + 0.007*\"human\" + 0.007*\"woman\" + 0.006*\"summerhil\"\n", + "2019-01-31 01:07:57,044 : INFO : topic #25 (0.020): 0.032*\"ring\" + 0.019*\"area\" + 0.017*\"lagrang\" + 0.016*\"warmth\" + 0.016*\"mount\" + 0.010*\"north\" + 0.009*\"palmer\" + 0.009*\"sourc\" + 0.008*\"lobe\" + 0.008*\"vacant\"\n", + "2019-01-31 01:07:57,045 : INFO : topic #23 (0.020): 0.137*\"audit\" + 0.071*\"best\" + 0.033*\"yawn\" + 0.028*\"jacksonvil\" + 0.022*\"festiv\" + 0.021*\"japanes\" + 0.021*\"noll\" + 0.018*\"women\" + 0.017*\"intern\" + 0.013*\"prison\"\n", + "2019-01-31 01:07:57,046 : INFO : topic #24 (0.020): 0.038*\"book\" + 0.033*\"publicis\" + 0.028*\"word\" + 0.018*\"new\" + 0.014*\"arsen\" + 0.014*\"edit\" + 0.013*\"presid\" + 0.011*\"collect\" + 0.011*\"storag\" + 0.011*\"nicola\"\n", + "2019-01-31 01:07:57,052 : INFO : topic diff=0.003147, rho=0.025768\n", + "2019-01-31 01:07:57,207 : INFO : PROGRESS: pass 0, at document #3014000/4922894\n", + "2019-01-31 01:07:58,585 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:07:58,851 : INFO : topic #21 (0.020): 0.032*\"samford\" + 0.021*\"spain\" + 0.019*\"del\" + 0.017*\"mexico\" + 0.016*\"italian\" + 0.013*\"soviet\" + 0.011*\"santa\" + 0.011*\"carlo\" + 0.011*\"juan\" + 0.010*\"francisco\"\n", + "2019-01-31 01:07:58,852 : INFO : topic #43 (0.020): 0.064*\"elect\" + 0.055*\"parti\" + 0.024*\"democrat\" + 0.023*\"voluntari\" + 0.022*\"member\" + 0.017*\"polici\" + 0.016*\"republ\" + 0.013*\"bypass\" + 0.013*\"report\" + 0.013*\"seaport\"\n", + "2019-01-31 01:07:58,853 : INFO : topic #25 (0.020): 0.032*\"ring\" + 0.019*\"area\" + 0.017*\"lagrang\" + 0.016*\"warmth\" + 0.016*\"mount\" + 0.010*\"north\" + 0.009*\"palmer\" + 0.009*\"sourc\" + 0.008*\"vacant\" + 0.008*\"lobe\"\n", + "2019-01-31 01:07:58,854 : INFO : topic #9 (0.020): 0.071*\"bone\" + 0.046*\"american\" + 0.027*\"valour\" + 0.020*\"folei\" + 0.020*\"player\" + 0.019*\"dutch\" + 0.017*\"polit\" + 0.016*\"english\" + 0.011*\"acrimoni\" + 0.011*\"simpler\"\n", + "2019-01-31 01:07:58,855 : INFO : topic #13 (0.020): 0.027*\"australia\" + 0.027*\"sourc\" + 0.026*\"london\" + 0.026*\"new\" + 0.023*\"england\" + 0.022*\"australian\" + 0.019*\"british\" + 0.019*\"ireland\" + 0.015*\"wale\" + 0.015*\"youth\"\n", + "2019-01-31 01:07:58,860 : INFO : topic diff=0.003655, rho=0.025760\n", + "2019-01-31 01:07:59,010 : INFO : PROGRESS: pass 0, at document #3016000/4922894\n", + "2019-01-31 01:08:00,361 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:08:00,627 : INFO : topic #13 (0.020): 0.027*\"australia\" + 0.027*\"sourc\" + 0.026*\"london\" + 0.026*\"new\" + 0.023*\"england\" + 0.022*\"australian\" + 0.019*\"british\" + 0.019*\"ireland\" + 0.015*\"wale\" + 0.015*\"youth\"\n", + "2019-01-31 01:08:00,628 : INFO : topic #38 (0.020): 0.024*\"walter\" + 0.010*\"aza\" + 0.010*\"battalion\" + 0.009*\"forc\" + 0.008*\"empath\" + 0.008*\"teufel\" + 0.007*\"armi\" + 0.007*\"militari\" + 0.006*\"till\" + 0.006*\"govern\"\n", + "2019-01-31 01:08:00,629 : INFO : topic #42 (0.020): 0.048*\"german\" + 0.031*\"germani\" + 0.015*\"jewish\" + 0.015*\"vol\" + 0.014*\"berlin\" + 0.014*\"der\" + 0.013*\"israel\" + 0.011*\"european\" + 0.010*\"europ\" + 0.009*\"austria\"\n", + "2019-01-31 01:08:00,630 : INFO : topic #33 (0.020): 0.059*\"french\" + 0.046*\"franc\" + 0.032*\"pari\" + 0.022*\"jean\" + 0.022*\"sail\" + 0.017*\"daphn\" + 0.014*\"loui\" + 0.013*\"lazi\" + 0.011*\"piec\" + 0.009*\"wine\"\n", + "2019-01-31 01:08:00,631 : INFO : topic #43 (0.020): 0.064*\"elect\" + 0.055*\"parti\" + 0.024*\"voluntari\" + 0.024*\"democrat\" + 0.022*\"member\" + 0.017*\"polici\" + 0.015*\"republ\" + 0.013*\"liber\" + 0.013*\"bypass\" + 0.013*\"report\"\n", + "2019-01-31 01:08:00,637 : INFO : topic diff=0.004276, rho=0.025751\n", + "2019-01-31 01:08:00,793 : INFO : PROGRESS: pass 0, at document #3018000/4922894\n", + "2019-01-31 01:08:02,150 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:08:02,418 : INFO : topic #26 (0.020): 0.031*\"workplac\" + 0.029*\"woman\" + 0.029*\"champion\" + 0.024*\"men\" + 0.024*\"olymp\" + 0.022*\"medal\" + 0.020*\"event\" + 0.019*\"rainfal\" + 0.018*\"taxpay\" + 0.018*\"atheist\"\n", + "2019-01-31 01:08:02,419 : INFO : topic #22 (0.020): 0.035*\"spars\" + 0.020*\"factor\" + 0.012*\"plaisir\" + 0.011*\"genu\" + 0.008*\"feel\" + 0.008*\"biom\" + 0.008*\"male\" + 0.008*\"median\" + 0.008*\"western\" + 0.007*\"incom\"\n", + "2019-01-31 01:08:02,420 : INFO : topic #49 (0.020): 0.046*\"india\" + 0.030*\"incumb\" + 0.016*\"pakistan\" + 0.013*\"islam\" + 0.012*\"muskoge\" + 0.012*\"affection\" + 0.012*\"anglo\" + 0.011*\"alam\" + 0.011*\"televis\" + 0.010*\"khalsa\"\n", + "2019-01-31 01:08:02,421 : INFO : topic #44 (0.020): 0.031*\"rooftop\" + 0.030*\"final\" + 0.024*\"wife\" + 0.022*\"tourist\" + 0.018*\"champion\" + 0.015*\"taxpay\" + 0.014*\"chamber\" + 0.014*\"tiepolo\" + 0.013*\"martin\" + 0.012*\"open\"\n", + "2019-01-31 01:08:02,422 : INFO : topic #21 (0.020): 0.032*\"samford\" + 0.022*\"spain\" + 0.019*\"del\" + 0.017*\"mexico\" + 0.016*\"italian\" + 0.013*\"soviet\" + 0.011*\"santa\" + 0.011*\"carlo\" + 0.011*\"juan\" + 0.010*\"francisco\"\n", + "2019-01-31 01:08:02,428 : INFO : topic diff=0.004323, rho=0.025743\n", + "2019-01-31 01:08:05,099 : INFO : -11.657 per-word bound, 3229.3 perplexity estimate based on a held-out corpus of 2000 documents with 541996 words\n", + "2019-01-31 01:08:05,100 : INFO : PROGRESS: pass 0, at document #3020000/4922894\n", + "2019-01-31 01:08:06,479 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:08:06,745 : INFO : topic #32 (0.020): 0.048*\"district\" + 0.044*\"popolo\" + 0.042*\"vigour\" + 0.036*\"tortur\" + 0.032*\"cotton\" + 0.024*\"area\" + 0.021*\"multitud\" + 0.021*\"citi\" + 0.020*\"adulthood\" + 0.019*\"cede\"\n", + "2019-01-31 01:08:06,746 : INFO : topic #3 (0.020): 0.032*\"present\" + 0.026*\"offic\" + 0.024*\"nation\" + 0.024*\"minist\" + 0.022*\"govern\" + 0.021*\"member\" + 0.018*\"serv\" + 0.017*\"start\" + 0.016*\"gener\" + 0.014*\"council\"\n", + "2019-01-31 01:08:06,748 : INFO : topic #21 (0.020): 0.032*\"samford\" + 0.022*\"spain\" + 0.018*\"del\" + 0.017*\"mexico\" + 0.016*\"italian\" + 0.013*\"soviet\" + 0.011*\"santa\" + 0.011*\"juan\" + 0.011*\"carlo\" + 0.010*\"francisco\"\n", + "2019-01-31 01:08:06,749 : INFO : topic #45 (0.020): 0.027*\"jpg\" + 0.025*\"fifteenth\" + 0.018*\"illicit\" + 0.016*\"colder\" + 0.016*\"pain\" + 0.014*\"western\" + 0.014*\"black\" + 0.011*\"record\" + 0.010*\"depress\" + 0.010*\"blind\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 01:08:06,750 : INFO : topic #23 (0.020): 0.137*\"audit\" + 0.071*\"best\" + 0.033*\"yawn\" + 0.028*\"jacksonvil\" + 0.021*\"festiv\" + 0.021*\"noll\" + 0.021*\"japanes\" + 0.019*\"women\" + 0.017*\"intern\" + 0.013*\"prison\"\n", + "2019-01-31 01:08:06,755 : INFO : topic diff=0.003816, rho=0.025734\n", + "2019-01-31 01:08:06,911 : INFO : PROGRESS: pass 0, at document #3022000/4922894\n", + "2019-01-31 01:08:08,284 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:08:08,550 : INFO : topic #31 (0.020): 0.053*\"fusiform\" + 0.026*\"scientist\" + 0.026*\"taxpay\" + 0.024*\"player\" + 0.020*\"place\" + 0.014*\"clot\" + 0.012*\"leagu\" + 0.011*\"folei\" + 0.010*\"yawn\" + 0.009*\"reconstruct\"\n", + "2019-01-31 01:08:08,551 : INFO : topic #32 (0.020): 0.048*\"district\" + 0.044*\"popolo\" + 0.042*\"vigour\" + 0.036*\"tortur\" + 0.032*\"cotton\" + 0.024*\"area\" + 0.021*\"multitud\" + 0.021*\"citi\" + 0.020*\"adulthood\" + 0.019*\"cede\"\n", + "2019-01-31 01:08:08,553 : INFO : topic #16 (0.020): 0.054*\"king\" + 0.032*\"priest\" + 0.020*\"duke\" + 0.019*\"idiosyncrat\" + 0.018*\"rotterdam\" + 0.017*\"quarterli\" + 0.016*\"grammat\" + 0.014*\"count\" + 0.013*\"portugues\" + 0.013*\"brazil\"\n", + "2019-01-31 01:08:08,554 : INFO : topic #37 (0.020): 0.011*\"charact\" + 0.011*\"septemb\" + 0.010*\"man\" + 0.009*\"anim\" + 0.007*\"appear\" + 0.007*\"comic\" + 0.006*\"workplac\" + 0.006*\"vision\" + 0.006*\"love\" + 0.006*\"storag\"\n", + "2019-01-31 01:08:08,555 : INFO : topic #21 (0.020): 0.032*\"samford\" + 0.022*\"spain\" + 0.018*\"del\" + 0.017*\"mexico\" + 0.016*\"italian\" + 0.013*\"soviet\" + 0.011*\"santa\" + 0.011*\"juan\" + 0.011*\"carlo\" + 0.010*\"francisco\"\n", + "2019-01-31 01:08:08,561 : INFO : topic diff=0.003301, rho=0.025726\n", + "2019-01-31 01:08:08,716 : INFO : PROGRESS: pass 0, at document #3024000/4922894\n", + "2019-01-31 01:08:10,075 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:08:10,344 : INFO : topic #34 (0.020): 0.067*\"start\" + 0.034*\"new\" + 0.032*\"american\" + 0.029*\"unionist\" + 0.024*\"cotton\" + 0.021*\"year\" + 0.015*\"california\" + 0.013*\"warrior\" + 0.013*\"terri\" + 0.011*\"north\"\n", + "2019-01-31 01:08:10,345 : INFO : topic #20 (0.020): 0.150*\"scholar\" + 0.038*\"high\" + 0.037*\"struggl\" + 0.029*\"educ\" + 0.023*\"collector\" + 0.017*\"yawn\" + 0.013*\"prognosi\" + 0.010*\"district\" + 0.010*\"task\" + 0.010*\"gothic\"\n", + "2019-01-31 01:08:10,346 : INFO : topic #25 (0.020): 0.032*\"ring\" + 0.018*\"area\" + 0.018*\"lagrang\" + 0.016*\"warmth\" + 0.016*\"mount\" + 0.010*\"north\" + 0.009*\"palmer\" + 0.009*\"sourc\" + 0.008*\"vacant\" + 0.008*\"lobe\"\n", + "2019-01-31 01:08:10,347 : INFO : topic #32 (0.020): 0.049*\"district\" + 0.044*\"popolo\" + 0.042*\"vigour\" + 0.036*\"tortur\" + 0.032*\"cotton\" + 0.023*\"area\" + 0.021*\"multitud\" + 0.021*\"citi\" + 0.020*\"adulthood\" + 0.019*\"cede\"\n", + "2019-01-31 01:08:10,348 : INFO : topic #13 (0.020): 0.028*\"australia\" + 0.027*\"new\" + 0.027*\"sourc\" + 0.026*\"london\" + 0.023*\"england\" + 0.021*\"australian\" + 0.019*\"british\" + 0.019*\"ireland\" + 0.015*\"youth\" + 0.015*\"wale\"\n", + "2019-01-31 01:08:10,354 : INFO : topic diff=0.004919, rho=0.025717\n", + "2019-01-31 01:08:10,509 : INFO : PROGRESS: pass 0, at document #3026000/4922894\n", + "2019-01-31 01:08:11,871 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:08:12,137 : INFO : topic #47 (0.020): 0.066*\"muscl\" + 0.033*\"perceptu\" + 0.018*\"theater\" + 0.018*\"compos\" + 0.017*\"place\" + 0.015*\"damn\" + 0.014*\"orchestr\" + 0.012*\"word\" + 0.012*\"olympo\" + 0.012*\"physician\"\n", + "2019-01-31 01:08:12,138 : INFO : topic #22 (0.020): 0.035*\"spars\" + 0.020*\"factor\" + 0.011*\"plaisir\" + 0.011*\"genu\" + 0.009*\"median\" + 0.009*\"biom\" + 0.008*\"feel\" + 0.008*\"western\" + 0.008*\"male\" + 0.008*\"incom\"\n", + "2019-01-31 01:08:12,139 : INFO : topic #15 (0.020): 0.011*\"small\" + 0.010*\"organ\" + 0.010*\"develop\" + 0.009*\"commun\" + 0.009*\"group\" + 0.008*\"peopl\" + 0.008*\"word\" + 0.007*\"human\" + 0.007*\"summerhil\" + 0.006*\"workplac\"\n", + "2019-01-31 01:08:12,140 : INFO : topic #17 (0.020): 0.079*\"church\" + 0.022*\"bishop\" + 0.022*\"christian\" + 0.022*\"cathol\" + 0.016*\"sail\" + 0.015*\"retroflex\" + 0.010*\"relationship\" + 0.010*\"cathedr\" + 0.010*\"parish\" + 0.009*\"centuri\"\n", + "2019-01-31 01:08:12,141 : INFO : topic #2 (0.020): 0.053*\"isl\" + 0.037*\"shield\" + 0.017*\"narrat\" + 0.015*\"scot\" + 0.014*\"pope\" + 0.012*\"blur\" + 0.011*\"coalit\" + 0.010*\"nativist\" + 0.010*\"bahá\" + 0.009*\"fleet\"\n", + "2019-01-31 01:08:12,147 : INFO : topic diff=0.004164, rho=0.025709\n", + "2019-01-31 01:08:12,303 : INFO : PROGRESS: pass 0, at document #3028000/4922894\n", + "2019-01-31 01:08:13,694 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:08:13,959 : INFO : topic #12 (0.020): 0.009*\"number\" + 0.007*\"frontal\" + 0.007*\"poet\" + 0.007*\"gener\" + 0.007*\"théori\" + 0.006*\"exampl\" + 0.006*\"southern\" + 0.006*\"measur\" + 0.006*\"differ\" + 0.006*\"utopian\"\n", + "2019-01-31 01:08:13,960 : INFO : topic #48 (0.020): 0.084*\"march\" + 0.079*\"octob\" + 0.077*\"sens\" + 0.072*\"januari\" + 0.070*\"notion\" + 0.070*\"juli\" + 0.068*\"decatur\" + 0.067*\"april\" + 0.067*\"judici\" + 0.067*\"august\"\n", + "2019-01-31 01:08:13,962 : INFO : topic #18 (0.020): 0.011*\"théori\" + 0.007*\"later\" + 0.007*\"sack\" + 0.006*\"dai\" + 0.006*\"kill\" + 0.005*\"retrospect\" + 0.005*\"like\" + 0.005*\"end\" + 0.004*\"call\" + 0.004*\"help\"\n", + "2019-01-31 01:08:13,963 : INFO : topic #38 (0.020): 0.023*\"walter\" + 0.010*\"battalion\" + 0.010*\"aza\" + 0.009*\"forc\" + 0.008*\"empath\" + 0.007*\"armi\" + 0.007*\"teufel\" + 0.006*\"militari\" + 0.006*\"govern\" + 0.006*\"till\"\n", + "2019-01-31 01:08:13,964 : INFO : topic #11 (0.020): 0.023*\"john\" + 0.013*\"will\" + 0.012*\"david\" + 0.011*\"jame\" + 0.010*\"rival\" + 0.009*\"mexican–american\" + 0.008*\"slur\" + 0.008*\"georg\" + 0.008*\"paul\" + 0.007*\"rhyme\"\n", + "2019-01-31 01:08:13,970 : INFO : topic diff=0.004164, rho=0.025700\n", + "2019-01-31 01:08:14,123 : INFO : PROGRESS: pass 0, at document #3030000/4922894\n", + "2019-01-31 01:08:15,489 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:08:15,756 : INFO : topic #39 (0.020): 0.057*\"canada\" + 0.043*\"canadian\" + 0.024*\"hoar\" + 0.022*\"toronto\" + 0.019*\"ontario\" + 0.015*\"hydrogen\" + 0.015*\"new\" + 0.014*\"novotná\" + 0.014*\"misericordia\" + 0.013*\"quebec\"\n", + "2019-01-31 01:08:15,757 : INFO : topic #14 (0.020): 0.024*\"forc\" + 0.022*\"aggress\" + 0.020*\"armi\" + 0.020*\"walter\" + 0.018*\"com\" + 0.015*\"oper\" + 0.014*\"unionist\" + 0.013*\"militari\" + 0.012*\"airbu\" + 0.011*\"diversifi\"\n", + "2019-01-31 01:08:15,758 : INFO : topic #42 (0.020): 0.047*\"german\" + 0.031*\"germani\" + 0.015*\"vol\" + 0.015*\"jewish\" + 0.015*\"berlin\" + 0.014*\"israel\" + 0.014*\"der\" + 0.011*\"european\" + 0.010*\"europ\" + 0.009*\"austria\"\n", + "2019-01-31 01:08:15,759 : INFO : topic #18 (0.020): 0.011*\"théori\" + 0.007*\"later\" + 0.007*\"sack\" + 0.006*\"dai\" + 0.006*\"kill\" + 0.005*\"retrospect\" + 0.005*\"like\" + 0.005*\"end\" + 0.004*\"call\" + 0.004*\"help\"\n", + "2019-01-31 01:08:15,760 : INFO : topic #17 (0.020): 0.080*\"church\" + 0.022*\"bishop\" + 0.022*\"christian\" + 0.022*\"cathol\" + 0.016*\"sail\" + 0.015*\"retroflex\" + 0.010*\"relationship\" + 0.010*\"parish\" + 0.010*\"cathedr\" + 0.009*\"centuri\"\n", + "2019-01-31 01:08:15,766 : INFO : topic diff=0.004628, rho=0.025692\n", + "2019-01-31 01:08:15,921 : INFO : PROGRESS: pass 0, at document #3032000/4922894\n", + "2019-01-31 01:08:17,289 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:08:17,556 : INFO : topic #47 (0.020): 0.065*\"muscl\" + 0.033*\"perceptu\" + 0.018*\"theater\" + 0.018*\"place\" + 0.017*\"compos\" + 0.015*\"damn\" + 0.014*\"orchestr\" + 0.012*\"physician\" + 0.012*\"word\" + 0.012*\"olympo\"\n", + "2019-01-31 01:08:17,557 : INFO : topic #43 (0.020): 0.064*\"elect\" + 0.055*\"parti\" + 0.024*\"voluntari\" + 0.023*\"democrat\" + 0.022*\"member\" + 0.017*\"polici\" + 0.015*\"republ\" + 0.014*\"bypass\" + 0.013*\"selma\" + 0.013*\"liber\"\n", + "2019-01-31 01:08:17,558 : INFO : topic #3 (0.020): 0.032*\"present\" + 0.026*\"offic\" + 0.024*\"nation\" + 0.024*\"minist\" + 0.022*\"govern\" + 0.021*\"member\" + 0.018*\"serv\" + 0.017*\"start\" + 0.016*\"gener\" + 0.014*\"council\"\n", + "2019-01-31 01:08:17,559 : INFO : topic #2 (0.020): 0.053*\"isl\" + 0.037*\"shield\" + 0.017*\"narrat\" + 0.015*\"scot\" + 0.013*\"pope\" + 0.012*\"blur\" + 0.011*\"coalit\" + 0.010*\"nativist\" + 0.010*\"bahá\" + 0.009*\"fleet\"\n", + "2019-01-31 01:08:17,560 : INFO : topic #33 (0.020): 0.060*\"french\" + 0.047*\"franc\" + 0.032*\"pari\" + 0.023*\"jean\" + 0.022*\"sail\" + 0.017*\"daphn\" + 0.013*\"loui\" + 0.013*\"lazi\" + 0.011*\"piec\" + 0.009*\"wine\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 01:08:17,566 : INFO : topic diff=0.002821, rho=0.025683\n", + "2019-01-31 01:08:17,728 : INFO : PROGRESS: pass 0, at document #3034000/4922894\n", + "2019-01-31 01:08:19,136 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:08:19,405 : INFO : topic #35 (0.020): 0.057*\"russia\" + 0.035*\"sovereignti\" + 0.034*\"rural\" + 0.025*\"poison\" + 0.025*\"personifi\" + 0.022*\"reprint\" + 0.021*\"moscow\" + 0.016*\"poland\" + 0.015*\"unfortun\" + 0.014*\"czech\"\n", + "2019-01-31 01:08:19,406 : INFO : topic #38 (0.020): 0.024*\"walter\" + 0.010*\"battalion\" + 0.009*\"aza\" + 0.009*\"forc\" + 0.008*\"empath\" + 0.007*\"armi\" + 0.007*\"teufel\" + 0.006*\"militari\" + 0.006*\"govern\" + 0.006*\"till\"\n", + "2019-01-31 01:08:19,407 : INFO : topic #19 (0.020): 0.017*\"languag\" + 0.015*\"centuri\" + 0.011*\"woodcut\" + 0.010*\"form\" + 0.009*\"mean\" + 0.009*\"trade\" + 0.009*\"origin\" + 0.007*\"english\" + 0.007*\"known\" + 0.007*\"ancestor\"\n", + "2019-01-31 01:08:19,408 : INFO : topic #36 (0.020): 0.011*\"network\" + 0.010*\"prognosi\" + 0.010*\"pop\" + 0.008*\"develop\" + 0.008*\"cytokin\" + 0.008*\"user\" + 0.008*\"uruguayan\" + 0.008*\"softwar\" + 0.008*\"includ\" + 0.007*\"base\"\n", + "2019-01-31 01:08:19,410 : INFO : topic #10 (0.020): 0.011*\"cdd\" + 0.008*\"media\" + 0.008*\"disco\" + 0.008*\"have\" + 0.008*\"hormon\" + 0.007*\"pathwai\" + 0.007*\"caus\" + 0.006*\"proper\" + 0.006*\"treat\" + 0.006*\"effect\"\n", + "2019-01-31 01:08:19,415 : INFO : topic diff=0.005355, rho=0.025675\n", + "2019-01-31 01:08:19,567 : INFO : PROGRESS: pass 0, at document #3036000/4922894\n", + "2019-01-31 01:08:20,902 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:08:21,168 : INFO : topic #10 (0.020): 0.011*\"cdd\" + 0.008*\"media\" + 0.008*\"disco\" + 0.007*\"hormon\" + 0.007*\"have\" + 0.007*\"pathwai\" + 0.007*\"caus\" + 0.006*\"proper\" + 0.006*\"treat\" + 0.006*\"effect\"\n", + "2019-01-31 01:08:21,169 : INFO : topic #24 (0.020): 0.037*\"book\" + 0.033*\"publicis\" + 0.028*\"word\" + 0.018*\"new\" + 0.015*\"arsen\" + 0.013*\"edit\" + 0.013*\"presid\" + 0.012*\"collect\" + 0.011*\"storag\" + 0.011*\"nicola\"\n", + "2019-01-31 01:08:21,171 : INFO : topic #27 (0.020): 0.071*\"questionnair\" + 0.020*\"candid\" + 0.018*\"taxpay\" + 0.015*\"ret\" + 0.012*\"tornado\" + 0.012*\"driver\" + 0.012*\"find\" + 0.011*\"fool\" + 0.011*\"squatter\" + 0.010*\"théori\"\n", + "2019-01-31 01:08:21,172 : INFO : topic #45 (0.020): 0.026*\"jpg\" + 0.026*\"fifteenth\" + 0.018*\"illicit\" + 0.017*\"colder\" + 0.016*\"pain\" + 0.014*\"western\" + 0.014*\"black\" + 0.011*\"record\" + 0.010*\"depress\" + 0.010*\"blind\"\n", + "2019-01-31 01:08:21,173 : INFO : topic #2 (0.020): 0.052*\"isl\" + 0.037*\"shield\" + 0.017*\"narrat\" + 0.015*\"scot\" + 0.013*\"pope\" + 0.012*\"blur\" + 0.011*\"coalit\" + 0.010*\"nativist\" + 0.010*\"bahá\" + 0.009*\"fleet\"\n", + "2019-01-31 01:08:21,179 : INFO : topic diff=0.004771, rho=0.025666\n", + "2019-01-31 01:08:21,334 : INFO : PROGRESS: pass 0, at document #3038000/4922894\n", + "2019-01-31 01:08:22,713 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:08:22,979 : INFO : topic #3 (0.020): 0.031*\"present\" + 0.026*\"offic\" + 0.024*\"nation\" + 0.023*\"minist\" + 0.022*\"serv\" + 0.022*\"govern\" + 0.020*\"member\" + 0.016*\"start\" + 0.016*\"gener\" + 0.014*\"chickasaw\"\n", + "2019-01-31 01:08:22,980 : INFO : topic #27 (0.020): 0.071*\"questionnair\" + 0.020*\"candid\" + 0.018*\"taxpay\" + 0.015*\"ret\" + 0.012*\"tornado\" + 0.012*\"driver\" + 0.012*\"find\" + 0.011*\"fool\" + 0.011*\"squatter\" + 0.010*\"théori\"\n", + "2019-01-31 01:08:22,981 : INFO : topic #5 (0.020): 0.037*\"abroad\" + 0.028*\"son\" + 0.026*\"rel\" + 0.025*\"reconstruct\" + 0.021*\"band\" + 0.016*\"muscl\" + 0.016*\"simultan\" + 0.014*\"charcoal\" + 0.014*\"toyota\" + 0.010*\"myspac\"\n", + "2019-01-31 01:08:22,982 : INFO : topic #45 (0.020): 0.026*\"jpg\" + 0.025*\"fifteenth\" + 0.018*\"illicit\" + 0.017*\"colder\" + 0.016*\"pain\" + 0.014*\"western\" + 0.014*\"black\" + 0.011*\"record\" + 0.010*\"depress\" + 0.010*\"blind\"\n", + "2019-01-31 01:08:22,983 : INFO : topic #42 (0.020): 0.046*\"german\" + 0.031*\"germani\" + 0.015*\"jewish\" + 0.015*\"vol\" + 0.014*\"berlin\" + 0.014*\"israel\" + 0.013*\"der\" + 0.011*\"european\" + 0.010*\"europ\" + 0.009*\"austria\"\n", + "2019-01-31 01:08:22,989 : INFO : topic diff=0.003575, rho=0.025658\n", + "2019-01-31 01:08:25,738 : INFO : -11.663 per-word bound, 3243.6 perplexity estimate based on a held-out corpus of 2000 documents with 565012 words\n", + "2019-01-31 01:08:25,739 : INFO : PROGRESS: pass 0, at document #3040000/4922894\n", + "2019-01-31 01:08:27,108 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:08:27,375 : INFO : topic #45 (0.020): 0.027*\"jpg\" + 0.025*\"fifteenth\" + 0.018*\"illicit\" + 0.017*\"colder\" + 0.016*\"pain\" + 0.014*\"western\" + 0.014*\"black\" + 0.011*\"record\" + 0.010*\"depress\" + 0.010*\"blind\"\n", + "2019-01-31 01:08:27,376 : INFO : topic #39 (0.020): 0.057*\"canada\" + 0.043*\"canadian\" + 0.023*\"hoar\" + 0.023*\"toronto\" + 0.019*\"ontario\" + 0.015*\"hydrogen\" + 0.015*\"novotná\" + 0.014*\"new\" + 0.014*\"misericordia\" + 0.013*\"quebec\"\n", + "2019-01-31 01:08:27,377 : INFO : topic #18 (0.020): 0.011*\"théori\" + 0.007*\"later\" + 0.007*\"sack\" + 0.006*\"dai\" + 0.006*\"kill\" + 0.005*\"retrospect\" + 0.005*\"like\" + 0.005*\"end\" + 0.004*\"call\" + 0.004*\"wander\"\n", + "2019-01-31 01:08:27,378 : INFO : topic #5 (0.020): 0.037*\"abroad\" + 0.028*\"son\" + 0.026*\"rel\" + 0.025*\"reconstruct\" + 0.021*\"band\" + 0.016*\"muscl\" + 0.016*\"simultan\" + 0.014*\"charcoal\" + 0.014*\"toyota\" + 0.010*\"myspac\"\n", + "2019-01-31 01:08:27,379 : INFO : topic #12 (0.020): 0.009*\"number\" + 0.007*\"frontal\" + 0.007*\"gener\" + 0.007*\"poet\" + 0.007*\"théori\" + 0.006*\"exampl\" + 0.006*\"southern\" + 0.006*\"measur\" + 0.006*\"servitud\" + 0.006*\"differ\"\n", + "2019-01-31 01:08:27,385 : INFO : topic diff=0.003932, rho=0.025649\n", + "2019-01-31 01:08:27,536 : INFO : PROGRESS: pass 0, at document #3042000/4922894\n", + "2019-01-31 01:08:28,874 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:08:29,140 : INFO : topic #0 (0.020): 0.068*\"statewid\" + 0.042*\"line\" + 0.034*\"raid\" + 0.023*\"rosenwald\" + 0.021*\"traceabl\" + 0.020*\"serv\" + 0.017*\"museo\" + 0.014*\"oper\" + 0.012*\"arsen\" + 0.010*\"radiu\"\n", + "2019-01-31 01:08:29,141 : INFO : topic #5 (0.020): 0.037*\"abroad\" + 0.028*\"son\" + 0.026*\"rel\" + 0.025*\"reconstruct\" + 0.021*\"band\" + 0.016*\"muscl\" + 0.016*\"simultan\" + 0.014*\"charcoal\" + 0.014*\"toyota\" + 0.010*\"myspac\"\n", + "2019-01-31 01:08:29,143 : INFO : topic #15 (0.020): 0.011*\"small\" + 0.010*\"organ\" + 0.010*\"develop\" + 0.009*\"commun\" + 0.009*\"group\" + 0.008*\"peopl\" + 0.008*\"word\" + 0.007*\"human\" + 0.006*\"summerhil\" + 0.006*\"woman\"\n", + "2019-01-31 01:08:29,144 : INFO : topic #12 (0.020): 0.009*\"number\" + 0.007*\"frontal\" + 0.007*\"gener\" + 0.007*\"poet\" + 0.007*\"théori\" + 0.006*\"exampl\" + 0.006*\"southern\" + 0.006*\"servitud\" + 0.006*\"measur\" + 0.006*\"utopian\"\n", + "2019-01-31 01:08:29,145 : INFO : topic #44 (0.020): 0.031*\"rooftop\" + 0.029*\"final\" + 0.023*\"wife\" + 0.021*\"tourist\" + 0.017*\"champion\" + 0.015*\"taxpay\" + 0.014*\"chamber\" + 0.014*\"tiepolo\" + 0.013*\"martin\" + 0.013*\"open\"\n", + "2019-01-31 01:08:29,151 : INFO : topic diff=0.005300, rho=0.025641\n", + "2019-01-31 01:08:29,311 : INFO : PROGRESS: pass 0, at document #3044000/4922894\n", + "2019-01-31 01:08:30,726 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:08:30,992 : INFO : topic #21 (0.020): 0.032*\"samford\" + 0.022*\"spain\" + 0.019*\"del\" + 0.017*\"mexico\" + 0.017*\"italian\" + 0.012*\"soviet\" + 0.011*\"santa\" + 0.011*\"juan\" + 0.011*\"itali\" + 0.010*\"carlo\"\n", + "2019-01-31 01:08:30,993 : INFO : topic #6 (0.020): 0.072*\"fewer\" + 0.024*\"epiru\" + 0.021*\"septemb\" + 0.019*\"teacher\" + 0.016*\"stake\" + 0.013*\"proclaim\" + 0.012*\"rodríguez\" + 0.011*\"direct\" + 0.011*\"acrimoni\" + 0.011*\"movi\"\n", + "2019-01-31 01:08:30,995 : INFO : topic #25 (0.020): 0.032*\"ring\" + 0.019*\"area\" + 0.018*\"lagrang\" + 0.016*\"warmth\" + 0.016*\"mount\" + 0.010*\"north\" + 0.009*\"palmer\" + 0.009*\"sourc\" + 0.009*\"vacant\" + 0.008*\"lobe\"\n", + "2019-01-31 01:08:30,996 : INFO : topic #41 (0.020): 0.042*\"citi\" + 0.023*\"palmer\" + 0.021*\"new\" + 0.015*\"strategist\" + 0.013*\"center\" + 0.013*\"open\" + 0.011*\"dai\" + 0.011*\"includ\" + 0.011*\"lobe\" + 0.009*\"yawn\"\n", + "2019-01-31 01:08:30,997 : INFO : topic #14 (0.020): 0.024*\"forc\" + 0.022*\"aggress\" + 0.020*\"walter\" + 0.020*\"armi\" + 0.018*\"com\" + 0.015*\"oper\" + 0.014*\"unionist\" + 0.013*\"militari\" + 0.011*\"airbu\" + 0.011*\"diversifi\"\n", + "2019-01-31 01:08:31,003 : INFO : topic diff=0.004402, rho=0.025633\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 01:08:31,158 : INFO : PROGRESS: pass 0, at document #3046000/4922894\n", + "2019-01-31 01:08:32,533 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:08:32,799 : INFO : topic #22 (0.020): 0.035*\"spars\" + 0.020*\"factor\" + 0.011*\"plaisir\" + 0.011*\"genu\" + 0.009*\"biom\" + 0.008*\"feel\" + 0.008*\"western\" + 0.008*\"male\" + 0.008*\"median\" + 0.007*\"incom\"\n", + "2019-01-31 01:08:32,800 : INFO : topic #40 (0.020): 0.087*\"unit\" + 0.023*\"schuster\" + 0.021*\"institut\" + 0.021*\"requir\" + 0.021*\"collector\" + 0.019*\"student\" + 0.014*\"professor\" + 0.012*\"word\" + 0.012*\"http\" + 0.011*\"governor\"\n", + "2019-01-31 01:08:32,802 : INFO : topic #5 (0.020): 0.037*\"abroad\" + 0.028*\"son\" + 0.026*\"rel\" + 0.025*\"reconstruct\" + 0.021*\"band\" + 0.016*\"muscl\" + 0.016*\"simultan\" + 0.014*\"charcoal\" + 0.014*\"toyota\" + 0.010*\"myspac\"\n", + "2019-01-31 01:08:32,803 : INFO : topic #14 (0.020): 0.024*\"forc\" + 0.022*\"aggress\" + 0.020*\"walter\" + 0.020*\"armi\" + 0.018*\"com\" + 0.015*\"oper\" + 0.014*\"unionist\" + 0.013*\"militari\" + 0.011*\"airbu\" + 0.011*\"diversifi\"\n", + "2019-01-31 01:08:32,804 : INFO : topic #2 (0.020): 0.052*\"isl\" + 0.037*\"shield\" + 0.018*\"narrat\" + 0.014*\"scot\" + 0.013*\"pope\" + 0.012*\"blur\" + 0.011*\"coalit\" + 0.010*\"bahá\" + 0.010*\"nativist\" + 0.009*\"fleet\"\n", + "2019-01-31 01:08:32,809 : INFO : topic diff=0.004820, rho=0.025624\n", + "2019-01-31 01:08:32,966 : INFO : PROGRESS: pass 0, at document #3048000/4922894\n", + "2019-01-31 01:08:34,354 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:08:34,621 : INFO : topic #47 (0.020): 0.064*\"muscl\" + 0.033*\"perceptu\" + 0.018*\"theater\" + 0.017*\"compos\" + 0.017*\"place\" + 0.015*\"damn\" + 0.014*\"orchestr\" + 0.012*\"physician\" + 0.012*\"olympo\" + 0.012*\"word\"\n", + "2019-01-31 01:08:34,622 : INFO : topic #24 (0.020): 0.037*\"book\" + 0.033*\"publicis\" + 0.028*\"word\" + 0.018*\"new\" + 0.015*\"arsen\" + 0.014*\"edit\" + 0.013*\"presid\" + 0.011*\"collect\" + 0.010*\"storag\" + 0.010*\"worldwid\"\n", + "2019-01-31 01:08:34,623 : INFO : topic #34 (0.020): 0.067*\"start\" + 0.034*\"new\" + 0.032*\"american\" + 0.029*\"unionist\" + 0.024*\"cotton\" + 0.021*\"year\" + 0.015*\"california\" + 0.013*\"warrior\" + 0.013*\"terri\" + 0.012*\"north\"\n", + "2019-01-31 01:08:34,624 : INFO : topic #42 (0.020): 0.046*\"german\" + 0.031*\"germani\" + 0.015*\"vol\" + 0.015*\"jewish\" + 0.015*\"berlin\" + 0.014*\"israel\" + 0.013*\"der\" + 0.011*\"european\" + 0.010*\"europ\" + 0.009*\"austria\"\n", + "2019-01-31 01:08:34,625 : INFO : topic #6 (0.020): 0.072*\"fewer\" + 0.024*\"epiru\" + 0.021*\"septemb\" + 0.018*\"teacher\" + 0.016*\"stake\" + 0.013*\"proclaim\" + 0.012*\"rodríguez\" + 0.011*\"direct\" + 0.011*\"movi\" + 0.011*\"acrimoni\"\n", + "2019-01-31 01:08:34,631 : INFO : topic diff=0.003406, rho=0.025616\n", + "2019-01-31 01:08:34,788 : INFO : PROGRESS: pass 0, at document #3050000/4922894\n", + "2019-01-31 01:08:36,178 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:08:36,445 : INFO : topic #46 (0.020): 0.017*\"sweden\" + 0.017*\"swedish\" + 0.016*\"stop\" + 0.015*\"norwai\" + 0.014*\"norwegian\" + 0.013*\"damag\" + 0.012*\"treeless\" + 0.012*\"wind\" + 0.011*\"denmark\" + 0.011*\"danish\"\n", + "2019-01-31 01:08:36,446 : INFO : topic #3 (0.020): 0.031*\"present\" + 0.026*\"offic\" + 0.023*\"nation\" + 0.023*\"minist\" + 0.022*\"govern\" + 0.021*\"serv\" + 0.020*\"member\" + 0.016*\"start\" + 0.016*\"gener\" + 0.014*\"chickasaw\"\n", + "2019-01-31 01:08:36,447 : INFO : topic #25 (0.020): 0.032*\"ring\" + 0.019*\"area\" + 0.018*\"lagrang\" + 0.016*\"mount\" + 0.016*\"warmth\" + 0.010*\"north\" + 0.009*\"palmer\" + 0.009*\"sourc\" + 0.009*\"vacant\" + 0.008*\"lobe\"\n", + "2019-01-31 01:08:36,448 : INFO : topic #42 (0.020): 0.046*\"german\" + 0.031*\"germani\" + 0.015*\"vol\" + 0.015*\"jewish\" + 0.015*\"berlin\" + 0.014*\"israel\" + 0.013*\"der\" + 0.011*\"european\" + 0.010*\"europ\" + 0.009*\"austria\"\n", + "2019-01-31 01:08:36,449 : INFO : topic #30 (0.020): 0.037*\"leagu\" + 0.036*\"cleveland\" + 0.030*\"place\" + 0.027*\"taxpay\" + 0.024*\"scientist\" + 0.023*\"crete\" + 0.021*\"folei\" + 0.017*\"goal\" + 0.015*\"martin\" + 0.012*\"schmitz\"\n", + "2019-01-31 01:08:36,455 : INFO : topic diff=0.003313, rho=0.025607\n", + "2019-01-31 01:08:36,614 : INFO : PROGRESS: pass 0, at document #3052000/4922894\n", + "2019-01-31 01:08:38,012 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:08:38,279 : INFO : topic #23 (0.020): 0.134*\"audit\" + 0.069*\"best\" + 0.034*\"yawn\" + 0.029*\"jacksonvil\" + 0.022*\"japanes\" + 0.021*\"noll\" + 0.021*\"festiv\" + 0.019*\"women\" + 0.016*\"intern\" + 0.013*\"prison\"\n", + "2019-01-31 01:08:38,280 : INFO : topic #16 (0.020): 0.055*\"king\" + 0.033*\"priest\" + 0.023*\"duke\" + 0.019*\"idiosyncrat\" + 0.018*\"quarterli\" + 0.017*\"rotterdam\" + 0.017*\"grammat\" + 0.013*\"princ\" + 0.013*\"count\" + 0.012*\"portugues\"\n", + "2019-01-31 01:08:38,281 : INFO : topic #25 (0.020): 0.032*\"ring\" + 0.019*\"area\" + 0.018*\"lagrang\" + 0.016*\"mount\" + 0.016*\"warmth\" + 0.010*\"north\" + 0.009*\"palmer\" + 0.009*\"sourc\" + 0.008*\"vacant\" + 0.008*\"lobe\"\n", + "2019-01-31 01:08:38,282 : INFO : topic #5 (0.020): 0.037*\"abroad\" + 0.028*\"son\" + 0.026*\"rel\" + 0.025*\"reconstruct\" + 0.021*\"band\" + 0.016*\"muscl\" + 0.016*\"simultan\" + 0.014*\"charcoal\" + 0.014*\"toyota\" + 0.010*\"myspac\"\n", + "2019-01-31 01:08:38,283 : INFO : topic #12 (0.020): 0.009*\"number\" + 0.007*\"frontal\" + 0.007*\"gener\" + 0.007*\"poet\" + 0.007*\"théori\" + 0.007*\"exampl\" + 0.006*\"southern\" + 0.006*\"measur\" + 0.005*\"servitud\" + 0.005*\"differ\"\n", + "2019-01-31 01:08:38,289 : INFO : topic diff=0.003767, rho=0.025599\n", + "2019-01-31 01:08:38,453 : INFO : PROGRESS: pass 0, at document #3054000/4922894\n", + "2019-01-31 01:08:39,833 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:08:40,102 : INFO : topic #35 (0.020): 0.057*\"russia\" + 0.036*\"sovereignti\" + 0.034*\"rural\" + 0.025*\"personifi\" + 0.024*\"poison\" + 0.023*\"reprint\" + 0.021*\"moscow\" + 0.016*\"poland\" + 0.015*\"unfortun\" + 0.015*\"czech\"\n", + "2019-01-31 01:08:40,103 : INFO : topic #19 (0.020): 0.017*\"languag\" + 0.015*\"centuri\" + 0.011*\"woodcut\" + 0.009*\"form\" + 0.009*\"mean\" + 0.009*\"origin\" + 0.008*\"trade\" + 0.008*\"english\" + 0.007*\"ancestor\" + 0.007*\"known\"\n", + "2019-01-31 01:08:40,104 : INFO : topic #20 (0.020): 0.150*\"scholar\" + 0.039*\"struggl\" + 0.038*\"high\" + 0.029*\"educ\" + 0.024*\"collector\" + 0.017*\"yawn\" + 0.013*\"prognosi\" + 0.010*\"gothic\" + 0.010*\"task\" + 0.010*\"class\"\n", + "2019-01-31 01:08:40,105 : INFO : topic #44 (0.020): 0.031*\"rooftop\" + 0.029*\"final\" + 0.023*\"wife\" + 0.022*\"tourist\" + 0.018*\"champion\" + 0.015*\"chamber\" + 0.014*\"taxpay\" + 0.014*\"tiepolo\" + 0.013*\"martin\" + 0.013*\"women\"\n", + "2019-01-31 01:08:40,106 : INFO : topic #22 (0.020): 0.035*\"spars\" + 0.020*\"factor\" + 0.011*\"plaisir\" + 0.011*\"genu\" + 0.009*\"feel\" + 0.009*\"male\" + 0.009*\"median\" + 0.009*\"biom\" + 0.008*\"western\" + 0.008*\"incom\"\n", + "2019-01-31 01:08:40,112 : INFO : topic diff=0.003038, rho=0.025591\n", + "2019-01-31 01:08:40,268 : INFO : PROGRESS: pass 0, at document #3056000/4922894\n", + "2019-01-31 01:08:41,640 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:08:41,906 : INFO : topic #30 (0.020): 0.037*\"leagu\" + 0.036*\"cleveland\" + 0.030*\"place\" + 0.027*\"taxpay\" + 0.024*\"scientist\" + 0.023*\"crete\" + 0.021*\"folei\" + 0.017*\"goal\" + 0.015*\"martin\" + 0.012*\"schmitz\"\n", + "2019-01-31 01:08:41,907 : INFO : topic #5 (0.020): 0.037*\"abroad\" + 0.028*\"son\" + 0.026*\"rel\" + 0.025*\"reconstruct\" + 0.021*\"band\" + 0.016*\"muscl\" + 0.016*\"simultan\" + 0.014*\"charcoal\" + 0.014*\"toyota\" + 0.010*\"myspac\"\n", + "2019-01-31 01:08:41,908 : INFO : topic #44 (0.020): 0.031*\"rooftop\" + 0.029*\"final\" + 0.024*\"wife\" + 0.021*\"tourist\" + 0.018*\"champion\" + 0.015*\"chamber\" + 0.014*\"taxpay\" + 0.014*\"tiepolo\" + 0.013*\"martin\" + 0.013*\"women\"\n", + "2019-01-31 01:08:41,909 : INFO : topic #14 (0.020): 0.024*\"forc\" + 0.022*\"aggress\" + 0.020*\"armi\" + 0.020*\"walter\" + 0.018*\"com\" + 0.015*\"oper\" + 0.014*\"unionist\" + 0.013*\"militari\" + 0.011*\"airbu\" + 0.011*\"diversifi\"\n", + "2019-01-31 01:08:41,910 : INFO : topic #1 (0.020): 0.055*\"china\" + 0.047*\"chilton\" + 0.025*\"hong\" + 0.024*\"kong\" + 0.022*\"korea\" + 0.020*\"korean\" + 0.017*\"sourc\" + 0.015*\"leah\" + 0.014*\"kim\" + 0.013*\"shirin\"\n", + "2019-01-31 01:08:41,916 : INFO : topic diff=0.004023, rho=0.025582\n", + "2019-01-31 01:08:42,071 : INFO : PROGRESS: pass 0, at document #3058000/4922894\n", + "2019-01-31 01:08:43,431 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 01:08:43,697 : INFO : topic #47 (0.020): 0.064*\"muscl\" + 0.032*\"perceptu\" + 0.018*\"theater\" + 0.018*\"compos\" + 0.018*\"place\" + 0.015*\"orchestr\" + 0.015*\"damn\" + 0.012*\"physician\" + 0.012*\"olympo\" + 0.012*\"word\"\n", + "2019-01-31 01:08:43,698 : INFO : topic #38 (0.020): 0.023*\"walter\" + 0.012*\"aza\" + 0.009*\"battalion\" + 0.009*\"teufel\" + 0.009*\"forc\" + 0.007*\"till\" + 0.007*\"empath\" + 0.007*\"armi\" + 0.006*\"militari\" + 0.006*\"govern\"\n", + "2019-01-31 01:08:43,700 : INFO : topic #19 (0.020): 0.018*\"languag\" + 0.015*\"centuri\" + 0.011*\"woodcut\" + 0.009*\"form\" + 0.009*\"mean\" + 0.009*\"origin\" + 0.008*\"trade\" + 0.008*\"english\" + 0.007*\"known\" + 0.007*\"ancestor\"\n", + "2019-01-31 01:08:43,701 : INFO : topic #15 (0.020): 0.011*\"small\" + 0.010*\"organ\" + 0.010*\"develop\" + 0.010*\"commun\" + 0.009*\"group\" + 0.008*\"peopl\" + 0.008*\"word\" + 0.007*\"human\" + 0.006*\"summerhil\" + 0.006*\"woman\"\n", + "2019-01-31 01:08:43,702 : INFO : topic #40 (0.020): 0.087*\"unit\" + 0.023*\"schuster\" + 0.021*\"requir\" + 0.021*\"institut\" + 0.021*\"collector\" + 0.019*\"student\" + 0.015*\"professor\" + 0.012*\"word\" + 0.011*\"http\" + 0.011*\"governor\"\n", + "2019-01-31 01:08:43,707 : INFO : topic diff=0.003612, rho=0.025574\n", + "2019-01-31 01:08:46,497 : INFO : -12.020 per-word bound, 4154.6 perplexity estimate based on a held-out corpus of 2000 documents with 579488 words\n", + "2019-01-31 01:08:46,497 : INFO : PROGRESS: pass 0, at document #3060000/4922894\n", + "2019-01-31 01:08:47,921 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:08:48,187 : INFO : topic #47 (0.020): 0.064*\"muscl\" + 0.032*\"perceptu\" + 0.019*\"theater\" + 0.018*\"place\" + 0.018*\"compos\" + 0.015*\"orchestr\" + 0.014*\"damn\" + 0.012*\"olympo\" + 0.012*\"physician\" + 0.012*\"word\"\n", + "2019-01-31 01:08:48,188 : INFO : topic #26 (0.020): 0.031*\"workplac\" + 0.028*\"champion\" + 0.028*\"woman\" + 0.025*\"olymp\" + 0.024*\"men\" + 0.022*\"medal\" + 0.020*\"event\" + 0.018*\"atheist\" + 0.018*\"rainfal\" + 0.017*\"taxpay\"\n", + "2019-01-31 01:08:48,189 : INFO : topic #40 (0.020): 0.087*\"unit\" + 0.023*\"schuster\" + 0.021*\"requir\" + 0.021*\"institut\" + 0.021*\"collector\" + 0.019*\"student\" + 0.015*\"professor\" + 0.012*\"word\" + 0.012*\"http\" + 0.011*\"governor\"\n", + "2019-01-31 01:08:48,190 : INFO : topic #44 (0.020): 0.030*\"rooftop\" + 0.030*\"final\" + 0.023*\"wife\" + 0.021*\"tourist\" + 0.018*\"champion\" + 0.015*\"chamber\" + 0.014*\"taxpay\" + 0.014*\"tiepolo\" + 0.013*\"martin\" + 0.013*\"open\"\n", + "2019-01-31 01:08:48,191 : INFO : topic #19 (0.020): 0.018*\"languag\" + 0.015*\"centuri\" + 0.011*\"woodcut\" + 0.009*\"form\" + 0.009*\"mean\" + 0.009*\"origin\" + 0.008*\"trade\" + 0.008*\"english\" + 0.007*\"known\" + 0.007*\"modern\"\n", + "2019-01-31 01:08:48,197 : INFO : topic diff=0.003568, rho=0.025565\n", + "2019-01-31 01:08:48,352 : INFO : PROGRESS: pass 0, at document #3062000/4922894\n", + "2019-01-31 01:08:49,732 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:08:49,997 : INFO : topic #44 (0.020): 0.030*\"rooftop\" + 0.030*\"final\" + 0.023*\"wife\" + 0.021*\"tourist\" + 0.018*\"champion\" + 0.015*\"chamber\" + 0.014*\"tiepolo\" + 0.014*\"taxpay\" + 0.013*\"martin\" + 0.013*\"women\"\n", + "2019-01-31 01:08:49,998 : INFO : topic #8 (0.020): 0.026*\"law\" + 0.023*\"cortic\" + 0.019*\"start\" + 0.016*\"act\" + 0.013*\"ricardo\" + 0.012*\"case\" + 0.010*\"replac\" + 0.010*\"polaris\" + 0.009*\"legal\" + 0.007*\"justic\"\n", + "2019-01-31 01:08:50,000 : INFO : topic #4 (0.020): 0.021*\"enfranchis\" + 0.015*\"pour\" + 0.015*\"depress\" + 0.010*\"mode\" + 0.008*\"elabor\" + 0.008*\"veget\" + 0.007*\"uruguayan\" + 0.006*\"produc\" + 0.006*\"encyclopedia\" + 0.006*\"spectacl\"\n", + "2019-01-31 01:08:50,001 : INFO : topic #16 (0.020): 0.055*\"king\" + 0.033*\"priest\" + 0.022*\"duke\" + 0.018*\"idiosyncrat\" + 0.018*\"quarterli\" + 0.017*\"grammat\" + 0.017*\"rotterdam\" + 0.013*\"princ\" + 0.013*\"brazil\" + 0.013*\"count\"\n", + "2019-01-31 01:08:50,001 : INFO : topic #33 (0.020): 0.059*\"french\" + 0.047*\"franc\" + 0.032*\"pari\" + 0.027*\"sail\" + 0.023*\"jean\" + 0.018*\"daphn\" + 0.014*\"lazi\" + 0.013*\"loui\" + 0.011*\"piec\" + 0.009*\"wine\"\n", + "2019-01-31 01:08:50,007 : INFO : topic diff=0.003337, rho=0.025557\n", + "2019-01-31 01:08:50,166 : INFO : PROGRESS: pass 0, at document #3064000/4922894\n", + "2019-01-31 01:08:51,568 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:08:51,834 : INFO : topic #49 (0.020): 0.046*\"india\" + 0.029*\"incumb\" + 0.014*\"pakistan\" + 0.013*\"islam\" + 0.012*\"anglo\" + 0.012*\"muskoge\" + 0.011*\"alam\" + 0.011*\"affection\" + 0.011*\"televis\" + 0.010*\"khalsa\"\n", + "2019-01-31 01:08:51,835 : INFO : topic #12 (0.020): 0.009*\"number\" + 0.007*\"frontal\" + 0.007*\"gener\" + 0.007*\"poet\" + 0.006*\"théori\" + 0.006*\"exampl\" + 0.006*\"southern\" + 0.005*\"utopian\" + 0.005*\"differ\" + 0.005*\"servitud\"\n", + "2019-01-31 01:08:51,836 : INFO : topic #41 (0.020): 0.041*\"citi\" + 0.024*\"palmer\" + 0.021*\"new\" + 0.015*\"strategist\" + 0.014*\"center\" + 0.013*\"open\" + 0.011*\"dai\" + 0.011*\"includ\" + 0.011*\"lobe\" + 0.009*\"highli\"\n", + "2019-01-31 01:08:51,837 : INFO : topic #25 (0.020): 0.032*\"ring\" + 0.019*\"area\" + 0.018*\"lagrang\" + 0.016*\"warmth\" + 0.016*\"mount\" + 0.010*\"north\" + 0.009*\"palmer\" + 0.009*\"sourc\" + 0.008*\"vacant\" + 0.008*\"lobe\"\n", + "2019-01-31 01:08:51,838 : INFO : topic #42 (0.020): 0.046*\"german\" + 0.031*\"germani\" + 0.015*\"vol\" + 0.015*\"jewish\" + 0.015*\"berlin\" + 0.014*\"israel\" + 0.013*\"der\" + 0.011*\"european\" + 0.010*\"europ\" + 0.009*\"austria\"\n", + "2019-01-31 01:08:51,844 : INFO : topic diff=0.004235, rho=0.025549\n", + "2019-01-31 01:08:52,004 : INFO : PROGRESS: pass 0, at document #3066000/4922894\n", + "2019-01-31 01:08:53,405 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:08:53,675 : INFO : topic #30 (0.020): 0.036*\"leagu\" + 0.036*\"cleveland\" + 0.030*\"place\" + 0.027*\"taxpay\" + 0.024*\"scientist\" + 0.024*\"crete\" + 0.021*\"folei\" + 0.017*\"goal\" + 0.015*\"martin\" + 0.013*\"schmitz\"\n", + "2019-01-31 01:08:53,676 : INFO : topic #5 (0.020): 0.038*\"abroad\" + 0.028*\"son\" + 0.026*\"rel\" + 0.025*\"reconstruct\" + 0.021*\"band\" + 0.016*\"muscl\" + 0.016*\"simultan\" + 0.014*\"charcoal\" + 0.014*\"toyota\" + 0.010*\"myspac\"\n", + "2019-01-31 01:08:53,677 : INFO : topic #44 (0.020): 0.030*\"rooftop\" + 0.030*\"final\" + 0.024*\"wife\" + 0.021*\"tourist\" + 0.018*\"champion\" + 0.015*\"chamber\" + 0.014*\"taxpay\" + 0.014*\"tiepolo\" + 0.013*\"martin\" + 0.013*\"open\"\n", + "2019-01-31 01:08:53,678 : INFO : topic #34 (0.020): 0.068*\"start\" + 0.034*\"new\" + 0.032*\"american\" + 0.030*\"unionist\" + 0.025*\"cotton\" + 0.021*\"year\" + 0.015*\"california\" + 0.013*\"warrior\" + 0.013*\"terri\" + 0.012*\"north\"\n", + "2019-01-31 01:08:53,679 : INFO : topic #14 (0.020): 0.024*\"forc\" + 0.022*\"aggress\" + 0.020*\"armi\" + 0.020*\"walter\" + 0.018*\"com\" + 0.015*\"oper\" + 0.014*\"unionist\" + 0.013*\"militari\" + 0.011*\"airbu\" + 0.011*\"diversifi\"\n", + "2019-01-31 01:08:53,685 : INFO : topic diff=0.004608, rho=0.025540\n", + "2019-01-31 01:08:53,837 : INFO : PROGRESS: pass 0, at document #3068000/4922894\n", + "2019-01-31 01:08:55,188 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:08:55,454 : INFO : topic #40 (0.020): 0.087*\"unit\" + 0.023*\"schuster\" + 0.021*\"requir\" + 0.021*\"institut\" + 0.021*\"collector\" + 0.019*\"student\" + 0.015*\"professor\" + 0.012*\"word\" + 0.011*\"http\" + 0.011*\"governor\"\n", + "2019-01-31 01:08:55,455 : INFO : topic #4 (0.020): 0.021*\"enfranchis\" + 0.015*\"depress\" + 0.014*\"pour\" + 0.010*\"mode\" + 0.008*\"elabor\" + 0.008*\"veget\" + 0.007*\"uruguayan\" + 0.006*\"produc\" + 0.006*\"encyclopedia\" + 0.006*\"spectacl\"\n", + "2019-01-31 01:08:55,456 : INFO : topic #2 (0.020): 0.053*\"isl\" + 0.038*\"shield\" + 0.018*\"narrat\" + 0.015*\"scot\" + 0.013*\"pope\" + 0.012*\"blur\" + 0.011*\"nativist\" + 0.011*\"coalit\" + 0.009*\"bahá\" + 0.009*\"fleet\"\n", + "2019-01-31 01:08:55,457 : INFO : topic #25 (0.020): 0.032*\"ring\" + 0.019*\"area\" + 0.018*\"lagrang\" + 0.016*\"warmth\" + 0.016*\"mount\" + 0.010*\"north\" + 0.009*\"palmer\" + 0.009*\"sourc\" + 0.009*\"vacant\" + 0.008*\"lobe\"\n", + "2019-01-31 01:08:55,458 : INFO : topic #19 (0.020): 0.018*\"languag\" + 0.015*\"centuri\" + 0.011*\"woodcut\" + 0.010*\"form\" + 0.009*\"mean\" + 0.009*\"origin\" + 0.008*\"trade\" + 0.008*\"english\" + 0.007*\"known\" + 0.007*\"modern\"\n", + "2019-01-31 01:08:55,464 : INFO : topic diff=0.004271, rho=0.025532\n", + "2019-01-31 01:08:55,678 : INFO : PROGRESS: pass 0, at document #3070000/4922894\n", + "2019-01-31 01:08:57,087 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 01:08:57,354 : INFO : topic #44 (0.020): 0.031*\"rooftop\" + 0.030*\"final\" + 0.024*\"wife\" + 0.021*\"tourist\" + 0.018*\"champion\" + 0.015*\"chamber\" + 0.014*\"tiepolo\" + 0.014*\"taxpay\" + 0.013*\"martin\" + 0.013*\"women\"\n", + "2019-01-31 01:08:57,355 : INFO : topic #43 (0.020): 0.065*\"elect\" + 0.054*\"parti\" + 0.025*\"voluntari\" + 0.023*\"democrat\" + 0.020*\"member\" + 0.016*\"polici\" + 0.016*\"republ\" + 0.014*\"bypass\" + 0.014*\"selma\" + 0.013*\"seaport\"\n", + "2019-01-31 01:08:57,356 : INFO : topic #48 (0.020): 0.081*\"march\" + 0.078*\"octob\" + 0.075*\"sens\" + 0.071*\"januari\" + 0.069*\"notion\" + 0.069*\"juli\" + 0.067*\"august\" + 0.066*\"decatur\" + 0.066*\"judici\" + 0.066*\"april\"\n", + "2019-01-31 01:08:57,357 : INFO : topic #12 (0.020): 0.009*\"number\" + 0.007*\"frontal\" + 0.007*\"gener\" + 0.007*\"poet\" + 0.006*\"théori\" + 0.006*\"exampl\" + 0.006*\"southern\" + 0.006*\"utopian\" + 0.005*\"differ\" + 0.005*\"measur\"\n", + "2019-01-31 01:08:57,358 : INFO : topic #35 (0.020): 0.055*\"russia\" + 0.035*\"sovereignti\" + 0.034*\"rural\" + 0.026*\"personifi\" + 0.024*\"reprint\" + 0.023*\"poison\" + 0.020*\"moscow\" + 0.016*\"poland\" + 0.015*\"unfortun\" + 0.014*\"czech\"\n", + "2019-01-31 01:08:57,363 : INFO : topic diff=0.003679, rho=0.025524\n", + "2019-01-31 01:08:57,518 : INFO : PROGRESS: pass 0, at document #3072000/4922894\n", + "2019-01-31 01:08:58,891 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:08:59,158 : INFO : topic #5 (0.020): 0.038*\"abroad\" + 0.028*\"son\" + 0.026*\"rel\" + 0.025*\"reconstruct\" + 0.021*\"band\" + 0.016*\"muscl\" + 0.016*\"simultan\" + 0.014*\"charcoal\" + 0.014*\"toyota\" + 0.010*\"myspac\"\n", + "2019-01-31 01:08:59,159 : INFO : topic #48 (0.020): 0.080*\"march\" + 0.077*\"octob\" + 0.075*\"sens\" + 0.071*\"januari\" + 0.069*\"notion\" + 0.068*\"juli\" + 0.066*\"decatur\" + 0.066*\"august\" + 0.065*\"april\" + 0.065*\"judici\"\n", + "2019-01-31 01:08:59,161 : INFO : topic #8 (0.020): 0.027*\"law\" + 0.023*\"cortic\" + 0.019*\"start\" + 0.016*\"act\" + 0.013*\"ricardo\" + 0.012*\"case\" + 0.010*\"replac\" + 0.009*\"polaris\" + 0.009*\"legal\" + 0.007*\"justic\"\n", + "2019-01-31 01:08:59,162 : INFO : topic #15 (0.020): 0.011*\"small\" + 0.010*\"organ\" + 0.010*\"develop\" + 0.010*\"commun\" + 0.009*\"group\" + 0.008*\"peopl\" + 0.008*\"word\" + 0.008*\"human\" + 0.007*\"woman\" + 0.006*\"workplac\"\n", + "2019-01-31 01:08:59,163 : INFO : topic #34 (0.020): 0.068*\"start\" + 0.034*\"new\" + 0.032*\"american\" + 0.029*\"unionist\" + 0.025*\"cotton\" + 0.021*\"year\" + 0.015*\"california\" + 0.013*\"warrior\" + 0.012*\"terri\" + 0.012*\"north\"\n", + "2019-01-31 01:08:59,168 : INFO : topic diff=0.004168, rho=0.025516\n", + "2019-01-31 01:08:59,324 : INFO : PROGRESS: pass 0, at document #3074000/4922894\n", + "2019-01-31 01:09:00,713 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:09:00,979 : INFO : topic #10 (0.020): 0.012*\"cdd\" + 0.009*\"media\" + 0.008*\"disco\" + 0.008*\"hormon\" + 0.008*\"have\" + 0.007*\"pathwai\" + 0.007*\"caus\" + 0.006*\"proper\" + 0.006*\"treat\" + 0.006*\"effect\"\n", + "2019-01-31 01:09:00,980 : INFO : topic #9 (0.020): 0.070*\"bone\" + 0.047*\"american\" + 0.031*\"valour\" + 0.020*\"dutch\" + 0.019*\"folei\" + 0.019*\"player\" + 0.017*\"polit\" + 0.017*\"english\" + 0.013*\"simpler\" + 0.011*\"acrimoni\"\n", + "2019-01-31 01:09:00,981 : INFO : topic #22 (0.020): 0.035*\"spars\" + 0.020*\"factor\" + 0.011*\"plaisir\" + 0.010*\"genu\" + 0.009*\"western\" + 0.009*\"median\" + 0.008*\"male\" + 0.008*\"feel\" + 0.008*\"biom\" + 0.008*\"incom\"\n", + "2019-01-31 01:09:00,982 : INFO : topic #48 (0.020): 0.080*\"march\" + 0.077*\"octob\" + 0.075*\"sens\" + 0.071*\"januari\" + 0.069*\"notion\" + 0.068*\"juli\" + 0.066*\"decatur\" + 0.066*\"august\" + 0.066*\"april\" + 0.065*\"judici\"\n", + "2019-01-31 01:09:00,983 : INFO : topic #35 (0.020): 0.055*\"russia\" + 0.035*\"sovereignti\" + 0.035*\"rural\" + 0.027*\"personifi\" + 0.024*\"reprint\" + 0.023*\"poison\" + 0.021*\"moscow\" + 0.016*\"poland\" + 0.015*\"unfortun\" + 0.014*\"czech\"\n", + "2019-01-31 01:09:00,989 : INFO : topic diff=0.004360, rho=0.025507\n", + "2019-01-31 01:09:01,151 : INFO : PROGRESS: pass 0, at document #3076000/4922894\n", + "2019-01-31 01:09:02,533 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:09:02,802 : INFO : topic #14 (0.020): 0.024*\"forc\" + 0.022*\"aggress\" + 0.020*\"walter\" + 0.020*\"armi\" + 0.018*\"com\" + 0.014*\"oper\" + 0.014*\"unionist\" + 0.013*\"militari\" + 0.011*\"airbu\" + 0.011*\"diversifi\"\n", + "2019-01-31 01:09:02,803 : INFO : topic #11 (0.020): 0.024*\"john\" + 0.013*\"will\" + 0.011*\"david\" + 0.011*\"jame\" + 0.010*\"rival\" + 0.009*\"mexican–american\" + 0.009*\"paul\" + 0.008*\"slur\" + 0.008*\"georg\" + 0.007*\"rhyme\"\n", + "2019-01-31 01:09:02,804 : INFO : topic #39 (0.020): 0.057*\"canada\" + 0.043*\"canadian\" + 0.024*\"toronto\" + 0.023*\"hoar\" + 0.019*\"ontario\" + 0.015*\"hydrogen\" + 0.015*\"novotná\" + 0.014*\"new\" + 0.014*\"misericordia\" + 0.014*\"quebec\"\n", + "2019-01-31 01:09:02,805 : INFO : topic #16 (0.020): 0.056*\"king\" + 0.032*\"priest\" + 0.023*\"duke\" + 0.019*\"idiosyncrat\" + 0.018*\"grammat\" + 0.018*\"quarterli\" + 0.018*\"rotterdam\" + 0.013*\"princ\" + 0.013*\"count\" + 0.012*\"brazil\"\n", + "2019-01-31 01:09:02,806 : INFO : topic #22 (0.020): 0.035*\"spars\" + 0.020*\"factor\" + 0.011*\"plaisir\" + 0.010*\"genu\" + 0.009*\"western\" + 0.009*\"feel\" + 0.009*\"median\" + 0.008*\"male\" + 0.008*\"biom\" + 0.008*\"incom\"\n", + "2019-01-31 01:09:02,812 : INFO : topic diff=0.003791, rho=0.025499\n", + "2019-01-31 01:09:02,968 : INFO : PROGRESS: pass 0, at document #3078000/4922894\n", + "2019-01-31 01:09:04,344 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:09:04,611 : INFO : topic #28 (0.020): 0.033*\"build\" + 0.026*\"hous\" + 0.018*\"buford\" + 0.017*\"rivièr\" + 0.014*\"histor\" + 0.011*\"constitut\" + 0.011*\"briarwood\" + 0.011*\"depress\" + 0.011*\"linear\" + 0.010*\"silicon\"\n", + "2019-01-31 01:09:04,612 : INFO : topic #6 (0.020): 0.072*\"fewer\" + 0.024*\"epiru\" + 0.021*\"septemb\" + 0.018*\"teacher\" + 0.016*\"stake\" + 0.013*\"proclaim\" + 0.013*\"rodríguez\" + 0.011*\"direct\" + 0.011*\"movi\" + 0.011*\"acrimoni\"\n", + "2019-01-31 01:09:04,613 : INFO : topic #5 (0.020): 0.038*\"abroad\" + 0.028*\"son\" + 0.026*\"rel\" + 0.025*\"reconstruct\" + 0.021*\"band\" + 0.016*\"muscl\" + 0.016*\"simultan\" + 0.014*\"charcoal\" + 0.013*\"toyota\" + 0.010*\"myspac\"\n", + "2019-01-31 01:09:04,614 : INFO : topic #23 (0.020): 0.137*\"audit\" + 0.069*\"best\" + 0.034*\"yawn\" + 0.028*\"jacksonvil\" + 0.022*\"japanes\" + 0.021*\"festiv\" + 0.021*\"noll\" + 0.019*\"women\" + 0.016*\"intern\" + 0.013*\"prison\"\n", + "2019-01-31 01:09:04,615 : INFO : topic #46 (0.020): 0.018*\"sweden\" + 0.017*\"swedish\" + 0.016*\"stop\" + 0.016*\"norwai\" + 0.014*\"norwegian\" + 0.013*\"wind\" + 0.012*\"treeless\" + 0.012*\"damag\" + 0.011*\"denmark\" + 0.011*\"huntsvil\"\n", + "2019-01-31 01:09:04,621 : INFO : topic diff=0.003783, rho=0.025491\n", + "2019-01-31 01:09:07,312 : INFO : -11.967 per-word bound, 4003.4 perplexity estimate based on a held-out corpus of 2000 documents with 561897 words\n", + "2019-01-31 01:09:07,312 : INFO : PROGRESS: pass 0, at document #3080000/4922894\n", + "2019-01-31 01:09:08,685 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:09:08,951 : INFO : topic #21 (0.020): 0.033*\"samford\" + 0.021*\"spain\" + 0.018*\"del\" + 0.016*\"italian\" + 0.016*\"mexico\" + 0.012*\"soviet\" + 0.011*\"juan\" + 0.011*\"santa\" + 0.011*\"itali\" + 0.010*\"francisco\"\n", + "2019-01-31 01:09:08,952 : INFO : topic #43 (0.020): 0.064*\"elect\" + 0.054*\"parti\" + 0.025*\"voluntari\" + 0.023*\"democrat\" + 0.021*\"member\" + 0.016*\"polici\" + 0.015*\"republ\" + 0.014*\"bypass\" + 0.013*\"selma\" + 0.013*\"seaport\"\n", + "2019-01-31 01:09:08,953 : INFO : topic #34 (0.020): 0.068*\"start\" + 0.034*\"new\" + 0.032*\"american\" + 0.030*\"unionist\" + 0.025*\"cotton\" + 0.021*\"year\" + 0.015*\"california\" + 0.013*\"warrior\" + 0.013*\"terri\" + 0.012*\"north\"\n", + "2019-01-31 01:09:08,954 : INFO : topic #13 (0.020): 0.027*\"london\" + 0.027*\"new\" + 0.026*\"australia\" + 0.026*\"sourc\" + 0.023*\"england\" + 0.022*\"australian\" + 0.019*\"british\" + 0.018*\"ireland\" + 0.015*\"youth\" + 0.014*\"wale\"\n", + "2019-01-31 01:09:08,955 : INFO : topic #30 (0.020): 0.036*\"leagu\" + 0.036*\"cleveland\" + 0.030*\"place\" + 0.027*\"taxpay\" + 0.024*\"scientist\" + 0.024*\"crete\" + 0.021*\"folei\" + 0.017*\"goal\" + 0.015*\"martin\" + 0.012*\"schmitz\"\n", + "2019-01-31 01:09:08,961 : INFO : topic diff=0.004487, rho=0.025482\n", + "2019-01-31 01:09:09,115 : INFO : PROGRESS: pass 0, at document #3082000/4922894\n", + "2019-01-31 01:09:10,473 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 01:09:10,740 : INFO : topic #30 (0.020): 0.036*\"leagu\" + 0.036*\"cleveland\" + 0.030*\"place\" + 0.027*\"taxpay\" + 0.024*\"scientist\" + 0.024*\"crete\" + 0.021*\"folei\" + 0.017*\"goal\" + 0.015*\"martin\" + 0.012*\"schmitz\"\n", + "2019-01-31 01:09:10,741 : INFO : topic #12 (0.020): 0.009*\"number\" + 0.007*\"frontal\" + 0.007*\"théori\" + 0.007*\"gener\" + 0.007*\"poet\" + 0.006*\"exampl\" + 0.006*\"southern\" + 0.006*\"utopian\" + 0.005*\"differ\" + 0.005*\"method\"\n", + "2019-01-31 01:09:10,742 : INFO : topic #44 (0.020): 0.032*\"rooftop\" + 0.030*\"final\" + 0.024*\"wife\" + 0.021*\"tourist\" + 0.018*\"champion\" + 0.014*\"chamber\" + 0.014*\"tiepolo\" + 0.014*\"taxpay\" + 0.014*\"martin\" + 0.013*\"winner\"\n", + "2019-01-31 01:09:10,743 : INFO : topic #38 (0.020): 0.023*\"walter\" + 0.012*\"aza\" + 0.009*\"battalion\" + 0.009*\"forc\" + 0.008*\"teufel\" + 0.007*\"empath\" + 0.007*\"armi\" + 0.007*\"till\" + 0.007*\"govern\" + 0.006*\"militari\"\n", + "2019-01-31 01:09:10,744 : INFO : topic #25 (0.020): 0.032*\"ring\" + 0.019*\"area\" + 0.017*\"lagrang\" + 0.017*\"mount\" + 0.016*\"warmth\" + 0.010*\"north\" + 0.009*\"palmer\" + 0.009*\"sourc\" + 0.009*\"foam\" + 0.008*\"vacant\"\n", + "2019-01-31 01:09:10,750 : INFO : topic diff=0.004358, rho=0.025474\n", + "2019-01-31 01:09:10,905 : INFO : PROGRESS: pass 0, at document #3084000/4922894\n", + "2019-01-31 01:09:12,282 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:09:12,549 : INFO : topic #0 (0.020): 0.067*\"statewid\" + 0.043*\"line\" + 0.034*\"raid\" + 0.025*\"rosenwald\" + 0.021*\"traceabl\" + 0.020*\"serv\" + 0.015*\"museo\" + 0.014*\"oper\" + 0.010*\"radiu\" + 0.010*\"brook\"\n", + "2019-01-31 01:09:12,550 : INFO : topic #37 (0.020): 0.012*\"charact\" + 0.011*\"septemb\" + 0.010*\"man\" + 0.009*\"anim\" + 0.007*\"appear\" + 0.007*\"comic\" + 0.006*\"workplac\" + 0.006*\"love\" + 0.006*\"dixi\" + 0.006*\"fusiform\"\n", + "2019-01-31 01:09:12,551 : INFO : topic #26 (0.020): 0.031*\"workplac\" + 0.029*\"champion\" + 0.028*\"woman\" + 0.026*\"olymp\" + 0.024*\"men\" + 0.022*\"medal\" + 0.020*\"event\" + 0.019*\"atheist\" + 0.018*\"rainfal\" + 0.017*\"taxpay\"\n", + "2019-01-31 01:09:12,552 : INFO : topic #5 (0.020): 0.038*\"abroad\" + 0.028*\"son\" + 0.026*\"rel\" + 0.025*\"reconstruct\" + 0.021*\"band\" + 0.016*\"muscl\" + 0.016*\"simultan\" + 0.014*\"charcoal\" + 0.013*\"toyota\" + 0.010*\"vocabulari\"\n", + "2019-01-31 01:09:12,553 : INFO : topic #24 (0.020): 0.039*\"book\" + 0.033*\"publicis\" + 0.027*\"word\" + 0.018*\"new\" + 0.015*\"arsen\" + 0.013*\"edit\" + 0.013*\"presid\" + 0.011*\"collect\" + 0.010*\"author\" + 0.010*\"worldwid\"\n", + "2019-01-31 01:09:12,559 : INFO : topic diff=0.004597, rho=0.025466\n", + "2019-01-31 01:09:12,717 : INFO : PROGRESS: pass 0, at document #3086000/4922894\n", + "2019-01-31 01:09:14,105 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:09:14,371 : INFO : topic #34 (0.020): 0.068*\"start\" + 0.034*\"new\" + 0.032*\"american\" + 0.029*\"unionist\" + 0.024*\"cotton\" + 0.021*\"year\" + 0.015*\"california\" + 0.014*\"warrior\" + 0.013*\"terri\" + 0.012*\"north\"\n", + "2019-01-31 01:09:14,372 : INFO : topic #26 (0.020): 0.031*\"workplac\" + 0.029*\"champion\" + 0.029*\"woman\" + 0.026*\"olymp\" + 0.024*\"men\" + 0.022*\"medal\" + 0.020*\"event\" + 0.019*\"atheist\" + 0.018*\"rainfal\" + 0.017*\"alic\"\n", + "2019-01-31 01:09:14,373 : INFO : topic #21 (0.020): 0.033*\"samford\" + 0.021*\"spain\" + 0.018*\"del\" + 0.016*\"mexico\" + 0.016*\"italian\" + 0.013*\"soviet\" + 0.011*\"juan\" + 0.011*\"santa\" + 0.011*\"francisco\" + 0.010*\"itali\"\n", + "2019-01-31 01:09:14,374 : INFO : topic #49 (0.020): 0.046*\"india\" + 0.031*\"incumb\" + 0.013*\"pakistan\" + 0.013*\"islam\" + 0.012*\"anglo\" + 0.011*\"televis\" + 0.011*\"muskoge\" + 0.011*\"alam\" + 0.011*\"affection\" + 0.010*\"tajikistan\"\n", + "2019-01-31 01:09:14,375 : INFO : topic #29 (0.020): 0.029*\"companhia\" + 0.012*\"busi\" + 0.012*\"bank\" + 0.012*\"million\" + 0.012*\"market\" + 0.011*\"produc\" + 0.010*\"industri\" + 0.008*\"yawn\" + 0.008*\"manag\" + 0.007*\"trace\"\n", + "2019-01-31 01:09:14,380 : INFO : topic diff=0.003159, rho=0.025458\n", + "2019-01-31 01:09:14,539 : INFO : PROGRESS: pass 0, at document #3088000/4922894\n", + "2019-01-31 01:09:15,937 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:09:16,203 : INFO : topic #20 (0.020): 0.150*\"scholar\" + 0.039*\"struggl\" + 0.037*\"high\" + 0.029*\"educ\" + 0.024*\"collector\" + 0.018*\"yawn\" + 0.013*\"prognosi\" + 0.009*\"task\" + 0.009*\"class\" + 0.009*\"gothic\"\n", + "2019-01-31 01:09:16,205 : INFO : topic #36 (0.020): 0.011*\"network\" + 0.010*\"prognosi\" + 0.010*\"pop\" + 0.009*\"cytokin\" + 0.008*\"develop\" + 0.008*\"uruguayan\" + 0.008*\"user\" + 0.007*\"includ\" + 0.007*\"championship\" + 0.007*\"softwar\"\n", + "2019-01-31 01:09:16,205 : INFO : topic #23 (0.020): 0.136*\"audit\" + 0.071*\"best\" + 0.034*\"yawn\" + 0.028*\"jacksonvil\" + 0.022*\"japanes\" + 0.021*\"festiv\" + 0.021*\"noll\" + 0.019*\"women\" + 0.016*\"intern\" + 0.013*\"prison\"\n", + "2019-01-31 01:09:16,206 : INFO : topic #28 (0.020): 0.033*\"build\" + 0.026*\"hous\" + 0.018*\"rivièr\" + 0.018*\"buford\" + 0.014*\"histor\" + 0.011*\"constitut\" + 0.011*\"briarwood\" + 0.011*\"depress\" + 0.011*\"linear\" + 0.010*\"strategist\"\n", + "2019-01-31 01:09:16,207 : INFO : topic #18 (0.020): 0.011*\"théori\" + 0.007*\"later\" + 0.007*\"sack\" + 0.006*\"dai\" + 0.006*\"kill\" + 0.005*\"like\" + 0.005*\"retrospect\" + 0.005*\"end\" + 0.004*\"call\" + 0.004*\"help\"\n", + "2019-01-31 01:09:16,213 : INFO : topic diff=0.004542, rho=0.025449\n", + "2019-01-31 01:09:16,374 : INFO : PROGRESS: pass 0, at document #3090000/4922894\n", + "2019-01-31 01:09:17,741 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:09:18,010 : INFO : topic #19 (0.020): 0.017*\"languag\" + 0.015*\"centuri\" + 0.011*\"woodcut\" + 0.009*\"form\" + 0.009*\"mean\" + 0.009*\"origin\" + 0.008*\"trade\" + 0.007*\"english\" + 0.007*\"known\" + 0.007*\"ancestor\"\n", + "2019-01-31 01:09:18,011 : INFO : topic #12 (0.020): 0.009*\"number\" + 0.007*\"frontal\" + 0.007*\"poet\" + 0.007*\"gener\" + 0.007*\"théori\" + 0.006*\"exampl\" + 0.006*\"utopian\" + 0.006*\"method\" + 0.006*\"southern\" + 0.005*\"differ\"\n", + "2019-01-31 01:09:18,012 : INFO : topic #7 (0.020): 0.021*\"snatch\" + 0.020*\"di\" + 0.019*\"factor\" + 0.016*\"yawn\" + 0.015*\"margin\" + 0.014*\"bone\" + 0.012*\"faster\" + 0.012*\"life\" + 0.012*\"deal\" + 0.012*\"daughter\"\n", + "2019-01-31 01:09:18,013 : INFO : topic #28 (0.020): 0.033*\"build\" + 0.026*\"hous\" + 0.018*\"rivièr\" + 0.018*\"buford\" + 0.014*\"histor\" + 0.012*\"briarwood\" + 0.011*\"constitut\" + 0.011*\"depress\" + 0.011*\"linear\" + 0.010*\"silicon\"\n", + "2019-01-31 01:09:18,014 : INFO : topic #31 (0.020): 0.054*\"fusiform\" + 0.027*\"scientist\" + 0.025*\"taxpay\" + 0.023*\"player\" + 0.020*\"place\" + 0.014*\"clot\" + 0.012*\"leagu\" + 0.011*\"folei\" + 0.010*\"yawn\" + 0.009*\"reconstruct\"\n", + "2019-01-31 01:09:18,020 : INFO : topic diff=0.004041, rho=0.025441\n", + "2019-01-31 01:09:18,173 : INFO : PROGRESS: pass 0, at document #3092000/4922894\n", + "2019-01-31 01:09:19,535 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:09:19,801 : INFO : topic #16 (0.020): 0.057*\"king\" + 0.032*\"priest\" + 0.021*\"duke\" + 0.019*\"idiosyncrat\" + 0.018*\"grammat\" + 0.018*\"quarterli\" + 0.018*\"rotterdam\" + 0.013*\"count\" + 0.012*\"princ\" + 0.012*\"brazil\"\n", + "2019-01-31 01:09:19,802 : INFO : topic #35 (0.020): 0.056*\"russia\" + 0.038*\"sovereignti\" + 0.035*\"rural\" + 0.026*\"personifi\" + 0.024*\"reprint\" + 0.022*\"poison\" + 0.021*\"moscow\" + 0.016*\"unfortun\" + 0.016*\"poland\" + 0.014*\"czech\"\n", + "2019-01-31 01:09:19,804 : INFO : topic #33 (0.020): 0.058*\"french\" + 0.047*\"franc\" + 0.034*\"pari\" + 0.027*\"sail\" + 0.022*\"jean\" + 0.018*\"daphn\" + 0.014*\"lazi\" + 0.013*\"loui\" + 0.011*\"piec\" + 0.009*\"wine\"\n", + "2019-01-31 01:09:19,805 : INFO : topic #12 (0.020): 0.009*\"number\" + 0.007*\"frontal\" + 0.007*\"poet\" + 0.007*\"gener\" + 0.007*\"théori\" + 0.006*\"exampl\" + 0.006*\"utopian\" + 0.006*\"method\" + 0.005*\"southern\" + 0.005*\"differ\"\n", + "2019-01-31 01:09:19,806 : INFO : topic #23 (0.020): 0.136*\"audit\" + 0.071*\"best\" + 0.034*\"yawn\" + 0.028*\"jacksonvil\" + 0.022*\"japanes\" + 0.021*\"festiv\" + 0.021*\"noll\" + 0.019*\"women\" + 0.016*\"intern\" + 0.013*\"prison\"\n", + "2019-01-31 01:09:19,812 : INFO : topic diff=0.003703, rho=0.025433\n", + "2019-01-31 01:09:19,965 : INFO : PROGRESS: pass 0, at document #3094000/4922894\n", + "2019-01-31 01:09:21,325 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:09:21,592 : INFO : topic #43 (0.020): 0.064*\"elect\" + 0.056*\"parti\" + 0.025*\"voluntari\" + 0.022*\"democrat\" + 0.020*\"member\" + 0.016*\"polici\" + 0.016*\"republ\" + 0.014*\"selma\" + 0.014*\"bypass\" + 0.013*\"seaport\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 01:09:21,593 : INFO : topic #9 (0.020): 0.071*\"bone\" + 0.048*\"american\" + 0.030*\"valour\" + 0.020*\"folei\" + 0.019*\"player\" + 0.019*\"dutch\" + 0.017*\"polit\" + 0.016*\"english\" + 0.013*\"simpler\" + 0.012*\"acrimoni\"\n", + "2019-01-31 01:09:21,594 : INFO : topic #2 (0.020): 0.052*\"isl\" + 0.037*\"shield\" + 0.017*\"narrat\" + 0.015*\"scot\" + 0.013*\"pope\" + 0.012*\"blur\" + 0.011*\"coalit\" + 0.011*\"nativist\" + 0.009*\"class\" + 0.009*\"bahá\"\n", + "2019-01-31 01:09:21,595 : INFO : topic #45 (0.020): 0.027*\"jpg\" + 0.026*\"fifteenth\" + 0.018*\"illicit\" + 0.017*\"pain\" + 0.017*\"colder\" + 0.014*\"black\" + 0.013*\"western\" + 0.011*\"arsen\" + 0.011*\"record\" + 0.010*\"depress\"\n", + "2019-01-31 01:09:21,596 : INFO : topic #7 (0.020): 0.021*\"snatch\" + 0.020*\"di\" + 0.019*\"factor\" + 0.016*\"yawn\" + 0.015*\"margin\" + 0.014*\"bone\" + 0.012*\"faster\" + 0.012*\"life\" + 0.012*\"deal\" + 0.012*\"daughter\"\n", + "2019-01-31 01:09:21,602 : INFO : topic diff=0.003716, rho=0.025425\n", + "2019-01-31 01:09:21,758 : INFO : PROGRESS: pass 0, at document #3096000/4922894\n", + "2019-01-31 01:09:23,144 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:09:23,410 : INFO : topic #9 (0.020): 0.070*\"bone\" + 0.048*\"american\" + 0.030*\"valour\" + 0.020*\"folei\" + 0.019*\"player\" + 0.019*\"dutch\" + 0.017*\"polit\" + 0.016*\"english\" + 0.013*\"simpler\" + 0.011*\"acrimoni\"\n", + "2019-01-31 01:09:23,411 : INFO : topic #1 (0.020): 0.053*\"china\" + 0.046*\"chilton\" + 0.023*\"hong\" + 0.023*\"kong\" + 0.022*\"korea\" + 0.019*\"korean\" + 0.017*\"sourc\" + 0.015*\"leah\" + 0.014*\"kim\" + 0.013*\"shirin\"\n", + "2019-01-31 01:09:23,412 : INFO : topic #22 (0.020): 0.035*\"spars\" + 0.020*\"factor\" + 0.011*\"plaisir\" + 0.010*\"genu\" + 0.009*\"median\" + 0.009*\"western\" + 0.009*\"feel\" + 0.009*\"male\" + 0.008*\"biom\" + 0.008*\"incom\"\n", + "2019-01-31 01:09:23,413 : INFO : topic #32 (0.020): 0.050*\"district\" + 0.044*\"popolo\" + 0.041*\"vigour\" + 0.036*\"tortur\" + 0.033*\"cotton\" + 0.023*\"area\" + 0.022*\"multitud\" + 0.021*\"adulthood\" + 0.021*\"citi\" + 0.019*\"cede\"\n", + "2019-01-31 01:09:23,414 : INFO : topic #26 (0.020): 0.031*\"workplac\" + 0.029*\"champion\" + 0.029*\"woman\" + 0.025*\"olymp\" + 0.024*\"men\" + 0.021*\"medal\" + 0.020*\"event\" + 0.019*\"atheist\" + 0.018*\"alic\" + 0.018*\"rainfal\"\n", + "2019-01-31 01:09:23,419 : INFO : topic diff=0.003893, rho=0.025416\n", + "2019-01-31 01:09:23,581 : INFO : PROGRESS: pass 0, at document #3098000/4922894\n", + "2019-01-31 01:09:24,993 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:09:25,259 : INFO : topic #11 (0.020): 0.024*\"john\" + 0.013*\"will\" + 0.011*\"jame\" + 0.011*\"david\" + 0.010*\"rival\" + 0.009*\"mexican–american\" + 0.009*\"paul\" + 0.008*\"georg\" + 0.008*\"slur\" + 0.007*\"rhyme\"\n", + "2019-01-31 01:09:25,261 : INFO : topic #45 (0.020): 0.027*\"jpg\" + 0.025*\"fifteenth\" + 0.018*\"illicit\" + 0.017*\"pain\" + 0.016*\"colder\" + 0.014*\"black\" + 0.013*\"western\" + 0.011*\"arsen\" + 0.011*\"record\" + 0.010*\"depress\"\n", + "2019-01-31 01:09:25,261 : INFO : topic #23 (0.020): 0.137*\"audit\" + 0.071*\"best\" + 0.034*\"yawn\" + 0.028*\"jacksonvil\" + 0.022*\"japanes\" + 0.021*\"noll\" + 0.021*\"festiv\" + 0.019*\"women\" + 0.016*\"intern\" + 0.013*\"prison\"\n", + "2019-01-31 01:09:25,262 : INFO : topic #31 (0.020): 0.054*\"fusiform\" + 0.027*\"scientist\" + 0.025*\"taxpay\" + 0.023*\"player\" + 0.020*\"place\" + 0.014*\"clot\" + 0.012*\"leagu\" + 0.011*\"folei\" + 0.010*\"yawn\" + 0.009*\"reconstruct\"\n", + "2019-01-31 01:09:25,263 : INFO : topic #17 (0.020): 0.081*\"church\" + 0.023*\"cathol\" + 0.022*\"christian\" + 0.020*\"bishop\" + 0.016*\"retroflex\" + 0.016*\"sail\" + 0.009*\"poll\" + 0.009*\"relationship\" + 0.009*\"cathedr\" + 0.009*\"parish\"\n", + "2019-01-31 01:09:25,269 : INFO : topic diff=0.004811, rho=0.025408\n", + "2019-01-31 01:09:27,896 : INFO : -11.690 per-word bound, 3303.2 perplexity estimate based on a held-out corpus of 2000 documents with 515509 words\n", + "2019-01-31 01:09:27,896 : INFO : PROGRESS: pass 0, at document #3100000/4922894\n", + "2019-01-31 01:09:29,246 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:09:29,512 : INFO : topic #22 (0.020): 0.035*\"spars\" + 0.019*\"factor\" + 0.011*\"plaisir\" + 0.010*\"genu\" + 0.009*\"median\" + 0.009*\"western\" + 0.009*\"male\" + 0.008*\"biom\" + 0.008*\"feel\" + 0.008*\"incom\"\n", + "2019-01-31 01:09:29,514 : INFO : topic #31 (0.020): 0.053*\"fusiform\" + 0.027*\"scientist\" + 0.025*\"taxpay\" + 0.023*\"player\" + 0.020*\"place\" + 0.014*\"clot\" + 0.012*\"leagu\" + 0.011*\"folei\" + 0.010*\"yawn\" + 0.009*\"reconstruct\"\n", + "2019-01-31 01:09:29,515 : INFO : topic #38 (0.020): 0.023*\"walter\" + 0.011*\"aza\" + 0.009*\"battalion\" + 0.009*\"forc\" + 0.008*\"teufel\" + 0.008*\"empath\" + 0.007*\"armi\" + 0.007*\"till\" + 0.007*\"govern\" + 0.007*\"militari\"\n", + "2019-01-31 01:09:29,516 : INFO : topic #29 (0.020): 0.030*\"companhia\" + 0.012*\"million\" + 0.012*\"busi\" + 0.012*\"bank\" + 0.011*\"market\" + 0.011*\"produc\" + 0.010*\"industri\" + 0.008*\"yawn\" + 0.008*\"manag\" + 0.007*\"trace\"\n", + "2019-01-31 01:09:29,517 : INFO : topic #5 (0.020): 0.038*\"abroad\" + 0.029*\"son\" + 0.026*\"rel\" + 0.025*\"reconstruct\" + 0.020*\"band\" + 0.017*\"muscl\" + 0.016*\"simultan\" + 0.014*\"charcoal\" + 0.013*\"toyota\" + 0.010*\"vocabulari\"\n", + "2019-01-31 01:09:29,523 : INFO : topic diff=0.003987, rho=0.025400\n", + "2019-01-31 01:09:29,736 : INFO : PROGRESS: pass 0, at document #3102000/4922894\n", + "2019-01-31 01:09:31,145 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:09:31,415 : INFO : topic #6 (0.020): 0.072*\"fewer\" + 0.024*\"epiru\" + 0.020*\"septemb\" + 0.018*\"teacher\" + 0.016*\"stake\" + 0.012*\"proclaim\" + 0.012*\"rodríguez\" + 0.011*\"direct\" + 0.011*\"movi\" + 0.011*\"acrimoni\"\n", + "2019-01-31 01:09:31,416 : INFO : topic #10 (0.020): 0.012*\"cdd\" + 0.008*\"media\" + 0.008*\"disco\" + 0.008*\"hormon\" + 0.008*\"have\" + 0.007*\"pathwai\" + 0.007*\"caus\" + 0.006*\"proper\" + 0.006*\"effect\" + 0.006*\"treat\"\n", + "2019-01-31 01:09:31,417 : INFO : topic #17 (0.020): 0.080*\"church\" + 0.024*\"cathol\" + 0.023*\"christian\" + 0.021*\"bishop\" + 0.016*\"retroflex\" + 0.016*\"sail\" + 0.009*\"poll\" + 0.009*\"relationship\" + 0.009*\"parish\" + 0.009*\"cathedr\"\n", + "2019-01-31 01:09:31,418 : INFO : topic #33 (0.020): 0.058*\"french\" + 0.047*\"franc\" + 0.034*\"pari\" + 0.026*\"sail\" + 0.022*\"jean\" + 0.018*\"daphn\" + 0.014*\"lazi\" + 0.013*\"loui\" + 0.012*\"piec\" + 0.010*\"wine\"\n", + "2019-01-31 01:09:31,419 : INFO : topic #19 (0.020): 0.017*\"languag\" + 0.015*\"centuri\" + 0.010*\"woodcut\" + 0.009*\"form\" + 0.009*\"mean\" + 0.009*\"origin\" + 0.008*\"trade\" + 0.007*\"english\" + 0.007*\"known\" + 0.006*\"ancestor\"\n", + "2019-01-31 01:09:31,425 : INFO : topic diff=0.003505, rho=0.025392\n", + "2019-01-31 01:09:31,587 : INFO : PROGRESS: pass 0, at document #3104000/4922894\n", + "2019-01-31 01:09:33,012 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:09:33,279 : INFO : topic #34 (0.020): 0.068*\"start\" + 0.034*\"new\" + 0.032*\"american\" + 0.029*\"unionist\" + 0.024*\"cotton\" + 0.021*\"year\" + 0.015*\"california\" + 0.013*\"warrior\" + 0.013*\"terri\" + 0.012*\"north\"\n", + "2019-01-31 01:09:33,280 : INFO : topic #15 (0.020): 0.012*\"small\" + 0.010*\"organ\" + 0.010*\"develop\" + 0.009*\"commun\" + 0.009*\"group\" + 0.008*\"peopl\" + 0.008*\"word\" + 0.007*\"human\" + 0.007*\"woman\" + 0.007*\"summerhil\"\n", + "2019-01-31 01:09:33,281 : INFO : topic #16 (0.020): 0.058*\"king\" + 0.032*\"priest\" + 0.021*\"duke\" + 0.019*\"idiosyncrat\" + 0.018*\"quarterli\" + 0.018*\"grammat\" + 0.018*\"rotterdam\" + 0.013*\"kingdom\" + 0.013*\"count\" + 0.012*\"princ\"\n", + "2019-01-31 01:09:33,282 : INFO : topic #46 (0.020): 0.019*\"sweden\" + 0.017*\"swedish\" + 0.017*\"norwai\" + 0.016*\"stop\" + 0.015*\"norwegian\" + 0.013*\"wind\" + 0.012*\"damag\" + 0.012*\"turkish\" + 0.012*\"denmark\" + 0.011*\"treeless\"\n", + "2019-01-31 01:09:33,283 : INFO : topic #25 (0.020): 0.032*\"ring\" + 0.019*\"area\" + 0.017*\"lagrang\" + 0.017*\"warmth\" + 0.017*\"mount\" + 0.010*\"north\" + 0.009*\"palmer\" + 0.009*\"sourc\" + 0.008*\"lobe\" + 0.008*\"foam\"\n", + "2019-01-31 01:09:33,289 : INFO : topic diff=0.003661, rho=0.025384\n", + "2019-01-31 01:09:33,447 : INFO : PROGRESS: pass 0, at document #3106000/4922894\n", + "2019-01-31 01:09:34,830 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:09:35,096 : INFO : topic #18 (0.020): 0.011*\"théori\" + 0.007*\"later\" + 0.007*\"sack\" + 0.006*\"dai\" + 0.006*\"kill\" + 0.005*\"like\" + 0.005*\"retrospect\" + 0.005*\"end\" + 0.004*\"call\" + 0.004*\"help\"\n", + "2019-01-31 01:09:35,097 : INFO : topic #43 (0.020): 0.065*\"elect\" + 0.056*\"parti\" + 0.025*\"voluntari\" + 0.023*\"democrat\" + 0.020*\"member\" + 0.016*\"polici\" + 0.016*\"republ\" + 0.014*\"selma\" + 0.014*\"bypass\" + 0.013*\"seaport\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 01:09:35,098 : INFO : topic #10 (0.020): 0.012*\"cdd\" + 0.008*\"media\" + 0.008*\"disco\" + 0.008*\"hormon\" + 0.008*\"have\" + 0.007*\"caus\" + 0.007*\"pathwai\" + 0.006*\"proper\" + 0.006*\"treat\" + 0.006*\"effect\"\n", + "2019-01-31 01:09:35,099 : INFO : topic #34 (0.020): 0.068*\"start\" + 0.034*\"new\" + 0.032*\"american\" + 0.029*\"unionist\" + 0.024*\"cotton\" + 0.021*\"year\" + 0.015*\"california\" + 0.013*\"warrior\" + 0.013*\"terri\" + 0.012*\"north\"\n", + "2019-01-31 01:09:35,100 : INFO : topic #6 (0.020): 0.072*\"fewer\" + 0.024*\"epiru\" + 0.020*\"septemb\" + 0.018*\"teacher\" + 0.016*\"stake\" + 0.012*\"rodríguez\" + 0.012*\"proclaim\" + 0.011*\"movi\" + 0.011*\"direct\" + 0.010*\"acrimoni\"\n", + "2019-01-31 01:09:35,106 : INFO : topic diff=0.004011, rho=0.025375\n", + "2019-01-31 01:09:35,261 : INFO : PROGRESS: pass 0, at document #3108000/4922894\n", + "2019-01-31 01:09:36,631 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:09:36,897 : INFO : topic #37 (0.020): 0.012*\"charact\" + 0.010*\"septemb\" + 0.010*\"man\" + 0.010*\"anim\" + 0.007*\"appear\" + 0.007*\"comic\" + 0.006*\"workplac\" + 0.006*\"love\" + 0.006*\"vision\" + 0.006*\"fusiform\"\n", + "2019-01-31 01:09:36,898 : INFO : topic #29 (0.020): 0.030*\"companhia\" + 0.012*\"million\" + 0.012*\"busi\" + 0.011*\"market\" + 0.011*\"bank\" + 0.011*\"produc\" + 0.010*\"industri\" + 0.008*\"yawn\" + 0.008*\"manag\" + 0.007*\"trace\"\n", + "2019-01-31 01:09:36,899 : INFO : topic #13 (0.020): 0.028*\"london\" + 0.026*\"new\" + 0.026*\"sourc\" + 0.026*\"australia\" + 0.024*\"england\" + 0.022*\"australian\" + 0.019*\"british\" + 0.017*\"ireland\" + 0.015*\"youth\" + 0.013*\"wale\"\n", + "2019-01-31 01:09:36,900 : INFO : topic #4 (0.020): 0.021*\"enfranchis\" + 0.015*\"depress\" + 0.014*\"pour\" + 0.009*\"mode\" + 0.009*\"elabor\" + 0.008*\"veget\" + 0.007*\"uruguayan\" + 0.007*\"encyclopedia\" + 0.006*\"produc\" + 0.006*\"develop\"\n", + "2019-01-31 01:09:36,901 : INFO : topic #46 (0.020): 0.019*\"sweden\" + 0.017*\"swedish\" + 0.017*\"stop\" + 0.017*\"norwai\" + 0.015*\"norwegian\" + 0.013*\"damag\" + 0.013*\"wind\" + 0.012*\"turkish\" + 0.012*\"denmark\" + 0.011*\"huntsvil\"\n", + "2019-01-31 01:09:36,907 : INFO : topic diff=0.003738, rho=0.025367\n", + "2019-01-31 01:09:37,068 : INFO : PROGRESS: pass 0, at document #3110000/4922894\n", + "2019-01-31 01:09:38,541 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:09:38,808 : INFO : topic #48 (0.020): 0.081*\"march\" + 0.077*\"octob\" + 0.076*\"sens\" + 0.071*\"januari\" + 0.070*\"juli\" + 0.069*\"notion\" + 0.068*\"august\" + 0.067*\"decatur\" + 0.066*\"april\" + 0.066*\"judici\"\n", + "2019-01-31 01:09:38,810 : INFO : topic #40 (0.020): 0.087*\"unit\" + 0.023*\"schuster\" + 0.021*\"institut\" + 0.021*\"requir\" + 0.021*\"collector\" + 0.019*\"student\" + 0.014*\"professor\" + 0.012*\"word\" + 0.011*\"http\" + 0.011*\"governor\"\n", + "2019-01-31 01:09:38,811 : INFO : topic #7 (0.020): 0.021*\"snatch\" + 0.020*\"di\" + 0.019*\"factor\" + 0.016*\"yawn\" + 0.016*\"margin\" + 0.014*\"bone\" + 0.012*\"faster\" + 0.012*\"life\" + 0.012*\"deal\" + 0.012*\"daughter\"\n", + "2019-01-31 01:09:38,812 : INFO : topic #5 (0.020): 0.038*\"abroad\" + 0.029*\"son\" + 0.027*\"rel\" + 0.025*\"reconstruct\" + 0.021*\"band\" + 0.017*\"muscl\" + 0.016*\"simultan\" + 0.014*\"charcoal\" + 0.013*\"toyota\" + 0.010*\"vocabulari\"\n", + "2019-01-31 01:09:38,813 : INFO : topic #30 (0.020): 0.036*\"leagu\" + 0.035*\"cleveland\" + 0.030*\"place\" + 0.028*\"taxpay\" + 0.025*\"scientist\" + 0.023*\"crete\" + 0.021*\"folei\" + 0.017*\"goal\" + 0.015*\"martin\" + 0.012*\"schmitz\"\n", + "2019-01-31 01:09:38,819 : INFO : topic diff=0.003766, rho=0.025359\n", + "2019-01-31 01:09:38,974 : INFO : PROGRESS: pass 0, at document #3112000/4922894\n", + "2019-01-31 01:09:40,333 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:09:40,598 : INFO : topic #17 (0.020): 0.081*\"church\" + 0.024*\"cathol\" + 0.023*\"christian\" + 0.021*\"bishop\" + 0.016*\"retroflex\" + 0.016*\"sail\" + 0.010*\"relationship\" + 0.009*\"cathedr\" + 0.009*\"poll\" + 0.009*\"parish\"\n", + "2019-01-31 01:09:40,599 : INFO : topic #39 (0.020): 0.058*\"canada\" + 0.044*\"canadian\" + 0.024*\"toronto\" + 0.023*\"hoar\" + 0.020*\"ontario\" + 0.016*\"quebec\" + 0.015*\"hydrogen\" + 0.015*\"misericordia\" + 0.015*\"new\" + 0.013*\"novotná\"\n", + "2019-01-31 01:09:40,600 : INFO : topic #49 (0.020): 0.045*\"india\" + 0.031*\"incumb\" + 0.013*\"pakistan\" + 0.013*\"islam\" + 0.011*\"televis\" + 0.011*\"anglo\" + 0.011*\"muskoge\" + 0.010*\"alam\" + 0.010*\"affection\" + 0.010*\"khalsa\"\n", + "2019-01-31 01:09:40,601 : INFO : topic #22 (0.020): 0.035*\"spars\" + 0.019*\"factor\" + 0.011*\"plaisir\" + 0.010*\"genu\" + 0.009*\"male\" + 0.009*\"median\" + 0.008*\"western\" + 0.008*\"feel\" + 0.008*\"biom\" + 0.008*\"incom\"\n", + "2019-01-31 01:09:40,602 : INFO : topic #33 (0.020): 0.058*\"french\" + 0.046*\"franc\" + 0.032*\"pari\" + 0.026*\"sail\" + 0.023*\"jean\" + 0.018*\"daphn\" + 0.014*\"lazi\" + 0.013*\"loui\" + 0.012*\"piec\" + 0.010*\"wine\"\n", + "2019-01-31 01:09:40,608 : INFO : topic diff=0.004149, rho=0.025351\n", + "2019-01-31 01:09:40,767 : INFO : PROGRESS: pass 0, at document #3114000/4922894\n", + "2019-01-31 01:09:42,143 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:09:42,409 : INFO : topic #41 (0.020): 0.040*\"citi\" + 0.025*\"palmer\" + 0.021*\"new\" + 0.014*\"strategist\" + 0.013*\"center\" + 0.012*\"open\" + 0.011*\"includ\" + 0.011*\"dai\" + 0.011*\"lobe\" + 0.009*\"highli\"\n", + "2019-01-31 01:09:42,410 : INFO : topic #14 (0.020): 0.024*\"forc\" + 0.021*\"aggress\" + 0.021*\"walter\" + 0.020*\"armi\" + 0.017*\"com\" + 0.015*\"oper\" + 0.014*\"unionist\" + 0.013*\"militari\" + 0.011*\"airbu\" + 0.011*\"diversifi\"\n", + "2019-01-31 01:09:42,411 : INFO : topic #31 (0.020): 0.053*\"fusiform\" + 0.027*\"scientist\" + 0.025*\"taxpay\" + 0.023*\"player\" + 0.020*\"place\" + 0.014*\"clot\" + 0.012*\"leagu\" + 0.011*\"folei\" + 0.010*\"yawn\" + 0.009*\"reconstruct\"\n", + "2019-01-31 01:09:42,412 : INFO : topic #20 (0.020): 0.149*\"scholar\" + 0.040*\"struggl\" + 0.036*\"high\" + 0.030*\"educ\" + 0.023*\"collector\" + 0.018*\"yawn\" + 0.013*\"prognosi\" + 0.010*\"gothic\" + 0.010*\"district\" + 0.010*\"task\"\n", + "2019-01-31 01:09:42,413 : INFO : topic #26 (0.020): 0.031*\"workplac\" + 0.029*\"champion\" + 0.028*\"woman\" + 0.026*\"olymp\" + 0.024*\"men\" + 0.022*\"medal\" + 0.021*\"event\" + 0.019*\"atheist\" + 0.018*\"rainfal\" + 0.017*\"alic\"\n", + "2019-01-31 01:09:42,419 : INFO : topic diff=0.004726, rho=0.025343\n", + "2019-01-31 01:09:42,578 : INFO : PROGRESS: pass 0, at document #3116000/4922894\n", + "2019-01-31 01:09:43,971 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:09:44,238 : INFO : topic #20 (0.020): 0.149*\"scholar\" + 0.040*\"struggl\" + 0.036*\"high\" + 0.030*\"educ\" + 0.023*\"collector\" + 0.018*\"yawn\" + 0.013*\"prognosi\" + 0.010*\"gothic\" + 0.010*\"district\" + 0.010*\"task\"\n", + "2019-01-31 01:09:44,239 : INFO : topic #37 (0.020): 0.012*\"charact\" + 0.010*\"septemb\" + 0.010*\"man\" + 0.010*\"anim\" + 0.007*\"appear\" + 0.007*\"comic\" + 0.006*\"workplac\" + 0.006*\"vision\" + 0.006*\"love\" + 0.006*\"fusiform\"\n", + "2019-01-31 01:09:44,240 : INFO : topic #23 (0.020): 0.137*\"audit\" + 0.071*\"best\" + 0.037*\"yawn\" + 0.028*\"jacksonvil\" + 0.022*\"japanes\" + 0.021*\"noll\" + 0.020*\"festiv\" + 0.018*\"women\" + 0.016*\"intern\" + 0.013*\"winner\"\n", + "2019-01-31 01:09:44,241 : INFO : topic #22 (0.020): 0.035*\"spars\" + 0.019*\"factor\" + 0.011*\"plaisir\" + 0.010*\"genu\" + 0.009*\"biom\" + 0.009*\"male\" + 0.008*\"median\" + 0.008*\"western\" + 0.008*\"feel\" + 0.008*\"incom\"\n", + "2019-01-31 01:09:44,242 : INFO : topic #2 (0.020): 0.052*\"isl\" + 0.037*\"shield\" + 0.017*\"narrat\" + 0.015*\"scot\" + 0.013*\"pope\" + 0.012*\"blur\" + 0.011*\"coalit\" + 0.011*\"nativist\" + 0.009*\"class\" + 0.009*\"bahá\"\n", + "2019-01-31 01:09:44,248 : INFO : topic diff=0.003409, rho=0.025335\n", + "2019-01-31 01:09:44,407 : INFO : PROGRESS: pass 0, at document #3118000/4922894\n", + "2019-01-31 01:09:45,776 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:09:46,042 : INFO : topic #24 (0.020): 0.038*\"book\" + 0.033*\"publicis\" + 0.028*\"word\" + 0.019*\"new\" + 0.016*\"arsen\" + 0.013*\"edit\" + 0.013*\"presid\" + 0.011*\"collect\" + 0.010*\"magazin\" + 0.010*\"author\"\n", + "2019-01-31 01:09:46,044 : INFO : topic #27 (0.020): 0.073*\"questionnair\" + 0.020*\"candid\" + 0.018*\"taxpay\" + 0.013*\"driver\" + 0.013*\"tornado\" + 0.012*\"ret\" + 0.011*\"squatter\" + 0.011*\"fool\" + 0.011*\"find\" + 0.010*\"champion\"\n", + "2019-01-31 01:09:46,045 : INFO : topic #46 (0.020): 0.018*\"sweden\" + 0.017*\"stop\" + 0.017*\"swedish\" + 0.017*\"norwai\" + 0.016*\"norwegian\" + 0.013*\"wind\" + 0.013*\"damag\" + 0.012*\"denmark\" + 0.011*\"turkish\" + 0.011*\"huntsvil\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 01:09:46,046 : INFO : topic #10 (0.020): 0.012*\"cdd\" + 0.008*\"disco\" + 0.008*\"media\" + 0.008*\"hormon\" + 0.007*\"have\" + 0.007*\"pathwai\" + 0.007*\"caus\" + 0.006*\"proper\" + 0.006*\"effect\" + 0.006*\"treat\"\n", + "2019-01-31 01:09:46,047 : INFO : topic #6 (0.020): 0.072*\"fewer\" + 0.024*\"epiru\" + 0.020*\"septemb\" + 0.018*\"teacher\" + 0.016*\"stake\" + 0.012*\"rodríguez\" + 0.012*\"proclaim\" + 0.011*\"direct\" + 0.011*\"movi\" + 0.010*\"acrimoni\"\n", + "2019-01-31 01:09:46,053 : INFO : topic diff=0.003315, rho=0.025327\n", + "2019-01-31 01:09:48,690 : INFO : -11.655 per-word bound, 3225.1 perplexity estimate based on a held-out corpus of 2000 documents with 526146 words\n", + "2019-01-31 01:09:48,690 : INFO : PROGRESS: pass 0, at document #3120000/4922894\n", + "2019-01-31 01:09:50,043 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:09:50,312 : INFO : topic #8 (0.020): 0.026*\"law\" + 0.023*\"cortic\" + 0.018*\"start\" + 0.016*\"act\" + 0.013*\"ricardo\" + 0.012*\"case\" + 0.010*\"replac\" + 0.010*\"polaris\" + 0.008*\"legal\" + 0.007*\"order\"\n", + "2019-01-31 01:09:50,313 : INFO : topic #37 (0.020): 0.012*\"charact\" + 0.010*\"septemb\" + 0.010*\"man\" + 0.010*\"anim\" + 0.007*\"comic\" + 0.007*\"appear\" + 0.006*\"workplac\" + 0.006*\"vision\" + 0.006*\"love\" + 0.006*\"fusiform\"\n", + "2019-01-31 01:09:50,314 : INFO : topic #1 (0.020): 0.052*\"china\" + 0.045*\"chilton\" + 0.023*\"hong\" + 0.022*\"kong\" + 0.021*\"korea\" + 0.019*\"korean\" + 0.017*\"sourc\" + 0.015*\"leah\" + 0.014*\"kim\" + 0.013*\"shirin\"\n", + "2019-01-31 01:09:50,315 : INFO : topic #20 (0.020): 0.148*\"scholar\" + 0.040*\"struggl\" + 0.035*\"high\" + 0.030*\"educ\" + 0.023*\"collector\" + 0.018*\"yawn\" + 0.013*\"prognosi\" + 0.010*\"gothic\" + 0.010*\"district\" + 0.010*\"task\"\n", + "2019-01-31 01:09:50,316 : INFO : topic #3 (0.020): 0.032*\"present\" + 0.025*\"offic\" + 0.024*\"minist\" + 0.023*\"nation\" + 0.023*\"govern\" + 0.021*\"member\" + 0.020*\"serv\" + 0.017*\"start\" + 0.016*\"gener\" + 0.014*\"seri\"\n", + "2019-01-31 01:09:50,322 : INFO : topic diff=0.003679, rho=0.025318\n", + "2019-01-31 01:09:50,480 : INFO : PROGRESS: pass 0, at document #3122000/4922894\n", + "2019-01-31 01:09:51,858 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:09:52,124 : INFO : topic #32 (0.020): 0.051*\"district\" + 0.044*\"popolo\" + 0.041*\"vigour\" + 0.036*\"tortur\" + 0.032*\"cotton\" + 0.022*\"area\" + 0.022*\"multitud\" + 0.021*\"adulthood\" + 0.020*\"citi\" + 0.019*\"cede\"\n", + "2019-01-31 01:09:52,125 : INFO : topic #14 (0.020): 0.024*\"forc\" + 0.022*\"aggress\" + 0.020*\"walter\" + 0.020*\"armi\" + 0.017*\"com\" + 0.015*\"oper\" + 0.014*\"unionist\" + 0.013*\"militari\" + 0.011*\"airbu\" + 0.011*\"diversifi\"\n", + "2019-01-31 01:09:52,126 : INFO : topic #31 (0.020): 0.054*\"fusiform\" + 0.027*\"scientist\" + 0.025*\"taxpay\" + 0.023*\"player\" + 0.020*\"place\" + 0.014*\"clot\" + 0.012*\"leagu\" + 0.011*\"folei\" + 0.010*\"yawn\" + 0.009*\"reconstruct\"\n", + "2019-01-31 01:09:52,127 : INFO : topic #13 (0.020): 0.028*\"london\" + 0.026*\"australia\" + 0.026*\"sourc\" + 0.026*\"new\" + 0.024*\"england\" + 0.022*\"australian\" + 0.018*\"british\" + 0.017*\"ireland\" + 0.015*\"youth\" + 0.013*\"wale\"\n", + "2019-01-31 01:09:52,128 : INFO : topic #24 (0.020): 0.038*\"book\" + 0.033*\"publicis\" + 0.028*\"word\" + 0.019*\"new\" + 0.016*\"arsen\" + 0.013*\"presid\" + 0.013*\"edit\" + 0.011*\"collect\" + 0.010*\"magazin\" + 0.010*\"author\"\n", + "2019-01-31 01:09:52,135 : INFO : topic diff=0.003936, rho=0.025310\n", + "2019-01-31 01:09:52,295 : INFO : PROGRESS: pass 0, at document #3124000/4922894\n", + "2019-01-31 01:09:53,696 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:09:53,963 : INFO : topic #0 (0.020): 0.068*\"statewid\" + 0.042*\"line\" + 0.035*\"raid\" + 0.026*\"rosenwald\" + 0.021*\"traceabl\" + 0.020*\"serv\" + 0.014*\"oper\" + 0.012*\"museo\" + 0.010*\"radiu\" + 0.010*\"transient\"\n", + "2019-01-31 01:09:53,964 : INFO : topic #3 (0.020): 0.031*\"present\" + 0.026*\"offic\" + 0.024*\"minist\" + 0.023*\"nation\" + 0.022*\"govern\" + 0.021*\"member\" + 0.020*\"serv\" + 0.016*\"start\" + 0.016*\"gener\" + 0.014*\"chickasaw\"\n", + "2019-01-31 01:09:53,965 : INFO : topic #28 (0.020): 0.033*\"build\" + 0.027*\"hous\" + 0.018*\"buford\" + 0.018*\"rivièr\" + 0.014*\"histor\" + 0.012*\"briarwood\" + 0.011*\"constitut\" + 0.011*\"depress\" + 0.010*\"linear\" + 0.010*\"silicon\"\n", + "2019-01-31 01:09:53,966 : INFO : topic #31 (0.020): 0.054*\"fusiform\" + 0.027*\"scientist\" + 0.025*\"taxpay\" + 0.023*\"player\" + 0.020*\"place\" + 0.014*\"clot\" + 0.012*\"leagu\" + 0.011*\"folei\" + 0.010*\"yawn\" + 0.009*\"reconstruct\"\n", + "2019-01-31 01:09:53,967 : INFO : topic #5 (0.020): 0.038*\"abroad\" + 0.028*\"son\" + 0.027*\"rel\" + 0.025*\"reconstruct\" + 0.021*\"band\" + 0.017*\"muscl\" + 0.016*\"simultan\" + 0.014*\"charcoal\" + 0.013*\"toyota\" + 0.010*\"vocabulari\"\n", + "2019-01-31 01:09:53,973 : INFO : topic diff=0.004002, rho=0.025302\n", + "2019-01-31 01:09:54,133 : INFO : PROGRESS: pass 0, at document #3126000/4922894\n", + "2019-01-31 01:09:55,512 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:09:55,778 : INFO : topic #13 (0.020): 0.028*\"london\" + 0.026*\"australia\" + 0.026*\"new\" + 0.026*\"sourc\" + 0.023*\"england\" + 0.022*\"australian\" + 0.019*\"british\" + 0.017*\"ireland\" + 0.014*\"youth\" + 0.013*\"wale\"\n", + "2019-01-31 01:09:55,779 : INFO : topic #39 (0.020): 0.059*\"canada\" + 0.045*\"canadian\" + 0.024*\"toronto\" + 0.023*\"hoar\" + 0.020*\"ontario\" + 0.016*\"hydrogen\" + 0.016*\"quebec\" + 0.015*\"new\" + 0.014*\"misericordia\" + 0.013*\"novotná\"\n", + "2019-01-31 01:09:55,780 : INFO : topic #46 (0.020): 0.018*\"sweden\" + 0.017*\"stop\" + 0.017*\"swedish\" + 0.016*\"norwai\" + 0.015*\"norwegian\" + 0.013*\"wind\" + 0.013*\"damag\" + 0.012*\"denmark\" + 0.012*\"turkish\" + 0.011*\"huntsvil\"\n", + "2019-01-31 01:09:55,781 : INFO : topic #26 (0.020): 0.032*\"workplac\" + 0.029*\"champion\" + 0.027*\"woman\" + 0.025*\"olymp\" + 0.023*\"men\" + 0.022*\"medal\" + 0.021*\"event\" + 0.018*\"atheist\" + 0.018*\"rainfal\" + 0.018*\"alic\"\n", + "2019-01-31 01:09:55,783 : INFO : topic #3 (0.020): 0.031*\"present\" + 0.026*\"offic\" + 0.024*\"minist\" + 0.023*\"nation\" + 0.022*\"govern\" + 0.021*\"member\" + 0.020*\"serv\" + 0.016*\"start\" + 0.016*\"gener\" + 0.014*\"chickasaw\"\n", + "2019-01-31 01:09:55,788 : INFO : topic diff=0.003506, rho=0.025294\n", + "2019-01-31 01:09:55,942 : INFO : PROGRESS: pass 0, at document #3128000/4922894\n", + "2019-01-31 01:09:57,298 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:09:57,565 : INFO : topic #16 (0.020): 0.060*\"king\" + 0.032*\"priest\" + 0.020*\"duke\" + 0.019*\"rotterdam\" + 0.019*\"grammat\" + 0.018*\"idiosyncrat\" + 0.018*\"quarterli\" + 0.013*\"count\" + 0.013*\"brazil\" + 0.012*\"princ\"\n", + "2019-01-31 01:09:57,565 : INFO : topic #9 (0.020): 0.071*\"bone\" + 0.046*\"american\" + 0.032*\"valour\" + 0.020*\"folei\" + 0.019*\"player\" + 0.018*\"dutch\" + 0.017*\"polit\" + 0.016*\"english\" + 0.012*\"simpler\" + 0.011*\"acrimoni\"\n", + "2019-01-31 01:09:57,567 : INFO : topic #18 (0.020): 0.011*\"théori\" + 0.007*\"later\" + 0.007*\"sack\" + 0.006*\"kill\" + 0.006*\"dai\" + 0.005*\"like\" + 0.005*\"retrospect\" + 0.005*\"end\" + 0.004*\"help\" + 0.004*\"call\"\n", + "2019-01-31 01:09:57,568 : INFO : topic #28 (0.020): 0.033*\"build\" + 0.027*\"hous\" + 0.018*\"buford\" + 0.018*\"rivièr\" + 0.014*\"histor\" + 0.012*\"briarwood\" + 0.011*\"constitut\" + 0.011*\"depress\" + 0.010*\"linear\" + 0.010*\"silicon\"\n", + "2019-01-31 01:09:57,569 : INFO : topic #0 (0.020): 0.068*\"statewid\" + 0.042*\"line\" + 0.035*\"raid\" + 0.026*\"rosenwald\" + 0.021*\"traceabl\" + 0.020*\"serv\" + 0.014*\"oper\" + 0.012*\"museo\" + 0.011*\"brook\" + 0.011*\"transient\"\n", + "2019-01-31 01:09:57,575 : INFO : topic diff=0.003521, rho=0.025286\n", + "2019-01-31 01:09:57,732 : INFO : PROGRESS: pass 0, at document #3130000/4922894\n", + "2019-01-31 01:09:59,104 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:09:59,372 : INFO : topic #30 (0.020): 0.036*\"leagu\" + 0.036*\"cleveland\" + 0.030*\"place\" + 0.028*\"taxpay\" + 0.025*\"scientist\" + 0.024*\"crete\" + 0.021*\"folei\" + 0.017*\"goal\" + 0.015*\"martin\" + 0.012*\"schmitz\"\n", + "2019-01-31 01:09:59,373 : INFO : topic #38 (0.020): 0.023*\"walter\" + 0.011*\"aza\" + 0.009*\"battalion\" + 0.009*\"forc\" + 0.008*\"teufel\" + 0.007*\"empath\" + 0.007*\"armi\" + 0.007*\"govern\" + 0.007*\"till\" + 0.006*\"militari\"\n", + "2019-01-31 01:09:59,374 : INFO : topic #1 (0.020): 0.051*\"china\" + 0.044*\"chilton\" + 0.023*\"hong\" + 0.022*\"kong\" + 0.022*\"korea\" + 0.019*\"korean\" + 0.017*\"sourc\" + 0.015*\"leah\" + 0.014*\"kim\" + 0.013*\"shirin\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 01:09:59,375 : INFO : topic #31 (0.020): 0.053*\"fusiform\" + 0.027*\"scientist\" + 0.025*\"taxpay\" + 0.023*\"player\" + 0.020*\"place\" + 0.014*\"clot\" + 0.012*\"leagu\" + 0.011*\"folei\" + 0.010*\"yawn\" + 0.009*\"reconstruct\"\n", + "2019-01-31 01:09:59,376 : INFO : topic #0 (0.020): 0.068*\"statewid\" + 0.042*\"line\" + 0.035*\"raid\" + 0.026*\"rosenwald\" + 0.020*\"traceabl\" + 0.020*\"serv\" + 0.014*\"oper\" + 0.012*\"museo\" + 0.011*\"brook\" + 0.011*\"transient\"\n", + "2019-01-31 01:09:59,382 : INFO : topic diff=0.003754, rho=0.025278\n", + "2019-01-31 01:09:59,539 : INFO : PROGRESS: pass 0, at document #3132000/4922894\n", + "2019-01-31 01:10:00,914 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:10:01,181 : INFO : topic #6 (0.020): 0.071*\"fewer\" + 0.023*\"epiru\" + 0.021*\"septemb\" + 0.018*\"teacher\" + 0.016*\"stake\" + 0.012*\"rodríguez\" + 0.012*\"proclaim\" + 0.011*\"direct\" + 0.011*\"movi\" + 0.010*\"acrimoni\"\n", + "2019-01-31 01:10:01,182 : INFO : topic #28 (0.020): 0.034*\"build\" + 0.026*\"hous\" + 0.018*\"buford\" + 0.017*\"rivièr\" + 0.013*\"histor\" + 0.011*\"briarwood\" + 0.011*\"constitut\" + 0.011*\"depress\" + 0.010*\"linear\" + 0.010*\"silicon\"\n", + "2019-01-31 01:10:01,183 : INFO : topic #40 (0.020): 0.088*\"unit\" + 0.023*\"schuster\" + 0.022*\"institut\" + 0.021*\"requir\" + 0.020*\"collector\" + 0.019*\"student\" + 0.014*\"professor\" + 0.012*\"word\" + 0.011*\"http\" + 0.011*\"degre\"\n", + "2019-01-31 01:10:01,184 : INFO : topic #29 (0.020): 0.030*\"companhia\" + 0.013*\"busi\" + 0.012*\"million\" + 0.012*\"market\" + 0.011*\"produc\" + 0.011*\"bank\" + 0.010*\"industri\" + 0.008*\"yawn\" + 0.008*\"manag\" + 0.007*\"trace\"\n", + "2019-01-31 01:10:01,185 : INFO : topic #9 (0.020): 0.071*\"bone\" + 0.046*\"american\" + 0.032*\"valour\" + 0.020*\"folei\" + 0.018*\"player\" + 0.018*\"dutch\" + 0.017*\"polit\" + 0.016*\"english\" + 0.012*\"simpler\" + 0.011*\"acrimoni\"\n", + "2019-01-31 01:10:01,191 : INFO : topic diff=0.003819, rho=0.025270\n", + "2019-01-31 01:10:01,351 : INFO : PROGRESS: pass 0, at document #3134000/4922894\n", + "2019-01-31 01:10:02,747 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:10:03,013 : INFO : topic #24 (0.020): 0.038*\"book\" + 0.033*\"publicis\" + 0.028*\"word\" + 0.019*\"new\" + 0.016*\"arsen\" + 0.013*\"edit\" + 0.013*\"presid\" + 0.011*\"collect\" + 0.010*\"author\" + 0.010*\"magazin\"\n", + "2019-01-31 01:10:03,014 : INFO : topic #10 (0.020): 0.012*\"cdd\" + 0.008*\"disco\" + 0.008*\"media\" + 0.007*\"hormon\" + 0.007*\"have\" + 0.007*\"pathwai\" + 0.007*\"proper\" + 0.007*\"caus\" + 0.006*\"effect\" + 0.006*\"treat\"\n", + "2019-01-31 01:10:03,015 : INFO : topic #32 (0.020): 0.050*\"district\" + 0.044*\"popolo\" + 0.041*\"vigour\" + 0.036*\"tortur\" + 0.032*\"cotton\" + 0.022*\"area\" + 0.022*\"multitud\" + 0.021*\"adulthood\" + 0.021*\"citi\" + 0.019*\"cede\"\n", + "2019-01-31 01:10:03,016 : INFO : topic #15 (0.020): 0.012*\"small\" + 0.010*\"organ\" + 0.010*\"develop\" + 0.009*\"commun\" + 0.009*\"group\" + 0.008*\"peopl\" + 0.008*\"word\" + 0.007*\"human\" + 0.007*\"woman\" + 0.007*\"summerhil\"\n", + "2019-01-31 01:10:03,017 : INFO : topic #11 (0.020): 0.023*\"john\" + 0.013*\"will\" + 0.012*\"david\" + 0.011*\"jame\" + 0.010*\"rival\" + 0.009*\"mexican–american\" + 0.008*\"paul\" + 0.008*\"slur\" + 0.008*\"georg\" + 0.007*\"rhyme\"\n", + "2019-01-31 01:10:03,023 : INFO : topic diff=0.003940, rho=0.025262\n", + "2019-01-31 01:10:03,242 : INFO : PROGRESS: pass 0, at document #3136000/4922894\n", + "2019-01-31 01:10:04,637 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:10:04,903 : INFO : topic #32 (0.020): 0.050*\"district\" + 0.044*\"popolo\" + 0.041*\"vigour\" + 0.035*\"tortur\" + 0.032*\"cotton\" + 0.022*\"multitud\" + 0.022*\"area\" + 0.021*\"adulthood\" + 0.021*\"citi\" + 0.019*\"cede\"\n", + "2019-01-31 01:10:04,905 : INFO : topic #18 (0.020): 0.011*\"théori\" + 0.007*\"later\" + 0.007*\"sack\" + 0.006*\"dai\" + 0.006*\"kill\" + 0.005*\"like\" + 0.005*\"retrospect\" + 0.005*\"end\" + 0.004*\"help\" + 0.004*\"call\"\n", + "2019-01-31 01:10:04,906 : INFO : topic #42 (0.020): 0.046*\"german\" + 0.031*\"germani\" + 0.016*\"vol\" + 0.015*\"jewish\" + 0.014*\"berlin\" + 0.013*\"israel\" + 0.013*\"der\" + 0.011*\"european\" + 0.010*\"europ\" + 0.009*\"austria\"\n", + "2019-01-31 01:10:04,907 : INFO : topic #49 (0.020): 0.044*\"india\" + 0.031*\"incumb\" + 0.013*\"pakistan\" + 0.012*\"islam\" + 0.012*\"televis\" + 0.011*\"anglo\" + 0.011*\"khalsa\" + 0.010*\"muskoge\" + 0.010*\"alam\" + 0.010*\"sri\"\n", + "2019-01-31 01:10:04,908 : INFO : topic #31 (0.020): 0.053*\"fusiform\" + 0.027*\"scientist\" + 0.025*\"taxpay\" + 0.023*\"player\" + 0.020*\"place\" + 0.014*\"clot\" + 0.012*\"leagu\" + 0.011*\"folei\" + 0.010*\"yawn\" + 0.009*\"reconstruct\"\n", + "2019-01-31 01:10:04,913 : INFO : topic diff=0.003994, rho=0.025254\n", + "2019-01-31 01:10:05,071 : INFO : PROGRESS: pass 0, at document #3138000/4922894\n", + "2019-01-31 01:10:06,456 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:10:06,722 : INFO : topic #44 (0.020): 0.033*\"rooftop\" + 0.028*\"final\" + 0.022*\"wife\" + 0.021*\"tourist\" + 0.018*\"champion\" + 0.015*\"taxpay\" + 0.015*\"martin\" + 0.014*\"chamber\" + 0.013*\"tiepolo\" + 0.013*\"winner\"\n", + "2019-01-31 01:10:06,723 : INFO : topic #1 (0.020): 0.053*\"china\" + 0.043*\"chilton\" + 0.024*\"hong\" + 0.023*\"kong\" + 0.022*\"korea\" + 0.019*\"korean\" + 0.017*\"sourc\" + 0.015*\"leah\" + 0.014*\"kim\" + 0.013*\"shirin\"\n", + "2019-01-31 01:10:06,724 : INFO : topic #17 (0.020): 0.079*\"church\" + 0.024*\"cathol\" + 0.024*\"christian\" + 0.021*\"bishop\" + 0.016*\"sail\" + 0.016*\"retroflex\" + 0.009*\"relationship\" + 0.009*\"parish\" + 0.009*\"poll\" + 0.009*\"historiographi\"\n", + "2019-01-31 01:10:06,725 : INFO : topic #16 (0.020): 0.061*\"king\" + 0.033*\"priest\" + 0.019*\"duke\" + 0.019*\"rotterdam\" + 0.019*\"quarterli\" + 0.019*\"grammat\" + 0.018*\"idiosyncrat\" + 0.013*\"kingdom\" + 0.013*\"count\" + 0.013*\"brazil\"\n", + "2019-01-31 01:10:06,726 : INFO : topic #31 (0.020): 0.054*\"fusiform\" + 0.027*\"scientist\" + 0.025*\"taxpay\" + 0.023*\"player\" + 0.020*\"place\" + 0.014*\"clot\" + 0.012*\"leagu\" + 0.011*\"folei\" + 0.010*\"yawn\" + 0.009*\"reconstruct\"\n", + "2019-01-31 01:10:06,732 : INFO : topic diff=0.004529, rho=0.025246\n", + "2019-01-31 01:10:09,457 : INFO : -11.574 per-word bound, 3048.9 perplexity estimate based on a held-out corpus of 2000 documents with 568793 words\n", + "2019-01-31 01:10:09,457 : INFO : PROGRESS: pass 0, at document #3140000/4922894\n", + "2019-01-31 01:10:10,844 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:10:11,111 : INFO : topic #22 (0.020): 0.035*\"spars\" + 0.019*\"factor\" + 0.011*\"plaisir\" + 0.010*\"genu\" + 0.010*\"biom\" + 0.009*\"western\" + 0.008*\"male\" + 0.008*\"median\" + 0.008*\"feel\" + 0.007*\"incom\"\n", + "2019-01-31 01:10:11,112 : INFO : topic #5 (0.020): 0.038*\"abroad\" + 0.028*\"son\" + 0.027*\"rel\" + 0.025*\"reconstruct\" + 0.021*\"band\" + 0.017*\"muscl\" + 0.016*\"simultan\" + 0.014*\"charcoal\" + 0.014*\"toyota\" + 0.010*\"vocabulari\"\n", + "2019-01-31 01:10:11,113 : INFO : topic #6 (0.020): 0.071*\"fewer\" + 0.024*\"epiru\" + 0.021*\"septemb\" + 0.018*\"teacher\" + 0.016*\"stake\" + 0.012*\"rodríguez\" + 0.012*\"proclaim\" + 0.011*\"direct\" + 0.011*\"movi\" + 0.010*\"acrimoni\"\n", + "2019-01-31 01:10:11,114 : INFO : topic #8 (0.020): 0.026*\"law\" + 0.023*\"cortic\" + 0.018*\"start\" + 0.016*\"act\" + 0.012*\"ricardo\" + 0.012*\"case\" + 0.010*\"replac\" + 0.009*\"polaris\" + 0.008*\"legal\" + 0.007*\"judaism\"\n", + "2019-01-31 01:10:11,115 : INFO : topic #13 (0.020): 0.028*\"london\" + 0.026*\"australia\" + 0.026*\"new\" + 0.026*\"sourc\" + 0.024*\"england\" + 0.022*\"australian\" + 0.019*\"british\" + 0.017*\"ireland\" + 0.015*\"youth\" + 0.013*\"wale\"\n", + "2019-01-31 01:10:11,120 : INFO : topic diff=0.003668, rho=0.025238\n", + "2019-01-31 01:10:11,282 : INFO : PROGRESS: pass 0, at document #3142000/4922894\n", + "2019-01-31 01:10:12,685 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:10:12,952 : INFO : topic #1 (0.020): 0.054*\"china\" + 0.044*\"chilton\" + 0.023*\"hong\" + 0.022*\"kong\" + 0.022*\"korea\" + 0.020*\"korean\" + 0.017*\"sourc\" + 0.015*\"leah\" + 0.014*\"kim\" + 0.013*\"shirin\"\n", + "2019-01-31 01:10:12,953 : INFO : topic #34 (0.020): 0.068*\"start\" + 0.034*\"new\" + 0.032*\"american\" + 0.030*\"unionist\" + 0.025*\"cotton\" + 0.021*\"year\" + 0.015*\"california\" + 0.013*\"warrior\" + 0.012*\"terri\" + 0.012*\"north\"\n", + "2019-01-31 01:10:12,954 : INFO : topic #2 (0.020): 0.052*\"isl\" + 0.038*\"shield\" + 0.017*\"narrat\" + 0.014*\"scot\" + 0.014*\"pope\" + 0.012*\"blur\" + 0.010*\"nativist\" + 0.010*\"coalit\" + 0.009*\"bahá\" + 0.009*\"class\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 01:10:12,955 : INFO : topic #45 (0.020): 0.026*\"jpg\" + 0.025*\"fifteenth\" + 0.018*\"illicit\" + 0.017*\"pain\" + 0.016*\"colder\" + 0.013*\"black\" + 0.013*\"western\" + 0.012*\"arsen\" + 0.011*\"depress\" + 0.010*\"record\"\n", + "2019-01-31 01:10:12,956 : INFO : topic #17 (0.020): 0.078*\"church\" + 0.024*\"cathol\" + 0.024*\"christian\" + 0.021*\"bishop\" + 0.016*\"sail\" + 0.016*\"retroflex\" + 0.009*\"relationship\" + 0.009*\"parish\" + 0.009*\"poll\" + 0.009*\"historiographi\"\n", + "2019-01-31 01:10:12,962 : INFO : topic diff=0.004457, rho=0.025230\n", + "2019-01-31 01:10:13,120 : INFO : PROGRESS: pass 0, at document #3144000/4922894\n", + "2019-01-31 01:10:14,513 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:10:14,779 : INFO : topic #7 (0.020): 0.021*\"snatch\" + 0.020*\"di\" + 0.019*\"factor\" + 0.016*\"yawn\" + 0.015*\"margin\" + 0.014*\"bone\" + 0.012*\"faster\" + 0.012*\"life\" + 0.012*\"daughter\" + 0.012*\"deal\"\n", + "2019-01-31 01:10:14,780 : INFO : topic #34 (0.020): 0.068*\"start\" + 0.034*\"new\" + 0.032*\"american\" + 0.030*\"unionist\" + 0.024*\"cotton\" + 0.021*\"year\" + 0.015*\"california\" + 0.013*\"warrior\" + 0.012*\"terri\" + 0.012*\"north\"\n", + "2019-01-31 01:10:14,781 : INFO : topic #26 (0.020): 0.032*\"workplac\" + 0.029*\"champion\" + 0.028*\"woman\" + 0.025*\"olymp\" + 0.023*\"men\" + 0.021*\"medal\" + 0.020*\"event\" + 0.018*\"atheist\" + 0.018*\"rainfal\" + 0.018*\"nation\"\n", + "2019-01-31 01:10:14,782 : INFO : topic #16 (0.020): 0.061*\"king\" + 0.033*\"priest\" + 0.020*\"duke\" + 0.019*\"quarterli\" + 0.019*\"rotterdam\" + 0.019*\"grammat\" + 0.018*\"idiosyncrat\" + 0.013*\"kingdom\" + 0.013*\"count\" + 0.013*\"brazil\"\n", + "2019-01-31 01:10:14,783 : INFO : topic #1 (0.020): 0.054*\"china\" + 0.044*\"chilton\" + 0.023*\"hong\" + 0.022*\"kong\" + 0.022*\"korea\" + 0.019*\"korean\" + 0.017*\"sourc\" + 0.015*\"leah\" + 0.014*\"kim\" + 0.013*\"shirin\"\n", + "2019-01-31 01:10:14,789 : INFO : topic diff=0.003676, rho=0.025222\n", + "2019-01-31 01:10:14,942 : INFO : PROGRESS: pass 0, at document #3146000/4922894\n", + "2019-01-31 01:10:16,295 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:10:16,562 : INFO : topic #31 (0.020): 0.053*\"fusiform\" + 0.027*\"scientist\" + 0.026*\"taxpay\" + 0.023*\"player\" + 0.020*\"place\" + 0.014*\"clot\" + 0.013*\"leagu\" + 0.011*\"folei\" + 0.010*\"yawn\" + 0.009*\"reconstruct\"\n", + "2019-01-31 01:10:16,563 : INFO : topic #12 (0.020): 0.009*\"number\" + 0.007*\"frontal\" + 0.007*\"théori\" + 0.007*\"utopian\" + 0.007*\"poet\" + 0.006*\"gener\" + 0.006*\"exampl\" + 0.006*\"measur\" + 0.006*\"differ\" + 0.006*\"southern\"\n", + "2019-01-31 01:10:16,564 : INFO : topic #2 (0.020): 0.051*\"isl\" + 0.038*\"shield\" + 0.017*\"narrat\" + 0.014*\"scot\" + 0.014*\"pope\" + 0.012*\"blur\" + 0.011*\"nativist\" + 0.010*\"coalit\" + 0.009*\"bahá\" + 0.009*\"class\"\n", + "2019-01-31 01:10:16,565 : INFO : topic #30 (0.020): 0.035*\"cleveland\" + 0.035*\"leagu\" + 0.030*\"place\" + 0.028*\"taxpay\" + 0.025*\"scientist\" + 0.023*\"crete\" + 0.021*\"folei\" + 0.017*\"goal\" + 0.015*\"martin\" + 0.012*\"schmitz\"\n", + "2019-01-31 01:10:16,566 : INFO : topic #10 (0.020): 0.013*\"cdd\" + 0.008*\"media\" + 0.008*\"disco\" + 0.007*\"hormon\" + 0.007*\"have\" + 0.007*\"pathwai\" + 0.007*\"caus\" + 0.006*\"proper\" + 0.006*\"effect\" + 0.006*\"gastrointestin\"\n", + "2019-01-31 01:10:16,572 : INFO : topic diff=0.004447, rho=0.025214\n", + "2019-01-31 01:10:16,726 : INFO : PROGRESS: pass 0, at document #3148000/4922894\n", + "2019-01-31 01:10:18,107 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:10:18,374 : INFO : topic #29 (0.020): 0.031*\"companhia\" + 0.013*\"busi\" + 0.012*\"million\" + 0.011*\"market\" + 0.011*\"bank\" + 0.011*\"produc\" + 0.010*\"industri\" + 0.008*\"yawn\" + 0.008*\"manag\" + 0.007*\"trace\"\n", + "2019-01-31 01:10:18,375 : INFO : topic #19 (0.020): 0.016*\"languag\" + 0.015*\"centuri\" + 0.010*\"woodcut\" + 0.010*\"form\" + 0.009*\"mean\" + 0.008*\"origin\" + 0.008*\"trade\" + 0.007*\"english\" + 0.007*\"known\" + 0.007*\"ancestor\"\n", + "2019-01-31 01:10:18,376 : INFO : topic #13 (0.020): 0.027*\"london\" + 0.026*\"australia\" + 0.026*\"new\" + 0.025*\"sourc\" + 0.024*\"england\" + 0.022*\"australian\" + 0.019*\"british\" + 0.017*\"ireland\" + 0.015*\"youth\" + 0.013*\"wale\"\n", + "2019-01-31 01:10:18,377 : INFO : topic #23 (0.020): 0.136*\"audit\" + 0.072*\"best\" + 0.036*\"yawn\" + 0.028*\"jacksonvil\" + 0.022*\"japanes\" + 0.021*\"noll\" + 0.020*\"festiv\" + 0.018*\"women\" + 0.016*\"intern\" + 0.012*\"winner\"\n", + "2019-01-31 01:10:18,378 : INFO : topic #31 (0.020): 0.053*\"fusiform\" + 0.027*\"scientist\" + 0.026*\"taxpay\" + 0.023*\"player\" + 0.020*\"place\" + 0.014*\"clot\" + 0.013*\"leagu\" + 0.011*\"folei\" + 0.010*\"yawn\" + 0.009*\"reconstruct\"\n", + "2019-01-31 01:10:18,384 : INFO : topic diff=0.003971, rho=0.025206\n", + "2019-01-31 01:10:18,542 : INFO : PROGRESS: pass 0, at document #3150000/4922894\n", + "2019-01-31 01:10:19,924 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:10:20,191 : INFO : topic #17 (0.020): 0.077*\"church\" + 0.024*\"cathol\" + 0.024*\"christian\" + 0.021*\"bishop\" + 0.016*\"sail\" + 0.016*\"retroflex\" + 0.009*\"relationship\" + 0.009*\"cathedr\" + 0.009*\"poll\" + 0.009*\"historiographi\"\n", + "2019-01-31 01:10:20,192 : INFO : topic #11 (0.020): 0.023*\"john\" + 0.013*\"will\" + 0.012*\"david\" + 0.011*\"jame\" + 0.010*\"mexican–american\" + 0.010*\"rival\" + 0.008*\"paul\" + 0.008*\"slur\" + 0.008*\"georg\" + 0.007*\"rhyme\"\n", + "2019-01-31 01:10:20,193 : INFO : topic #33 (0.020): 0.059*\"french\" + 0.047*\"franc\" + 0.032*\"pari\" + 0.024*\"sail\" + 0.022*\"jean\" + 0.018*\"daphn\" + 0.014*\"loui\" + 0.013*\"lazi\" + 0.011*\"piec\" + 0.009*\"wine\"\n", + "2019-01-31 01:10:20,194 : INFO : topic #37 (0.020): 0.012*\"charact\" + 0.010*\"septemb\" + 0.010*\"anim\" + 0.010*\"man\" + 0.008*\"appear\" + 0.007*\"comic\" + 0.006*\"workplac\" + 0.006*\"vision\" + 0.006*\"storag\" + 0.006*\"love\"\n", + "2019-01-31 01:10:20,196 : INFO : topic #31 (0.020): 0.052*\"fusiform\" + 0.027*\"scientist\" + 0.026*\"taxpay\" + 0.023*\"player\" + 0.020*\"place\" + 0.014*\"clot\" + 0.013*\"leagu\" + 0.011*\"folei\" + 0.010*\"yawn\" + 0.009*\"reconstruct\"\n", + "2019-01-31 01:10:20,202 : INFO : topic diff=0.003900, rho=0.025198\n", + "2019-01-31 01:10:20,361 : INFO : PROGRESS: pass 0, at document #3152000/4922894\n", + "2019-01-31 01:10:21,759 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:10:22,027 : INFO : topic #33 (0.020): 0.059*\"french\" + 0.047*\"franc\" + 0.032*\"pari\" + 0.024*\"sail\" + 0.022*\"jean\" + 0.018*\"daphn\" + 0.014*\"loui\" + 0.014*\"lazi\" + 0.011*\"piec\" + 0.009*\"wine\"\n", + "2019-01-31 01:10:22,028 : INFO : topic #42 (0.020): 0.046*\"german\" + 0.031*\"germani\" + 0.016*\"vol\" + 0.015*\"jewish\" + 0.014*\"berlin\" + 0.014*\"israel\" + 0.013*\"der\" + 0.011*\"european\" + 0.010*\"europ\" + 0.009*\"austria\"\n", + "2019-01-31 01:10:22,029 : INFO : topic #31 (0.020): 0.052*\"fusiform\" + 0.027*\"scientist\" + 0.026*\"taxpay\" + 0.023*\"player\" + 0.020*\"place\" + 0.014*\"clot\" + 0.013*\"leagu\" + 0.011*\"folei\" + 0.010*\"yawn\" + 0.009*\"reconstruct\"\n", + "2019-01-31 01:10:22,030 : INFO : topic #45 (0.020): 0.027*\"jpg\" + 0.024*\"fifteenth\" + 0.018*\"illicit\" + 0.017*\"pain\" + 0.016*\"colder\" + 0.013*\"black\" + 0.013*\"western\" + 0.013*\"arsen\" + 0.011*\"depress\" + 0.010*\"gai\"\n", + "2019-01-31 01:10:22,032 : INFO : topic #25 (0.020): 0.033*\"ring\" + 0.018*\"lagrang\" + 0.018*\"area\" + 0.017*\"warmth\" + 0.016*\"mount\" + 0.010*\"north\" + 0.009*\"foam\" + 0.009*\"palmer\" + 0.008*\"sourc\" + 0.008*\"lobe\"\n", + "2019-01-31 01:10:22,038 : INFO : topic diff=0.004152, rho=0.025190\n", + "2019-01-31 01:10:22,197 : INFO : PROGRESS: pass 0, at document #3154000/4922894\n", + "2019-01-31 01:10:23,571 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:10:23,837 : INFO : topic #18 (0.020): 0.010*\"théori\" + 0.007*\"later\" + 0.007*\"sack\" + 0.006*\"dai\" + 0.006*\"kill\" + 0.005*\"like\" + 0.005*\"retrospect\" + 0.005*\"end\" + 0.004*\"call\" + 0.004*\"help\"\n", + "2019-01-31 01:10:23,838 : INFO : topic #14 (0.020): 0.023*\"forc\" + 0.022*\"aggress\" + 0.021*\"walter\" + 0.020*\"armi\" + 0.017*\"com\" + 0.014*\"oper\" + 0.014*\"unionist\" + 0.013*\"militari\" + 0.011*\"airbu\" + 0.011*\"diversifi\"\n", + "2019-01-31 01:10:23,840 : INFO : topic #32 (0.020): 0.049*\"district\" + 0.045*\"popolo\" + 0.041*\"vigour\" + 0.036*\"tortur\" + 0.032*\"cotton\" + 0.023*\"multitud\" + 0.022*\"area\" + 0.021*\"adulthood\" + 0.020*\"citi\" + 0.019*\"cede\"\n", + "2019-01-31 01:10:23,841 : INFO : topic #19 (0.020): 0.016*\"languag\" + 0.015*\"centuri\" + 0.011*\"woodcut\" + 0.010*\"form\" + 0.009*\"mean\" + 0.008*\"origin\" + 0.008*\"trade\" + 0.007*\"english\" + 0.007*\"known\" + 0.007*\"ancestor\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 01:10:23,842 : INFO : topic #13 (0.020): 0.027*\"london\" + 0.026*\"australia\" + 0.026*\"new\" + 0.025*\"sourc\" + 0.024*\"england\" + 0.022*\"australian\" + 0.019*\"british\" + 0.017*\"ireland\" + 0.015*\"youth\" + 0.013*\"wale\"\n", + "2019-01-31 01:10:23,848 : INFO : topic diff=0.004476, rho=0.025182\n", + "2019-01-31 01:10:24,009 : INFO : PROGRESS: pass 0, at document #3156000/4922894\n", + "2019-01-31 01:10:25,431 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:10:25,697 : INFO : topic #40 (0.020): 0.087*\"unit\" + 0.023*\"schuster\" + 0.022*\"institut\" + 0.021*\"requir\" + 0.021*\"collector\" + 0.019*\"student\" + 0.014*\"professor\" + 0.012*\"word\" + 0.012*\"http\" + 0.011*\"degre\"\n", + "2019-01-31 01:10:25,699 : INFO : topic #25 (0.020): 0.033*\"ring\" + 0.019*\"lagrang\" + 0.018*\"area\" + 0.017*\"warmth\" + 0.016*\"mount\" + 0.010*\"north\" + 0.009*\"foam\" + 0.009*\"palmer\" + 0.008*\"sourc\" + 0.008*\"lobe\"\n", + "2019-01-31 01:10:25,700 : INFO : topic #21 (0.020): 0.032*\"samford\" + 0.021*\"spain\" + 0.019*\"del\" + 0.017*\"mexico\" + 0.016*\"italian\" + 0.013*\"soviet\" + 0.012*\"juan\" + 0.011*\"josé\" + 0.011*\"carlo\" + 0.011*\"santa\"\n", + "2019-01-31 01:10:25,701 : INFO : topic #38 (0.020): 0.024*\"walter\" + 0.010*\"aza\" + 0.009*\"battalion\" + 0.009*\"forc\" + 0.008*\"teufel\" + 0.008*\"empath\" + 0.007*\"armi\" + 0.007*\"govern\" + 0.006*\"till\" + 0.006*\"militari\"\n", + "2019-01-31 01:10:25,702 : INFO : topic #47 (0.020): 0.065*\"muscl\" + 0.032*\"perceptu\" + 0.020*\"theater\" + 0.018*\"place\" + 0.018*\"compos\" + 0.015*\"damn\" + 0.014*\"orchestr\" + 0.013*\"olympo\" + 0.012*\"physician\" + 0.011*\"word\"\n", + "2019-01-31 01:10:25,708 : INFO : topic diff=0.005016, rho=0.025174\n", + "2019-01-31 01:10:25,865 : INFO : PROGRESS: pass 0, at document #3158000/4922894\n", + "2019-01-31 01:10:27,250 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:10:27,516 : INFO : topic #21 (0.020): 0.032*\"samford\" + 0.021*\"spain\" + 0.019*\"del\" + 0.016*\"mexico\" + 0.016*\"italian\" + 0.013*\"soviet\" + 0.012*\"juan\" + 0.011*\"josé\" + 0.011*\"carlo\" + 0.011*\"santa\"\n", + "2019-01-31 01:10:27,517 : INFO : topic #17 (0.020): 0.077*\"church\" + 0.024*\"cathol\" + 0.023*\"christian\" + 0.020*\"bishop\" + 0.016*\"retroflex\" + 0.016*\"sail\" + 0.010*\"poll\" + 0.009*\"relationship\" + 0.009*\"cathedr\" + 0.009*\"historiographi\"\n", + "2019-01-31 01:10:27,519 : INFO : topic #35 (0.020): 0.056*\"russia\" + 0.039*\"sovereignti\" + 0.034*\"rural\" + 0.025*\"personifi\" + 0.024*\"reprint\" + 0.022*\"poison\" + 0.019*\"moscow\" + 0.015*\"poland\" + 0.015*\"unfortun\" + 0.015*\"malaysia\"\n", + "2019-01-31 01:10:27,520 : INFO : topic #9 (0.020): 0.070*\"bone\" + 0.046*\"american\" + 0.031*\"valour\" + 0.020*\"folei\" + 0.018*\"player\" + 0.017*\"dutch\" + 0.017*\"polit\" + 0.016*\"english\" + 0.012*\"simpler\" + 0.011*\"acrimoni\"\n", + "2019-01-31 01:10:27,521 : INFO : topic #44 (0.020): 0.032*\"rooftop\" + 0.029*\"final\" + 0.022*\"wife\" + 0.021*\"tourist\" + 0.018*\"champion\" + 0.015*\"taxpay\" + 0.015*\"martin\" + 0.014*\"tiepolo\" + 0.014*\"chamber\" + 0.013*\"open\"\n", + "2019-01-31 01:10:27,527 : INFO : topic diff=0.003629, rho=0.025166\n", + "2019-01-31 01:10:30,341 : INFO : -11.976 per-word bound, 4028.9 perplexity estimate based on a held-out corpus of 2000 documents with 608637 words\n", + "2019-01-31 01:10:30,342 : INFO : PROGRESS: pass 0, at document #3160000/4922894\n", + "2019-01-31 01:10:31,774 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:10:32,040 : INFO : topic #39 (0.020): 0.059*\"canada\" + 0.044*\"canadian\" + 0.024*\"toronto\" + 0.023*\"hoar\" + 0.020*\"ontario\" + 0.015*\"hydrogen\" + 0.015*\"new\" + 0.014*\"quebec\" + 0.014*\"misericordia\" + 0.013*\"novotná\"\n", + "2019-01-31 01:10:32,041 : INFO : topic #3 (0.020): 0.032*\"present\" + 0.025*\"offic\" + 0.024*\"minist\" + 0.023*\"nation\" + 0.022*\"govern\" + 0.021*\"member\" + 0.019*\"serv\" + 0.016*\"start\" + 0.016*\"gener\" + 0.014*\"chickasaw\"\n", + "2019-01-31 01:10:32,043 : INFO : topic #22 (0.020): 0.035*\"spars\" + 0.019*\"factor\" + 0.011*\"plaisir\" + 0.010*\"genu\" + 0.010*\"biom\" + 0.009*\"western\" + 0.008*\"male\" + 0.008*\"feel\" + 0.008*\"median\" + 0.007*\"trap\"\n", + "2019-01-31 01:10:32,044 : INFO : topic #9 (0.020): 0.070*\"bone\" + 0.045*\"american\" + 0.031*\"valour\" + 0.020*\"folei\" + 0.018*\"player\" + 0.017*\"dutch\" + 0.017*\"polit\" + 0.016*\"english\" + 0.012*\"simpler\" + 0.011*\"acrimoni\"\n", + "2019-01-31 01:10:32,045 : INFO : topic #4 (0.020): 0.020*\"enfranchis\" + 0.015*\"depress\" + 0.014*\"pour\" + 0.009*\"mode\" + 0.008*\"elabor\" + 0.008*\"veget\" + 0.007*\"uruguayan\" + 0.007*\"spectacl\" + 0.006*\"encyclopedia\" + 0.006*\"produc\"\n", + "2019-01-31 01:10:32,051 : INFO : topic diff=0.003941, rho=0.025158\n", + "2019-01-31 01:10:32,214 : INFO : PROGRESS: pass 0, at document #3162000/4922894\n", + "2019-01-31 01:10:33,629 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:10:33,897 : INFO : topic #37 (0.020): 0.012*\"charact\" + 0.010*\"septemb\" + 0.010*\"anim\" + 0.010*\"man\" + 0.007*\"appear\" + 0.007*\"comic\" + 0.006*\"workplac\" + 0.006*\"storag\" + 0.006*\"vision\" + 0.006*\"fusiform\"\n", + "2019-01-31 01:10:33,898 : INFO : topic #48 (0.020): 0.082*\"march\" + 0.080*\"sens\" + 0.078*\"octob\" + 0.072*\"januari\" + 0.071*\"august\" + 0.070*\"juli\" + 0.069*\"notion\" + 0.068*\"judici\" + 0.067*\"april\" + 0.066*\"decatur\"\n", + "2019-01-31 01:10:33,899 : INFO : topic #6 (0.020): 0.071*\"fewer\" + 0.024*\"epiru\" + 0.021*\"septemb\" + 0.018*\"teacher\" + 0.016*\"stake\" + 0.012*\"rodríguez\" + 0.012*\"proclaim\" + 0.011*\"direct\" + 0.011*\"movi\" + 0.010*\"acrimoni\"\n", + "2019-01-31 01:10:33,900 : INFO : topic #32 (0.020): 0.049*\"district\" + 0.045*\"popolo\" + 0.042*\"vigour\" + 0.036*\"tortur\" + 0.033*\"cotton\" + 0.023*\"multitud\" + 0.022*\"area\" + 0.021*\"adulthood\" + 0.020*\"citi\" + 0.019*\"cede\"\n", + "2019-01-31 01:10:33,901 : INFO : topic #12 (0.020): 0.009*\"number\" + 0.008*\"frontal\" + 0.007*\"poet\" + 0.007*\"utopian\" + 0.006*\"gener\" + 0.006*\"théori\" + 0.006*\"exampl\" + 0.006*\"measur\" + 0.006*\"southern\" + 0.005*\"differ\"\n", + "2019-01-31 01:10:33,908 : INFO : topic diff=0.004350, rho=0.025150\n", + "2019-01-31 01:10:34,070 : INFO : PROGRESS: pass 0, at document #3164000/4922894\n", + "2019-01-31 01:10:35,955 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:10:36,221 : INFO : topic #48 (0.020): 0.082*\"march\" + 0.080*\"sens\" + 0.078*\"octob\" + 0.072*\"januari\" + 0.071*\"juli\" + 0.071*\"august\" + 0.069*\"notion\" + 0.068*\"judici\" + 0.067*\"april\" + 0.066*\"decatur\"\n", + "2019-01-31 01:10:36,222 : INFO : topic #31 (0.020): 0.053*\"fusiform\" + 0.027*\"scientist\" + 0.026*\"taxpay\" + 0.023*\"player\" + 0.020*\"place\" + 0.014*\"clot\" + 0.013*\"leagu\" + 0.011*\"folei\" + 0.010*\"yawn\" + 0.009*\"reconstruct\"\n", + "2019-01-31 01:10:36,223 : INFO : topic #33 (0.020): 0.061*\"french\" + 0.047*\"franc\" + 0.031*\"pari\" + 0.023*\"sail\" + 0.022*\"jean\" + 0.018*\"daphn\" + 0.013*\"loui\" + 0.013*\"lazi\" + 0.012*\"piec\" + 0.008*\"wine\"\n", + "2019-01-31 01:10:36,224 : INFO : topic #41 (0.020): 0.040*\"citi\" + 0.024*\"palmer\" + 0.021*\"new\" + 0.014*\"strategist\" + 0.013*\"center\" + 0.012*\"open\" + 0.011*\"includ\" + 0.011*\"lobe\" + 0.010*\"dai\" + 0.009*\"highli\"\n", + "2019-01-31 01:10:36,225 : INFO : topic #10 (0.020): 0.013*\"cdd\" + 0.009*\"media\" + 0.008*\"disco\" + 0.007*\"hormon\" + 0.007*\"pathwai\" + 0.007*\"have\" + 0.006*\"caus\" + 0.006*\"proper\" + 0.006*\"effect\" + 0.006*\"gastrointestin\"\n", + "2019-01-31 01:10:36,231 : INFO : topic diff=0.004311, rho=0.025142\n", + "2019-01-31 01:10:36,453 : INFO : PROGRESS: pass 0, at document #3166000/4922894\n", + "2019-01-31 01:10:37,845 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:10:38,115 : INFO : topic #44 (0.020): 0.033*\"rooftop\" + 0.028*\"final\" + 0.022*\"wife\" + 0.020*\"tourist\" + 0.018*\"champion\" + 0.015*\"taxpay\" + 0.015*\"martin\" + 0.014*\"tiepolo\" + 0.014*\"chamber\" + 0.013*\"open\"\n", + "2019-01-31 01:10:38,115 : INFO : topic #35 (0.020): 0.055*\"russia\" + 0.038*\"sovereignti\" + 0.034*\"rural\" + 0.025*\"personifi\" + 0.023*\"reprint\" + 0.022*\"poison\" + 0.019*\"moscow\" + 0.016*\"poland\" + 0.015*\"unfortun\" + 0.015*\"malaysia\"\n", + "2019-01-31 01:10:38,117 : INFO : topic #19 (0.020): 0.015*\"languag\" + 0.015*\"centuri\" + 0.010*\"woodcut\" + 0.010*\"form\" + 0.009*\"mean\" + 0.008*\"origin\" + 0.008*\"trade\" + 0.007*\"english\" + 0.007*\"known\" + 0.007*\"ancestor\"\n", + "2019-01-31 01:10:38,118 : INFO : topic #43 (0.020): 0.065*\"elect\" + 0.057*\"parti\" + 0.025*\"voluntari\" + 0.024*\"democrat\" + 0.020*\"member\" + 0.017*\"polici\" + 0.015*\"republ\" + 0.015*\"seaport\" + 0.013*\"bypass\" + 0.013*\"selma\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 01:10:38,119 : INFO : topic #42 (0.020): 0.047*\"german\" + 0.031*\"germani\" + 0.016*\"vol\" + 0.014*\"berlin\" + 0.014*\"jewish\" + 0.014*\"israel\" + 0.013*\"der\" + 0.011*\"european\" + 0.010*\"europ\" + 0.009*\"austria\"\n", + "2019-01-31 01:10:38,125 : INFO : topic diff=0.004365, rho=0.025134\n", + "2019-01-31 01:10:38,282 : INFO : PROGRESS: pass 0, at document #3168000/4922894\n", + "2019-01-31 01:10:39,682 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:10:39,948 : INFO : topic #19 (0.020): 0.015*\"languag\" + 0.015*\"centuri\" + 0.010*\"woodcut\" + 0.010*\"form\" + 0.009*\"mean\" + 0.008*\"origin\" + 0.008*\"trade\" + 0.007*\"english\" + 0.007*\"known\" + 0.007*\"ancestor\"\n", + "2019-01-31 01:10:39,949 : INFO : topic #18 (0.020): 0.010*\"théori\" + 0.007*\"later\" + 0.007*\"sack\" + 0.006*\"dai\" + 0.006*\"kill\" + 0.005*\"like\" + 0.005*\"retrospect\" + 0.005*\"end\" + 0.004*\"call\" + 0.004*\"help\"\n", + "2019-01-31 01:10:39,950 : INFO : topic #35 (0.020): 0.055*\"russia\" + 0.038*\"sovereignti\" + 0.034*\"rural\" + 0.025*\"personifi\" + 0.023*\"reprint\" + 0.022*\"poison\" + 0.019*\"moscow\" + 0.016*\"poland\" + 0.015*\"unfortun\" + 0.014*\"malaysia\"\n", + "2019-01-31 01:10:39,951 : INFO : topic #38 (0.020): 0.024*\"walter\" + 0.010*\"aza\" + 0.009*\"battalion\" + 0.009*\"forc\" + 0.008*\"teufel\" + 0.008*\"empath\" + 0.007*\"armi\" + 0.007*\"till\" + 0.007*\"govern\" + 0.006*\"militari\"\n", + "2019-01-31 01:10:39,952 : INFO : topic #15 (0.020): 0.012*\"small\" + 0.010*\"organ\" + 0.010*\"develop\" + 0.009*\"commun\" + 0.009*\"group\" + 0.008*\"peopl\" + 0.008*\"word\" + 0.007*\"human\" + 0.007*\"woman\" + 0.006*\"summerhil\"\n", + "2019-01-31 01:10:39,958 : INFO : topic diff=0.003928, rho=0.025126\n", + "2019-01-31 01:10:40,116 : INFO : PROGRESS: pass 0, at document #3170000/4922894\n", + "2019-01-31 01:10:41,507 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:10:41,774 : INFO : topic #22 (0.020): 0.035*\"spars\" + 0.019*\"factor\" + 0.011*\"plaisir\" + 0.010*\"genu\" + 0.009*\"biom\" + 0.009*\"western\" + 0.008*\"median\" + 0.008*\"feel\" + 0.008*\"male\" + 0.007*\"trap\"\n", + "2019-01-31 01:10:41,775 : INFO : topic #40 (0.020): 0.087*\"unit\" + 0.023*\"schuster\" + 0.022*\"institut\" + 0.021*\"requir\" + 0.020*\"collector\" + 0.019*\"student\" + 0.014*\"professor\" + 0.012*\"http\" + 0.012*\"word\" + 0.011*\"degre\"\n", + "2019-01-31 01:10:41,776 : INFO : topic #45 (0.020): 0.027*\"jpg\" + 0.024*\"fifteenth\" + 0.019*\"illicit\" + 0.017*\"pain\" + 0.016*\"colder\" + 0.014*\"arsen\" + 0.013*\"black\" + 0.012*\"western\" + 0.011*\"depress\" + 0.011*\"gai\"\n", + "2019-01-31 01:10:41,777 : INFO : topic #38 (0.020): 0.024*\"walter\" + 0.010*\"aza\" + 0.009*\"battalion\" + 0.009*\"forc\" + 0.008*\"teufel\" + 0.008*\"empath\" + 0.007*\"armi\" + 0.007*\"govern\" + 0.007*\"till\" + 0.006*\"militari\"\n", + "2019-01-31 01:10:41,778 : INFO : topic #43 (0.020): 0.065*\"elect\" + 0.057*\"parti\" + 0.025*\"voluntari\" + 0.024*\"democrat\" + 0.020*\"member\" + 0.017*\"polici\" + 0.015*\"republ\" + 0.015*\"seaport\" + 0.013*\"bypass\" + 0.013*\"selma\"\n", + "2019-01-31 01:10:41,784 : INFO : topic diff=0.003314, rho=0.025118\n", + "2019-01-31 01:10:41,938 : INFO : PROGRESS: pass 0, at document #3172000/4922894\n", + "2019-01-31 01:10:43,304 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:10:43,571 : INFO : topic #21 (0.020): 0.032*\"samford\" + 0.021*\"spain\" + 0.019*\"del\" + 0.016*\"mexico\" + 0.016*\"italian\" + 0.013*\"soviet\" + 0.011*\"juan\" + 0.011*\"santa\" + 0.011*\"lizard\" + 0.010*\"josé\"\n", + "2019-01-31 01:10:43,572 : INFO : topic #44 (0.020): 0.033*\"rooftop\" + 0.028*\"final\" + 0.022*\"wife\" + 0.020*\"tourist\" + 0.018*\"champion\" + 0.015*\"taxpay\" + 0.015*\"martin\" + 0.014*\"chamber\" + 0.014*\"tiepolo\" + 0.013*\"open\"\n", + "2019-01-31 01:10:43,573 : INFO : topic #29 (0.020): 0.030*\"companhia\" + 0.013*\"busi\" + 0.012*\"million\" + 0.012*\"market\" + 0.011*\"bank\" + 0.011*\"produc\" + 0.010*\"industri\" + 0.008*\"yawn\" + 0.008*\"manag\" + 0.007*\"function\"\n", + "2019-01-31 01:10:43,574 : INFO : topic #39 (0.020): 0.058*\"canada\" + 0.044*\"canadian\" + 0.024*\"toronto\" + 0.022*\"hoar\" + 0.019*\"ontario\" + 0.015*\"novotná\" + 0.015*\"new\" + 0.015*\"hydrogen\" + 0.014*\"misericordia\" + 0.014*\"quebec\"\n", + "2019-01-31 01:10:43,575 : INFO : topic #13 (0.020): 0.028*\"london\" + 0.027*\"australia\" + 0.026*\"new\" + 0.025*\"sourc\" + 0.024*\"england\" + 0.023*\"australian\" + 0.019*\"british\" + 0.017*\"ireland\" + 0.015*\"youth\" + 0.013*\"wale\"\n", + "2019-01-31 01:10:43,580 : INFO : topic diff=0.004106, rho=0.025110\n", + "2019-01-31 01:10:43,738 : INFO : PROGRESS: pass 0, at document #3174000/4922894\n", + "2019-01-31 01:10:45,139 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:10:45,405 : INFO : topic #15 (0.020): 0.011*\"small\" + 0.011*\"organ\" + 0.010*\"develop\" + 0.009*\"commun\" + 0.009*\"group\" + 0.008*\"peopl\" + 0.008*\"word\" + 0.007*\"human\" + 0.007*\"woman\" + 0.006*\"summerhil\"\n", + "2019-01-31 01:10:45,406 : INFO : topic #14 (0.020): 0.024*\"forc\" + 0.022*\"aggress\" + 0.020*\"walter\" + 0.020*\"armi\" + 0.018*\"com\" + 0.015*\"oper\" + 0.014*\"unionist\" + 0.013*\"militari\" + 0.012*\"airbu\" + 0.011*\"diversifi\"\n", + "2019-01-31 01:10:45,407 : INFO : topic #39 (0.020): 0.058*\"canada\" + 0.044*\"canadian\" + 0.024*\"toronto\" + 0.022*\"hoar\" + 0.019*\"ontario\" + 0.015*\"novotná\" + 0.015*\"new\" + 0.015*\"hydrogen\" + 0.014*\"misericordia\" + 0.014*\"quebec\"\n", + "2019-01-31 01:10:45,408 : INFO : topic #11 (0.020): 0.024*\"john\" + 0.013*\"will\" + 0.012*\"jame\" + 0.011*\"david\" + 0.010*\"rival\" + 0.009*\"mexican–american\" + 0.008*\"paul\" + 0.008*\"georg\" + 0.008*\"slur\" + 0.007*\"rhyme\"\n", + "2019-01-31 01:10:45,409 : INFO : topic #17 (0.020): 0.078*\"church\" + 0.023*\"christian\" + 0.023*\"cathol\" + 0.020*\"bishop\" + 0.016*\"retroflex\" + 0.016*\"sail\" + 0.010*\"poll\" + 0.009*\"relationship\" + 0.009*\"cathedr\" + 0.009*\"parish\"\n", + "2019-01-31 01:10:45,415 : INFO : topic diff=0.003677, rho=0.025102\n", + "2019-01-31 01:10:45,575 : INFO : PROGRESS: pass 0, at document #3176000/4922894\n", + "2019-01-31 01:10:46,947 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:10:47,214 : INFO : topic #43 (0.020): 0.066*\"elect\" + 0.057*\"parti\" + 0.025*\"democrat\" + 0.024*\"voluntari\" + 0.020*\"member\" + 0.017*\"polici\" + 0.015*\"republ\" + 0.014*\"seaport\" + 0.013*\"bypass\" + 0.013*\"selma\"\n", + "2019-01-31 01:10:47,215 : INFO : topic #44 (0.020): 0.034*\"rooftop\" + 0.029*\"final\" + 0.022*\"wife\" + 0.020*\"tourist\" + 0.018*\"champion\" + 0.015*\"taxpay\" + 0.015*\"martin\" + 0.014*\"chamber\" + 0.013*\"tiepolo\" + 0.013*\"winner\"\n", + "2019-01-31 01:10:47,216 : INFO : topic #5 (0.020): 0.039*\"abroad\" + 0.028*\"son\" + 0.027*\"rel\" + 0.025*\"reconstruct\" + 0.021*\"band\" + 0.017*\"muscl\" + 0.016*\"simultan\" + 0.014*\"charcoal\" + 0.014*\"toyota\" + 0.010*\"vocabulari\"\n", + "2019-01-31 01:10:47,217 : INFO : topic #27 (0.020): 0.072*\"questionnair\" + 0.019*\"candid\" + 0.019*\"taxpay\" + 0.013*\"tornado\" + 0.013*\"driver\" + 0.013*\"ret\" + 0.012*\"find\" + 0.011*\"fool\" + 0.011*\"squatter\" + 0.010*\"champion\"\n", + "2019-01-31 01:10:47,218 : INFO : topic #41 (0.020): 0.040*\"citi\" + 0.024*\"palmer\" + 0.021*\"new\" + 0.014*\"strategist\" + 0.013*\"center\" + 0.012*\"open\" + 0.011*\"includ\" + 0.011*\"lobe\" + 0.010*\"dai\" + 0.009*\"highli\"\n", + "2019-01-31 01:10:47,224 : INFO : topic diff=0.003521, rho=0.025094\n", + "2019-01-31 01:10:47,383 : INFO : PROGRESS: pass 0, at document #3178000/4922894\n", + "2019-01-31 01:10:48,790 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:10:49,057 : INFO : topic #14 (0.020): 0.024*\"forc\" + 0.022*\"aggress\" + 0.020*\"walter\" + 0.020*\"armi\" + 0.018*\"com\" + 0.015*\"oper\" + 0.014*\"unionist\" + 0.013*\"militari\" + 0.012*\"airbu\" + 0.011*\"diversifi\"\n", + "2019-01-31 01:10:49,058 : INFO : topic #36 (0.020): 0.012*\"network\" + 0.011*\"pop\" + 0.011*\"prognosi\" + 0.009*\"cytokin\" + 0.008*\"develop\" + 0.008*\"diggin\" + 0.008*\"uruguayan\" + 0.008*\"softwar\" + 0.008*\"user\" + 0.007*\"includ\"\n", + "2019-01-31 01:10:49,059 : INFO : topic #34 (0.020): 0.068*\"start\" + 0.034*\"new\" + 0.032*\"american\" + 0.029*\"unionist\" + 0.025*\"cotton\" + 0.022*\"year\" + 0.015*\"california\" + 0.013*\"warrior\" + 0.013*\"terri\" + 0.012*\"north\"\n", + "2019-01-31 01:10:49,060 : INFO : topic #26 (0.020): 0.032*\"workplac\" + 0.029*\"champion\" + 0.028*\"woman\" + 0.025*\"olymp\" + 0.024*\"men\" + 0.023*\"medal\" + 0.021*\"event\" + 0.018*\"atheist\" + 0.018*\"rainfal\" + 0.018*\"nation\"\n", + "2019-01-31 01:10:49,061 : INFO : topic #12 (0.020): 0.009*\"number\" + 0.007*\"frontal\" + 0.007*\"poet\" + 0.007*\"gener\" + 0.006*\"utopian\" + 0.006*\"exampl\" + 0.006*\"théori\" + 0.006*\"southern\" + 0.006*\"measur\" + 0.006*\"differ\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 01:10:49,067 : INFO : topic diff=0.003511, rho=0.025086\n", + "2019-01-31 01:10:51,794 : INFO : -11.411 per-word bound, 2722.3 perplexity estimate based on a held-out corpus of 2000 documents with 573974 words\n", + "2019-01-31 01:10:51,795 : INFO : PROGRESS: pass 0, at document #3180000/4922894\n", + "2019-01-31 01:10:53,196 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:10:53,462 : INFO : topic #22 (0.020): 0.035*\"spars\" + 0.019*\"factor\" + 0.011*\"plaisir\" + 0.010*\"genu\" + 0.009*\"biom\" + 0.009*\"western\" + 0.008*\"median\" + 0.008*\"feel\" + 0.008*\"male\" + 0.007*\"trap\"\n", + "2019-01-31 01:10:53,463 : INFO : topic #17 (0.020): 0.078*\"church\" + 0.023*\"cathol\" + 0.023*\"christian\" + 0.020*\"bishop\" + 0.016*\"retroflex\" + 0.016*\"sail\" + 0.010*\"poll\" + 0.009*\"relationship\" + 0.009*\"parish\" + 0.009*\"cathedr\"\n", + "2019-01-31 01:10:53,464 : INFO : topic #2 (0.020): 0.052*\"isl\" + 0.038*\"shield\" + 0.018*\"narrat\" + 0.014*\"scot\" + 0.013*\"pope\" + 0.012*\"blur\" + 0.012*\"nativist\" + 0.011*\"coalit\" + 0.009*\"fleet\" + 0.009*\"bahá\"\n", + "2019-01-31 01:10:53,465 : INFO : topic #30 (0.020): 0.035*\"cleveland\" + 0.035*\"leagu\" + 0.029*\"place\" + 0.027*\"taxpay\" + 0.025*\"scientist\" + 0.024*\"crete\" + 0.021*\"folei\" + 0.017*\"goal\" + 0.015*\"martin\" + 0.012*\"schmitz\"\n", + "2019-01-31 01:10:53,466 : INFO : topic #0 (0.020): 0.067*\"statewid\" + 0.043*\"line\" + 0.034*\"raid\" + 0.027*\"rosenwald\" + 0.021*\"traceabl\" + 0.021*\"serv\" + 0.014*\"oper\" + 0.011*\"rivièr\" + 0.011*\"airmen\" + 0.011*\"transient\"\n", + "2019-01-31 01:10:53,472 : INFO : topic diff=0.004377, rho=0.025078\n", + "2019-01-31 01:10:53,625 : INFO : PROGRESS: pass 0, at document #3182000/4922894\n", + "2019-01-31 01:10:54,979 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:10:55,245 : INFO : topic #8 (0.020): 0.026*\"law\" + 0.023*\"cortic\" + 0.018*\"start\" + 0.016*\"act\" + 0.012*\"ricardo\" + 0.012*\"case\" + 0.010*\"replac\" + 0.009*\"polaris\" + 0.008*\"legal\" + 0.007*\"judaism\"\n", + "2019-01-31 01:10:55,246 : INFO : topic #41 (0.020): 0.041*\"citi\" + 0.023*\"palmer\" + 0.021*\"new\" + 0.014*\"strategist\" + 0.013*\"center\" + 0.012*\"open\" + 0.011*\"includ\" + 0.011*\"lobe\" + 0.010*\"dai\" + 0.009*\"highli\"\n", + "2019-01-31 01:10:55,247 : INFO : topic #49 (0.020): 0.043*\"india\" + 0.030*\"incumb\" + 0.013*\"pakistan\" + 0.012*\"televis\" + 0.012*\"islam\" + 0.011*\"muskoge\" + 0.011*\"anglo\" + 0.010*\"sri\" + 0.010*\"affection\" + 0.010*\"alam\"\n", + "2019-01-31 01:10:55,248 : INFO : topic #30 (0.020): 0.035*\"cleveland\" + 0.035*\"leagu\" + 0.029*\"place\" + 0.027*\"taxpay\" + 0.025*\"scientist\" + 0.024*\"crete\" + 0.021*\"folei\" + 0.017*\"goal\" + 0.015*\"martin\" + 0.012*\"schmitz\"\n", + "2019-01-31 01:10:55,250 : INFO : topic #18 (0.020): 0.010*\"théori\" + 0.007*\"later\" + 0.007*\"sack\" + 0.006*\"dai\" + 0.006*\"kill\" + 0.005*\"like\" + 0.005*\"retrospect\" + 0.005*\"end\" + 0.004*\"call\" + 0.004*\"help\"\n", + "2019-01-31 01:10:55,255 : INFO : topic diff=0.004012, rho=0.025071\n", + "2019-01-31 01:10:55,412 : INFO : PROGRESS: pass 0, at document #3184000/4922894\n", + "2019-01-31 01:10:56,804 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:10:57,070 : INFO : topic #28 (0.020): 0.034*\"build\" + 0.027*\"hous\" + 0.018*\"buford\" + 0.017*\"rivièr\" + 0.014*\"histor\" + 0.011*\"constitut\" + 0.011*\"briarwood\" + 0.011*\"depress\" + 0.011*\"linear\" + 0.010*\"silicon\"\n", + "2019-01-31 01:10:57,072 : INFO : topic #29 (0.020): 0.030*\"companhia\" + 0.012*\"busi\" + 0.012*\"million\" + 0.011*\"market\" + 0.011*\"bank\" + 0.011*\"produc\" + 0.010*\"industri\" + 0.008*\"yawn\" + 0.008*\"manag\" + 0.007*\"oper\"\n", + "2019-01-31 01:10:57,073 : INFO : topic #20 (0.020): 0.148*\"scholar\" + 0.040*\"struggl\" + 0.037*\"high\" + 0.031*\"educ\" + 0.026*\"collector\" + 0.017*\"yawn\" + 0.013*\"prognosi\" + 0.010*\"task\" + 0.009*\"district\" + 0.009*\"gothic\"\n", + "2019-01-31 01:10:57,074 : INFO : topic #34 (0.020): 0.067*\"start\" + 0.034*\"new\" + 0.032*\"american\" + 0.030*\"unionist\" + 0.025*\"cotton\" + 0.022*\"year\" + 0.015*\"california\" + 0.013*\"warrior\" + 0.012*\"terri\" + 0.012*\"north\"\n", + "2019-01-31 01:10:57,075 : INFO : topic #18 (0.020): 0.011*\"théori\" + 0.007*\"later\" + 0.007*\"sack\" + 0.006*\"dai\" + 0.006*\"kill\" + 0.005*\"retrospect\" + 0.005*\"like\" + 0.005*\"end\" + 0.004*\"call\" + 0.004*\"help\"\n", + "2019-01-31 01:10:57,081 : INFO : topic diff=0.003405, rho=0.025063\n", + "2019-01-31 01:10:57,234 : INFO : PROGRESS: pass 0, at document #3186000/4922894\n", + "2019-01-31 01:10:58,600 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:10:58,867 : INFO : topic #36 (0.020): 0.012*\"network\" + 0.011*\"pop\" + 0.011*\"prognosi\" + 0.009*\"cytokin\" + 0.008*\"develop\" + 0.008*\"uruguayan\" + 0.008*\"diggin\" + 0.008*\"softwar\" + 0.008*\"user\" + 0.007*\"includ\"\n", + "2019-01-31 01:10:58,868 : INFO : topic #3 (0.020): 0.032*\"present\" + 0.026*\"offic\" + 0.024*\"minist\" + 0.023*\"nation\" + 0.023*\"govern\" + 0.021*\"member\" + 0.019*\"serv\" + 0.016*\"start\" + 0.016*\"gener\" + 0.014*\"chickasaw\"\n", + "2019-01-31 01:10:58,868 : INFO : topic #47 (0.020): 0.063*\"muscl\" + 0.031*\"perceptu\" + 0.019*\"theater\" + 0.019*\"compos\" + 0.018*\"place\" + 0.014*\"damn\" + 0.014*\"physician\" + 0.014*\"orchestr\" + 0.013*\"olympo\" + 0.011*\"jack\"\n", + "2019-01-31 01:10:58,869 : INFO : topic #33 (0.020): 0.062*\"french\" + 0.046*\"franc\" + 0.031*\"pari\" + 0.024*\"sail\" + 0.023*\"jean\" + 0.017*\"daphn\" + 0.013*\"loui\" + 0.013*\"lazi\" + 0.012*\"piec\" + 0.008*\"wine\"\n", + "2019-01-31 01:10:58,870 : INFO : topic #27 (0.020): 0.072*\"questionnair\" + 0.019*\"candid\" + 0.019*\"taxpay\" + 0.013*\"tornado\" + 0.013*\"driver\" + 0.012*\"ret\" + 0.012*\"find\" + 0.011*\"squatter\" + 0.011*\"fool\" + 0.010*\"champion\"\n", + "2019-01-31 01:10:58,876 : INFO : topic diff=0.003314, rho=0.025055\n", + "2019-01-31 01:10:59,033 : INFO : PROGRESS: pass 0, at document #3188000/4922894\n", + "2019-01-31 01:11:00,435 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:11:00,704 : INFO : topic #13 (0.020): 0.028*\"london\" + 0.026*\"australia\" + 0.026*\"new\" + 0.025*\"sourc\" + 0.024*\"england\" + 0.022*\"australian\" + 0.019*\"british\" + 0.017*\"ireland\" + 0.015*\"youth\" + 0.013*\"wale\"\n", + "2019-01-31 01:11:00,705 : INFO : topic #37 (0.020): 0.012*\"charact\" + 0.010*\"anim\" + 0.010*\"septemb\" + 0.010*\"man\" + 0.007*\"appear\" + 0.007*\"comic\" + 0.006*\"workplac\" + 0.006*\"storag\" + 0.006*\"fusiform\" + 0.006*\"vision\"\n", + "2019-01-31 01:11:00,707 : INFO : topic #40 (0.020): 0.086*\"unit\" + 0.023*\"schuster\" + 0.022*\"institut\" + 0.021*\"requir\" + 0.021*\"collector\" + 0.019*\"student\" + 0.014*\"professor\" + 0.012*\"word\" + 0.012*\"http\" + 0.011*\"governor\"\n", + "2019-01-31 01:11:00,708 : INFO : topic #9 (0.020): 0.069*\"bone\" + 0.048*\"american\" + 0.030*\"valour\" + 0.020*\"folei\" + 0.020*\"player\" + 0.017*\"dutch\" + 0.017*\"polit\" + 0.016*\"english\" + 0.012*\"simpler\" + 0.012*\"acrimoni\"\n", + "2019-01-31 01:11:00,709 : INFO : topic #20 (0.020): 0.152*\"scholar\" + 0.040*\"struggl\" + 0.037*\"high\" + 0.030*\"educ\" + 0.025*\"collector\" + 0.017*\"yawn\" + 0.013*\"prognosi\" + 0.010*\"prickli\" + 0.010*\"task\" + 0.009*\"district\"\n", + "2019-01-31 01:11:00,714 : INFO : topic diff=0.003494, rho=0.025047\n", + "2019-01-31 01:11:00,869 : INFO : PROGRESS: pass 0, at document #3190000/4922894\n", + "2019-01-31 01:11:02,245 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:11:02,512 : INFO : topic #42 (0.020): 0.049*\"german\" + 0.031*\"germani\" + 0.016*\"vol\" + 0.015*\"berlin\" + 0.015*\"jewish\" + 0.014*\"israel\" + 0.013*\"der\" + 0.010*\"european\" + 0.009*\"europ\" + 0.009*\"austria\"\n", + "2019-01-31 01:11:02,513 : INFO : topic #33 (0.020): 0.062*\"french\" + 0.047*\"franc\" + 0.031*\"pari\" + 0.023*\"sail\" + 0.023*\"jean\" + 0.017*\"daphn\" + 0.013*\"loui\" + 0.013*\"lazi\" + 0.012*\"piec\" + 0.008*\"wine\"\n", + "2019-01-31 01:11:02,514 : INFO : topic #17 (0.020): 0.079*\"church\" + 0.023*\"cathol\" + 0.023*\"christian\" + 0.020*\"bishop\" + 0.016*\"sail\" + 0.016*\"retroflex\" + 0.009*\"poll\" + 0.009*\"relationship\" + 0.009*\"cathedr\" + 0.009*\"parish\"\n", + "2019-01-31 01:11:02,515 : INFO : topic #43 (0.020): 0.067*\"elect\" + 0.057*\"parti\" + 0.024*\"voluntari\" + 0.024*\"democrat\" + 0.020*\"member\" + 0.017*\"polici\" + 0.015*\"republ\" + 0.014*\"seaport\" + 0.013*\"bypass\" + 0.013*\"selma\"\n", + "2019-01-31 01:11:02,516 : INFO : topic #41 (0.020): 0.040*\"citi\" + 0.023*\"palmer\" + 0.021*\"new\" + 0.014*\"strategist\" + 0.013*\"center\" + 0.012*\"open\" + 0.011*\"includ\" + 0.011*\"lobe\" + 0.010*\"dai\" + 0.009*\"highli\"\n", + "2019-01-31 01:11:02,522 : INFO : topic diff=0.004055, rho=0.025039\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 01:11:02,680 : INFO : PROGRESS: pass 0, at document #3192000/4922894\n", + "2019-01-31 01:11:04,087 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:11:04,355 : INFO : topic #7 (0.020): 0.021*\"snatch\" + 0.020*\"di\" + 0.018*\"factor\" + 0.016*\"margin\" + 0.016*\"yawn\" + 0.014*\"bone\" + 0.012*\"faster\" + 0.012*\"life\" + 0.012*\"daughter\" + 0.012*\"john\"\n", + "2019-01-31 01:11:04,356 : INFO : topic #46 (0.020): 0.018*\"stop\" + 0.017*\"sweden\" + 0.016*\"norwai\" + 0.016*\"swedish\" + 0.014*\"norwegian\" + 0.013*\"wind\" + 0.013*\"treeless\" + 0.012*\"damag\" + 0.011*\"huntsvil\" + 0.011*\"denmark\"\n", + "2019-01-31 01:11:04,357 : INFO : topic #21 (0.020): 0.033*\"samford\" + 0.022*\"spain\" + 0.019*\"del\" + 0.017*\"italian\" + 0.016*\"mexico\" + 0.013*\"soviet\" + 0.011*\"santa\" + 0.011*\"juan\" + 0.010*\"lizard\" + 0.010*\"carlo\"\n", + "2019-01-31 01:11:04,358 : INFO : topic #34 (0.020): 0.067*\"start\" + 0.034*\"new\" + 0.032*\"american\" + 0.030*\"unionist\" + 0.025*\"cotton\" + 0.022*\"year\" + 0.015*\"california\" + 0.013*\"warrior\" + 0.013*\"terri\" + 0.012*\"north\"\n", + "2019-01-31 01:11:04,359 : INFO : topic #16 (0.020): 0.058*\"king\" + 0.034*\"priest\" + 0.023*\"duke\" + 0.019*\"quarterli\" + 0.019*\"rotterdam\" + 0.018*\"grammat\" + 0.017*\"idiosyncrat\" + 0.015*\"count\" + 0.014*\"brazil\" + 0.012*\"princ\"\n", + "2019-01-31 01:11:04,365 : INFO : topic diff=0.003654, rho=0.025031\n", + "2019-01-31 01:11:04,520 : INFO : PROGRESS: pass 0, at document #3194000/4922894\n", + "2019-01-31 01:11:05,892 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:11:06,158 : INFO : topic #8 (0.020): 0.026*\"law\" + 0.023*\"cortic\" + 0.018*\"start\" + 0.016*\"act\" + 0.012*\"ricardo\" + 0.012*\"case\" + 0.010*\"replac\" + 0.009*\"polaris\" + 0.008*\"legal\" + 0.007*\"justic\"\n", + "2019-01-31 01:11:06,159 : INFO : topic #21 (0.020): 0.033*\"samford\" + 0.022*\"spain\" + 0.019*\"del\" + 0.017*\"italian\" + 0.016*\"mexico\" + 0.013*\"soviet\" + 0.011*\"juan\" + 0.011*\"santa\" + 0.010*\"lizard\" + 0.010*\"carlo\"\n", + "2019-01-31 01:11:06,160 : INFO : topic #28 (0.020): 0.034*\"build\" + 0.027*\"hous\" + 0.018*\"buford\" + 0.017*\"rivièr\" + 0.014*\"histor\" + 0.011*\"constitut\" + 0.011*\"depress\" + 0.011*\"briarwood\" + 0.010*\"linear\" + 0.010*\"silicon\"\n", + "2019-01-31 01:11:06,161 : INFO : topic #32 (0.020): 0.051*\"district\" + 0.044*\"popolo\" + 0.042*\"vigour\" + 0.037*\"tortur\" + 0.033*\"cotton\" + 0.022*\"multitud\" + 0.022*\"area\" + 0.021*\"adulthood\" + 0.021*\"citi\" + 0.019*\"cede\"\n", + "2019-01-31 01:11:06,162 : INFO : topic #15 (0.020): 0.011*\"small\" + 0.010*\"organ\" + 0.010*\"develop\" + 0.009*\"commun\" + 0.009*\"group\" + 0.008*\"peopl\" + 0.008*\"word\" + 0.007*\"human\" + 0.007*\"woman\" + 0.006*\"summerhil\"\n", + "2019-01-31 01:11:06,168 : INFO : topic diff=0.003691, rho=0.025023\n", + "2019-01-31 01:11:06,322 : INFO : PROGRESS: pass 0, at document #3196000/4922894\n", + "2019-01-31 01:11:07,692 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:11:07,958 : INFO : topic #23 (0.020): 0.137*\"audit\" + 0.071*\"best\" + 0.035*\"yawn\" + 0.028*\"jacksonvil\" + 0.022*\"japanes\" + 0.021*\"noll\" + 0.020*\"festiv\" + 0.018*\"women\" + 0.016*\"intern\" + 0.012*\"winner\"\n", + "2019-01-31 01:11:07,959 : INFO : topic #3 (0.020): 0.031*\"present\" + 0.026*\"offic\" + 0.023*\"minist\" + 0.023*\"nation\" + 0.022*\"govern\" + 0.021*\"member\" + 0.019*\"serv\" + 0.016*\"start\" + 0.016*\"gener\" + 0.014*\"chickasaw\"\n", + "2019-01-31 01:11:07,960 : INFO : topic #29 (0.020): 0.030*\"companhia\" + 0.013*\"busi\" + 0.012*\"million\" + 0.011*\"market\" + 0.011*\"bank\" + 0.011*\"produc\" + 0.010*\"industri\" + 0.009*\"yawn\" + 0.008*\"manag\" + 0.007*\"oper\"\n", + "2019-01-31 01:11:07,961 : INFO : topic #42 (0.020): 0.048*\"german\" + 0.031*\"germani\" + 0.015*\"vol\" + 0.015*\"jewish\" + 0.014*\"berlin\" + 0.014*\"israel\" + 0.013*\"der\" + 0.011*\"european\" + 0.009*\"europ\" + 0.009*\"austria\"\n", + "2019-01-31 01:11:07,962 : INFO : topic #15 (0.020): 0.011*\"small\" + 0.010*\"organ\" + 0.010*\"develop\" + 0.009*\"commun\" + 0.009*\"group\" + 0.008*\"peopl\" + 0.008*\"word\" + 0.007*\"human\" + 0.007*\"woman\" + 0.006*\"summerhil\"\n", + "2019-01-31 01:11:07,968 : INFO : topic diff=0.003398, rho=0.025016\n", + "2019-01-31 01:11:08,181 : INFO : PROGRESS: pass 0, at document #3198000/4922894\n", + "2019-01-31 01:11:09,566 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:11:09,835 : INFO : topic #45 (0.020): 0.027*\"jpg\" + 0.025*\"fifteenth\" + 0.020*\"illicit\" + 0.017*\"pain\" + 0.015*\"colder\" + 0.014*\"arsen\" + 0.013*\"black\" + 0.012*\"western\" + 0.012*\"museo\" + 0.011*\"gai\"\n", + "2019-01-31 01:11:09,836 : INFO : topic #44 (0.020): 0.034*\"rooftop\" + 0.029*\"final\" + 0.021*\"wife\" + 0.020*\"tourist\" + 0.018*\"champion\" + 0.015*\"taxpay\" + 0.015*\"martin\" + 0.014*\"tiepolo\" + 0.014*\"chamber\" + 0.012*\"open\"\n", + "2019-01-31 01:11:09,837 : INFO : topic #32 (0.020): 0.051*\"district\" + 0.044*\"popolo\" + 0.042*\"vigour\" + 0.037*\"tortur\" + 0.032*\"cotton\" + 0.022*\"area\" + 0.022*\"multitud\" + 0.021*\"adulthood\" + 0.021*\"citi\" + 0.019*\"cede\"\n", + "2019-01-31 01:11:09,838 : INFO : topic #29 (0.020): 0.030*\"companhia\" + 0.013*\"busi\" + 0.012*\"million\" + 0.011*\"market\" + 0.011*\"bank\" + 0.011*\"produc\" + 0.010*\"industri\" + 0.009*\"yawn\" + 0.008*\"manag\" + 0.007*\"oper\"\n", + "2019-01-31 01:11:09,840 : INFO : topic #19 (0.020): 0.016*\"languag\" + 0.015*\"centuri\" + 0.010*\"woodcut\" + 0.010*\"form\" + 0.009*\"mean\" + 0.008*\"origin\" + 0.008*\"trade\" + 0.008*\"english\" + 0.007*\"known\" + 0.007*\"ancestor\"\n", + "2019-01-31 01:11:09,845 : INFO : topic diff=0.003829, rho=0.025008\n", + "2019-01-31 01:11:12,486 : INFO : -11.511 per-word bound, 2919.3 perplexity estimate based on a held-out corpus of 2000 documents with 515958 words\n", + "2019-01-31 01:11:12,486 : INFO : PROGRESS: pass 0, at document #3200000/4922894\n", + "2019-01-31 01:11:13,858 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:11:14,124 : INFO : topic #18 (0.020): 0.011*\"théori\" + 0.007*\"later\" + 0.007*\"sack\" + 0.006*\"dai\" + 0.006*\"kill\" + 0.005*\"retrospect\" + 0.005*\"like\" + 0.005*\"end\" + 0.004*\"call\" + 0.004*\"help\"\n", + "2019-01-31 01:11:14,125 : INFO : topic #28 (0.020): 0.034*\"build\" + 0.027*\"hous\" + 0.018*\"buford\" + 0.016*\"rivièr\" + 0.014*\"histor\" + 0.011*\"constitut\" + 0.011*\"depress\" + 0.011*\"briarwood\" + 0.011*\"silicon\" + 0.010*\"linear\"\n", + "2019-01-31 01:11:14,127 : INFO : topic #5 (0.020): 0.039*\"abroad\" + 0.029*\"son\" + 0.027*\"rel\" + 0.025*\"reconstruct\" + 0.020*\"band\" + 0.017*\"muscl\" + 0.016*\"simultan\" + 0.014*\"charcoal\" + 0.014*\"toyota\" + 0.009*\"myspac\"\n", + "2019-01-31 01:11:14,128 : INFO : topic #39 (0.020): 0.057*\"canada\" + 0.042*\"canadian\" + 0.024*\"toronto\" + 0.023*\"hoar\" + 0.019*\"ontario\" + 0.015*\"novotná\" + 0.015*\"new\" + 0.015*\"hydrogen\" + 0.014*\"misericordia\" + 0.014*\"quebec\"\n", + "2019-01-31 01:11:14,129 : INFO : topic #15 (0.020): 0.011*\"small\" + 0.010*\"organ\" + 0.010*\"develop\" + 0.009*\"group\" + 0.009*\"commun\" + 0.008*\"peopl\" + 0.008*\"word\" + 0.007*\"human\" + 0.007*\"woman\" + 0.006*\"summerhil\"\n", + "2019-01-31 01:11:14,134 : INFO : topic diff=0.004012, rho=0.025000\n", + "2019-01-31 01:11:14,297 : INFO : PROGRESS: pass 0, at document #3202000/4922894\n", + "2019-01-31 01:11:15,692 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:11:15,959 : INFO : topic #22 (0.020): 0.035*\"spars\" + 0.019*\"factor\" + 0.012*\"plaisir\" + 0.010*\"genu\" + 0.009*\"biom\" + 0.009*\"western\" + 0.008*\"median\" + 0.008*\"feel\" + 0.008*\"male\" + 0.008*\"trap\"\n", + "2019-01-31 01:11:15,960 : INFO : topic #30 (0.020): 0.036*\"cleveland\" + 0.035*\"leagu\" + 0.030*\"place\" + 0.028*\"taxpay\" + 0.025*\"scientist\" + 0.023*\"crete\" + 0.021*\"folei\" + 0.017*\"goal\" + 0.015*\"martin\" + 0.012*\"schmitz\"\n", + "2019-01-31 01:11:15,961 : INFO : topic #49 (0.020): 0.044*\"india\" + 0.031*\"incumb\" + 0.013*\"pakistan\" + 0.012*\"televis\" + 0.012*\"islam\" + 0.012*\"muskoge\" + 0.012*\"anglo\" + 0.010*\"sri\" + 0.010*\"alam\" + 0.010*\"affection\"\n", + "2019-01-31 01:11:15,962 : INFO : topic #14 (0.020): 0.024*\"forc\" + 0.023*\"aggress\" + 0.020*\"walter\" + 0.020*\"armi\" + 0.017*\"com\" + 0.015*\"oper\" + 0.013*\"unionist\" + 0.012*\"militari\" + 0.012*\"airbu\" + 0.012*\"diversifi\"\n", + "2019-01-31 01:11:15,963 : INFO : topic #26 (0.020): 0.032*\"workplac\" + 0.029*\"champion\" + 0.029*\"woman\" + 0.026*\"olymp\" + 0.023*\"men\" + 0.022*\"medal\" + 0.021*\"event\" + 0.018*\"rainfal\" + 0.018*\"nation\" + 0.018*\"atheist\"\n", + "2019-01-31 01:11:15,969 : INFO : topic diff=0.003855, rho=0.024992\n", + "2019-01-31 01:11:16,124 : INFO : PROGRESS: pass 0, at document #3204000/4922894\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 01:11:17,518 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:11:17,785 : INFO : topic #37 (0.020): 0.012*\"charact\" + 0.010*\"septemb\" + 0.010*\"anim\" + 0.010*\"man\" + 0.007*\"comic\" + 0.007*\"appear\" + 0.007*\"workplac\" + 0.006*\"storag\" + 0.006*\"fusiform\" + 0.006*\"vision\"\n", + "2019-01-31 01:11:17,786 : INFO : topic #25 (0.020): 0.032*\"ring\" + 0.019*\"lagrang\" + 0.019*\"area\" + 0.017*\"warmth\" + 0.016*\"mount\" + 0.010*\"north\" + 0.009*\"foam\" + 0.009*\"land\" + 0.009*\"sourc\" + 0.008*\"palmer\"\n", + "2019-01-31 01:11:17,787 : INFO : topic #2 (0.020): 0.049*\"isl\" + 0.038*\"shield\" + 0.018*\"narrat\" + 0.014*\"scot\" + 0.013*\"pope\" + 0.012*\"blur\" + 0.012*\"nativist\" + 0.011*\"coalit\" + 0.009*\"fleet\" + 0.009*\"class\"\n", + "2019-01-31 01:11:17,788 : INFO : topic #49 (0.020): 0.044*\"india\" + 0.031*\"incumb\" + 0.013*\"pakistan\" + 0.012*\"televis\" + 0.012*\"anglo\" + 0.012*\"islam\" + 0.012*\"muskoge\" + 0.010*\"sri\" + 0.010*\"khalsa\" + 0.010*\"alam\"\n", + "2019-01-31 01:11:17,789 : INFO : topic #34 (0.020): 0.067*\"start\" + 0.034*\"new\" + 0.032*\"american\" + 0.030*\"unionist\" + 0.025*\"cotton\" + 0.022*\"year\" + 0.015*\"california\" + 0.013*\"warrior\" + 0.013*\"terri\" + 0.012*\"north\"\n", + "2019-01-31 01:11:17,794 : INFO : topic diff=0.003871, rho=0.024984\n", + "2019-01-31 01:11:17,949 : INFO : PROGRESS: pass 0, at document #3206000/4922894\n", + "2019-01-31 01:11:19,319 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:11:19,585 : INFO : topic #15 (0.020): 0.011*\"small\" + 0.010*\"organ\" + 0.010*\"develop\" + 0.009*\"commun\" + 0.009*\"group\" + 0.008*\"peopl\" + 0.008*\"word\" + 0.007*\"human\" + 0.007*\"woman\" + 0.006*\"summerhil\"\n", + "2019-01-31 01:11:19,586 : INFO : topic #26 (0.020): 0.031*\"workplac\" + 0.029*\"champion\" + 0.029*\"woman\" + 0.026*\"olymp\" + 0.024*\"men\" + 0.023*\"medal\" + 0.021*\"event\" + 0.018*\"rainfal\" + 0.018*\"nation\" + 0.018*\"atheist\"\n", + "2019-01-31 01:11:19,587 : INFO : topic #9 (0.020): 0.071*\"bone\" + 0.046*\"american\" + 0.029*\"valour\" + 0.020*\"folei\" + 0.019*\"player\" + 0.018*\"dutch\" + 0.017*\"polit\" + 0.016*\"english\" + 0.012*\"acrimoni\" + 0.012*\"simpler\"\n", + "2019-01-31 01:11:19,588 : INFO : topic #45 (0.020): 0.027*\"jpg\" + 0.025*\"fifteenth\" + 0.020*\"illicit\" + 0.017*\"pain\" + 0.015*\"colder\" + 0.014*\"arsen\" + 0.013*\"black\" + 0.012*\"western\" + 0.012*\"museo\" + 0.011*\"gai\"\n", + "2019-01-31 01:11:19,589 : INFO : topic #18 (0.020): 0.011*\"théori\" + 0.007*\"later\" + 0.007*\"sack\" + 0.006*\"dai\" + 0.006*\"kill\" + 0.005*\"retrospect\" + 0.005*\"like\" + 0.005*\"end\" + 0.004*\"call\" + 0.004*\"help\"\n", + "2019-01-31 01:11:19,595 : INFO : topic diff=0.003740, rho=0.024977\n", + "2019-01-31 01:11:19,752 : INFO : PROGRESS: pass 0, at document #3208000/4922894\n", + "2019-01-31 01:11:21,151 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:11:21,417 : INFO : topic #37 (0.020): 0.012*\"charact\" + 0.010*\"septemb\" + 0.010*\"anim\" + 0.010*\"man\" + 0.007*\"appear\" + 0.007*\"comic\" + 0.007*\"workplac\" + 0.006*\"storag\" + 0.006*\"fusiform\" + 0.006*\"love\"\n", + "2019-01-31 01:11:21,418 : INFO : topic #12 (0.020): 0.009*\"number\" + 0.007*\"frontal\" + 0.007*\"poet\" + 0.006*\"gener\" + 0.006*\"exampl\" + 0.006*\"utopian\" + 0.006*\"théori\" + 0.006*\"measur\" + 0.006*\"southern\" + 0.006*\"differ\"\n", + "2019-01-31 01:11:21,419 : INFO : topic #46 (0.020): 0.018*\"stop\" + 0.017*\"sweden\" + 0.017*\"norwai\" + 0.016*\"swedish\" + 0.015*\"norwegian\" + 0.014*\"wind\" + 0.012*\"damag\" + 0.012*\"treeless\" + 0.011*\"huntsvil\" + 0.011*\"denmark\"\n", + "2019-01-31 01:11:21,420 : INFO : topic #15 (0.020): 0.011*\"small\" + 0.010*\"organ\" + 0.010*\"develop\" + 0.009*\"commun\" + 0.009*\"group\" + 0.008*\"peopl\" + 0.008*\"word\" + 0.007*\"human\" + 0.007*\"woman\" + 0.006*\"summerhil\"\n", + "2019-01-31 01:11:21,421 : INFO : topic #49 (0.020): 0.044*\"india\" + 0.030*\"incumb\" + 0.013*\"pakistan\" + 0.012*\"islam\" + 0.012*\"televis\" + 0.012*\"anglo\" + 0.012*\"muskoge\" + 0.010*\"sri\" + 0.010*\"khalsa\" + 0.010*\"alam\"\n", + "2019-01-31 01:11:21,427 : INFO : topic diff=0.003282, rho=0.024969\n", + "2019-01-31 01:11:21,587 : INFO : PROGRESS: pass 0, at document #3210000/4922894\n", + "2019-01-31 01:11:22,983 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:11:23,253 : INFO : topic #27 (0.020): 0.073*\"questionnair\" + 0.019*\"candid\" + 0.019*\"taxpay\" + 0.013*\"tornado\" + 0.013*\"driver\" + 0.012*\"find\" + 0.011*\"ret\" + 0.011*\"fool\" + 0.011*\"squatter\" + 0.010*\"champion\"\n", + "2019-01-31 01:11:23,254 : INFO : topic #13 (0.020): 0.028*\"london\" + 0.026*\"australia\" + 0.025*\"new\" + 0.025*\"sourc\" + 0.023*\"england\" + 0.022*\"australian\" + 0.020*\"british\" + 0.017*\"ireland\" + 0.015*\"youth\" + 0.013*\"wale\"\n", + "2019-01-31 01:11:23,256 : INFO : topic #37 (0.020): 0.012*\"charact\" + 0.010*\"anim\" + 0.010*\"septemb\" + 0.010*\"man\" + 0.007*\"comic\" + 0.007*\"appear\" + 0.007*\"workplac\" + 0.006*\"storag\" + 0.006*\"fusiform\" + 0.006*\"vision\"\n", + "2019-01-31 01:11:23,257 : INFO : topic #36 (0.020): 0.011*\"network\" + 0.011*\"prognosi\" + 0.011*\"pop\" + 0.009*\"cytokin\" + 0.008*\"uruguayan\" + 0.008*\"develop\" + 0.008*\"user\" + 0.008*\"diggin\" + 0.008*\"softwar\" + 0.007*\"includ\"\n", + "2019-01-31 01:11:23,258 : INFO : topic #28 (0.020): 0.034*\"build\" + 0.028*\"hous\" + 0.018*\"buford\" + 0.016*\"rivièr\" + 0.014*\"histor\" + 0.011*\"constitut\" + 0.011*\"depress\" + 0.011*\"briarwood\" + 0.011*\"silicon\" + 0.011*\"linear\"\n", + "2019-01-31 01:11:23,264 : INFO : topic diff=0.003698, rho=0.024961\n", + "2019-01-31 01:11:23,421 : INFO : PROGRESS: pass 0, at document #3212000/4922894\n", + "2019-01-31 01:11:24,813 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:11:25,079 : INFO : topic #26 (0.020): 0.032*\"workplac\" + 0.030*\"champion\" + 0.029*\"woman\" + 0.025*\"olymp\" + 0.023*\"men\" + 0.022*\"medal\" + 0.021*\"event\" + 0.018*\"rainfal\" + 0.018*\"nation\" + 0.018*\"taxpay\"\n", + "2019-01-31 01:11:25,080 : INFO : topic #27 (0.020): 0.073*\"questionnair\" + 0.020*\"candid\" + 0.019*\"taxpay\" + 0.013*\"driver\" + 0.013*\"tornado\" + 0.011*\"find\" + 0.011*\"ret\" + 0.011*\"fool\" + 0.010*\"squatter\" + 0.010*\"champion\"\n", + "2019-01-31 01:11:25,081 : INFO : topic #33 (0.020): 0.063*\"french\" + 0.046*\"franc\" + 0.031*\"pari\" + 0.023*\"jean\" + 0.023*\"sail\" + 0.017*\"daphn\" + 0.013*\"loui\" + 0.013*\"lazi\" + 0.012*\"piec\" + 0.008*\"wine\"\n", + "2019-01-31 01:11:25,082 : INFO : topic #35 (0.020): 0.057*\"russia\" + 0.038*\"sovereignti\" + 0.034*\"rural\" + 0.025*\"personifi\" + 0.023*\"reprint\" + 0.023*\"poison\" + 0.020*\"moscow\" + 0.016*\"poland\" + 0.015*\"unfortun\" + 0.014*\"malaysia\"\n", + "2019-01-31 01:11:25,083 : INFO : topic #37 (0.020): 0.012*\"charact\" + 0.010*\"anim\" + 0.010*\"man\" + 0.010*\"septemb\" + 0.008*\"comic\" + 0.007*\"appear\" + 0.007*\"workplac\" + 0.006*\"storag\" + 0.006*\"fusiform\" + 0.006*\"love\"\n", + "2019-01-31 01:11:25,089 : INFO : topic diff=0.003818, rho=0.024953\n", + "2019-01-31 01:11:25,244 : INFO : PROGRESS: pass 0, at document #3214000/4922894\n", + "2019-01-31 01:11:26,622 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:11:26,888 : INFO : topic #43 (0.020): 0.066*\"elect\" + 0.056*\"parti\" + 0.025*\"voluntari\" + 0.023*\"democrat\" + 0.020*\"member\" + 0.017*\"polici\" + 0.015*\"republ\" + 0.014*\"seaport\" + 0.014*\"selma\" + 0.013*\"bypass\"\n", + "2019-01-31 01:11:26,889 : INFO : topic #13 (0.020): 0.028*\"london\" + 0.026*\"australia\" + 0.026*\"new\" + 0.025*\"sourc\" + 0.023*\"england\" + 0.022*\"australian\" + 0.020*\"british\" + 0.017*\"ireland\" + 0.015*\"youth\" + 0.013*\"wale\"\n", + "2019-01-31 01:11:26,890 : INFO : topic #7 (0.020): 0.021*\"snatch\" + 0.020*\"di\" + 0.018*\"factor\" + 0.016*\"margin\" + 0.016*\"yawn\" + 0.014*\"bone\" + 0.012*\"life\" + 0.012*\"faster\" + 0.012*\"daughter\" + 0.011*\"john\"\n", + "2019-01-31 01:11:26,891 : INFO : topic #31 (0.020): 0.052*\"fusiform\" + 0.026*\"scientist\" + 0.026*\"taxpay\" + 0.023*\"player\" + 0.020*\"place\" + 0.014*\"clot\" + 0.013*\"leagu\" + 0.011*\"folei\" + 0.010*\"yawn\" + 0.009*\"reconstruct\"\n", + "2019-01-31 01:11:26,892 : INFO : topic #2 (0.020): 0.049*\"isl\" + 0.037*\"shield\" + 0.018*\"narrat\" + 0.014*\"scot\" + 0.012*\"pope\" + 0.012*\"blur\" + 0.011*\"nativist\" + 0.011*\"coalit\" + 0.010*\"retrospect\" + 0.009*\"fleet\"\n", + "2019-01-31 01:11:26,898 : INFO : topic diff=0.003957, rho=0.024945\n", + "2019-01-31 01:11:27,052 : INFO : PROGRESS: pass 0, at document #3216000/4922894\n", + "2019-01-31 01:11:28,415 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:11:28,682 : INFO : topic #27 (0.020): 0.073*\"questionnair\" + 0.019*\"candid\" + 0.019*\"taxpay\" + 0.013*\"tornado\" + 0.013*\"driver\" + 0.012*\"find\" + 0.011*\"fool\" + 0.011*\"ret\" + 0.010*\"squatter\" + 0.010*\"champion\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 01:11:28,683 : INFO : topic #19 (0.020): 0.017*\"languag\" + 0.015*\"centuri\" + 0.010*\"woodcut\" + 0.010*\"form\" + 0.008*\"mean\" + 0.008*\"origin\" + 0.008*\"trade\" + 0.008*\"english\" + 0.007*\"known\" + 0.006*\"ancestor\"\n", + "2019-01-31 01:11:28,684 : INFO : topic #39 (0.020): 0.058*\"canada\" + 0.044*\"canadian\" + 0.024*\"toronto\" + 0.023*\"hoar\" + 0.020*\"ontario\" + 0.017*\"hydrogen\" + 0.015*\"new\" + 0.015*\"novotná\" + 0.014*\"misericordia\" + 0.014*\"quebec\"\n", + "2019-01-31 01:11:28,685 : INFO : topic #1 (0.020): 0.052*\"china\" + 0.045*\"chilton\" + 0.025*\"hong\" + 0.024*\"kong\" + 0.020*\"korea\" + 0.019*\"korean\" + 0.018*\"leah\" + 0.017*\"kim\" + 0.016*\"sourc\" + 0.013*\"shirin\"\n", + "2019-01-31 01:11:28,686 : INFO : topic #43 (0.020): 0.066*\"elect\" + 0.056*\"parti\" + 0.025*\"voluntari\" + 0.023*\"democrat\" + 0.020*\"member\" + 0.017*\"polici\" + 0.015*\"republ\" + 0.014*\"seaport\" + 0.014*\"selma\" + 0.013*\"bypass\"\n", + "2019-01-31 01:11:28,692 : INFO : topic diff=0.004325, rho=0.024938\n", + "2019-01-31 01:11:28,852 : INFO : PROGRESS: pass 0, at document #3218000/4922894\n", + "2019-01-31 01:11:30,242 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:11:30,508 : INFO : topic #49 (0.020): 0.043*\"india\" + 0.030*\"incumb\" + 0.013*\"pakistan\" + 0.013*\"anglo\" + 0.012*\"islam\" + 0.012*\"televis\" + 0.012*\"muskoge\" + 0.010*\"sri\" + 0.010*\"khalsa\" + 0.010*\"alam\"\n", + "2019-01-31 01:11:30,509 : INFO : topic #8 (0.020): 0.026*\"law\" + 0.022*\"cortic\" + 0.018*\"start\" + 0.015*\"act\" + 0.012*\"case\" + 0.012*\"ricardo\" + 0.010*\"replac\" + 0.009*\"polaris\" + 0.008*\"legal\" + 0.007*\"justic\"\n", + "2019-01-31 01:11:30,510 : INFO : topic #31 (0.020): 0.052*\"fusiform\" + 0.026*\"scientist\" + 0.026*\"taxpay\" + 0.023*\"player\" + 0.020*\"place\" + 0.014*\"clot\" + 0.013*\"leagu\" + 0.010*\"folei\" + 0.010*\"yawn\" + 0.009*\"reconstruct\"\n", + "2019-01-31 01:11:30,512 : INFO : topic #16 (0.020): 0.058*\"king\" + 0.033*\"priest\" + 0.022*\"duke\" + 0.020*\"rotterdam\" + 0.019*\"quarterli\" + 0.018*\"grammat\" + 0.017*\"idiosyncrat\" + 0.014*\"count\" + 0.013*\"brazil\" + 0.013*\"portugues\"\n", + "2019-01-31 01:11:30,513 : INFO : topic #17 (0.020): 0.078*\"church\" + 0.023*\"christian\" + 0.022*\"cathol\" + 0.020*\"bishop\" + 0.015*\"sail\" + 0.015*\"retroflex\" + 0.009*\"relationship\" + 0.009*\"poll\" + 0.009*\"historiographi\" + 0.009*\"parish\"\n", + "2019-01-31 01:11:30,519 : INFO : topic diff=0.003555, rho=0.024930\n", + "2019-01-31 01:11:33,180 : INFO : -11.619 per-word bound, 3146.2 perplexity estimate based on a held-out corpus of 2000 documents with 544433 words\n", + "2019-01-31 01:11:33,181 : INFO : PROGRESS: pass 0, at document #3220000/4922894\n", + "2019-01-31 01:11:34,554 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:11:34,821 : INFO : topic #5 (0.020): 0.039*\"abroad\" + 0.028*\"son\" + 0.027*\"rel\" + 0.025*\"reconstruct\" + 0.020*\"band\" + 0.017*\"muscl\" + 0.016*\"simultan\" + 0.014*\"charcoal\" + 0.014*\"toyota\" + 0.010*\"vocabulari\"\n", + "2019-01-31 01:11:34,822 : INFO : topic #31 (0.020): 0.051*\"fusiform\" + 0.026*\"scientist\" + 0.026*\"taxpay\" + 0.023*\"player\" + 0.020*\"place\" + 0.014*\"clot\" + 0.013*\"leagu\" + 0.010*\"folei\" + 0.010*\"yawn\" + 0.009*\"reconstruct\"\n", + "2019-01-31 01:11:34,823 : INFO : topic #14 (0.020): 0.024*\"forc\" + 0.023*\"aggress\" + 0.020*\"armi\" + 0.020*\"walter\" + 0.018*\"com\" + 0.015*\"oper\" + 0.014*\"unionist\" + 0.012*\"militari\" + 0.012*\"airbu\" + 0.011*\"diversifi\"\n", + "2019-01-31 01:11:34,824 : INFO : topic #15 (0.020): 0.011*\"small\" + 0.010*\"organ\" + 0.010*\"develop\" + 0.009*\"commun\" + 0.009*\"group\" + 0.008*\"peopl\" + 0.008*\"word\" + 0.007*\"woman\" + 0.007*\"human\" + 0.006*\"summerhil\"\n", + "2019-01-31 01:11:34,825 : INFO : topic #28 (0.020): 0.034*\"build\" + 0.027*\"hous\" + 0.018*\"buford\" + 0.016*\"rivièr\" + 0.014*\"histor\" + 0.011*\"constitut\" + 0.011*\"silicon\" + 0.011*\"briarwood\" + 0.011*\"depress\" + 0.011*\"linear\"\n", + "2019-01-31 01:11:34,831 : INFO : topic diff=0.003490, rho=0.024922\n", + "2019-01-31 01:11:34,981 : INFO : PROGRESS: pass 0, at document #3222000/4922894\n", + "2019-01-31 01:11:36,312 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:11:36,579 : INFO : topic #47 (0.020): 0.062*\"muscl\" + 0.031*\"perceptu\" + 0.020*\"theater\" + 0.019*\"compos\" + 0.018*\"place\" + 0.014*\"damn\" + 0.013*\"orchestr\" + 0.013*\"olympo\" + 0.013*\"physician\" + 0.012*\"word\"\n", + "2019-01-31 01:11:36,580 : INFO : topic #29 (0.020): 0.031*\"companhia\" + 0.013*\"busi\" + 0.012*\"million\" + 0.011*\"bank\" + 0.011*\"market\" + 0.011*\"produc\" + 0.010*\"industri\" + 0.009*\"yawn\" + 0.008*\"manag\" + 0.007*\"function\"\n", + "2019-01-31 01:11:36,581 : INFO : topic #9 (0.020): 0.070*\"bone\" + 0.046*\"american\" + 0.029*\"valour\" + 0.020*\"folei\" + 0.019*\"player\" + 0.018*\"dutch\" + 0.017*\"polit\" + 0.016*\"english\" + 0.012*\"acrimoni\" + 0.012*\"simpler\"\n", + "2019-01-31 01:11:36,582 : INFO : topic #5 (0.020): 0.039*\"abroad\" + 0.028*\"son\" + 0.027*\"rel\" + 0.026*\"reconstruct\" + 0.020*\"band\" + 0.017*\"muscl\" + 0.016*\"simultan\" + 0.014*\"charcoal\" + 0.014*\"toyota\" + 0.010*\"vocabulari\"\n", + "2019-01-31 01:11:36,583 : INFO : topic #27 (0.020): 0.071*\"questionnair\" + 0.019*\"candid\" + 0.019*\"taxpay\" + 0.013*\"driver\" + 0.012*\"tornado\" + 0.012*\"ret\" + 0.012*\"find\" + 0.011*\"fool\" + 0.010*\"champion\" + 0.010*\"squatter\"\n", + "2019-01-31 01:11:36,589 : INFO : topic diff=0.004040, rho=0.024915\n", + "2019-01-31 01:11:36,745 : INFO : PROGRESS: pass 0, at document #3224000/4922894\n", + "2019-01-31 01:11:38,131 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:11:38,398 : INFO : topic #43 (0.020): 0.066*\"elect\" + 0.055*\"parti\" + 0.025*\"voluntari\" + 0.023*\"democrat\" + 0.020*\"member\" + 0.017*\"polici\" + 0.015*\"republ\" + 0.015*\"selma\" + 0.014*\"seaport\" + 0.013*\"bypass\"\n", + "2019-01-31 01:11:38,399 : INFO : topic #11 (0.020): 0.024*\"john\" + 0.013*\"will\" + 0.012*\"jame\" + 0.011*\"david\" + 0.009*\"rival\" + 0.009*\"mexican–american\" + 0.008*\"slur\" + 0.008*\"paul\" + 0.008*\"georg\" + 0.007*\"rhyme\"\n", + "2019-01-31 01:11:38,400 : INFO : topic #9 (0.020): 0.070*\"bone\" + 0.045*\"american\" + 0.029*\"valour\" + 0.020*\"folei\" + 0.019*\"player\" + 0.018*\"dutch\" + 0.017*\"polit\" + 0.016*\"english\" + 0.012*\"acrimoni\" + 0.012*\"simpler\"\n", + "2019-01-31 01:11:38,401 : INFO : topic #21 (0.020): 0.033*\"samford\" + 0.021*\"spain\" + 0.018*\"del\" + 0.018*\"mexico\" + 0.017*\"italian\" + 0.013*\"soviet\" + 0.011*\"juan\" + 0.011*\"santa\" + 0.010*\"lizard\" + 0.010*\"josé\"\n", + "2019-01-31 01:11:38,402 : INFO : topic #3 (0.020): 0.032*\"present\" + 0.026*\"offic\" + 0.025*\"minist\" + 0.023*\"nation\" + 0.023*\"govern\" + 0.021*\"member\" + 0.019*\"serv\" + 0.016*\"start\" + 0.016*\"gener\" + 0.014*\"chickasaw\"\n", + "2019-01-31 01:11:38,408 : INFO : topic diff=0.003623, rho=0.024907\n", + "2019-01-31 01:11:38,568 : INFO : PROGRESS: pass 0, at document #3226000/4922894\n", + "2019-01-31 01:11:39,944 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:11:40,211 : INFO : topic #33 (0.020): 0.062*\"french\" + 0.048*\"franc\" + 0.030*\"pari\" + 0.023*\"jean\" + 0.022*\"sail\" + 0.017*\"daphn\" + 0.013*\"loui\" + 0.013*\"lazi\" + 0.012*\"piec\" + 0.009*\"wine\"\n", + "2019-01-31 01:11:40,212 : INFO : topic #44 (0.020): 0.035*\"rooftop\" + 0.029*\"final\" + 0.021*\"wife\" + 0.020*\"tourist\" + 0.018*\"champion\" + 0.015*\"taxpay\" + 0.014*\"chamber\" + 0.014*\"martin\" + 0.013*\"tiepolo\" + 0.012*\"winner\"\n", + "2019-01-31 01:11:40,213 : INFO : topic #46 (0.020): 0.017*\"sweden\" + 0.017*\"stop\" + 0.017*\"norwai\" + 0.016*\"swedish\" + 0.015*\"damag\" + 0.015*\"norwegian\" + 0.014*\"wind\" + 0.012*\"treeless\" + 0.011*\"huntsvil\" + 0.011*\"denmark\"\n", + "2019-01-31 01:11:40,214 : INFO : topic #4 (0.020): 0.021*\"enfranchis\" + 0.015*\"depress\" + 0.013*\"pour\" + 0.009*\"mode\" + 0.008*\"elabor\" + 0.007*\"uruguayan\" + 0.007*\"veget\" + 0.006*\"spectacl\" + 0.006*\"produc\" + 0.006*\"develop\"\n", + "2019-01-31 01:11:40,215 : INFO : topic #7 (0.020): 0.021*\"snatch\" + 0.020*\"di\" + 0.018*\"factor\" + 0.016*\"margin\" + 0.016*\"yawn\" + 0.015*\"bone\" + 0.013*\"life\" + 0.012*\"faster\" + 0.012*\"daughter\" + 0.011*\"deal\"\n", + "2019-01-31 01:11:40,221 : INFO : topic diff=0.003542, rho=0.024899\n", + "2019-01-31 01:11:40,379 : INFO : PROGRESS: pass 0, at document #3228000/4922894\n", + "2019-01-31 01:11:41,776 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:11:42,043 : INFO : topic #0 (0.020): 0.067*\"statewid\" + 0.043*\"line\" + 0.036*\"raid\" + 0.026*\"rosenwald\" + 0.020*\"serv\" + 0.020*\"traceabl\" + 0.014*\"oper\" + 0.013*\"airmen\" + 0.013*\"rivièr\" + 0.010*\"transient\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 01:11:42,044 : INFO : topic #2 (0.020): 0.050*\"isl\" + 0.037*\"shield\" + 0.018*\"narrat\" + 0.014*\"scot\" + 0.012*\"pope\" + 0.012*\"blur\" + 0.011*\"coalit\" + 0.011*\"nativist\" + 0.010*\"retrospect\" + 0.009*\"fleet\"\n", + "2019-01-31 01:11:42,045 : INFO : topic #4 (0.020): 0.021*\"enfranchis\" + 0.015*\"depress\" + 0.013*\"pour\" + 0.009*\"mode\" + 0.008*\"elabor\" + 0.007*\"uruguayan\" + 0.007*\"veget\" + 0.006*\"spectacl\" + 0.006*\"produc\" + 0.006*\"develop\"\n", + "2019-01-31 01:11:42,046 : INFO : topic #24 (0.020): 0.037*\"book\" + 0.033*\"publicis\" + 0.028*\"word\" + 0.019*\"new\" + 0.016*\"arsen\" + 0.013*\"edit\" + 0.013*\"presid\" + 0.011*\"collect\" + 0.010*\"worldwid\" + 0.010*\"magazin\"\n", + "2019-01-31 01:11:42,047 : INFO : topic #9 (0.020): 0.069*\"bone\" + 0.045*\"american\" + 0.029*\"valour\" + 0.020*\"folei\" + 0.019*\"player\" + 0.018*\"dutch\" + 0.017*\"polit\" + 0.016*\"english\" + 0.012*\"acrimoni\" + 0.012*\"simpler\"\n", + "2019-01-31 01:11:42,053 : INFO : topic diff=0.003788, rho=0.024891\n", + "2019-01-31 01:11:42,204 : INFO : PROGRESS: pass 0, at document #3230000/4922894\n", + "2019-01-31 01:11:43,551 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:11:43,818 : INFO : topic #4 (0.020): 0.021*\"enfranchis\" + 0.015*\"depress\" + 0.013*\"pour\" + 0.009*\"mode\" + 0.008*\"elabor\" + 0.007*\"uruguayan\" + 0.007*\"veget\" + 0.006*\"spectacl\" + 0.006*\"produc\" + 0.006*\"develop\"\n", + "2019-01-31 01:11:43,819 : INFO : topic #26 (0.020): 0.032*\"workplac\" + 0.029*\"champion\" + 0.029*\"woman\" + 0.025*\"olymp\" + 0.024*\"men\" + 0.022*\"medal\" + 0.021*\"event\" + 0.019*\"nation\" + 0.018*\"atheist\" + 0.018*\"rainfal\"\n", + "2019-01-31 01:11:43,820 : INFO : topic #35 (0.020): 0.056*\"russia\" + 0.036*\"sovereignti\" + 0.033*\"rural\" + 0.025*\"personifi\" + 0.024*\"reprint\" + 0.024*\"poison\" + 0.019*\"moscow\" + 0.016*\"poland\" + 0.015*\"unfortun\" + 0.014*\"malaysia\"\n", + "2019-01-31 01:11:43,821 : INFO : topic #40 (0.020): 0.089*\"unit\" + 0.023*\"schuster\" + 0.022*\"institut\" + 0.021*\"collector\" + 0.021*\"requir\" + 0.019*\"student\" + 0.016*\"professor\" + 0.011*\"word\" + 0.011*\"http\" + 0.011*\"governor\"\n", + "2019-01-31 01:11:43,822 : INFO : topic #49 (0.020): 0.044*\"india\" + 0.031*\"incumb\" + 0.013*\"islam\" + 0.013*\"pakistan\" + 0.013*\"anglo\" + 0.012*\"muskoge\" + 0.011*\"televis\" + 0.010*\"sri\" + 0.010*\"alam\" + 0.010*\"khalsa\"\n", + "2019-01-31 01:11:43,828 : INFO : topic diff=0.004149, rho=0.024884\n", + "2019-01-31 01:11:44,040 : INFO : PROGRESS: pass 0, at document #3232000/4922894\n", + "2019-01-31 01:11:45,410 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:11:45,677 : INFO : topic #3 (0.020): 0.032*\"present\" + 0.026*\"offic\" + 0.024*\"minist\" + 0.023*\"nation\" + 0.023*\"govern\" + 0.021*\"member\" + 0.018*\"serv\" + 0.016*\"start\" + 0.016*\"gener\" + 0.014*\"council\"\n", + "2019-01-31 01:11:45,678 : INFO : topic #35 (0.020): 0.056*\"russia\" + 0.035*\"sovereignti\" + 0.033*\"rural\" + 0.025*\"personifi\" + 0.024*\"poison\" + 0.024*\"reprint\" + 0.019*\"moscow\" + 0.016*\"poland\" + 0.015*\"unfortun\" + 0.014*\"malaysia\"\n", + "2019-01-31 01:11:45,679 : INFO : topic #16 (0.020): 0.058*\"king\" + 0.034*\"priest\" + 0.021*\"duke\" + 0.020*\"rotterdam\" + 0.019*\"quarterli\" + 0.018*\"grammat\" + 0.017*\"idiosyncrat\" + 0.014*\"count\" + 0.013*\"brazil\" + 0.013*\"portugues\"\n", + "2019-01-31 01:11:45,680 : INFO : topic #47 (0.020): 0.062*\"muscl\" + 0.032*\"perceptu\" + 0.020*\"theater\" + 0.019*\"compos\" + 0.018*\"place\" + 0.014*\"damn\" + 0.013*\"orchestr\" + 0.013*\"physician\" + 0.013*\"olympo\" + 0.011*\"word\"\n", + "2019-01-31 01:11:45,681 : INFO : topic #33 (0.020): 0.063*\"french\" + 0.048*\"franc\" + 0.030*\"pari\" + 0.023*\"jean\" + 0.022*\"sail\" + 0.017*\"daphn\" + 0.013*\"loui\" + 0.013*\"lazi\" + 0.012*\"piec\" + 0.009*\"wine\"\n", + "2019-01-31 01:11:45,687 : INFO : topic diff=0.003635, rho=0.024876\n", + "2019-01-31 01:11:45,847 : INFO : PROGRESS: pass 0, at document #3234000/4922894\n", + "2019-01-31 01:11:47,254 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:11:47,521 : INFO : topic #22 (0.020): 0.035*\"spars\" + 0.019*\"factor\" + 0.012*\"plaisir\" + 0.010*\"genu\" + 0.009*\"biom\" + 0.009*\"western\" + 0.009*\"median\" + 0.008*\"trap\" + 0.008*\"feel\" + 0.008*\"male\"\n", + "2019-01-31 01:11:47,522 : INFO : topic #16 (0.020): 0.058*\"king\" + 0.034*\"priest\" + 0.021*\"duke\" + 0.020*\"rotterdam\" + 0.019*\"quarterli\" + 0.018*\"grammat\" + 0.017*\"idiosyncrat\" + 0.014*\"count\" + 0.013*\"portugues\" + 0.013*\"brazil\"\n", + "2019-01-31 01:11:47,523 : INFO : topic #19 (0.020): 0.016*\"languag\" + 0.015*\"centuri\" + 0.010*\"woodcut\" + 0.009*\"form\" + 0.008*\"origin\" + 0.008*\"mean\" + 0.008*\"trade\" + 0.008*\"english\" + 0.007*\"known\" + 0.006*\"ancestor\"\n", + "2019-01-31 01:11:47,524 : INFO : topic #0 (0.020): 0.068*\"statewid\" + 0.043*\"line\" + 0.035*\"raid\" + 0.025*\"rosenwald\" + 0.020*\"serv\" + 0.020*\"traceabl\" + 0.014*\"oper\" + 0.013*\"airmen\" + 0.012*\"rivièr\" + 0.011*\"transient\"\n", + "2019-01-31 01:11:47,525 : INFO : topic #21 (0.020): 0.033*\"samford\" + 0.021*\"spain\" + 0.018*\"del\" + 0.018*\"mexico\" + 0.016*\"italian\" + 0.013*\"soviet\" + 0.011*\"juan\" + 0.011*\"santa\" + 0.011*\"lizard\" + 0.010*\"carlo\"\n", + "2019-01-31 01:11:47,531 : INFO : topic diff=0.004368, rho=0.024868\n", + "2019-01-31 01:11:47,684 : INFO : PROGRESS: pass 0, at document #3236000/4922894\n", + "2019-01-31 01:11:49,061 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:11:49,327 : INFO : topic #32 (0.020): 0.050*\"district\" + 0.044*\"popolo\" + 0.042*\"vigour\" + 0.036*\"tortur\" + 0.033*\"cotton\" + 0.022*\"area\" + 0.022*\"multitud\" + 0.022*\"adulthood\" + 0.021*\"citi\" + 0.019*\"cede\"\n", + "2019-01-31 01:11:49,328 : INFO : topic #15 (0.020): 0.011*\"small\" + 0.010*\"organ\" + 0.010*\"develop\" + 0.009*\"commun\" + 0.009*\"group\" + 0.008*\"peopl\" + 0.008*\"word\" + 0.007*\"human\" + 0.007*\"woman\" + 0.006*\"summerhil\"\n", + "2019-01-31 01:11:49,329 : INFO : topic #6 (0.020): 0.070*\"fewer\" + 0.024*\"epiru\" + 0.022*\"septemb\" + 0.019*\"teacher\" + 0.016*\"stake\" + 0.012*\"rodríguez\" + 0.011*\"proclaim\" + 0.011*\"direct\" + 0.011*\"movi\" + 0.010*\"acrimoni\"\n", + "2019-01-31 01:11:49,330 : INFO : topic #5 (0.020): 0.039*\"abroad\" + 0.028*\"son\" + 0.027*\"rel\" + 0.026*\"reconstruct\" + 0.021*\"band\" + 0.017*\"muscl\" + 0.016*\"simultan\" + 0.014*\"charcoal\" + 0.014*\"toyota\" + 0.009*\"vocabulari\"\n", + "2019-01-31 01:11:49,331 : INFO : topic #27 (0.020): 0.072*\"questionnair\" + 0.019*\"candid\" + 0.018*\"taxpay\" + 0.014*\"ret\" + 0.013*\"driver\" + 0.012*\"tornado\" + 0.011*\"fool\" + 0.011*\"find\" + 0.010*\"champion\" + 0.010*\"landslid\"\n", + "2019-01-31 01:11:49,337 : INFO : topic diff=0.003402, rho=0.024861\n", + "2019-01-31 01:11:49,496 : INFO : PROGRESS: pass 0, at document #3238000/4922894\n", + "2019-01-31 01:11:50,886 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:11:51,153 : INFO : topic #14 (0.020): 0.024*\"forc\" + 0.022*\"aggress\" + 0.020*\"walter\" + 0.020*\"armi\" + 0.018*\"com\" + 0.014*\"oper\" + 0.014*\"unionist\" + 0.012*\"militari\" + 0.012*\"airbu\" + 0.012*\"diversifi\"\n", + "2019-01-31 01:11:51,155 : INFO : topic #25 (0.020): 0.035*\"ring\" + 0.019*\"area\" + 0.019*\"lagrang\" + 0.017*\"warmth\" + 0.016*\"mount\" + 0.010*\"north\" + 0.009*\"land\" + 0.009*\"vacant\" + 0.009*\"sourc\" + 0.008*\"palmer\"\n", + "2019-01-31 01:11:51,155 : INFO : topic #13 (0.020): 0.027*\"london\" + 0.027*\"australia\" + 0.025*\"new\" + 0.025*\"sourc\" + 0.023*\"england\" + 0.022*\"australian\" + 0.020*\"british\" + 0.017*\"ireland\" + 0.014*\"youth\" + 0.013*\"wale\"\n", + "2019-01-31 01:11:51,156 : INFO : topic #8 (0.020): 0.026*\"law\" + 0.023*\"cortic\" + 0.018*\"start\" + 0.016*\"act\" + 0.012*\"ricardo\" + 0.012*\"case\" + 0.010*\"replac\" + 0.009*\"polaris\" + 0.008*\"legal\" + 0.007*\"justic\"\n", + "2019-01-31 01:11:51,158 : INFO : topic #45 (0.020): 0.027*\"jpg\" + 0.025*\"fifteenth\" + 0.020*\"illicit\" + 0.018*\"pain\" + 0.016*\"colder\" + 0.015*\"arsen\" + 0.013*\"black\" + 0.012*\"museo\" + 0.012*\"western\" + 0.011*\"gai\"\n", + "2019-01-31 01:11:51,163 : INFO : topic diff=0.003652, rho=0.024853\n", + "2019-01-31 01:11:53,860 : INFO : -11.507 per-word bound, 2910.5 perplexity estimate based on a held-out corpus of 2000 documents with 563587 words\n", + "2019-01-31 01:11:53,860 : INFO : PROGRESS: pass 0, at document #3240000/4922894\n", + "2019-01-31 01:11:55,230 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:11:55,496 : INFO : topic #32 (0.020): 0.050*\"district\" + 0.044*\"popolo\" + 0.042*\"vigour\" + 0.036*\"tortur\" + 0.033*\"cotton\" + 0.022*\"area\" + 0.022*\"multitud\" + 0.021*\"adulthood\" + 0.021*\"citi\" + 0.019*\"cede\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 01:11:55,497 : INFO : topic #19 (0.020): 0.017*\"languag\" + 0.015*\"centuri\" + 0.010*\"woodcut\" + 0.009*\"form\" + 0.008*\"origin\" + 0.008*\"mean\" + 0.008*\"trade\" + 0.008*\"english\" + 0.007*\"known\" + 0.007*\"ancestor\"\n", + "2019-01-31 01:11:55,498 : INFO : topic #45 (0.020): 0.027*\"jpg\" + 0.025*\"fifteenth\" + 0.020*\"illicit\" + 0.018*\"pain\" + 0.015*\"colder\" + 0.015*\"arsen\" + 0.013*\"black\" + 0.013*\"western\" + 0.012*\"museo\" + 0.011*\"gai\"\n", + "2019-01-31 01:11:55,499 : INFO : topic #20 (0.020): 0.148*\"scholar\" + 0.041*\"struggl\" + 0.036*\"high\" + 0.030*\"educ\" + 0.024*\"collector\" + 0.018*\"yawn\" + 0.013*\"prognosi\" + 0.010*\"district\" + 0.010*\"task\" + 0.010*\"gothic\"\n", + "2019-01-31 01:11:55,500 : INFO : topic #30 (0.020): 0.036*\"cleveland\" + 0.035*\"leagu\" + 0.029*\"place\" + 0.027*\"taxpay\" + 0.024*\"scientist\" + 0.023*\"crete\" + 0.022*\"folei\" + 0.017*\"goal\" + 0.015*\"martin\" + 0.012*\"schmitz\"\n", + "2019-01-31 01:11:55,506 : INFO : topic diff=0.003893, rho=0.024845\n", + "2019-01-31 01:11:55,660 : INFO : PROGRESS: pass 0, at document #3242000/4922894\n", + "2019-01-31 01:11:57,024 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:11:57,291 : INFO : topic #41 (0.020): 0.040*\"citi\" + 0.023*\"palmer\" + 0.021*\"new\" + 0.014*\"strategist\" + 0.013*\"center\" + 0.013*\"open\" + 0.011*\"lobe\" + 0.011*\"includ\" + 0.010*\"dai\" + 0.009*\"highli\"\n", + "2019-01-31 01:11:57,292 : INFO : topic #15 (0.020): 0.011*\"small\" + 0.010*\"organ\" + 0.010*\"develop\" + 0.009*\"commun\" + 0.009*\"group\" + 0.008*\"peopl\" + 0.008*\"word\" + 0.007*\"human\" + 0.007*\"woman\" + 0.007*\"summerhil\"\n", + "2019-01-31 01:11:57,293 : INFO : topic #26 (0.020): 0.032*\"workplac\" + 0.029*\"champion\" + 0.028*\"woman\" + 0.026*\"olymp\" + 0.024*\"men\" + 0.022*\"medal\" + 0.021*\"event\" + 0.018*\"nation\" + 0.018*\"atheist\" + 0.017*\"taxpay\"\n", + "2019-01-31 01:11:57,294 : INFO : topic #3 (0.020): 0.032*\"present\" + 0.026*\"offic\" + 0.025*\"minist\" + 0.023*\"nation\" + 0.023*\"govern\" + 0.020*\"member\" + 0.018*\"serv\" + 0.016*\"start\" + 0.016*\"gener\" + 0.014*\"council\"\n", + "2019-01-31 01:11:57,295 : INFO : topic #37 (0.020): 0.012*\"charact\" + 0.010*\"septemb\" + 0.010*\"anim\" + 0.010*\"man\" + 0.007*\"comic\" + 0.007*\"appear\" + 0.007*\"storag\" + 0.006*\"workplac\" + 0.006*\"fusiform\" + 0.006*\"love\"\n", + "2019-01-31 01:11:57,301 : INFO : topic diff=0.003654, rho=0.024838\n", + "2019-01-31 01:11:57,458 : INFO : PROGRESS: pass 0, at document #3244000/4922894\n", + "2019-01-31 01:11:58,832 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:11:59,098 : INFO : topic #3 (0.020): 0.032*\"present\" + 0.026*\"offic\" + 0.025*\"minist\" + 0.023*\"nation\" + 0.023*\"govern\" + 0.021*\"member\" + 0.018*\"serv\" + 0.017*\"start\" + 0.016*\"gener\" + 0.014*\"council\"\n", + "2019-01-31 01:11:59,099 : INFO : topic #19 (0.020): 0.017*\"languag\" + 0.015*\"centuri\" + 0.010*\"woodcut\" + 0.010*\"form\" + 0.008*\"origin\" + 0.008*\"trade\" + 0.008*\"mean\" + 0.008*\"english\" + 0.007*\"known\" + 0.007*\"ancestor\"\n", + "2019-01-31 01:11:59,100 : INFO : topic #38 (0.020): 0.024*\"walter\" + 0.010*\"aza\" + 0.009*\"battalion\" + 0.009*\"forc\" + 0.008*\"empath\" + 0.007*\"teufel\" + 0.007*\"armi\" + 0.007*\"govern\" + 0.006*\"militari\" + 0.006*\"till\"\n", + "2019-01-31 01:11:59,101 : INFO : topic #42 (0.020): 0.048*\"german\" + 0.030*\"germani\" + 0.016*\"vol\" + 0.015*\"jewish\" + 0.014*\"israel\" + 0.014*\"berlin\" + 0.013*\"der\" + 0.010*\"european\" + 0.009*\"europ\" + 0.009*\"hungarian\"\n", + "2019-01-31 01:11:59,102 : INFO : topic #13 (0.020): 0.027*\"london\" + 0.027*\"australia\" + 0.025*\"new\" + 0.025*\"sourc\" + 0.023*\"england\" + 0.022*\"australian\" + 0.020*\"british\" + 0.017*\"ireland\" + 0.014*\"youth\" + 0.013*\"wale\"\n", + "2019-01-31 01:11:59,108 : INFO : topic diff=0.003935, rho=0.024830\n", + "2019-01-31 01:11:59,265 : INFO : PROGRESS: pass 0, at document #3246000/4922894\n", + "2019-01-31 01:12:00,643 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:12:00,909 : INFO : topic #32 (0.020): 0.050*\"district\" + 0.044*\"popolo\" + 0.041*\"vigour\" + 0.036*\"tortur\" + 0.033*\"cotton\" + 0.022*\"area\" + 0.022*\"adulthood\" + 0.021*\"multitud\" + 0.021*\"citi\" + 0.019*\"cede\"\n", + "2019-01-31 01:12:00,910 : INFO : topic #41 (0.020): 0.040*\"citi\" + 0.024*\"palmer\" + 0.021*\"new\" + 0.014*\"strategist\" + 0.013*\"center\" + 0.013*\"open\" + 0.011*\"lobe\" + 0.011*\"includ\" + 0.010*\"dai\" + 0.009*\"highli\"\n", + "2019-01-31 01:12:00,911 : INFO : topic #1 (0.020): 0.051*\"china\" + 0.043*\"chilton\" + 0.024*\"hong\" + 0.024*\"kong\" + 0.020*\"korea\" + 0.018*\"korean\" + 0.017*\"leah\" + 0.016*\"sourc\" + 0.016*\"kim\" + 0.012*\"shirin\"\n", + "2019-01-31 01:12:00,912 : INFO : topic #34 (0.020): 0.067*\"start\" + 0.034*\"new\" + 0.031*\"american\" + 0.029*\"unionist\" + 0.027*\"cotton\" + 0.021*\"year\" + 0.015*\"california\" + 0.013*\"warrior\" + 0.012*\"terri\" + 0.011*\"north\"\n", + "2019-01-31 01:12:00,913 : INFO : topic #46 (0.020): 0.017*\"sweden\" + 0.017*\"stop\" + 0.017*\"norwai\" + 0.015*\"swedish\" + 0.015*\"damag\" + 0.015*\"norwegian\" + 0.014*\"wind\" + 0.012*\"treeless\" + 0.011*\"denmark\" + 0.011*\"huntsvil\"\n", + "2019-01-31 01:12:00,919 : INFO : topic diff=0.004061, rho=0.024822\n", + "2019-01-31 01:12:01,072 : INFO : PROGRESS: pass 0, at document #3248000/4922894\n", + "2019-01-31 01:12:02,437 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:12:02,704 : INFO : topic #16 (0.020): 0.058*\"king\" + 0.033*\"priest\" + 0.022*\"duke\" + 0.019*\"rotterdam\" + 0.019*\"quarterli\" + 0.018*\"grammat\" + 0.017*\"idiosyncrat\" + 0.014*\"count\" + 0.013*\"brazil\" + 0.013*\"portugues\"\n", + "2019-01-31 01:12:02,705 : INFO : topic #30 (0.020): 0.036*\"cleveland\" + 0.036*\"leagu\" + 0.029*\"place\" + 0.027*\"taxpay\" + 0.024*\"scientist\" + 0.023*\"crete\" + 0.022*\"folei\" + 0.017*\"goal\" + 0.015*\"martin\" + 0.012*\"schmitz\"\n", + "2019-01-31 01:12:02,707 : INFO : topic #14 (0.020): 0.024*\"forc\" + 0.022*\"aggress\" + 0.020*\"armi\" + 0.020*\"walter\" + 0.017*\"com\" + 0.014*\"oper\" + 0.013*\"unionist\" + 0.012*\"militari\" + 0.012*\"airbu\" + 0.012*\"diversifi\"\n", + "2019-01-31 01:12:02,708 : INFO : topic #44 (0.020): 0.034*\"rooftop\" + 0.028*\"final\" + 0.022*\"wife\" + 0.020*\"tourist\" + 0.018*\"champion\" + 0.015*\"taxpay\" + 0.015*\"chamber\" + 0.015*\"martin\" + 0.014*\"tiepolo\" + 0.012*\"women\"\n", + "2019-01-31 01:12:02,709 : INFO : topic #0 (0.020): 0.068*\"statewid\" + 0.044*\"line\" + 0.035*\"raid\" + 0.027*\"rosenwald\" + 0.020*\"serv\" + 0.020*\"traceabl\" + 0.014*\"oper\" + 0.013*\"rivièr\" + 0.013*\"airmen\" + 0.011*\"transient\"\n", + "2019-01-31 01:12:02,715 : INFO : topic diff=0.003199, rho=0.024815\n", + "2019-01-31 01:12:02,868 : INFO : PROGRESS: pass 0, at document #3250000/4922894\n", + "2019-01-31 01:12:04,230 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:12:04,497 : INFO : topic #29 (0.020): 0.031*\"companhia\" + 0.013*\"busi\" + 0.012*\"million\" + 0.011*\"market\" + 0.011*\"produc\" + 0.010*\"bank\" + 0.010*\"industri\" + 0.009*\"yawn\" + 0.008*\"manag\" + 0.007*\"function\"\n", + "2019-01-31 01:12:04,498 : INFO : topic #24 (0.020): 0.037*\"book\" + 0.033*\"publicis\" + 0.028*\"word\" + 0.019*\"new\" + 0.016*\"arsen\" + 0.013*\"edit\" + 0.013*\"presid\" + 0.011*\"collect\" + 0.011*\"magazin\" + 0.011*\"storag\"\n", + "2019-01-31 01:12:04,499 : INFO : topic #27 (0.020): 0.070*\"questionnair\" + 0.019*\"candid\" + 0.018*\"taxpay\" + 0.013*\"driver\" + 0.013*\"ret\" + 0.012*\"tornado\" + 0.012*\"fool\" + 0.011*\"find\" + 0.010*\"champion\" + 0.009*\"théori\"\n", + "2019-01-31 01:12:04,500 : INFO : topic #48 (0.020): 0.079*\"march\" + 0.078*\"sens\" + 0.075*\"octob\" + 0.070*\"august\" + 0.070*\"januari\" + 0.069*\"notion\" + 0.069*\"juli\" + 0.068*\"april\" + 0.066*\"judici\" + 0.065*\"decatur\"\n", + "2019-01-31 01:12:04,501 : INFO : topic #2 (0.020): 0.049*\"isl\" + 0.038*\"shield\" + 0.018*\"narrat\" + 0.013*\"scot\" + 0.012*\"pope\" + 0.012*\"blur\" + 0.011*\"coalit\" + 0.011*\"nativist\" + 0.010*\"fleet\" + 0.009*\"vernon\"\n", + "2019-01-31 01:12:04,507 : INFO : topic diff=0.003644, rho=0.024807\n", + "2019-01-31 01:12:04,664 : INFO : PROGRESS: pass 0, at document #3252000/4922894\n", + "2019-01-31 01:12:06,062 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:12:06,328 : INFO : topic #17 (0.020): 0.079*\"church\" + 0.023*\"christian\" + 0.021*\"cathol\" + 0.020*\"bishop\" + 0.015*\"retroflex\" + 0.015*\"sail\" + 0.010*\"poll\" + 0.009*\"relationship\" + 0.009*\"centuri\" + 0.009*\"historiographi\"\n", + "2019-01-31 01:12:06,330 : INFO : topic #44 (0.020): 0.034*\"rooftop\" + 0.028*\"final\" + 0.022*\"wife\" + 0.020*\"tourist\" + 0.017*\"champion\" + 0.015*\"taxpay\" + 0.015*\"martin\" + 0.015*\"chamber\" + 0.014*\"tiepolo\" + 0.012*\"winner\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 01:12:06,331 : INFO : topic #28 (0.020): 0.034*\"build\" + 0.028*\"hous\" + 0.018*\"buford\" + 0.016*\"rivièr\" + 0.014*\"histor\" + 0.011*\"constitut\" + 0.011*\"silicon\" + 0.011*\"linear\" + 0.011*\"briarwood\" + 0.010*\"depress\"\n", + "2019-01-31 01:12:06,332 : INFO : topic #18 (0.020): 0.011*\"théori\" + 0.007*\"later\" + 0.007*\"sack\" + 0.006*\"dai\" + 0.006*\"kill\" + 0.005*\"retrospect\" + 0.005*\"like\" + 0.005*\"end\" + 0.004*\"call\" + 0.004*\"help\"\n", + "2019-01-31 01:12:06,333 : INFO : topic #29 (0.020): 0.031*\"companhia\" + 0.013*\"busi\" + 0.012*\"million\" + 0.011*\"market\" + 0.011*\"produc\" + 0.010*\"bank\" + 0.010*\"industri\" + 0.009*\"yawn\" + 0.008*\"manag\" + 0.007*\"function\"\n", + "2019-01-31 01:12:06,339 : INFO : topic diff=0.003321, rho=0.024799\n", + "2019-01-31 01:12:06,491 : INFO : PROGRESS: pass 0, at document #3254000/4922894\n", + "2019-01-31 01:12:07,851 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:12:08,117 : INFO : topic #13 (0.020): 0.027*\"london\" + 0.027*\"australia\" + 0.026*\"sourc\" + 0.025*\"new\" + 0.023*\"england\" + 0.022*\"australian\" + 0.019*\"british\" + 0.017*\"ireland\" + 0.014*\"youth\" + 0.013*\"wale\"\n", + "2019-01-31 01:12:08,118 : INFO : topic #8 (0.020): 0.025*\"law\" + 0.023*\"cortic\" + 0.018*\"start\" + 0.016*\"act\" + 0.012*\"ricardo\" + 0.012*\"case\" + 0.011*\"replac\" + 0.009*\"polaris\" + 0.008*\"legal\" + 0.007*\"justic\"\n", + "2019-01-31 01:12:08,119 : INFO : topic #33 (0.020): 0.063*\"french\" + 0.047*\"franc\" + 0.030*\"pari\" + 0.023*\"sail\" + 0.022*\"jean\" + 0.017*\"daphn\" + 0.013*\"lazi\" + 0.013*\"loui\" + 0.012*\"piec\" + 0.011*\"cdr\"\n", + "2019-01-31 01:12:08,120 : INFO : topic #5 (0.020): 0.038*\"abroad\" + 0.028*\"son\" + 0.027*\"rel\" + 0.025*\"reconstruct\" + 0.020*\"band\" + 0.017*\"muscl\" + 0.016*\"simultan\" + 0.014*\"charcoal\" + 0.014*\"toyota\" + 0.010*\"vocabulari\"\n", + "2019-01-31 01:12:08,121 : INFO : topic #48 (0.020): 0.079*\"march\" + 0.079*\"sens\" + 0.075*\"octob\" + 0.070*\"august\" + 0.070*\"januari\" + 0.069*\"notion\" + 0.069*\"juli\" + 0.069*\"april\" + 0.067*\"judici\" + 0.065*\"decatur\"\n", + "2019-01-31 01:12:08,127 : INFO : topic diff=0.003959, rho=0.024792\n", + "2019-01-31 01:12:08,279 : INFO : PROGRESS: pass 0, at document #3256000/4922894\n", + "2019-01-31 01:12:09,640 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:12:09,906 : INFO : topic #36 (0.020): 0.011*\"prognosi\" + 0.011*\"pop\" + 0.010*\"network\" + 0.009*\"cytokin\" + 0.008*\"uruguayan\" + 0.008*\"develop\" + 0.008*\"softwar\" + 0.008*\"user\" + 0.008*\"championship\" + 0.007*\"diggin\"\n", + "2019-01-31 01:12:09,907 : INFO : topic #17 (0.020): 0.079*\"church\" + 0.023*\"christian\" + 0.021*\"cathol\" + 0.020*\"bishop\" + 0.015*\"sail\" + 0.015*\"retroflex\" + 0.010*\"relationship\" + 0.010*\"poll\" + 0.009*\"historiographi\" + 0.009*\"centuri\"\n", + "2019-01-31 01:12:09,908 : INFO : topic #15 (0.020): 0.011*\"small\" + 0.010*\"organ\" + 0.010*\"develop\" + 0.009*\"commun\" + 0.009*\"group\" + 0.008*\"peopl\" + 0.008*\"word\" + 0.007*\"human\" + 0.007*\"woman\" + 0.007*\"summerhil\"\n", + "2019-01-31 01:12:09,909 : INFO : topic #23 (0.020): 0.135*\"audit\" + 0.069*\"best\" + 0.035*\"yawn\" + 0.027*\"jacksonvil\" + 0.022*\"japanes\" + 0.021*\"festiv\" + 0.021*\"noll\" + 0.019*\"women\" + 0.016*\"intern\" + 0.014*\"winner\"\n", + "2019-01-31 01:12:09,910 : INFO : topic #26 (0.020): 0.033*\"workplac\" + 0.029*\"woman\" + 0.029*\"champion\" + 0.025*\"olymp\" + 0.025*\"men\" + 0.022*\"medal\" + 0.021*\"event\" + 0.018*\"nation\" + 0.017*\"taxpay\" + 0.017*\"rainfal\"\n", + "2019-01-31 01:12:09,916 : INFO : topic diff=0.003543, rho=0.024784\n", + "2019-01-31 01:12:10,073 : INFO : PROGRESS: pass 0, at document #3258000/4922894\n", + "2019-01-31 01:12:11,475 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:12:11,742 : INFO : topic #10 (0.020): 0.012*\"cdd\" + 0.009*\"media\" + 0.008*\"disco\" + 0.007*\"pathwai\" + 0.007*\"hormon\" + 0.007*\"proper\" + 0.006*\"have\" + 0.006*\"caus\" + 0.006*\"effect\" + 0.006*\"acid\"\n", + "2019-01-31 01:12:11,744 : INFO : topic #29 (0.020): 0.031*\"companhia\" + 0.013*\"busi\" + 0.012*\"million\" + 0.011*\"market\" + 0.011*\"produc\" + 0.011*\"bank\" + 0.010*\"industri\" + 0.009*\"yawn\" + 0.008*\"manag\" + 0.007*\"function\"\n", + "2019-01-31 01:12:11,745 : INFO : topic #44 (0.020): 0.034*\"rooftop\" + 0.028*\"final\" + 0.022*\"wife\" + 0.021*\"tourist\" + 0.018*\"champion\" + 0.015*\"martin\" + 0.015*\"taxpay\" + 0.015*\"chamber\" + 0.014*\"tiepolo\" + 0.012*\"winner\"\n", + "2019-01-31 01:12:11,746 : INFO : topic #27 (0.020): 0.070*\"questionnair\" + 0.019*\"candid\" + 0.018*\"taxpay\" + 0.013*\"tornado\" + 0.013*\"driver\" + 0.012*\"ret\" + 0.011*\"fool\" + 0.011*\"find\" + 0.010*\"squatter\" + 0.010*\"champion\"\n", + "2019-01-31 01:12:11,747 : INFO : topic #31 (0.020): 0.051*\"fusiform\" + 0.026*\"scientist\" + 0.026*\"taxpay\" + 0.023*\"player\" + 0.020*\"place\" + 0.015*\"clot\" + 0.013*\"leagu\" + 0.011*\"folei\" + 0.010*\"yawn\" + 0.009*\"reconstruct\"\n", + "2019-01-31 01:12:11,753 : INFO : topic diff=0.003865, rho=0.024776\n", + "2019-01-31 01:12:14,417 : INFO : -12.063 per-word bound, 4279.8 perplexity estimate based on a held-out corpus of 2000 documents with 542664 words\n", + "2019-01-31 01:12:14,418 : INFO : PROGRESS: pass 0, at document #3260000/4922894\n", + "2019-01-31 01:12:15,786 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:12:16,052 : INFO : topic #28 (0.020): 0.034*\"build\" + 0.028*\"hous\" + 0.018*\"buford\" + 0.016*\"rivièr\" + 0.014*\"histor\" + 0.011*\"constitut\" + 0.011*\"silicon\" + 0.011*\"linear\" + 0.011*\"briarwood\" + 0.011*\"depress\"\n", + "2019-01-31 01:12:16,054 : INFO : topic #23 (0.020): 0.136*\"audit\" + 0.070*\"best\" + 0.034*\"yawn\" + 0.027*\"jacksonvil\" + 0.022*\"japanes\" + 0.022*\"noll\" + 0.021*\"festiv\" + 0.019*\"women\" + 0.016*\"intern\" + 0.013*\"winner\"\n", + "2019-01-31 01:12:16,055 : INFO : topic #13 (0.020): 0.027*\"london\" + 0.026*\"australia\" + 0.025*\"sourc\" + 0.025*\"new\" + 0.023*\"england\" + 0.022*\"australian\" + 0.019*\"british\" + 0.017*\"ireland\" + 0.014*\"youth\" + 0.013*\"wale\"\n", + "2019-01-31 01:12:16,056 : INFO : topic #1 (0.020): 0.052*\"china\" + 0.042*\"chilton\" + 0.024*\"hong\" + 0.023*\"kong\" + 0.021*\"korea\" + 0.018*\"korean\" + 0.017*\"leah\" + 0.016*\"sourc\" + 0.015*\"kim\" + 0.014*\"shirin\"\n", + "2019-01-31 01:12:16,056 : INFO : topic #39 (0.020): 0.059*\"canada\" + 0.046*\"canadian\" + 0.024*\"toronto\" + 0.023*\"hoar\" + 0.021*\"ontario\" + 0.016*\"hydrogen\" + 0.015*\"new\" + 0.014*\"misericordia\" + 0.014*\"quebec\" + 0.014*\"novotná\"\n", + "2019-01-31 01:12:16,062 : INFO : topic diff=0.003384, rho=0.024769\n", + "2019-01-31 01:12:16,274 : INFO : PROGRESS: pass 0, at document #3262000/4922894\n", + "2019-01-31 01:12:17,646 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:12:17,913 : INFO : topic #21 (0.020): 0.033*\"samford\" + 0.022*\"spain\" + 0.018*\"del\" + 0.018*\"mexico\" + 0.016*\"italian\" + 0.013*\"soviet\" + 0.011*\"santa\" + 0.011*\"juan\" + 0.011*\"carlo\" + 0.011*\"lizard\"\n", + "2019-01-31 01:12:17,914 : INFO : topic #2 (0.020): 0.049*\"isl\" + 0.038*\"shield\" + 0.018*\"narrat\" + 0.014*\"pope\" + 0.013*\"scot\" + 0.012*\"blur\" + 0.011*\"coalit\" + 0.011*\"nativist\" + 0.010*\"fleet\" + 0.009*\"vernon\"\n", + "2019-01-31 01:12:17,915 : INFO : topic #9 (0.020): 0.068*\"bone\" + 0.044*\"american\" + 0.028*\"valour\" + 0.020*\"folei\" + 0.019*\"player\" + 0.017*\"polit\" + 0.017*\"dutch\" + 0.016*\"english\" + 0.012*\"acrimoni\" + 0.012*\"simpler\"\n", + "2019-01-31 01:12:17,916 : INFO : topic #15 (0.020): 0.011*\"small\" + 0.010*\"organ\" + 0.010*\"develop\" + 0.009*\"commun\" + 0.009*\"group\" + 0.008*\"word\" + 0.008*\"peopl\" + 0.007*\"human\" + 0.007*\"woman\" + 0.007*\"summerhil\"\n", + "2019-01-31 01:12:17,917 : INFO : topic #42 (0.020): 0.047*\"german\" + 0.030*\"germani\" + 0.016*\"vol\" + 0.015*\"israel\" + 0.014*\"jewish\" + 0.014*\"berlin\" + 0.013*\"der\" + 0.010*\"european\" + 0.009*\"europ\" + 0.009*\"austria\"\n", + "2019-01-31 01:12:17,923 : INFO : topic diff=0.003440, rho=0.024761\n", + "2019-01-31 01:12:18,081 : INFO : PROGRESS: pass 0, at document #3264000/4922894\n", + "2019-01-31 01:12:19,490 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:12:19,757 : INFO : topic #43 (0.020): 0.065*\"elect\" + 0.055*\"parti\" + 0.025*\"voluntari\" + 0.022*\"democrat\" + 0.020*\"member\" + 0.016*\"polici\" + 0.014*\"liber\" + 0.014*\"seaport\" + 0.013*\"selma\" + 0.013*\"republ\"\n", + "2019-01-31 01:12:19,758 : INFO : topic #44 (0.020): 0.033*\"rooftop\" + 0.028*\"final\" + 0.022*\"wife\" + 0.021*\"tourist\" + 0.018*\"champion\" + 0.015*\"martin\" + 0.015*\"taxpay\" + 0.015*\"chamber\" + 0.014*\"tiepolo\" + 0.012*\"winner\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 01:12:19,759 : INFO : topic #15 (0.020): 0.011*\"small\" + 0.010*\"organ\" + 0.010*\"develop\" + 0.009*\"commun\" + 0.009*\"group\" + 0.008*\"word\" + 0.008*\"peopl\" + 0.007*\"human\" + 0.007*\"woman\" + 0.007*\"summerhil\"\n", + "2019-01-31 01:12:19,760 : INFO : topic #10 (0.020): 0.012*\"cdd\" + 0.009*\"media\" + 0.009*\"disco\" + 0.007*\"pathwai\" + 0.007*\"hormon\" + 0.007*\"have\" + 0.007*\"proper\" + 0.006*\"caus\" + 0.006*\"effect\" + 0.006*\"treat\"\n", + "2019-01-31 01:12:19,761 : INFO : topic #36 (0.020): 0.011*\"prognosi\" + 0.011*\"pop\" + 0.010*\"network\" + 0.009*\"cytokin\" + 0.008*\"softwar\" + 0.008*\"develop\" + 0.008*\"uruguayan\" + 0.008*\"user\" + 0.007*\"championship\" + 0.007*\"diggin\"\n", + "2019-01-31 01:12:19,767 : INFO : topic diff=0.004756, rho=0.024754\n", + "2019-01-31 01:12:19,923 : INFO : PROGRESS: pass 0, at document #3266000/4922894\n", + "2019-01-31 01:12:21,279 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:12:21,545 : INFO : topic #18 (0.020): 0.011*\"théori\" + 0.007*\"later\" + 0.007*\"sack\" + 0.006*\"dai\" + 0.006*\"kill\" + 0.005*\"retrospect\" + 0.005*\"like\" + 0.005*\"end\" + 0.004*\"call\" + 0.004*\"help\"\n", + "2019-01-31 01:12:21,546 : INFO : topic #47 (0.020): 0.064*\"muscl\" + 0.032*\"perceptu\" + 0.020*\"theater\" + 0.019*\"place\" + 0.018*\"compos\" + 0.015*\"damn\" + 0.014*\"orchestr\" + 0.013*\"olympo\" + 0.012*\"physician\" + 0.011*\"word\"\n", + "2019-01-31 01:12:21,547 : INFO : topic #1 (0.020): 0.052*\"china\" + 0.042*\"chilton\" + 0.024*\"hong\" + 0.023*\"kong\" + 0.021*\"korea\" + 0.018*\"korean\" + 0.017*\"leah\" + 0.016*\"sourc\" + 0.015*\"kim\" + 0.014*\"shirin\"\n", + "2019-01-31 01:12:21,548 : INFO : topic #41 (0.020): 0.041*\"citi\" + 0.024*\"palmer\" + 0.021*\"new\" + 0.014*\"strategist\" + 0.013*\"center\" + 0.013*\"open\" + 0.011*\"includ\" + 0.011*\"lobe\" + 0.010*\"dai\" + 0.009*\"highli\"\n", + "2019-01-31 01:12:21,549 : INFO : topic #33 (0.020): 0.063*\"french\" + 0.049*\"franc\" + 0.030*\"pari\" + 0.023*\"sail\" + 0.023*\"jean\" + 0.017*\"daphn\" + 0.014*\"lazi\" + 0.013*\"loui\" + 0.012*\"piec\" + 0.010*\"cdr\"\n", + "2019-01-31 01:12:21,555 : INFO : topic diff=0.003919, rho=0.024746\n", + "2019-01-31 01:12:21,710 : INFO : PROGRESS: pass 0, at document #3268000/4922894\n", + "2019-01-31 01:12:23,076 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:12:23,343 : INFO : topic #8 (0.020): 0.025*\"law\" + 0.022*\"cortic\" + 0.018*\"start\" + 0.016*\"act\" + 0.012*\"ricardo\" + 0.012*\"case\" + 0.010*\"replac\" + 0.009*\"polaris\" + 0.008*\"legal\" + 0.007*\"order\"\n", + "2019-01-31 01:12:23,344 : INFO : topic #19 (0.020): 0.018*\"languag\" + 0.014*\"centuri\" + 0.010*\"woodcut\" + 0.009*\"form\" + 0.009*\"origin\" + 0.008*\"trade\" + 0.008*\"mean\" + 0.008*\"english\" + 0.007*\"known\" + 0.007*\"ancestor\"\n", + "2019-01-31 01:12:23,345 : INFO : topic #32 (0.020): 0.051*\"district\" + 0.044*\"popolo\" + 0.042*\"vigour\" + 0.036*\"tortur\" + 0.034*\"cotton\" + 0.022*\"multitud\" + 0.022*\"area\" + 0.022*\"adulthood\" + 0.021*\"citi\" + 0.019*\"cede\"\n", + "2019-01-31 01:12:23,346 : INFO : topic #9 (0.020): 0.068*\"bone\" + 0.045*\"american\" + 0.027*\"valour\" + 0.020*\"folei\" + 0.019*\"player\" + 0.017*\"polit\" + 0.017*\"dutch\" + 0.016*\"english\" + 0.013*\"acrimoni\" + 0.012*\"simpler\"\n", + "2019-01-31 01:12:23,347 : INFO : topic #14 (0.020): 0.024*\"forc\" + 0.023*\"aggress\" + 0.020*\"walter\" + 0.020*\"armi\" + 0.018*\"com\" + 0.015*\"oper\" + 0.013*\"unionist\" + 0.012*\"airbu\" + 0.012*\"militari\" + 0.011*\"diversifi\"\n", + "2019-01-31 01:12:23,353 : INFO : topic diff=0.003619, rho=0.024739\n", + "2019-01-31 01:12:23,516 : INFO : PROGRESS: pass 0, at document #3270000/4922894\n", + "2019-01-31 01:12:24,901 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:12:25,168 : INFO : topic #43 (0.020): 0.065*\"elect\" + 0.056*\"parti\" + 0.025*\"voluntari\" + 0.022*\"democrat\" + 0.020*\"member\" + 0.016*\"polici\" + 0.014*\"liber\" + 0.014*\"seaport\" + 0.014*\"bypass\" + 0.013*\"selma\"\n", + "2019-01-31 01:12:25,169 : INFO : topic #25 (0.020): 0.034*\"ring\" + 0.019*\"lagrang\" + 0.019*\"area\" + 0.016*\"warmth\" + 0.016*\"mount\" + 0.010*\"north\" + 0.009*\"land\" + 0.009*\"sourc\" + 0.009*\"palmer\" + 0.008*\"lobe\"\n", + "2019-01-31 01:12:25,170 : INFO : topic #49 (0.020): 0.044*\"india\" + 0.031*\"incumb\" + 0.013*\"islam\" + 0.013*\"pakistan\" + 0.012*\"muskoge\" + 0.012*\"anglo\" + 0.010*\"televis\" + 0.010*\"khalsa\" + 0.009*\"sri\" + 0.009*\"alam\"\n", + "2019-01-31 01:12:25,171 : INFO : topic #15 (0.020): 0.011*\"small\" + 0.010*\"organ\" + 0.010*\"develop\" + 0.009*\"commun\" + 0.009*\"group\" + 0.008*\"word\" + 0.008*\"peopl\" + 0.007*\"human\" + 0.007*\"woman\" + 0.007*\"summerhil\"\n", + "2019-01-31 01:12:25,172 : INFO : topic #42 (0.020): 0.048*\"german\" + 0.031*\"germani\" + 0.017*\"vol\" + 0.014*\"israel\" + 0.014*\"berlin\" + 0.014*\"jewish\" + 0.013*\"der\" + 0.010*\"european\" + 0.009*\"europ\" + 0.009*\"austria\"\n", + "2019-01-31 01:12:25,177 : INFO : topic diff=0.004240, rho=0.024731\n", + "2019-01-31 01:12:25,333 : INFO : PROGRESS: pass 0, at document #3272000/4922894\n", + "2019-01-31 01:12:26,724 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:12:26,991 : INFO : topic #11 (0.020): 0.023*\"john\" + 0.012*\"will\" + 0.012*\"david\" + 0.011*\"jame\" + 0.010*\"rival\" + 0.009*\"mexican–american\" + 0.008*\"slur\" + 0.008*\"paul\" + 0.008*\"georg\" + 0.007*\"rhyme\"\n", + "2019-01-31 01:12:26,992 : INFO : topic #33 (0.020): 0.063*\"french\" + 0.049*\"franc\" + 0.030*\"pari\" + 0.023*\"sail\" + 0.022*\"jean\" + 0.017*\"daphn\" + 0.013*\"lazi\" + 0.013*\"loui\" + 0.012*\"piec\" + 0.010*\"cdr\"\n", + "2019-01-31 01:12:26,993 : INFO : topic #5 (0.020): 0.038*\"abroad\" + 0.029*\"son\" + 0.027*\"rel\" + 0.025*\"reconstruct\" + 0.021*\"band\" + 0.017*\"muscl\" + 0.016*\"simultan\" + 0.014*\"charcoal\" + 0.013*\"toyota\" + 0.010*\"vocabulari\"\n", + "2019-01-31 01:12:26,995 : INFO : topic #42 (0.020): 0.048*\"german\" + 0.031*\"germani\" + 0.017*\"vol\" + 0.014*\"israel\" + 0.014*\"berlin\" + 0.014*\"jewish\" + 0.013*\"der\" + 0.010*\"european\" + 0.009*\"europ\" + 0.009*\"hungarian\"\n", + "2019-01-31 01:12:26,996 : INFO : topic #6 (0.020): 0.070*\"fewer\" + 0.024*\"epiru\" + 0.022*\"septemb\" + 0.019*\"teacher\" + 0.015*\"stake\" + 0.012*\"rodríguez\" + 0.011*\"proclaim\" + 0.011*\"direct\" + 0.010*\"movi\" + 0.010*\"acrimoni\"\n", + "2019-01-31 01:12:27,002 : INFO : topic diff=0.003828, rho=0.024723\n", + "2019-01-31 01:12:27,158 : INFO : PROGRESS: pass 0, at document #3274000/4922894\n", + "2019-01-31 01:12:28,533 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:12:28,800 : INFO : topic #13 (0.020): 0.027*\"london\" + 0.026*\"australia\" + 0.026*\"sourc\" + 0.024*\"new\" + 0.023*\"england\" + 0.022*\"australian\" + 0.019*\"british\" + 0.017*\"ireland\" + 0.014*\"youth\" + 0.013*\"wale\"\n", + "2019-01-31 01:12:28,801 : INFO : topic #25 (0.020): 0.034*\"ring\" + 0.019*\"lagrang\" + 0.019*\"area\" + 0.016*\"warmth\" + 0.016*\"mount\" + 0.010*\"north\" + 0.009*\"land\" + 0.009*\"sourc\" + 0.009*\"palmer\" + 0.008*\"lobe\"\n", + "2019-01-31 01:12:28,802 : INFO : topic #45 (0.020): 0.027*\"jpg\" + 0.026*\"fifteenth\" + 0.019*\"illicit\" + 0.018*\"pain\" + 0.016*\"arsen\" + 0.015*\"colder\" + 0.014*\"museo\" + 0.013*\"black\" + 0.012*\"western\" + 0.011*\"gai\"\n", + "2019-01-31 01:12:28,803 : INFO : topic #14 (0.020): 0.024*\"forc\" + 0.023*\"aggress\" + 0.020*\"walter\" + 0.020*\"armi\" + 0.017*\"com\" + 0.015*\"oper\" + 0.013*\"unionist\" + 0.012*\"militari\" + 0.012*\"airbu\" + 0.011*\"diversifi\"\n", + "2019-01-31 01:12:28,804 : INFO : topic #36 (0.020): 0.011*\"prognosi\" + 0.011*\"network\" + 0.010*\"pop\" + 0.009*\"cytokin\" + 0.008*\"develop\" + 0.008*\"uruguayan\" + 0.008*\"softwar\" + 0.008*\"user\" + 0.007*\"clean\" + 0.007*\"championship\"\n", + "2019-01-31 01:12:28,810 : INFO : topic diff=0.003878, rho=0.024716\n", + "2019-01-31 01:12:28,966 : INFO : PROGRESS: pass 0, at document #3276000/4922894\n", + "2019-01-31 01:12:30,364 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:12:30,630 : INFO : topic #28 (0.020): 0.033*\"build\" + 0.028*\"hous\" + 0.018*\"buford\" + 0.016*\"rivièr\" + 0.014*\"histor\" + 0.011*\"constitut\" + 0.011*\"linear\" + 0.011*\"silicon\" + 0.011*\"briarwood\" + 0.011*\"depress\"\n", + "2019-01-31 01:12:30,631 : INFO : topic #26 (0.020): 0.033*\"workplac\" + 0.029*\"champion\" + 0.028*\"woman\" + 0.026*\"olymp\" + 0.024*\"men\" + 0.022*\"medal\" + 0.021*\"event\" + 0.019*\"nation\" + 0.018*\"taxpay\" + 0.018*\"atheist\"\n", + "2019-01-31 01:12:30,632 : INFO : topic #3 (0.020): 0.033*\"present\" + 0.026*\"offic\" + 0.025*\"minist\" + 0.023*\"nation\" + 0.022*\"govern\" + 0.020*\"member\" + 0.018*\"serv\" + 0.016*\"start\" + 0.015*\"gener\" + 0.014*\"chickasaw\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 01:12:30,633 : INFO : topic #1 (0.020): 0.052*\"china\" + 0.044*\"chilton\" + 0.026*\"kong\" + 0.023*\"hong\" + 0.020*\"korea\" + 0.018*\"leah\" + 0.018*\"korean\" + 0.016*\"sourc\" + 0.015*\"shirin\" + 0.015*\"kim\"\n", + "2019-01-31 01:12:30,634 : INFO : topic #48 (0.020): 0.079*\"march\" + 0.079*\"sens\" + 0.076*\"octob\" + 0.072*\"august\" + 0.070*\"notion\" + 0.070*\"juli\" + 0.069*\"januari\" + 0.069*\"april\" + 0.067*\"judici\" + 0.065*\"decatur\"\n", + "2019-01-31 01:12:30,640 : INFO : topic diff=0.003458, rho=0.024708\n", + "2019-01-31 01:12:30,799 : INFO : PROGRESS: pass 0, at document #3278000/4922894\n", + "2019-01-31 01:12:32,186 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:12:32,452 : INFO : topic #25 (0.020): 0.034*\"ring\" + 0.019*\"lagrang\" + 0.019*\"area\" + 0.016*\"warmth\" + 0.016*\"mount\" + 0.010*\"north\" + 0.009*\"land\" + 0.009*\"sourc\" + 0.009*\"palmer\" + 0.008*\"lobe\"\n", + "2019-01-31 01:12:32,453 : INFO : topic #26 (0.020): 0.033*\"workplac\" + 0.029*\"champion\" + 0.028*\"woman\" + 0.026*\"olymp\" + 0.024*\"men\" + 0.022*\"medal\" + 0.021*\"event\" + 0.019*\"nation\" + 0.018*\"rainfal\" + 0.018*\"taxpay\"\n", + "2019-01-31 01:12:32,454 : INFO : topic #6 (0.020): 0.071*\"fewer\" + 0.024*\"epiru\" + 0.021*\"septemb\" + 0.019*\"teacher\" + 0.015*\"stake\" + 0.012*\"rodríguez\" + 0.011*\"proclaim\" + 0.011*\"direct\" + 0.010*\"movi\" + 0.010*\"acrimoni\"\n", + "2019-01-31 01:12:32,455 : INFO : topic #11 (0.020): 0.023*\"john\" + 0.012*\"will\" + 0.011*\"david\" + 0.011*\"jame\" + 0.010*\"rival\" + 0.009*\"mexican–american\" + 0.008*\"slur\" + 0.008*\"paul\" + 0.008*\"georg\" + 0.007*\"rhyme\"\n", + "2019-01-31 01:12:32,456 : INFO : topic #44 (0.020): 0.035*\"rooftop\" + 0.028*\"final\" + 0.022*\"wife\" + 0.020*\"tourist\" + 0.017*\"champion\" + 0.016*\"tiepolo\" + 0.015*\"taxpay\" + 0.014*\"martin\" + 0.014*\"chamber\" + 0.012*\"women\"\n", + "2019-01-31 01:12:32,462 : INFO : topic diff=0.004167, rho=0.024701\n", + "2019-01-31 01:12:35,202 : INFO : -11.753 per-word bound, 3451.2 perplexity estimate based on a held-out corpus of 2000 documents with 561527 words\n", + "2019-01-31 01:12:35,203 : INFO : PROGRESS: pass 0, at document #3280000/4922894\n", + "2019-01-31 01:12:36,597 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:12:36,863 : INFO : topic #47 (0.020): 0.063*\"muscl\" + 0.032*\"perceptu\" + 0.020*\"theater\" + 0.019*\"place\" + 0.018*\"compos\" + 0.016*\"damn\" + 0.013*\"orchestr\" + 0.013*\"olympo\" + 0.012*\"physician\" + 0.011*\"word\"\n", + "2019-01-31 01:12:36,864 : INFO : topic #48 (0.020): 0.079*\"march\" + 0.079*\"sens\" + 0.076*\"octob\" + 0.073*\"august\" + 0.070*\"notion\" + 0.069*\"juli\" + 0.068*\"april\" + 0.068*\"januari\" + 0.067*\"judici\" + 0.066*\"decatur\"\n", + "2019-01-31 01:12:36,865 : INFO : topic #10 (0.020): 0.014*\"cdd\" + 0.009*\"media\" + 0.008*\"disco\" + 0.007*\"pathwai\" + 0.007*\"hormon\" + 0.007*\"proper\" + 0.007*\"have\" + 0.006*\"caus\" + 0.006*\"effect\" + 0.006*\"treat\"\n", + "2019-01-31 01:12:36,866 : INFO : topic #0 (0.020): 0.067*\"statewid\" + 0.043*\"line\" + 0.035*\"raid\" + 0.026*\"rosenwald\" + 0.020*\"serv\" + 0.020*\"traceabl\" + 0.017*\"airmen\" + 0.014*\"oper\" + 0.013*\"rivièr\" + 0.011*\"transient\"\n", + "2019-01-31 01:12:36,867 : INFO : topic #45 (0.020): 0.027*\"jpg\" + 0.025*\"fifteenth\" + 0.019*\"illicit\" + 0.018*\"pain\" + 0.017*\"arsen\" + 0.015*\"colder\" + 0.015*\"museo\" + 0.013*\"black\" + 0.012*\"western\" + 0.011*\"gai\"\n", + "2019-01-31 01:12:36,873 : INFO : topic diff=0.003950, rho=0.024693\n", + "2019-01-31 01:12:37,031 : INFO : PROGRESS: pass 0, at document #3282000/4922894\n", + "2019-01-31 01:12:38,415 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:12:38,682 : INFO : topic #25 (0.020): 0.034*\"ring\" + 0.020*\"lagrang\" + 0.019*\"area\" + 0.016*\"warmth\" + 0.015*\"mount\" + 0.010*\"north\" + 0.009*\"land\" + 0.009*\"sourc\" + 0.009*\"palmer\" + 0.008*\"lobe\"\n", + "2019-01-31 01:12:38,683 : INFO : topic #20 (0.020): 0.148*\"scholar\" + 0.040*\"struggl\" + 0.035*\"high\" + 0.029*\"educ\" + 0.024*\"collector\" + 0.018*\"yawn\" + 0.013*\"prognosi\" + 0.010*\"district\" + 0.010*\"gothic\" + 0.010*\"task\"\n", + "2019-01-31 01:12:38,684 : INFO : topic #31 (0.020): 0.052*\"fusiform\" + 0.026*\"scientist\" + 0.026*\"taxpay\" + 0.023*\"player\" + 0.020*\"place\" + 0.015*\"clot\" + 0.013*\"leagu\" + 0.011*\"folei\" + 0.010*\"yawn\" + 0.009*\"reconstruct\"\n", + "2019-01-31 01:12:38,685 : INFO : topic #40 (0.020): 0.088*\"unit\" + 0.024*\"schuster\" + 0.021*\"institut\" + 0.021*\"collector\" + 0.021*\"requir\" + 0.019*\"student\" + 0.015*\"professor\" + 0.012*\"http\" + 0.011*\"word\" + 0.011*\"governor\"\n", + "2019-01-31 01:12:38,686 : INFO : topic #5 (0.020): 0.038*\"abroad\" + 0.029*\"son\" + 0.026*\"rel\" + 0.025*\"reconstruct\" + 0.020*\"band\" + 0.016*\"muscl\" + 0.016*\"simultan\" + 0.014*\"charcoal\" + 0.013*\"toyota\" + 0.010*\"vocabulari\"\n", + "2019-01-31 01:12:38,692 : INFO : topic diff=0.003749, rho=0.024686\n", + "2019-01-31 01:12:38,850 : INFO : PROGRESS: pass 0, at document #3284000/4922894\n", + "2019-01-31 01:12:40,238 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:12:40,505 : INFO : topic #14 (0.020): 0.024*\"forc\" + 0.023*\"aggress\" + 0.020*\"armi\" + 0.020*\"walter\" + 0.017*\"com\" + 0.014*\"oper\" + 0.013*\"unionist\" + 0.012*\"militari\" + 0.012*\"airbu\" + 0.011*\"diversifi\"\n", + "2019-01-31 01:12:40,506 : INFO : topic #23 (0.020): 0.134*\"audit\" + 0.070*\"best\" + 0.034*\"yawn\" + 0.028*\"jacksonvil\" + 0.023*\"japanes\" + 0.022*\"noll\" + 0.021*\"festiv\" + 0.019*\"women\" + 0.016*\"intern\" + 0.013*\"winner\"\n", + "2019-01-31 01:12:40,507 : INFO : topic #4 (0.020): 0.022*\"enfranchis\" + 0.015*\"depress\" + 0.013*\"pour\" + 0.009*\"mode\" + 0.008*\"elabor\" + 0.008*\"veget\" + 0.007*\"uruguayan\" + 0.007*\"spectacl\" + 0.007*\"candid\" + 0.006*\"develop\"\n", + "2019-01-31 01:12:40,508 : INFO : topic #41 (0.020): 0.041*\"citi\" + 0.023*\"palmer\" + 0.021*\"new\" + 0.014*\"strategist\" + 0.013*\"center\" + 0.013*\"open\" + 0.011*\"includ\" + 0.011*\"lobe\" + 0.010*\"dai\" + 0.009*\"highli\"\n", + "2019-01-31 01:12:40,509 : INFO : topic #5 (0.020): 0.038*\"abroad\" + 0.029*\"son\" + 0.026*\"rel\" + 0.025*\"reconstruct\" + 0.021*\"band\" + 0.016*\"muscl\" + 0.016*\"simultan\" + 0.014*\"charcoal\" + 0.013*\"toyota\" + 0.010*\"vocabulari\"\n", + "2019-01-31 01:12:40,515 : INFO : topic diff=0.003935, rho=0.024678\n", + "2019-01-31 01:12:40,672 : INFO : PROGRESS: pass 0, at document #3286000/4922894\n", + "2019-01-31 01:12:42,045 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:12:42,311 : INFO : topic #15 (0.020): 0.011*\"small\" + 0.010*\"organ\" + 0.010*\"develop\" + 0.009*\"commun\" + 0.009*\"group\" + 0.008*\"peopl\" + 0.008*\"word\" + 0.007*\"human\" + 0.007*\"summerhil\" + 0.007*\"woman\"\n", + "2019-01-31 01:12:42,312 : INFO : topic #23 (0.020): 0.134*\"audit\" + 0.070*\"best\" + 0.034*\"yawn\" + 0.028*\"jacksonvil\" + 0.023*\"japanes\" + 0.022*\"noll\" + 0.021*\"festiv\" + 0.018*\"women\" + 0.016*\"intern\" + 0.013*\"winner\"\n", + "2019-01-31 01:12:42,313 : INFO : topic #25 (0.020): 0.034*\"ring\" + 0.020*\"lagrang\" + 0.018*\"area\" + 0.017*\"warmth\" + 0.015*\"mount\" + 0.010*\"north\" + 0.009*\"land\" + 0.009*\"sourc\" + 0.009*\"palmer\" + 0.009*\"lobe\"\n", + "2019-01-31 01:12:42,314 : INFO : topic #17 (0.020): 0.079*\"church\" + 0.022*\"christian\" + 0.022*\"cathol\" + 0.021*\"bishop\" + 0.015*\"sail\" + 0.015*\"retroflex\" + 0.010*\"poll\" + 0.010*\"relationship\" + 0.009*\"historiographi\" + 0.009*\"cathedr\"\n", + "2019-01-31 01:12:42,315 : INFO : topic #13 (0.020): 0.028*\"australia\" + 0.027*\"london\" + 0.026*\"sourc\" + 0.025*\"new\" + 0.024*\"england\" + 0.023*\"australian\" + 0.019*\"british\" + 0.016*\"ireland\" + 0.015*\"youth\" + 0.014*\"wale\"\n", + "2019-01-31 01:12:42,321 : INFO : topic diff=0.004167, rho=0.024671\n", + "2019-01-31 01:12:42,476 : INFO : PROGRESS: pass 0, at document #3288000/4922894\n", + "2019-01-31 01:12:43,856 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:12:44,122 : INFO : topic #10 (0.020): 0.013*\"cdd\" + 0.009*\"media\" + 0.008*\"disco\" + 0.008*\"pathwai\" + 0.007*\"hormon\" + 0.007*\"have\" + 0.007*\"proper\" + 0.006*\"caus\" + 0.006*\"treat\" + 0.006*\"effect\"\n", + "2019-01-31 01:12:44,123 : INFO : topic #23 (0.020): 0.134*\"audit\" + 0.070*\"best\" + 0.034*\"yawn\" + 0.028*\"jacksonvil\" + 0.023*\"japanes\" + 0.022*\"noll\" + 0.021*\"festiv\" + 0.019*\"women\" + 0.016*\"intern\" + 0.013*\"winner\"\n", + "2019-01-31 01:12:44,125 : INFO : topic #0 (0.020): 0.067*\"statewid\" + 0.044*\"line\" + 0.035*\"raid\" + 0.026*\"rosenwald\" + 0.020*\"serv\" + 0.019*\"traceabl\" + 0.017*\"airmen\" + 0.014*\"oper\" + 0.013*\"rivièr\" + 0.011*\"transient\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 01:12:44,125 : INFO : topic #35 (0.020): 0.055*\"russia\" + 0.037*\"sovereignti\" + 0.033*\"rural\" + 0.025*\"poison\" + 0.025*\"personifi\" + 0.025*\"reprint\" + 0.020*\"moscow\" + 0.017*\"poland\" + 0.015*\"unfortun\" + 0.014*\"malaysia\"\n", + "2019-01-31 01:12:44,127 : INFO : topic #25 (0.020): 0.033*\"ring\" + 0.020*\"lagrang\" + 0.018*\"area\" + 0.016*\"warmth\" + 0.015*\"mount\" + 0.010*\"north\" + 0.009*\"land\" + 0.009*\"sourc\" + 0.009*\"palmer\" + 0.008*\"lobe\"\n", + "2019-01-31 01:12:44,132 : INFO : topic diff=0.003747, rho=0.024663\n", + "2019-01-31 01:12:44,289 : INFO : PROGRESS: pass 0, at document #3290000/4922894\n", + "2019-01-31 01:12:45,670 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:12:45,936 : INFO : topic #33 (0.020): 0.062*\"french\" + 0.048*\"franc\" + 0.031*\"pari\" + 0.022*\"sail\" + 0.021*\"jean\" + 0.017*\"daphn\" + 0.013*\"lazi\" + 0.013*\"loui\" + 0.011*\"piec\" + 0.011*\"wreath\"\n", + "2019-01-31 01:12:45,938 : INFO : topic #47 (0.020): 0.063*\"muscl\" + 0.032*\"perceptu\" + 0.020*\"theater\" + 0.019*\"place\" + 0.018*\"compos\" + 0.015*\"damn\" + 0.013*\"orchestr\" + 0.013*\"physician\" + 0.012*\"olympo\" + 0.012*\"word\"\n", + "2019-01-31 01:12:45,939 : INFO : topic #26 (0.020): 0.033*\"workplac\" + 0.029*\"champion\" + 0.028*\"woman\" + 0.025*\"olymp\" + 0.024*\"men\" + 0.022*\"medal\" + 0.021*\"event\" + 0.018*\"nation\" + 0.018*\"taxpay\" + 0.018*\"atheist\"\n", + "2019-01-31 01:12:45,940 : INFO : topic #29 (0.020): 0.031*\"companhia\" + 0.013*\"busi\" + 0.012*\"million\" + 0.011*\"market\" + 0.011*\"bank\" + 0.011*\"produc\" + 0.010*\"industri\" + 0.009*\"yawn\" + 0.009*\"manag\" + 0.007*\"function\"\n", + "2019-01-31 01:12:45,941 : INFO : topic #28 (0.020): 0.033*\"build\" + 0.028*\"hous\" + 0.018*\"buford\" + 0.016*\"rivièr\" + 0.014*\"histor\" + 0.011*\"constitut\" + 0.011*\"silicon\" + 0.011*\"linear\" + 0.011*\"depress\" + 0.010*\"briarwood\"\n", + "2019-01-31 01:12:45,947 : INFO : topic diff=0.003592, rho=0.024656\n", + "2019-01-31 01:12:46,104 : INFO : PROGRESS: pass 0, at document #3292000/4922894\n", + "2019-01-31 01:12:47,482 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:12:47,748 : INFO : topic #21 (0.020): 0.032*\"samford\" + 0.022*\"spain\" + 0.018*\"del\" + 0.018*\"mexico\" + 0.017*\"italian\" + 0.013*\"soviet\" + 0.011*\"santa\" + 0.011*\"juan\" + 0.011*\"mexican\" + 0.011*\"lizard\"\n", + "2019-01-31 01:12:47,750 : INFO : topic #38 (0.020): 0.023*\"walter\" + 0.011*\"aza\" + 0.009*\"battalion\" + 0.009*\"forc\" + 0.008*\"empath\" + 0.008*\"teufel\" + 0.007*\"armi\" + 0.007*\"govern\" + 0.006*\"till\" + 0.006*\"militari\"\n", + "2019-01-31 01:12:47,751 : INFO : topic #42 (0.020): 0.048*\"german\" + 0.031*\"germani\" + 0.016*\"vol\" + 0.015*\"berlin\" + 0.014*\"israel\" + 0.014*\"jewish\" + 0.013*\"der\" + 0.010*\"european\" + 0.009*\"europ\" + 0.009*\"austria\"\n", + "2019-01-31 01:12:47,752 : INFO : topic #8 (0.020): 0.026*\"law\" + 0.023*\"cortic\" + 0.018*\"start\" + 0.017*\"act\" + 0.012*\"case\" + 0.012*\"ricardo\" + 0.010*\"replac\" + 0.009*\"polaris\" + 0.008*\"order\" + 0.008*\"legal\"\n", + "2019-01-31 01:12:47,753 : INFO : topic #4 (0.020): 0.022*\"enfranchis\" + 0.015*\"depress\" + 0.013*\"pour\" + 0.009*\"mode\" + 0.008*\"elabor\" + 0.008*\"veget\" + 0.007*\"uruguayan\" + 0.007*\"spectacl\" + 0.007*\"candid\" + 0.006*\"produc\"\n", + "2019-01-31 01:12:47,759 : INFO : topic diff=0.003695, rho=0.024648\n", + "2019-01-31 01:12:47,978 : INFO : PROGRESS: pass 0, at document #3294000/4922894\n", + "2019-01-31 01:12:49,390 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:12:49,657 : INFO : topic #22 (0.020): 0.036*\"spars\" + 0.018*\"factor\" + 0.011*\"plaisir\" + 0.011*\"genu\" + 0.008*\"western\" + 0.008*\"median\" + 0.008*\"biom\" + 0.008*\"feel\" + 0.007*\"male\" + 0.007*\"incom\"\n", + "2019-01-31 01:12:49,658 : INFO : topic #32 (0.020): 0.052*\"district\" + 0.044*\"popolo\" + 0.041*\"vigour\" + 0.035*\"tortur\" + 0.034*\"cotton\" + 0.022*\"multitud\" + 0.022*\"area\" + 0.022*\"adulthood\" + 0.021*\"citi\" + 0.019*\"cede\"\n", + "2019-01-31 01:12:49,659 : INFO : topic #42 (0.020): 0.047*\"german\" + 0.031*\"germani\" + 0.016*\"jewish\" + 0.016*\"vol\" + 0.015*\"berlin\" + 0.015*\"israel\" + 0.013*\"der\" + 0.011*\"jeremiah\" + 0.010*\"european\" + 0.009*\"europ\"\n", + "2019-01-31 01:12:49,660 : INFO : topic #40 (0.020): 0.088*\"unit\" + 0.024*\"schuster\" + 0.021*\"collector\" + 0.021*\"institut\" + 0.021*\"requir\" + 0.019*\"student\" + 0.015*\"professor\" + 0.012*\"http\" + 0.011*\"word\" + 0.011*\"governor\"\n", + "2019-01-31 01:12:49,661 : INFO : topic #35 (0.020): 0.055*\"russia\" + 0.037*\"sovereignti\" + 0.034*\"rural\" + 0.024*\"poison\" + 0.024*\"reprint\" + 0.024*\"personifi\" + 0.020*\"moscow\" + 0.017*\"poland\" + 0.015*\"unfortun\" + 0.014*\"malaysia\"\n", + "2019-01-31 01:12:49,667 : INFO : topic diff=0.004864, rho=0.024641\n", + "2019-01-31 01:12:49,824 : INFO : PROGRESS: pass 0, at document #3296000/4922894\n", + "2019-01-31 01:12:51,220 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:12:51,487 : INFO : topic #34 (0.020): 0.069*\"start\" + 0.034*\"new\" + 0.032*\"american\" + 0.031*\"unionist\" + 0.026*\"cotton\" + 0.021*\"year\" + 0.015*\"california\" + 0.013*\"warrior\" + 0.012*\"terri\" + 0.011*\"north\"\n", + "2019-01-31 01:12:51,488 : INFO : topic #28 (0.020): 0.033*\"build\" + 0.028*\"hous\" + 0.018*\"buford\" + 0.016*\"rivièr\" + 0.014*\"histor\" + 0.011*\"constitut\" + 0.011*\"silicon\" + 0.011*\"linear\" + 0.011*\"depress\" + 0.011*\"briarwood\"\n", + "2019-01-31 01:12:51,489 : INFO : topic #38 (0.020): 0.023*\"walter\" + 0.010*\"aza\" + 0.009*\"forc\" + 0.009*\"battalion\" + 0.008*\"empath\" + 0.007*\"teufel\" + 0.007*\"armi\" + 0.007*\"govern\" + 0.006*\"militari\" + 0.006*\"till\"\n", + "2019-01-31 01:12:51,490 : INFO : topic #17 (0.020): 0.079*\"church\" + 0.022*\"cathol\" + 0.022*\"christian\" + 0.021*\"bishop\" + 0.015*\"sail\" + 0.015*\"retroflex\" + 0.010*\"poll\" + 0.010*\"relationship\" + 0.009*\"historiographi\" + 0.009*\"centuri\"\n", + "2019-01-31 01:12:51,491 : INFO : topic #23 (0.020): 0.134*\"audit\" + 0.069*\"best\" + 0.034*\"yawn\" + 0.028*\"jacksonvil\" + 0.023*\"japanes\" + 0.022*\"noll\" + 0.021*\"festiv\" + 0.019*\"women\" + 0.016*\"intern\" + 0.013*\"winner\"\n", + "2019-01-31 01:12:51,497 : INFO : topic diff=0.003464, rho=0.024633\n", + "2019-01-31 01:12:51,653 : INFO : PROGRESS: pass 0, at document #3298000/4922894\n", + "2019-01-31 01:12:53,029 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:12:53,295 : INFO : topic #13 (0.020): 0.027*\"australia\" + 0.027*\"london\" + 0.026*\"sourc\" + 0.025*\"new\" + 0.024*\"england\" + 0.023*\"australian\" + 0.019*\"british\" + 0.017*\"ireland\" + 0.015*\"youth\" + 0.014*\"wale\"\n", + "2019-01-31 01:12:53,296 : INFO : topic #4 (0.020): 0.022*\"enfranchis\" + 0.015*\"depress\" + 0.013*\"pour\" + 0.009*\"mode\" + 0.008*\"elabor\" + 0.008*\"veget\" + 0.007*\"uruguayan\" + 0.006*\"spectacl\" + 0.006*\"candid\" + 0.006*\"produc\"\n", + "2019-01-31 01:12:53,297 : INFO : topic #29 (0.020): 0.031*\"companhia\" + 0.013*\"busi\" + 0.012*\"million\" + 0.011*\"market\" + 0.011*\"bank\" + 0.011*\"produc\" + 0.010*\"industri\" + 0.009*\"yawn\" + 0.008*\"manag\" + 0.007*\"function\"\n", + "2019-01-31 01:12:53,299 : INFO : topic #5 (0.020): 0.038*\"abroad\" + 0.029*\"son\" + 0.027*\"rel\" + 0.026*\"reconstruct\" + 0.021*\"band\" + 0.016*\"muscl\" + 0.016*\"simultan\" + 0.014*\"charcoal\" + 0.013*\"toyota\" + 0.010*\"myspac\"\n", + "2019-01-31 01:12:53,300 : INFO : topic #2 (0.020): 0.049*\"isl\" + 0.038*\"shield\" + 0.018*\"narrat\" + 0.014*\"scot\" + 0.013*\"pope\" + 0.012*\"blur\" + 0.011*\"nativist\" + 0.011*\"coalit\" + 0.009*\"fleet\" + 0.009*\"vernon\"\n", + "2019-01-31 01:12:53,305 : INFO : topic diff=0.003670, rho=0.024626\n", + "2019-01-31 01:12:56,018 : INFO : -11.834 per-word bound, 3650.7 perplexity estimate based on a held-out corpus of 2000 documents with 546499 words\n", + "2019-01-31 01:12:56,018 : INFO : PROGRESS: pass 0, at document #3300000/4922894\n", + "2019-01-31 01:12:57,407 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:12:57,673 : INFO : topic #32 (0.020): 0.052*\"district\" + 0.044*\"popolo\" + 0.043*\"vigour\" + 0.035*\"tortur\" + 0.034*\"cotton\" + 0.022*\"multitud\" + 0.022*\"adulthood\" + 0.022*\"area\" + 0.020*\"citi\" + 0.019*\"cede\"\n", + "2019-01-31 01:12:57,675 : INFO : topic #10 (0.020): 0.013*\"cdd\" + 0.009*\"media\" + 0.008*\"disco\" + 0.007*\"pathwai\" + 0.007*\"hormon\" + 0.007*\"have\" + 0.007*\"proper\" + 0.006*\"caus\" + 0.006*\"treat\" + 0.006*\"effect\"\n", + "2019-01-31 01:12:57,676 : INFO : topic #17 (0.020): 0.078*\"church\" + 0.023*\"cathol\" + 0.022*\"christian\" + 0.021*\"bishop\" + 0.016*\"retroflex\" + 0.015*\"sail\" + 0.010*\"poll\" + 0.009*\"relationship\" + 0.009*\"historiographi\" + 0.009*\"cathedr\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 01:12:57,677 : INFO : topic #30 (0.020): 0.035*\"cleveland\" + 0.034*\"leagu\" + 0.029*\"place\" + 0.027*\"taxpay\" + 0.024*\"crete\" + 0.024*\"scientist\" + 0.021*\"folei\" + 0.017*\"goal\" + 0.015*\"martin\" + 0.012*\"schmitz\"\n", + "2019-01-31 01:12:57,678 : INFO : topic #0 (0.020): 0.067*\"statewid\" + 0.044*\"line\" + 0.035*\"raid\" + 0.026*\"rosenwald\" + 0.019*\"serv\" + 0.019*\"traceabl\" + 0.017*\"airmen\" + 0.014*\"oper\" + 0.013*\"rivièr\" + 0.011*\"transient\"\n", + "2019-01-31 01:12:57,684 : INFO : topic diff=0.003650, rho=0.024618\n", + "2019-01-31 01:12:57,841 : INFO : PROGRESS: pass 0, at document #3302000/4922894\n", + "2019-01-31 01:12:59,227 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:12:59,493 : INFO : topic #16 (0.020): 0.057*\"king\" + 0.031*\"priest\" + 0.020*\"duke\" + 0.020*\"quarterli\" + 0.019*\"rotterdam\" + 0.017*\"grammat\" + 0.016*\"idiosyncrat\" + 0.014*\"count\" + 0.013*\"order\" + 0.013*\"portugues\"\n", + "2019-01-31 01:12:59,494 : INFO : topic #22 (0.020): 0.037*\"spars\" + 0.018*\"factor\" + 0.011*\"plaisir\" + 0.011*\"genu\" + 0.008*\"western\" + 0.008*\"median\" + 0.008*\"biom\" + 0.007*\"feel\" + 0.007*\"male\" + 0.007*\"trap\"\n", + "2019-01-31 01:12:59,495 : INFO : topic #29 (0.020): 0.031*\"companhia\" + 0.013*\"busi\" + 0.012*\"million\" + 0.011*\"market\" + 0.011*\"produc\" + 0.011*\"bank\" + 0.010*\"industri\" + 0.009*\"yawn\" + 0.009*\"manag\" + 0.007*\"function\"\n", + "2019-01-31 01:12:59,496 : INFO : topic #33 (0.020): 0.062*\"french\" + 0.047*\"franc\" + 0.031*\"pari\" + 0.022*\"sail\" + 0.021*\"jean\" + 0.017*\"daphn\" + 0.014*\"lazi\" + 0.013*\"loui\" + 0.011*\"piec\" + 0.010*\"wine\"\n", + "2019-01-31 01:12:59,497 : INFO : topic #12 (0.020): 0.009*\"number\" + 0.007*\"frontal\" + 0.007*\"gener\" + 0.007*\"poet\" + 0.006*\"exampl\" + 0.006*\"utopian\" + 0.006*\"southern\" + 0.006*\"théori\" + 0.006*\"servitud\" + 0.006*\"measur\"\n", + "2019-01-31 01:12:59,503 : INFO : topic diff=0.003686, rho=0.024611\n", + "2019-01-31 01:12:59,659 : INFO : PROGRESS: pass 0, at document #3304000/4922894\n", + "2019-01-31 01:13:01,034 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:13:01,301 : INFO : topic #5 (0.020): 0.038*\"abroad\" + 0.028*\"son\" + 0.027*\"rel\" + 0.026*\"reconstruct\" + 0.021*\"band\" + 0.016*\"muscl\" + 0.016*\"simultan\" + 0.014*\"charcoal\" + 0.013*\"toyota\" + 0.010*\"myspac\"\n", + "2019-01-31 01:13:01,302 : INFO : topic #13 (0.020): 0.027*\"australia\" + 0.026*\"london\" + 0.026*\"sourc\" + 0.025*\"new\" + 0.024*\"england\" + 0.023*\"australian\" + 0.020*\"british\" + 0.017*\"ireland\" + 0.015*\"youth\" + 0.014*\"wale\"\n", + "2019-01-31 01:13:01,303 : INFO : topic #23 (0.020): 0.134*\"audit\" + 0.069*\"best\" + 0.034*\"yawn\" + 0.029*\"jacksonvil\" + 0.023*\"japanes\" + 0.023*\"noll\" + 0.020*\"festiv\" + 0.019*\"women\" + 0.016*\"intern\" + 0.013*\"winner\"\n", + "2019-01-31 01:13:01,304 : INFO : topic #26 (0.020): 0.032*\"workplac\" + 0.029*\"champion\" + 0.029*\"woman\" + 0.025*\"olymp\" + 0.024*\"men\" + 0.022*\"medal\" + 0.021*\"event\" + 0.019*\"nation\" + 0.018*\"rainfal\" + 0.018*\"taxpay\"\n", + "2019-01-31 01:13:01,305 : INFO : topic #4 (0.020): 0.022*\"enfranchis\" + 0.015*\"depress\" + 0.013*\"pour\" + 0.009*\"mode\" + 0.008*\"elabor\" + 0.008*\"veget\" + 0.007*\"uruguayan\" + 0.007*\"candid\" + 0.006*\"spectacl\" + 0.006*\"produc\"\n", + "2019-01-31 01:13:01,311 : INFO : topic diff=0.003653, rho=0.024603\n", + "2019-01-31 01:13:01,470 : INFO : PROGRESS: pass 0, at document #3306000/4922894\n", + "2019-01-31 01:13:02,839 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:13:03,109 : INFO : topic #21 (0.020): 0.033*\"samford\" + 0.022*\"spain\" + 0.018*\"del\" + 0.018*\"mexico\" + 0.016*\"italian\" + 0.014*\"soviet\" + 0.012*\"santa\" + 0.011*\"lizard\" + 0.011*\"juan\" + 0.010*\"mexican\"\n", + "2019-01-31 01:13:03,110 : INFO : topic #41 (0.020): 0.040*\"citi\" + 0.023*\"palmer\" + 0.021*\"new\" + 0.014*\"strategist\" + 0.013*\"center\" + 0.013*\"open\" + 0.011*\"includ\" + 0.011*\"lobe\" + 0.011*\"dai\" + 0.009*\"highli\"\n", + "2019-01-31 01:13:03,111 : INFO : topic #44 (0.020): 0.034*\"rooftop\" + 0.028*\"final\" + 0.022*\"wife\" + 0.020*\"tourist\" + 0.017*\"champion\" + 0.016*\"taxpay\" + 0.015*\"tiepolo\" + 0.015*\"martin\" + 0.014*\"chamber\" + 0.012*\"women\"\n", + "2019-01-31 01:13:03,112 : INFO : topic #7 (0.020): 0.021*\"snatch\" + 0.020*\"di\" + 0.019*\"factor\" + 0.016*\"margin\" + 0.016*\"yawn\" + 0.014*\"bone\" + 0.013*\"life\" + 0.013*\"faster\" + 0.012*\"daughter\" + 0.011*\"deal\"\n", + "2019-01-31 01:13:03,113 : INFO : topic #33 (0.020): 0.062*\"french\" + 0.047*\"franc\" + 0.031*\"pari\" + 0.022*\"sail\" + 0.021*\"jean\" + 0.017*\"daphn\" + 0.013*\"lazi\" + 0.013*\"loui\" + 0.011*\"piec\" + 0.011*\"wreath\"\n", + "2019-01-31 01:13:03,119 : INFO : topic diff=0.003322, rho=0.024596\n", + "2019-01-31 01:13:03,276 : INFO : PROGRESS: pass 0, at document #3308000/4922894\n", + "2019-01-31 01:13:04,659 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:13:04,925 : INFO : topic #41 (0.020): 0.040*\"citi\" + 0.023*\"palmer\" + 0.021*\"new\" + 0.014*\"strategist\" + 0.013*\"center\" + 0.013*\"open\" + 0.011*\"includ\" + 0.011*\"lobe\" + 0.011*\"dai\" + 0.009*\"highli\"\n", + "2019-01-31 01:13:04,926 : INFO : topic #31 (0.020): 0.052*\"fusiform\" + 0.027*\"scientist\" + 0.026*\"taxpay\" + 0.023*\"player\" + 0.020*\"place\" + 0.015*\"clot\" + 0.013*\"leagu\" + 0.011*\"folei\" + 0.010*\"yawn\" + 0.009*\"reconstruct\"\n", + "2019-01-31 01:13:04,927 : INFO : topic #34 (0.020): 0.069*\"start\" + 0.034*\"new\" + 0.032*\"american\" + 0.031*\"unionist\" + 0.026*\"cotton\" + 0.021*\"year\" + 0.015*\"california\" + 0.013*\"warrior\" + 0.012*\"terri\" + 0.011*\"north\"\n", + "2019-01-31 01:13:04,929 : INFO : topic #10 (0.020): 0.012*\"cdd\" + 0.009*\"media\" + 0.008*\"disco\" + 0.007*\"hormon\" + 0.007*\"pathwai\" + 0.007*\"have\" + 0.007*\"proper\" + 0.006*\"caus\" + 0.006*\"effect\" + 0.006*\"treat\"\n", + "2019-01-31 01:13:04,930 : INFO : topic #19 (0.020): 0.017*\"languag\" + 0.015*\"centuri\" + 0.011*\"woodcut\" + 0.009*\"form\" + 0.009*\"origin\" + 0.008*\"trade\" + 0.008*\"mean\" + 0.008*\"english\" + 0.007*\"known\" + 0.006*\"ancestor\"\n", + "2019-01-31 01:13:04,936 : INFO : topic diff=0.003355, rho=0.024589\n", + "2019-01-31 01:13:05,091 : INFO : PROGRESS: pass 0, at document #3310000/4922894\n", + "2019-01-31 01:13:06,463 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:13:06,730 : INFO : topic #26 (0.020): 0.032*\"workplac\" + 0.029*\"champion\" + 0.028*\"woman\" + 0.025*\"olymp\" + 0.024*\"men\" + 0.022*\"medal\" + 0.021*\"event\" + 0.019*\"nation\" + 0.018*\"rainfal\" + 0.018*\"atheist\"\n", + "2019-01-31 01:13:06,731 : INFO : topic #9 (0.020): 0.069*\"bone\" + 0.048*\"american\" + 0.027*\"valour\" + 0.018*\"dutch\" + 0.018*\"folei\" + 0.017*\"player\" + 0.017*\"polit\" + 0.015*\"english\" + 0.012*\"acrimoni\" + 0.012*\"simpler\"\n", + "2019-01-31 01:13:06,732 : INFO : topic #36 (0.020): 0.010*\"prognosi\" + 0.010*\"pop\" + 0.010*\"network\" + 0.009*\"cytokin\" + 0.008*\"user\" + 0.008*\"develop\" + 0.008*\"softwar\" + 0.008*\"uruguayan\" + 0.007*\"includ\" + 0.007*\"championship\"\n", + "2019-01-31 01:13:06,733 : INFO : topic #33 (0.020): 0.062*\"french\" + 0.048*\"franc\" + 0.031*\"pari\" + 0.023*\"sail\" + 0.021*\"jean\" + 0.017*\"daphn\" + 0.014*\"lazi\" + 0.013*\"loui\" + 0.011*\"piec\" + 0.010*\"wreath\"\n", + "2019-01-31 01:13:06,734 : INFO : topic #8 (0.020): 0.026*\"law\" + 0.022*\"cortic\" + 0.018*\"start\" + 0.016*\"act\" + 0.012*\"case\" + 0.012*\"ricardo\" + 0.010*\"replac\" + 0.009*\"polaris\" + 0.008*\"legal\" + 0.008*\"order\"\n", + "2019-01-31 01:13:06,740 : INFO : topic diff=0.003703, rho=0.024581\n", + "2019-01-31 01:13:06,895 : INFO : PROGRESS: pass 0, at document #3312000/4922894\n", + "2019-01-31 01:13:08,263 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:13:08,530 : INFO : topic #19 (0.020): 0.017*\"languag\" + 0.015*\"centuri\" + 0.011*\"woodcut\" + 0.009*\"form\" + 0.009*\"origin\" + 0.008*\"mean\" + 0.008*\"trade\" + 0.008*\"english\" + 0.007*\"known\" + 0.006*\"ancestor\"\n", + "2019-01-31 01:13:08,531 : INFO : topic #13 (0.020): 0.027*\"australia\" + 0.026*\"london\" + 0.026*\"sourc\" + 0.025*\"new\" + 0.024*\"england\" + 0.023*\"australian\" + 0.019*\"british\" + 0.017*\"ireland\" + 0.015*\"youth\" + 0.014*\"wale\"\n", + "2019-01-31 01:13:08,532 : INFO : topic #6 (0.020): 0.071*\"fewer\" + 0.023*\"epiru\" + 0.021*\"septemb\" + 0.018*\"teacher\" + 0.016*\"stake\" + 0.012*\"rodríguez\" + 0.011*\"proclaim\" + 0.011*\"direct\" + 0.011*\"movi\" + 0.010*\"acrimoni\"\n", + "2019-01-31 01:13:08,533 : INFO : topic #5 (0.020): 0.038*\"abroad\" + 0.028*\"son\" + 0.027*\"rel\" + 0.026*\"reconstruct\" + 0.021*\"band\" + 0.016*\"muscl\" + 0.016*\"simultan\" + 0.014*\"charcoal\" + 0.013*\"toyota\" + 0.010*\"myspac\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 01:13:08,534 : INFO : topic #43 (0.020): 0.064*\"elect\" + 0.054*\"parti\" + 0.025*\"voluntari\" + 0.023*\"democrat\" + 0.021*\"member\" + 0.016*\"polici\" + 0.014*\"republ\" + 0.014*\"liber\" + 0.013*\"report\" + 0.013*\"bypass\"\n", + "2019-01-31 01:13:08,540 : INFO : topic diff=0.004365, rho=0.024574\n", + "2019-01-31 01:13:08,693 : INFO : PROGRESS: pass 0, at document #3314000/4922894\n", + "2019-01-31 01:13:10,049 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:13:10,316 : INFO : topic #9 (0.020): 0.069*\"bone\" + 0.047*\"american\" + 0.027*\"valour\" + 0.018*\"dutch\" + 0.018*\"folei\" + 0.017*\"player\" + 0.017*\"polit\" + 0.015*\"english\" + 0.012*\"acrimoni\" + 0.012*\"simpler\"\n", + "2019-01-31 01:13:10,317 : INFO : topic #43 (0.020): 0.064*\"elect\" + 0.054*\"parti\" + 0.025*\"voluntari\" + 0.023*\"democrat\" + 0.021*\"member\" + 0.016*\"polici\" + 0.014*\"republ\" + 0.014*\"liber\" + 0.013*\"bypass\" + 0.013*\"report\"\n", + "2019-01-31 01:13:10,318 : INFO : topic #41 (0.020): 0.040*\"citi\" + 0.023*\"palmer\" + 0.021*\"new\" + 0.014*\"strategist\" + 0.013*\"center\" + 0.013*\"open\" + 0.011*\"includ\" + 0.011*\"lobe\" + 0.011*\"dai\" + 0.009*\"highli\"\n", + "2019-01-31 01:13:10,319 : INFO : topic #45 (0.020): 0.026*\"jpg\" + 0.025*\"fifteenth\" + 0.019*\"pain\" + 0.019*\"illicit\" + 0.018*\"arsen\" + 0.016*\"museo\" + 0.015*\"colder\" + 0.013*\"black\" + 0.012*\"western\" + 0.012*\"gai\"\n", + "2019-01-31 01:13:10,320 : INFO : topic #8 (0.020): 0.026*\"law\" + 0.022*\"cortic\" + 0.018*\"start\" + 0.016*\"act\" + 0.012*\"case\" + 0.012*\"ricardo\" + 0.010*\"replac\" + 0.009*\"polaris\" + 0.008*\"legal\" + 0.008*\"order\"\n", + "2019-01-31 01:13:10,326 : INFO : topic diff=0.004409, rho=0.024566\n", + "2019-01-31 01:13:10,477 : INFO : PROGRESS: pass 0, at document #3316000/4922894\n", + "2019-01-31 01:13:11,821 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:13:12,090 : INFO : topic #20 (0.020): 0.144*\"scholar\" + 0.040*\"struggl\" + 0.033*\"high\" + 0.029*\"educ\" + 0.023*\"collector\" + 0.018*\"yawn\" + 0.013*\"prognosi\" + 0.011*\"district\" + 0.011*\"gothic\" + 0.010*\"task\"\n", + "2019-01-31 01:13:12,092 : INFO : topic #0 (0.020): 0.067*\"statewid\" + 0.043*\"line\" + 0.035*\"raid\" + 0.026*\"rosenwald\" + 0.020*\"serv\" + 0.019*\"traceabl\" + 0.017*\"airmen\" + 0.014*\"oper\" + 0.014*\"rivièr\" + 0.011*\"transient\"\n", + "2019-01-31 01:13:12,093 : INFO : topic #38 (0.020): 0.023*\"walter\" + 0.010*\"aza\" + 0.009*\"forc\" + 0.009*\"battalion\" + 0.007*\"empath\" + 0.007*\"teufel\" + 0.007*\"armi\" + 0.007*\"govern\" + 0.006*\"militari\" + 0.006*\"pour\"\n", + "2019-01-31 01:13:12,094 : INFO : topic #46 (0.020): 0.017*\"sweden\" + 0.016*\"norwai\" + 0.016*\"stop\" + 0.016*\"swedish\" + 0.015*\"norwegian\" + 0.014*\"damag\" + 0.013*\"wind\" + 0.012*\"huntsvil\" + 0.011*\"denmark\" + 0.011*\"turkish\"\n", + "2019-01-31 01:13:12,095 : INFO : topic #6 (0.020): 0.071*\"fewer\" + 0.023*\"epiru\" + 0.021*\"septemb\" + 0.018*\"teacher\" + 0.016*\"stake\" + 0.012*\"rodríguez\" + 0.011*\"proclaim\" + 0.011*\"direct\" + 0.011*\"movi\" + 0.010*\"acrimoni\"\n", + "2019-01-31 01:13:12,101 : INFO : topic diff=0.004118, rho=0.024559\n", + "2019-01-31 01:13:12,256 : INFO : PROGRESS: pass 0, at document #3318000/4922894\n", + "2019-01-31 01:13:13,635 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:13:13,901 : INFO : topic #27 (0.020): 0.072*\"questionnair\" + 0.019*\"candid\" + 0.019*\"taxpay\" + 0.014*\"ret\" + 0.013*\"driver\" + 0.012*\"tornado\" + 0.012*\"find\" + 0.010*\"fool\" + 0.010*\"champion\" + 0.009*\"landslid\"\n", + "2019-01-31 01:13:13,902 : INFO : topic #24 (0.020): 0.037*\"book\" + 0.033*\"publicis\" + 0.029*\"word\" + 0.019*\"new\" + 0.015*\"arsen\" + 0.013*\"edit\" + 0.013*\"presid\" + 0.011*\"collect\" + 0.011*\"worldwid\" + 0.010*\"nicola\"\n", + "2019-01-31 01:13:13,904 : INFO : topic #8 (0.020): 0.026*\"law\" + 0.022*\"cortic\" + 0.017*\"start\" + 0.016*\"act\" + 0.012*\"case\" + 0.012*\"ricardo\" + 0.010*\"replac\" + 0.008*\"polaris\" + 0.008*\"legal\" + 0.008*\"order\"\n", + "2019-01-31 01:13:13,905 : INFO : topic #19 (0.020): 0.017*\"languag\" + 0.015*\"centuri\" + 0.011*\"woodcut\" + 0.009*\"form\" + 0.009*\"origin\" + 0.008*\"trade\" + 0.008*\"mean\" + 0.008*\"english\" + 0.007*\"known\" + 0.006*\"ancestor\"\n", + "2019-01-31 01:13:13,906 : INFO : topic #11 (0.020): 0.023*\"john\" + 0.012*\"will\" + 0.012*\"jame\" + 0.011*\"david\" + 0.010*\"rival\" + 0.010*\"mexican–american\" + 0.008*\"slur\" + 0.008*\"paul\" + 0.008*\"georg\" + 0.007*\"rhyme\"\n", + "2019-01-31 01:13:13,912 : INFO : topic diff=0.002821, rho=0.024551\n", + "2019-01-31 01:13:16,578 : INFO : -11.544 per-word bound, 2985.7 perplexity estimate based on a held-out corpus of 2000 documents with 544621 words\n", + "2019-01-31 01:13:16,578 : INFO : PROGRESS: pass 0, at document #3320000/4922894\n", + "2019-01-31 01:13:17,944 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:13:18,213 : INFO : topic #14 (0.020): 0.024*\"forc\" + 0.023*\"aggress\" + 0.020*\"armi\" + 0.020*\"walter\" + 0.017*\"com\" + 0.015*\"oper\" + 0.014*\"unionist\" + 0.012*\"militari\" + 0.012*\"airbu\" + 0.011*\"diversifi\"\n", + "2019-01-31 01:13:18,214 : INFO : topic #23 (0.020): 0.132*\"audit\" + 0.068*\"best\" + 0.033*\"yawn\" + 0.029*\"jacksonvil\" + 0.023*\"japanes\" + 0.022*\"noll\" + 0.020*\"festiv\" + 0.019*\"women\" + 0.016*\"intern\" + 0.013*\"winner\"\n", + "2019-01-31 01:13:18,215 : INFO : topic #38 (0.020): 0.023*\"walter\" + 0.011*\"aza\" + 0.009*\"forc\" + 0.009*\"battalion\" + 0.008*\"teufel\" + 0.007*\"empath\" + 0.007*\"armi\" + 0.007*\"militari\" + 0.006*\"govern\" + 0.006*\"till\"\n", + "2019-01-31 01:13:18,216 : INFO : topic #15 (0.020): 0.011*\"small\" + 0.010*\"organ\" + 0.010*\"develop\" + 0.009*\"commun\" + 0.009*\"group\" + 0.008*\"word\" + 0.008*\"peopl\" + 0.007*\"human\" + 0.007*\"woman\" + 0.007*\"summerhil\"\n", + "2019-01-31 01:13:18,217 : INFO : topic #16 (0.020): 0.056*\"king\" + 0.032*\"priest\" + 0.020*\"duke\" + 0.019*\"rotterdam\" + 0.019*\"quarterli\" + 0.017*\"grammat\" + 0.016*\"idiosyncrat\" + 0.014*\"count\" + 0.014*\"portugues\" + 0.013*\"brazil\"\n", + "2019-01-31 01:13:18,223 : INFO : topic diff=0.003584, rho=0.024544\n", + "2019-01-31 01:13:18,387 : INFO : PROGRESS: pass 0, at document #3322000/4922894\n", + "2019-01-31 01:13:19,808 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:13:20,075 : INFO : topic #4 (0.020): 0.022*\"enfranchis\" + 0.015*\"depress\" + 0.013*\"pour\" + 0.009*\"mode\" + 0.008*\"veget\" + 0.008*\"elabor\" + 0.007*\"uruguayan\" + 0.006*\"produc\" + 0.006*\"candid\" + 0.006*\"spectacl\"\n", + "2019-01-31 01:13:20,076 : INFO : topic #9 (0.020): 0.069*\"bone\" + 0.047*\"american\" + 0.027*\"valour\" + 0.018*\"dutch\" + 0.018*\"folei\" + 0.017*\"polit\" + 0.017*\"player\" + 0.015*\"english\" + 0.012*\"acrimoni\" + 0.012*\"simpler\"\n", + "2019-01-31 01:13:20,077 : INFO : topic #5 (0.020): 0.038*\"abroad\" + 0.028*\"son\" + 0.027*\"rel\" + 0.025*\"reconstruct\" + 0.021*\"band\" + 0.016*\"muscl\" + 0.016*\"simultan\" + 0.014*\"charcoal\" + 0.013*\"toyota\" + 0.010*\"myspac\"\n", + "2019-01-31 01:13:20,078 : INFO : topic #0 (0.020): 0.067*\"statewid\" + 0.043*\"line\" + 0.035*\"raid\" + 0.025*\"rosenwald\" + 0.020*\"serv\" + 0.019*\"traceabl\" + 0.017*\"airmen\" + 0.014*\"oper\" + 0.014*\"rivièr\" + 0.011*\"transient\"\n", + "2019-01-31 01:13:20,079 : INFO : topic #18 (0.020): 0.010*\"théori\" + 0.007*\"later\" + 0.007*\"sack\" + 0.006*\"dai\" + 0.006*\"kill\" + 0.005*\"retrospect\" + 0.005*\"like\" + 0.005*\"end\" + 0.004*\"help\" + 0.004*\"call\"\n", + "2019-01-31 01:13:20,085 : INFO : topic diff=0.004407, rho=0.024537\n", + "2019-01-31 01:13:20,246 : INFO : PROGRESS: pass 0, at document #3324000/4922894\n", + "2019-01-31 01:13:21,651 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:13:21,918 : INFO : topic #28 (0.020): 0.033*\"build\" + 0.027*\"hous\" + 0.018*\"buford\" + 0.015*\"rivièr\" + 0.014*\"histor\" + 0.012*\"constitut\" + 0.011*\"silicon\" + 0.011*\"linear\" + 0.011*\"briarwood\" + 0.011*\"depress\"\n", + "2019-01-31 01:13:21,919 : INFO : topic #42 (0.020): 0.048*\"german\" + 0.032*\"germani\" + 0.016*\"vol\" + 0.015*\"jewish\" + 0.014*\"berlin\" + 0.014*\"israel\" + 0.013*\"der\" + 0.010*\"european\" + 0.010*\"jeremiah\" + 0.009*\"hungarian\"\n", + "2019-01-31 01:13:21,920 : INFO : topic #38 (0.020): 0.023*\"walter\" + 0.010*\"aza\" + 0.009*\"forc\" + 0.009*\"battalion\" + 0.007*\"empath\" + 0.007*\"teufel\" + 0.007*\"armi\" + 0.006*\"govern\" + 0.006*\"militari\" + 0.006*\"pour\"\n", + "2019-01-31 01:13:21,921 : INFO : topic #0 (0.020): 0.067*\"statewid\" + 0.043*\"line\" + 0.035*\"raid\" + 0.025*\"rosenwald\" + 0.020*\"serv\" + 0.019*\"traceabl\" + 0.017*\"airmen\" + 0.014*\"oper\" + 0.014*\"rivièr\" + 0.011*\"transient\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 01:13:21,922 : INFO : topic #45 (0.020): 0.027*\"jpg\" + 0.026*\"fifteenth\" + 0.019*\"illicit\" + 0.019*\"pain\" + 0.019*\"arsen\" + 0.016*\"museo\" + 0.014*\"colder\" + 0.013*\"black\" + 0.013*\"western\" + 0.012*\"gai\"\n", + "2019-01-31 01:13:21,928 : INFO : topic diff=0.003536, rho=0.024529\n", + "2019-01-31 01:13:22,084 : INFO : PROGRESS: pass 0, at document #3326000/4922894\n", + "2019-01-31 01:13:23,461 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:13:23,728 : INFO : topic #46 (0.020): 0.017*\"stop\" + 0.016*\"sweden\" + 0.016*\"norwai\" + 0.015*\"swedish\" + 0.014*\"norwegian\" + 0.014*\"damag\" + 0.013*\"wind\" + 0.013*\"huntsvil\" + 0.012*\"treeless\" + 0.011*\"denmark\"\n", + "2019-01-31 01:13:23,729 : INFO : topic #41 (0.020): 0.040*\"citi\" + 0.023*\"palmer\" + 0.021*\"new\" + 0.014*\"strategist\" + 0.013*\"center\" + 0.013*\"open\" + 0.011*\"includ\" + 0.011*\"lobe\" + 0.011*\"dai\" + 0.009*\"highli\"\n", + "2019-01-31 01:13:23,731 : INFO : topic #38 (0.020): 0.023*\"walter\" + 0.010*\"aza\" + 0.009*\"forc\" + 0.009*\"battalion\" + 0.007*\"teufel\" + 0.007*\"empath\" + 0.007*\"armi\" + 0.006*\"militari\" + 0.006*\"govern\" + 0.006*\"till\"\n", + "2019-01-31 01:13:23,732 : INFO : topic #42 (0.020): 0.047*\"german\" + 0.031*\"germani\" + 0.016*\"vol\" + 0.015*\"jewish\" + 0.015*\"israel\" + 0.014*\"berlin\" + 0.013*\"der\" + 0.010*\"european\" + 0.010*\"jeremiah\" + 0.009*\"hungarian\"\n", + "2019-01-31 01:13:23,733 : INFO : topic #40 (0.020): 0.088*\"unit\" + 0.024*\"schuster\" + 0.021*\"institut\" + 0.021*\"collector\" + 0.021*\"requir\" + 0.019*\"student\" + 0.015*\"professor\" + 0.012*\"http\" + 0.011*\"word\" + 0.011*\"governor\"\n", + "2019-01-31 01:13:23,739 : INFO : topic diff=0.003432, rho=0.024522\n", + "2019-01-31 01:13:23,956 : INFO : PROGRESS: pass 0, at document #3328000/4922894\n", + "2019-01-31 01:13:25,351 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:13:25,617 : INFO : topic #4 (0.020): 0.022*\"enfranchis\" + 0.015*\"depress\" + 0.014*\"pour\" + 0.009*\"mode\" + 0.008*\"veget\" + 0.008*\"elabor\" + 0.007*\"uruguayan\" + 0.006*\"produc\" + 0.006*\"develop\" + 0.006*\"spectacl\"\n", + "2019-01-31 01:13:25,618 : INFO : topic #48 (0.020): 0.080*\"march\" + 0.079*\"sens\" + 0.076*\"octob\" + 0.075*\"august\" + 0.074*\"juli\" + 0.070*\"april\" + 0.069*\"judici\" + 0.069*\"januari\" + 0.069*\"notion\" + 0.065*\"decatur\"\n", + "2019-01-31 01:13:25,619 : INFO : topic #15 (0.020): 0.011*\"small\" + 0.010*\"organ\" + 0.010*\"develop\" + 0.009*\"commun\" + 0.008*\"group\" + 0.008*\"word\" + 0.008*\"peopl\" + 0.007*\"human\" + 0.007*\"woman\" + 0.006*\"summerhil\"\n", + "2019-01-31 01:13:25,620 : INFO : topic #35 (0.020): 0.056*\"russia\" + 0.037*\"sovereignti\" + 0.033*\"rural\" + 0.026*\"reprint\" + 0.025*\"poison\" + 0.023*\"personifi\" + 0.020*\"moscow\" + 0.017*\"poland\" + 0.015*\"unfortun\" + 0.014*\"czech\"\n", + "2019-01-31 01:13:25,621 : INFO : topic #26 (0.020): 0.031*\"workplac\" + 0.029*\"woman\" + 0.028*\"champion\" + 0.025*\"olymp\" + 0.024*\"men\" + 0.022*\"medal\" + 0.021*\"event\" + 0.018*\"rainfal\" + 0.018*\"taxpay\" + 0.018*\"nation\"\n", + "2019-01-31 01:13:25,627 : INFO : topic diff=0.003442, rho=0.024515\n", + "2019-01-31 01:13:25,784 : INFO : PROGRESS: pass 0, at document #3330000/4922894\n", + "2019-01-31 01:13:27,157 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:13:27,424 : INFO : topic #23 (0.020): 0.133*\"audit\" + 0.067*\"best\" + 0.033*\"yawn\" + 0.029*\"jacksonvil\" + 0.023*\"japanes\" + 0.023*\"noll\" + 0.020*\"festiv\" + 0.019*\"women\" + 0.016*\"intern\" + 0.013*\"winner\"\n", + "2019-01-31 01:13:27,425 : INFO : topic #30 (0.020): 0.036*\"cleveland\" + 0.034*\"leagu\" + 0.030*\"place\" + 0.027*\"taxpay\" + 0.024*\"scientist\" + 0.023*\"crete\" + 0.021*\"folei\" + 0.016*\"goal\" + 0.015*\"martin\" + 0.012*\"schmitz\"\n", + "2019-01-31 01:13:27,426 : INFO : topic #24 (0.020): 0.037*\"book\" + 0.033*\"publicis\" + 0.029*\"word\" + 0.019*\"new\" + 0.015*\"arsen\" + 0.014*\"edit\" + 0.013*\"presid\" + 0.011*\"collect\" + 0.011*\"worldwid\" + 0.010*\"author\"\n", + "2019-01-31 01:13:27,427 : INFO : topic #48 (0.020): 0.079*\"march\" + 0.079*\"sens\" + 0.076*\"octob\" + 0.075*\"august\" + 0.073*\"juli\" + 0.070*\"april\" + 0.069*\"januari\" + 0.069*\"notion\" + 0.068*\"judici\" + 0.065*\"decatur\"\n", + "2019-01-31 01:13:27,428 : INFO : topic #22 (0.020): 0.036*\"spars\" + 0.018*\"factor\" + 0.012*\"plaisir\" + 0.011*\"genu\" + 0.009*\"western\" + 0.008*\"median\" + 0.008*\"biom\" + 0.007*\"feel\" + 0.007*\"trap\" + 0.007*\"male\"\n", + "2019-01-31 01:13:27,434 : INFO : topic diff=0.003903, rho=0.024507\n", + "2019-01-31 01:13:27,595 : INFO : PROGRESS: pass 0, at document #3332000/4922894\n", + "2019-01-31 01:13:29,000 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:13:29,266 : INFO : topic #42 (0.020): 0.047*\"german\" + 0.031*\"germani\" + 0.015*\"vol\" + 0.015*\"jewish\" + 0.014*\"israel\" + 0.014*\"berlin\" + 0.014*\"der\" + 0.010*\"jeremiah\" + 0.010*\"european\" + 0.009*\"hungarian\"\n", + "2019-01-31 01:13:29,267 : INFO : topic #4 (0.020): 0.022*\"enfranchis\" + 0.015*\"depress\" + 0.014*\"pour\" + 0.009*\"mode\" + 0.008*\"veget\" + 0.008*\"elabor\" + 0.007*\"uruguayan\" + 0.006*\"produc\" + 0.006*\"develop\" + 0.006*\"spectacl\"\n", + "2019-01-31 01:13:29,268 : INFO : topic #35 (0.020): 0.056*\"russia\" + 0.037*\"sovereignti\" + 0.034*\"rural\" + 0.025*\"reprint\" + 0.025*\"poison\" + 0.023*\"personifi\" + 0.020*\"moscow\" + 0.017*\"poland\" + 0.015*\"unfortun\" + 0.014*\"czech\"\n", + "2019-01-31 01:13:29,269 : INFO : topic #22 (0.020): 0.036*\"spars\" + 0.018*\"factor\" + 0.012*\"plaisir\" + 0.011*\"genu\" + 0.009*\"western\" + 0.008*\"median\" + 0.008*\"biom\" + 0.007*\"feel\" + 0.007*\"trap\" + 0.007*\"male\"\n", + "2019-01-31 01:13:29,270 : INFO : topic #45 (0.020): 0.026*\"jpg\" + 0.025*\"fifteenth\" + 0.019*\"pain\" + 0.019*\"illicit\" + 0.019*\"arsen\" + 0.016*\"museo\" + 0.015*\"colder\" + 0.013*\"black\" + 0.013*\"western\" + 0.012*\"gai\"\n", + "2019-01-31 01:13:29,276 : INFO : topic diff=0.003799, rho=0.024500\n", + "2019-01-31 01:13:29,433 : INFO : PROGRESS: pass 0, at document #3334000/4922894\n", + "2019-01-31 01:13:30,826 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:13:31,092 : INFO : topic #49 (0.020): 0.044*\"india\" + 0.031*\"incumb\" + 0.014*\"islam\" + 0.013*\"pakistan\" + 0.012*\"anglo\" + 0.012*\"muskoge\" + 0.010*\"sri\" + 0.010*\"televis\" + 0.010*\"alam\" + 0.010*\"affection\"\n", + "2019-01-31 01:13:31,093 : INFO : topic #46 (0.020): 0.017*\"norwai\" + 0.017*\"stop\" + 0.016*\"sweden\" + 0.015*\"norwegian\" + 0.015*\"swedish\" + 0.014*\"damag\" + 0.014*\"wind\" + 0.012*\"huntsvil\" + 0.012*\"treeless\" + 0.011*\"turkish\"\n", + "2019-01-31 01:13:31,094 : INFO : topic #22 (0.020): 0.036*\"spars\" + 0.018*\"factor\" + 0.012*\"plaisir\" + 0.011*\"genu\" + 0.009*\"western\" + 0.008*\"median\" + 0.008*\"biom\" + 0.007*\"feel\" + 0.007*\"trap\" + 0.007*\"incom\"\n", + "2019-01-31 01:13:31,095 : INFO : topic #19 (0.020): 0.017*\"languag\" + 0.015*\"centuri\" + 0.011*\"woodcut\" + 0.009*\"form\" + 0.009*\"origin\" + 0.008*\"trade\" + 0.008*\"mean\" + 0.008*\"english\" + 0.007*\"known\" + 0.007*\"ancestor\"\n", + "2019-01-31 01:13:31,096 : INFO : topic #35 (0.020): 0.056*\"russia\" + 0.037*\"sovereignti\" + 0.034*\"rural\" + 0.025*\"reprint\" + 0.025*\"poison\" + 0.023*\"personifi\" + 0.020*\"moscow\" + 0.017*\"poland\" + 0.016*\"unfortun\" + 0.014*\"czech\"\n", + "2019-01-31 01:13:31,102 : INFO : topic diff=0.003805, rho=0.024492\n", + "2019-01-31 01:13:31,260 : INFO : PROGRESS: pass 0, at document #3336000/4922894\n", + "2019-01-31 01:13:32,658 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:13:32,924 : INFO : topic #8 (0.020): 0.026*\"law\" + 0.022*\"cortic\" + 0.018*\"start\" + 0.016*\"act\" + 0.012*\"ricardo\" + 0.012*\"case\" + 0.010*\"replac\" + 0.009*\"polaris\" + 0.008*\"legal\" + 0.007*\"judaism\"\n", + "2019-01-31 01:13:32,925 : INFO : topic #21 (0.020): 0.032*\"samford\" + 0.023*\"spain\" + 0.018*\"mexico\" + 0.018*\"del\" + 0.016*\"italian\" + 0.014*\"soviet\" + 0.011*\"santa\" + 0.011*\"lizard\" + 0.011*\"carlo\" + 0.010*\"juan\"\n", + "2019-01-31 01:13:32,926 : INFO : topic #42 (0.020): 0.047*\"german\" + 0.031*\"germani\" + 0.015*\"jewish\" + 0.015*\"vol\" + 0.015*\"israel\" + 0.015*\"berlin\" + 0.014*\"der\" + 0.010*\"jeremiah\" + 0.010*\"european\" + 0.009*\"hungarian\"\n", + "2019-01-31 01:13:32,927 : INFO : topic #28 (0.020): 0.033*\"build\" + 0.027*\"hous\" + 0.018*\"buford\" + 0.015*\"rivièr\" + 0.014*\"histor\" + 0.011*\"linear\" + 0.011*\"constitut\" + 0.011*\"silicon\" + 0.011*\"briarwood\" + 0.010*\"depress\"\n", + "2019-01-31 01:13:32,928 : INFO : topic #36 (0.020): 0.011*\"network\" + 0.010*\"prognosi\" + 0.010*\"pop\" + 0.009*\"cytokin\" + 0.008*\"develop\" + 0.008*\"user\" + 0.008*\"uruguayan\" + 0.008*\"softwar\" + 0.007*\"championship\" + 0.007*\"includ\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 01:13:32,934 : INFO : topic diff=0.003221, rho=0.024485\n", + "2019-01-31 01:13:33,089 : INFO : PROGRESS: pass 0, at document #3338000/4922894\n", + "2019-01-31 01:13:34,457 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:13:34,723 : INFO : topic #6 (0.020): 0.070*\"fewer\" + 0.024*\"epiru\" + 0.021*\"septemb\" + 0.019*\"teacher\" + 0.016*\"stake\" + 0.013*\"rodríguez\" + 0.011*\"proclaim\" + 0.011*\"movi\" + 0.010*\"direct\" + 0.010*\"acrimoni\"\n", + "2019-01-31 01:13:34,725 : INFO : topic #31 (0.020): 0.051*\"fusiform\" + 0.026*\"scientist\" + 0.025*\"taxpay\" + 0.022*\"player\" + 0.019*\"place\" + 0.014*\"clot\" + 0.013*\"leagu\" + 0.011*\"folei\" + 0.010*\"yawn\" + 0.009*\"reconstruct\"\n", + "2019-01-31 01:13:34,726 : INFO : topic #27 (0.020): 0.072*\"questionnair\" + 0.020*\"candid\" + 0.019*\"taxpay\" + 0.014*\"ret\" + 0.013*\"driver\" + 0.012*\"tornado\" + 0.012*\"find\" + 0.011*\"fool\" + 0.010*\"champion\" + 0.009*\"septemb\"\n", + "2019-01-31 01:13:34,727 : INFO : topic #42 (0.020): 0.047*\"german\" + 0.031*\"germani\" + 0.016*\"vol\" + 0.015*\"jewish\" + 0.015*\"israel\" + 0.015*\"berlin\" + 0.014*\"der\" + 0.010*\"jeremiah\" + 0.010*\"european\" + 0.009*\"hungarian\"\n", + "2019-01-31 01:13:34,728 : INFO : topic #5 (0.020): 0.038*\"abroad\" + 0.028*\"son\" + 0.027*\"rel\" + 0.025*\"reconstruct\" + 0.020*\"band\" + 0.016*\"muscl\" + 0.016*\"simultan\" + 0.014*\"charcoal\" + 0.013*\"toyota\" + 0.010*\"myspac\"\n", + "2019-01-31 01:13:34,734 : INFO : topic diff=0.003667, rho=0.024478\n", + "2019-01-31 01:13:37,448 : INFO : -11.542 per-word bound, 2982.3 perplexity estimate based on a held-out corpus of 2000 documents with 548041 words\n", + "2019-01-31 01:13:37,448 : INFO : PROGRESS: pass 0, at document #3340000/4922894\n", + "2019-01-31 01:13:38,842 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:13:39,109 : INFO : topic #19 (0.020): 0.017*\"languag\" + 0.015*\"centuri\" + 0.011*\"woodcut\" + 0.009*\"form\" + 0.009*\"origin\" + 0.008*\"trade\" + 0.008*\"mean\" + 0.008*\"english\" + 0.007*\"known\" + 0.007*\"ancestor\"\n", + "2019-01-31 01:13:39,110 : INFO : topic #7 (0.020): 0.020*\"snatch\" + 0.020*\"di\" + 0.019*\"factor\" + 0.016*\"yawn\" + 0.016*\"margin\" + 0.014*\"bone\" + 0.013*\"life\" + 0.012*\"faster\" + 0.012*\"deal\" + 0.011*\"daughter\"\n", + "2019-01-31 01:13:39,111 : INFO : topic #0 (0.020): 0.067*\"statewid\" + 0.043*\"line\" + 0.034*\"raid\" + 0.025*\"rosenwald\" + 0.020*\"serv\" + 0.019*\"traceabl\" + 0.017*\"airmen\" + 0.014*\"oper\" + 0.014*\"rivièr\" + 0.011*\"transient\"\n", + "2019-01-31 01:13:39,112 : INFO : topic #36 (0.020): 0.011*\"network\" + 0.011*\"pop\" + 0.010*\"prognosi\" + 0.009*\"cytokin\" + 0.008*\"develop\" + 0.008*\"user\" + 0.008*\"uruguayan\" + 0.008*\"softwar\" + 0.007*\"includ\" + 0.007*\"championship\"\n", + "2019-01-31 01:13:39,113 : INFO : topic #27 (0.020): 0.072*\"questionnair\" + 0.020*\"candid\" + 0.019*\"taxpay\" + 0.014*\"ret\" + 0.013*\"driver\" + 0.012*\"tornado\" + 0.012*\"find\" + 0.011*\"fool\" + 0.010*\"champion\" + 0.009*\"septemb\"\n", + "2019-01-31 01:13:39,119 : INFO : topic diff=0.003463, rho=0.024470\n", + "2019-01-31 01:13:39,280 : INFO : PROGRESS: pass 0, at document #3342000/4922894\n", + "2019-01-31 01:13:40,692 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:13:40,958 : INFO : topic #1 (0.020): 0.054*\"china\" + 0.047*\"chilton\" + 0.025*\"kong\" + 0.023*\"hong\" + 0.021*\"korea\" + 0.018*\"korean\" + 0.016*\"leah\" + 0.016*\"sourc\" + 0.013*\"kim\" + 0.013*\"shirin\"\n", + "2019-01-31 01:13:40,959 : INFO : topic #14 (0.020): 0.024*\"forc\" + 0.023*\"aggress\" + 0.020*\"armi\" + 0.020*\"walter\" + 0.017*\"com\" + 0.015*\"oper\" + 0.014*\"unionist\" + 0.013*\"militari\" + 0.012*\"airbu\" + 0.011*\"diversifi\"\n", + "2019-01-31 01:13:40,961 : INFO : topic #44 (0.020): 0.033*\"rooftop\" + 0.028*\"final\" + 0.022*\"wife\" + 0.020*\"tourist\" + 0.018*\"champion\" + 0.016*\"taxpay\" + 0.015*\"tiepolo\" + 0.014*\"martin\" + 0.014*\"chamber\" + 0.012*\"women\"\n", + "2019-01-31 01:13:40,962 : INFO : topic #2 (0.020): 0.047*\"isl\" + 0.038*\"shield\" + 0.018*\"narrat\" + 0.014*\"scot\" + 0.013*\"pope\" + 0.012*\"blur\" + 0.011*\"coalit\" + 0.010*\"nativist\" + 0.009*\"fleet\" + 0.009*\"class\"\n", + "2019-01-31 01:13:40,963 : INFO : topic #35 (0.020): 0.058*\"russia\" + 0.036*\"sovereignti\" + 0.034*\"rural\" + 0.025*\"reprint\" + 0.024*\"poison\" + 0.024*\"personifi\" + 0.020*\"moscow\" + 0.017*\"poland\" + 0.015*\"unfortun\" + 0.013*\"czech\"\n", + "2019-01-31 01:13:40,968 : INFO : topic diff=0.003179, rho=0.024463\n", + "2019-01-31 01:13:41,124 : INFO : PROGRESS: pass 0, at document #3344000/4922894\n", + "2019-01-31 01:13:42,503 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:13:42,769 : INFO : topic #29 (0.020): 0.031*\"companhia\" + 0.013*\"busi\" + 0.012*\"million\" + 0.011*\"market\" + 0.011*\"produc\" + 0.011*\"bank\" + 0.010*\"industri\" + 0.009*\"yawn\" + 0.008*\"manag\" + 0.007*\"function\"\n", + "2019-01-31 01:13:42,771 : INFO : topic #44 (0.020): 0.033*\"rooftop\" + 0.028*\"final\" + 0.023*\"wife\" + 0.020*\"tourist\" + 0.018*\"champion\" + 0.016*\"taxpay\" + 0.015*\"tiepolo\" + 0.015*\"martin\" + 0.014*\"chamber\" + 0.012*\"women\"\n", + "2019-01-31 01:13:42,772 : INFO : topic #48 (0.020): 0.080*\"march\" + 0.079*\"sens\" + 0.077*\"octob\" + 0.075*\"august\" + 0.074*\"juli\" + 0.071*\"januari\" + 0.071*\"april\" + 0.071*\"notion\" + 0.069*\"judici\" + 0.066*\"decatur\"\n", + "2019-01-31 01:13:42,773 : INFO : topic #39 (0.020): 0.057*\"canada\" + 0.043*\"canadian\" + 0.022*\"toronto\" + 0.022*\"hoar\" + 0.020*\"ontario\" + 0.016*\"new\" + 0.015*\"hydrogen\" + 0.014*\"quebec\" + 0.014*\"novotná\" + 0.014*\"misericordia\"\n", + "2019-01-31 01:13:42,774 : INFO : topic #33 (0.020): 0.062*\"french\" + 0.048*\"franc\" + 0.031*\"pari\" + 0.023*\"sail\" + 0.022*\"jean\" + 0.017*\"daphn\" + 0.014*\"lazi\" + 0.013*\"loui\" + 0.011*\"piec\" + 0.011*\"wreath\"\n", + "2019-01-31 01:13:42,779 : INFO : topic diff=0.003150, rho=0.024456\n", + "2019-01-31 01:13:42,943 : INFO : PROGRESS: pass 0, at document #3346000/4922894\n", + "2019-01-31 01:13:44,350 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:13:44,617 : INFO : topic #18 (0.020): 0.011*\"théori\" + 0.007*\"later\" + 0.007*\"sack\" + 0.006*\"dai\" + 0.006*\"kill\" + 0.005*\"retrospect\" + 0.005*\"end\" + 0.005*\"like\" + 0.004*\"help\" + 0.004*\"call\"\n", + "2019-01-31 01:13:44,618 : INFO : topic #34 (0.020): 0.068*\"start\" + 0.034*\"new\" + 0.032*\"american\" + 0.030*\"unionist\" + 0.026*\"cotton\" + 0.021*\"year\" + 0.015*\"california\" + 0.013*\"warrior\" + 0.012*\"terri\" + 0.011*\"north\"\n", + "2019-01-31 01:13:44,619 : INFO : topic #10 (0.020): 0.012*\"cdd\" + 0.009*\"media\" + 0.008*\"disco\" + 0.007*\"hormon\" + 0.007*\"pathwai\" + 0.007*\"have\" + 0.006*\"caus\" + 0.006*\"proper\" + 0.006*\"treat\" + 0.006*\"effect\"\n", + "2019-01-31 01:13:44,620 : INFO : topic #26 (0.020): 0.031*\"workplac\" + 0.029*\"champion\" + 0.027*\"woman\" + 0.025*\"olymp\" + 0.023*\"men\" + 0.022*\"medal\" + 0.021*\"event\" + 0.018*\"taxpay\" + 0.018*\"atheist\" + 0.018*\"rainfal\"\n", + "2019-01-31 01:13:44,621 : INFO : topic #41 (0.020): 0.040*\"citi\" + 0.024*\"palmer\" + 0.021*\"new\" + 0.014*\"strategist\" + 0.013*\"center\" + 0.013*\"open\" + 0.011*\"includ\" + 0.011*\"lobe\" + 0.011*\"dai\" + 0.009*\"highli\"\n", + "2019-01-31 01:13:44,627 : INFO : topic diff=0.004405, rho=0.024448\n", + "2019-01-31 01:13:44,784 : INFO : PROGRESS: pass 0, at document #3348000/4922894\n", + "2019-01-31 01:13:46,159 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:13:46,426 : INFO : topic #0 (0.020): 0.066*\"statewid\" + 0.043*\"line\" + 0.034*\"raid\" + 0.025*\"rosenwald\" + 0.020*\"serv\" + 0.020*\"traceabl\" + 0.017*\"airmen\" + 0.014*\"oper\" + 0.014*\"rivièr\" + 0.011*\"transient\"\n", + "2019-01-31 01:13:46,427 : INFO : topic #3 (0.020): 0.033*\"present\" + 0.025*\"offic\" + 0.024*\"minist\" + 0.023*\"nation\" + 0.023*\"govern\" + 0.020*\"member\" + 0.017*\"serv\" + 0.016*\"start\" + 0.016*\"gener\" + 0.014*\"chickasaw\"\n", + "2019-01-31 01:13:46,428 : INFO : topic #21 (0.020): 0.032*\"samford\" + 0.023*\"spain\" + 0.018*\"del\" + 0.018*\"mexico\" + 0.016*\"italian\" + 0.014*\"soviet\" + 0.011*\"santa\" + 0.011*\"lizard\" + 0.011*\"juan\" + 0.011*\"carlo\"\n", + "2019-01-31 01:13:46,429 : INFO : topic #45 (0.020): 0.027*\"jpg\" + 0.025*\"fifteenth\" + 0.021*\"arsen\" + 0.020*\"pain\" + 0.019*\"illicit\" + 0.017*\"museo\" + 0.014*\"colder\" + 0.013*\"black\" + 0.013*\"gai\" + 0.013*\"western\"\n", + "2019-01-31 01:13:46,430 : INFO : topic #37 (0.020): 0.012*\"charact\" + 0.010*\"septemb\" + 0.010*\"anim\" + 0.010*\"man\" + 0.007*\"comic\" + 0.007*\"appear\" + 0.007*\"storag\" + 0.006*\"workplac\" + 0.006*\"fusiform\" + 0.006*\"love\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 01:13:46,436 : INFO : topic diff=0.003254, rho=0.024441\n", + "2019-01-31 01:13:46,594 : INFO : PROGRESS: pass 0, at document #3350000/4922894\n", + "2019-01-31 01:13:47,977 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:13:48,244 : INFO : topic #22 (0.020): 0.036*\"spars\" + 0.018*\"factor\" + 0.012*\"plaisir\" + 0.011*\"genu\" + 0.009*\"western\" + 0.008*\"median\" + 0.008*\"biom\" + 0.007*\"feel\" + 0.007*\"trap\" + 0.007*\"incom\"\n", + "2019-01-31 01:13:48,245 : INFO : topic #19 (0.020): 0.017*\"languag\" + 0.015*\"centuri\" + 0.011*\"woodcut\" + 0.009*\"form\" + 0.009*\"origin\" + 0.008*\"trade\" + 0.008*\"mean\" + 0.008*\"english\" + 0.007*\"known\" + 0.007*\"ancestor\"\n", + "2019-01-31 01:13:48,246 : INFO : topic #45 (0.020): 0.026*\"jpg\" + 0.025*\"fifteenth\" + 0.021*\"arsen\" + 0.020*\"pain\" + 0.019*\"illicit\" + 0.017*\"museo\" + 0.014*\"colder\" + 0.013*\"black\" + 0.013*\"western\" + 0.013*\"gai\"\n", + "2019-01-31 01:13:48,247 : INFO : topic #48 (0.020): 0.079*\"march\" + 0.079*\"sens\" + 0.076*\"octob\" + 0.074*\"august\" + 0.073*\"juli\" + 0.071*\"januari\" + 0.070*\"april\" + 0.070*\"notion\" + 0.068*\"judici\" + 0.066*\"decatur\"\n", + "2019-01-31 01:13:48,248 : INFO : topic #7 (0.020): 0.020*\"snatch\" + 0.020*\"di\" + 0.018*\"factor\" + 0.016*\"yawn\" + 0.016*\"margin\" + 0.014*\"bone\" + 0.013*\"life\" + 0.012*\"faster\" + 0.012*\"deal\" + 0.011*\"daughter\"\n", + "2019-01-31 01:13:48,254 : INFO : topic diff=0.003504, rho=0.024434\n", + "2019-01-31 01:13:48,410 : INFO : PROGRESS: pass 0, at document #3352000/4922894\n", + "2019-01-31 01:13:49,792 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:13:50,059 : INFO : topic #48 (0.020): 0.079*\"march\" + 0.079*\"sens\" + 0.077*\"octob\" + 0.074*\"august\" + 0.073*\"juli\" + 0.071*\"januari\" + 0.071*\"april\" + 0.070*\"notion\" + 0.068*\"judici\" + 0.065*\"decatur\"\n", + "2019-01-31 01:13:50,060 : INFO : topic #27 (0.020): 0.073*\"questionnair\" + 0.020*\"candid\" + 0.019*\"taxpay\" + 0.013*\"driver\" + 0.013*\"ret\" + 0.012*\"tornado\" + 0.012*\"find\" + 0.011*\"fool\" + 0.010*\"champion\" + 0.010*\"horac\"\n", + "2019-01-31 01:13:50,061 : INFO : topic #22 (0.020): 0.036*\"spars\" + 0.018*\"factor\" + 0.012*\"plaisir\" + 0.011*\"genu\" + 0.009*\"western\" + 0.008*\"median\" + 0.008*\"biom\" + 0.007*\"trap\" + 0.007*\"feel\" + 0.007*\"incom\"\n", + "2019-01-31 01:13:50,062 : INFO : topic #44 (0.020): 0.033*\"rooftop\" + 0.028*\"final\" + 0.023*\"wife\" + 0.020*\"tourist\" + 0.018*\"champion\" + 0.016*\"taxpay\" + 0.015*\"tiepolo\" + 0.015*\"martin\" + 0.014*\"chamber\" + 0.012*\"women\"\n", + "2019-01-31 01:13:50,063 : INFO : topic #35 (0.020): 0.057*\"russia\" + 0.037*\"sovereignti\" + 0.034*\"rural\" + 0.025*\"reprint\" + 0.024*\"poison\" + 0.024*\"personifi\" + 0.020*\"moscow\" + 0.017*\"poland\" + 0.015*\"unfortun\" + 0.013*\"malaysia\"\n", + "2019-01-31 01:13:50,068 : INFO : topic diff=0.003759, rho=0.024427\n", + "2019-01-31 01:13:50,232 : INFO : PROGRESS: pass 0, at document #3354000/4922894\n", + "2019-01-31 01:13:51,646 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:13:51,912 : INFO : topic #35 (0.020): 0.056*\"russia\" + 0.037*\"sovereignti\" + 0.034*\"rural\" + 0.025*\"reprint\" + 0.025*\"poison\" + 0.024*\"personifi\" + 0.020*\"moscow\" + 0.017*\"poland\" + 0.015*\"unfortun\" + 0.013*\"czech\"\n", + "2019-01-31 01:13:51,914 : INFO : topic #15 (0.020): 0.011*\"small\" + 0.010*\"organ\" + 0.010*\"develop\" + 0.009*\"commun\" + 0.008*\"group\" + 0.008*\"word\" + 0.008*\"peopl\" + 0.007*\"human\" + 0.007*\"woman\" + 0.007*\"summerhil\"\n", + "2019-01-31 01:13:51,915 : INFO : topic #39 (0.020): 0.057*\"canada\" + 0.043*\"canadian\" + 0.022*\"toronto\" + 0.022*\"hoar\" + 0.020*\"ontario\" + 0.016*\"new\" + 0.016*\"hydrogen\" + 0.014*\"novotná\" + 0.014*\"quebec\" + 0.014*\"misericordia\"\n", + "2019-01-31 01:13:51,916 : INFO : topic #37 (0.020): 0.012*\"charact\" + 0.010*\"septemb\" + 0.010*\"anim\" + 0.010*\"man\" + 0.007*\"comic\" + 0.007*\"appear\" + 0.007*\"storag\" + 0.006*\"workplac\" + 0.006*\"fusiform\" + 0.006*\"love\"\n", + "2019-01-31 01:13:51,917 : INFO : topic #31 (0.020): 0.051*\"fusiform\" + 0.026*\"scientist\" + 0.025*\"taxpay\" + 0.022*\"player\" + 0.019*\"place\" + 0.014*\"clot\" + 0.013*\"leagu\" + 0.011*\"folei\" + 0.010*\"yawn\" + 0.009*\"reconstruct\"\n", + "2019-01-31 01:13:51,923 : INFO : topic diff=0.004306, rho=0.024419\n", + "2019-01-31 01:13:52,077 : INFO : PROGRESS: pass 0, at document #3356000/4922894\n", + "2019-01-31 01:13:53,442 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:13:53,709 : INFO : topic #47 (0.020): 0.064*\"muscl\" + 0.033*\"perceptu\" + 0.020*\"theater\" + 0.018*\"place\" + 0.017*\"compos\" + 0.015*\"damn\" + 0.013*\"orchestr\" + 0.012*\"olympo\" + 0.012*\"physician\" + 0.011*\"word\"\n", + "2019-01-31 01:13:53,710 : INFO : topic #28 (0.020): 0.033*\"build\" + 0.028*\"hous\" + 0.018*\"buford\" + 0.014*\"histor\" + 0.014*\"rivièr\" + 0.011*\"linear\" + 0.011*\"constitut\" + 0.011*\"silicon\" + 0.010*\"briarwood\" + 0.010*\"depress\"\n", + "2019-01-31 01:13:53,712 : INFO : topic #19 (0.020): 0.016*\"languag\" + 0.015*\"centuri\" + 0.011*\"woodcut\" + 0.009*\"form\" + 0.009*\"origin\" + 0.008*\"trade\" + 0.008*\"mean\" + 0.008*\"english\" + 0.007*\"known\" + 0.007*\"ancestor\"\n", + "2019-01-31 01:13:53,712 : INFO : topic #9 (0.020): 0.068*\"bone\" + 0.046*\"american\" + 0.027*\"valour\" + 0.018*\"folei\" + 0.018*\"dutch\" + 0.017*\"polit\" + 0.017*\"player\" + 0.016*\"english\" + 0.013*\"acrimoni\" + 0.012*\"simpler\"\n", + "2019-01-31 01:13:53,714 : INFO : topic #21 (0.020): 0.032*\"samford\" + 0.022*\"spain\" + 0.019*\"del\" + 0.018*\"mexico\" + 0.016*\"italian\" + 0.014*\"soviet\" + 0.012*\"juan\" + 0.011*\"santa\" + 0.011*\"lizard\" + 0.011*\"carlo\"\n", + "2019-01-31 01:13:53,720 : INFO : topic diff=0.003753, rho=0.024412\n", + "2019-01-31 01:13:53,936 : INFO : PROGRESS: pass 0, at document #3358000/4922894\n", + "2019-01-31 01:13:55,336 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:13:55,603 : INFO : topic #3 (0.020): 0.033*\"present\" + 0.025*\"offic\" + 0.024*\"minist\" + 0.023*\"nation\" + 0.023*\"govern\" + 0.020*\"member\" + 0.017*\"serv\" + 0.016*\"start\" + 0.016*\"gener\" + 0.014*\"seri\"\n", + "2019-01-31 01:13:55,604 : INFO : topic #26 (0.020): 0.031*\"workplac\" + 0.029*\"champion\" + 0.027*\"woman\" + 0.026*\"olymp\" + 0.023*\"men\" + 0.022*\"medal\" + 0.021*\"event\" + 0.018*\"atheist\" + 0.018*\"taxpay\" + 0.018*\"nation\"\n", + "2019-01-31 01:13:55,605 : INFO : topic #19 (0.020): 0.016*\"languag\" + 0.015*\"centuri\" + 0.011*\"woodcut\" + 0.009*\"form\" + 0.009*\"origin\" + 0.008*\"trade\" + 0.008*\"mean\" + 0.008*\"english\" + 0.007*\"known\" + 0.007*\"ancestor\"\n", + "2019-01-31 01:13:55,606 : INFO : topic #1 (0.020): 0.057*\"china\" + 0.048*\"chilton\" + 0.025*\"kong\" + 0.024*\"hong\" + 0.021*\"korea\" + 0.017*\"korean\" + 0.016*\"leah\" + 0.015*\"sourc\" + 0.014*\"shirin\" + 0.013*\"kim\"\n", + "2019-01-31 01:13:55,607 : INFO : topic #31 (0.020): 0.051*\"fusiform\" + 0.026*\"scientist\" + 0.025*\"taxpay\" + 0.022*\"player\" + 0.019*\"place\" + 0.014*\"clot\" + 0.013*\"leagu\" + 0.011*\"folei\" + 0.010*\"yawn\" + 0.009*\"reconstruct\"\n", + "2019-01-31 01:13:55,613 : INFO : topic diff=0.003366, rho=0.024405\n", + "2019-01-31 01:13:58,339 : INFO : -11.800 per-word bound, 3565.4 perplexity estimate based on a held-out corpus of 2000 documents with 583734 words\n", + "2019-01-31 01:13:58,339 : INFO : PROGRESS: pass 0, at document #3360000/4922894\n", + "2019-01-31 01:13:59,730 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:13:59,997 : INFO : topic #7 (0.020): 0.020*\"snatch\" + 0.020*\"di\" + 0.019*\"factor\" + 0.016*\"yawn\" + 0.015*\"margin\" + 0.014*\"bone\" + 0.013*\"life\" + 0.012*\"faster\" + 0.012*\"deal\" + 0.011*\"daughter\"\n", + "2019-01-31 01:13:59,998 : INFO : topic #9 (0.020): 0.072*\"bone\" + 0.045*\"american\" + 0.027*\"valour\" + 0.018*\"folei\" + 0.018*\"dutch\" + 0.017*\"polit\" + 0.017*\"player\" + 0.015*\"english\" + 0.012*\"acrimoni\" + 0.012*\"simpler\"\n", + "2019-01-31 01:13:59,999 : INFO : topic #13 (0.020): 0.027*\"australia\" + 0.026*\"london\" + 0.025*\"sourc\" + 0.025*\"new\" + 0.024*\"england\" + 0.023*\"australian\" + 0.019*\"british\" + 0.017*\"ireland\" + 0.015*\"youth\" + 0.014*\"wale\"\n", + "2019-01-31 01:14:00,000 : INFO : topic #6 (0.020): 0.070*\"fewer\" + 0.023*\"epiru\" + 0.021*\"septemb\" + 0.019*\"teacher\" + 0.016*\"stake\" + 0.012*\"rodríguez\" + 0.012*\"proclaim\" + 0.011*\"direct\" + 0.010*\"movi\" + 0.010*\"acrimoni\"\n", + "2019-01-31 01:14:00,001 : INFO : topic #35 (0.020): 0.056*\"russia\" + 0.037*\"sovereignti\" + 0.033*\"rural\" + 0.025*\"reprint\" + 0.024*\"poison\" + 0.024*\"personifi\" + 0.020*\"moscow\" + 0.017*\"poland\" + 0.015*\"unfortun\" + 0.014*\"malaysia\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 01:14:00,007 : INFO : topic diff=0.004039, rho=0.024398\n", + "2019-01-31 01:14:00,164 : INFO : PROGRESS: pass 0, at document #3362000/4922894\n", + "2019-01-31 01:14:01,541 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:14:01,808 : INFO : topic #20 (0.020): 0.143*\"scholar\" + 0.040*\"struggl\" + 0.032*\"high\" + 0.030*\"educ\" + 0.024*\"collector\" + 0.018*\"yawn\" + 0.013*\"prognosi\" + 0.010*\"gothic\" + 0.010*\"task\" + 0.009*\"district\"\n", + "2019-01-31 01:14:01,809 : INFO : topic #29 (0.020): 0.031*\"companhia\" + 0.013*\"busi\" + 0.012*\"million\" + 0.011*\"market\" + 0.011*\"produc\" + 0.011*\"bank\" + 0.010*\"industri\" + 0.009*\"yawn\" + 0.008*\"manag\" + 0.007*\"function\"\n", + "2019-01-31 01:14:01,810 : INFO : topic #18 (0.020): 0.011*\"théori\" + 0.007*\"later\" + 0.007*\"sack\" + 0.006*\"dai\" + 0.006*\"kill\" + 0.005*\"retrospect\" + 0.005*\"end\" + 0.005*\"like\" + 0.004*\"help\" + 0.004*\"call\"\n", + "2019-01-31 01:14:01,812 : INFO : topic #47 (0.020): 0.063*\"muscl\" + 0.033*\"perceptu\" + 0.020*\"theater\" + 0.018*\"place\" + 0.017*\"compos\" + 0.015*\"damn\" + 0.013*\"orchestr\" + 0.013*\"olympo\" + 0.012*\"physician\" + 0.011*\"word\"\n", + "2019-01-31 01:14:01,813 : INFO : topic #15 (0.020): 0.011*\"small\" + 0.010*\"develop\" + 0.010*\"organ\" + 0.009*\"commun\" + 0.008*\"group\" + 0.008*\"word\" + 0.008*\"peopl\" + 0.007*\"human\" + 0.007*\"woman\" + 0.006*\"summerhil\"\n", + "2019-01-31 01:14:01,818 : INFO : topic diff=0.003565, rho=0.024390\n", + "2019-01-31 01:14:01,973 : INFO : PROGRESS: pass 0, at document #3364000/4922894\n", + "2019-01-31 01:14:03,335 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:14:03,602 : INFO : topic #17 (0.020): 0.075*\"church\" + 0.022*\"cathol\" + 0.022*\"christian\" + 0.021*\"bishop\" + 0.018*\"sail\" + 0.015*\"retroflex\" + 0.010*\"relationship\" + 0.009*\"poll\" + 0.009*\"cathedr\" + 0.009*\"historiographi\"\n", + "2019-01-31 01:14:03,603 : INFO : topic #32 (0.020): 0.050*\"district\" + 0.044*\"popolo\" + 0.043*\"vigour\" + 0.037*\"cotton\" + 0.036*\"tortur\" + 0.022*\"adulthood\" + 0.021*\"area\" + 0.021*\"multitud\" + 0.019*\"citi\" + 0.019*\"cede\"\n", + "2019-01-31 01:14:03,604 : INFO : topic #20 (0.020): 0.143*\"scholar\" + 0.040*\"struggl\" + 0.032*\"high\" + 0.030*\"educ\" + 0.024*\"collector\" + 0.018*\"yawn\" + 0.013*\"prognosi\" + 0.010*\"gothic\" + 0.009*\"task\" + 0.009*\"district\"\n", + "2019-01-31 01:14:03,605 : INFO : topic #12 (0.020): 0.008*\"number\" + 0.007*\"frontal\" + 0.007*\"gener\" + 0.007*\"southern\" + 0.006*\"poet\" + 0.006*\"exampl\" + 0.006*\"servitud\" + 0.006*\"théori\" + 0.006*\"measur\" + 0.006*\"utopian\"\n", + "2019-01-31 01:14:03,606 : INFO : topic #47 (0.020): 0.063*\"muscl\" + 0.033*\"perceptu\" + 0.020*\"theater\" + 0.018*\"place\" + 0.017*\"compos\" + 0.015*\"damn\" + 0.013*\"orchestr\" + 0.012*\"olympo\" + 0.012*\"physician\" + 0.011*\"word\"\n", + "2019-01-31 01:14:03,612 : INFO : topic diff=0.003327, rho=0.024383\n", + "2019-01-31 01:14:03,777 : INFO : PROGRESS: pass 0, at document #3366000/4922894\n", + "2019-01-31 01:14:05,200 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:14:05,466 : INFO : topic #0 (0.020): 0.065*\"statewid\" + 0.042*\"line\" + 0.036*\"raid\" + 0.025*\"rosenwald\" + 0.020*\"traceabl\" + 0.020*\"serv\" + 0.016*\"airmen\" + 0.015*\"rivièr\" + 0.014*\"oper\" + 0.011*\"transient\"\n", + "2019-01-31 01:14:05,468 : INFO : topic #6 (0.020): 0.071*\"fewer\" + 0.023*\"epiru\" + 0.020*\"septemb\" + 0.019*\"teacher\" + 0.016*\"stake\" + 0.013*\"rodríguez\" + 0.012*\"proclaim\" + 0.011*\"direct\" + 0.010*\"movi\" + 0.010*\"acrimoni\"\n", + "2019-01-31 01:14:05,469 : INFO : topic #43 (0.020): 0.065*\"elect\" + 0.054*\"parti\" + 0.025*\"voluntari\" + 0.022*\"democrat\" + 0.020*\"member\" + 0.017*\"polici\" + 0.016*\"republ\" + 0.014*\"selma\" + 0.014*\"report\" + 0.013*\"bypass\"\n", + "2019-01-31 01:14:05,470 : INFO : topic #10 (0.020): 0.012*\"cdd\" + 0.009*\"media\" + 0.008*\"disco\" + 0.007*\"hormon\" + 0.007*\"pathwai\" + 0.007*\"have\" + 0.006*\"caus\" + 0.006*\"proper\" + 0.006*\"treat\" + 0.006*\"effect\"\n", + "2019-01-31 01:14:05,471 : INFO : topic #1 (0.020): 0.056*\"china\" + 0.048*\"chilton\" + 0.025*\"kong\" + 0.024*\"hong\" + 0.021*\"korea\" + 0.017*\"korean\" + 0.017*\"leah\" + 0.015*\"sourc\" + 0.014*\"shirin\" + 0.013*\"kim\"\n", + "2019-01-31 01:14:05,476 : INFO : topic diff=0.004753, rho=0.024376\n", + "2019-01-31 01:14:05,634 : INFO : PROGRESS: pass 0, at document #3368000/4922894\n", + "2019-01-31 01:14:07,017 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:14:07,284 : INFO : topic #37 (0.020): 0.012*\"charact\" + 0.011*\"septemb\" + 0.010*\"man\" + 0.010*\"anim\" + 0.008*\"comic\" + 0.007*\"appear\" + 0.007*\"storag\" + 0.006*\"workplac\" + 0.006*\"fusiform\" + 0.006*\"gestur\"\n", + "2019-01-31 01:14:07,285 : INFO : topic #2 (0.020): 0.047*\"isl\" + 0.038*\"shield\" + 0.018*\"narrat\" + 0.014*\"scot\" + 0.013*\"pope\" + 0.012*\"blur\" + 0.011*\"nativist\" + 0.011*\"coalit\" + 0.009*\"fleet\" + 0.009*\"class\"\n", + "2019-01-31 01:14:07,286 : INFO : topic #16 (0.020): 0.057*\"king\" + 0.031*\"priest\" + 0.021*\"rotterdam\" + 0.019*\"quarterli\" + 0.019*\"duke\" + 0.016*\"grammat\" + 0.016*\"idiosyncrat\" + 0.013*\"count\" + 0.013*\"portugues\" + 0.013*\"kingdom\"\n", + "2019-01-31 01:14:07,287 : INFO : topic #29 (0.020): 0.031*\"companhia\" + 0.013*\"busi\" + 0.012*\"million\" + 0.011*\"market\" + 0.011*\"bank\" + 0.011*\"produc\" + 0.010*\"industri\" + 0.009*\"yawn\" + 0.008*\"manag\" + 0.007*\"function\"\n", + "2019-01-31 01:14:07,288 : INFO : topic #48 (0.020): 0.080*\"march\" + 0.080*\"sens\" + 0.077*\"octob\" + 0.074*\"juli\" + 0.074*\"august\" + 0.072*\"januari\" + 0.071*\"april\" + 0.071*\"notion\" + 0.069*\"judici\" + 0.066*\"decatur\"\n", + "2019-01-31 01:14:07,294 : INFO : topic diff=0.003514, rho=0.024369\n", + "2019-01-31 01:14:07,454 : INFO : PROGRESS: pass 0, at document #3370000/4922894\n", + "2019-01-31 01:14:08,846 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:14:09,113 : INFO : topic #25 (0.020): 0.032*\"ring\" + 0.020*\"lagrang\" + 0.018*\"area\" + 0.017*\"warmth\" + 0.015*\"mount\" + 0.010*\"north\" + 0.009*\"lobe\" + 0.009*\"sourc\" + 0.009*\"land\" + 0.009*\"foam\"\n", + "2019-01-31 01:14:09,114 : INFO : topic #11 (0.020): 0.024*\"john\" + 0.012*\"will\" + 0.012*\"david\" + 0.011*\"jame\" + 0.010*\"rival\" + 0.009*\"mexican–american\" + 0.008*\"slur\" + 0.008*\"paul\" + 0.008*\"georg\" + 0.008*\"rhyme\"\n", + "2019-01-31 01:14:09,115 : INFO : topic #44 (0.020): 0.033*\"rooftop\" + 0.028*\"final\" + 0.022*\"wife\" + 0.021*\"tourist\" + 0.019*\"champion\" + 0.016*\"taxpay\" + 0.015*\"martin\" + 0.015*\"tiepolo\" + 0.014*\"chamber\" + 0.012*\"women\"\n", + "2019-01-31 01:14:09,116 : INFO : topic #18 (0.020): 0.011*\"théori\" + 0.007*\"later\" + 0.007*\"sack\" + 0.006*\"dai\" + 0.005*\"kill\" + 0.005*\"retrospect\" + 0.005*\"like\" + 0.005*\"end\" + 0.004*\"help\" + 0.004*\"call\"\n", + "2019-01-31 01:14:09,117 : INFO : topic #7 (0.020): 0.020*\"snatch\" + 0.020*\"di\" + 0.019*\"factor\" + 0.016*\"yawn\" + 0.015*\"margin\" + 0.014*\"bone\" + 0.013*\"life\" + 0.012*\"faster\" + 0.012*\"deal\" + 0.011*\"john\"\n", + "2019-01-31 01:14:09,123 : INFO : topic diff=0.003778, rho=0.024361\n", + "2019-01-31 01:14:09,282 : INFO : PROGRESS: pass 0, at document #3372000/4922894\n", + "2019-01-31 01:14:10,672 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:14:10,939 : INFO : topic #34 (0.020): 0.068*\"start\" + 0.034*\"new\" + 0.032*\"american\" + 0.030*\"unionist\" + 0.025*\"cotton\" + 0.021*\"year\" + 0.015*\"california\" + 0.013*\"warrior\" + 0.012*\"terri\" + 0.011*\"north\"\n", + "2019-01-31 01:14:10,940 : INFO : topic #33 (0.020): 0.061*\"french\" + 0.046*\"franc\" + 0.030*\"pari\" + 0.023*\"sail\" + 0.021*\"jean\" + 0.017*\"daphn\" + 0.014*\"lazi\" + 0.012*\"loui\" + 0.011*\"piec\" + 0.009*\"wine\"\n", + "2019-01-31 01:14:10,941 : INFO : topic #25 (0.020): 0.032*\"ring\" + 0.020*\"lagrang\" + 0.018*\"area\" + 0.017*\"warmth\" + 0.015*\"mount\" + 0.010*\"north\" + 0.009*\"lobe\" + 0.009*\"sourc\" + 0.009*\"land\" + 0.009*\"foam\"\n", + "2019-01-31 01:14:10,942 : INFO : topic #27 (0.020): 0.071*\"questionnair\" + 0.020*\"taxpay\" + 0.019*\"candid\" + 0.014*\"ret\" + 0.013*\"driver\" + 0.013*\"tornado\" + 0.012*\"find\" + 0.011*\"fool\" + 0.010*\"champion\" + 0.009*\"horac\"\n", + "2019-01-31 01:14:10,943 : INFO : topic #31 (0.020): 0.051*\"fusiform\" + 0.026*\"scientist\" + 0.025*\"taxpay\" + 0.022*\"player\" + 0.019*\"place\" + 0.014*\"clot\" + 0.013*\"leagu\" + 0.011*\"folei\" + 0.010*\"yawn\" + 0.009*\"reconstruct\"\n", + "2019-01-31 01:14:10,949 : INFO : topic diff=0.004422, rho=0.024354\n", + "2019-01-31 01:14:11,108 : INFO : PROGRESS: pass 0, at document #3374000/4922894\n", + "2019-01-31 01:14:12,494 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 01:14:12,762 : INFO : topic #33 (0.020): 0.061*\"french\" + 0.046*\"franc\" + 0.030*\"pari\" + 0.023*\"sail\" + 0.021*\"jean\" + 0.017*\"daphn\" + 0.014*\"lazi\" + 0.012*\"loui\" + 0.011*\"piec\" + 0.009*\"wine\"\n", + "2019-01-31 01:14:12,763 : INFO : topic #37 (0.020): 0.012*\"charact\" + 0.011*\"septemb\" + 0.010*\"man\" + 0.010*\"anim\" + 0.007*\"comic\" + 0.007*\"appear\" + 0.007*\"storag\" + 0.006*\"workplac\" + 0.006*\"fusiform\" + 0.006*\"gestur\"\n", + "2019-01-31 01:14:12,764 : INFO : topic #20 (0.020): 0.143*\"scholar\" + 0.040*\"struggl\" + 0.033*\"high\" + 0.030*\"educ\" + 0.023*\"collector\" + 0.018*\"yawn\" + 0.013*\"prognosi\" + 0.010*\"gothic\" + 0.010*\"district\" + 0.009*\"task\"\n", + "2019-01-31 01:14:12,765 : INFO : topic #31 (0.020): 0.051*\"fusiform\" + 0.026*\"scientist\" + 0.025*\"taxpay\" + 0.023*\"player\" + 0.019*\"place\" + 0.014*\"clot\" + 0.013*\"leagu\" + 0.011*\"folei\" + 0.010*\"yawn\" + 0.009*\"reconstruct\"\n", + "2019-01-31 01:14:12,766 : INFO : topic #42 (0.020): 0.048*\"german\" + 0.032*\"germani\" + 0.015*\"vol\" + 0.015*\"jewish\" + 0.015*\"berlin\" + 0.015*\"israel\" + 0.014*\"der\" + 0.010*\"european\" + 0.009*\"jeremiah\" + 0.009*\"europ\"\n", + "2019-01-31 01:14:12,771 : INFO : topic diff=0.003743, rho=0.024347\n", + "2019-01-31 01:14:12,930 : INFO : PROGRESS: pass 0, at document #3376000/4922894\n", + "2019-01-31 01:14:14,316 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:14:14,582 : INFO : topic #12 (0.020): 0.009*\"number\" + 0.007*\"frontal\" + 0.007*\"gener\" + 0.007*\"southern\" + 0.006*\"poet\" + 0.006*\"exampl\" + 0.006*\"measur\" + 0.006*\"servitud\" + 0.006*\"théori\" + 0.006*\"utopian\"\n", + "2019-01-31 01:14:14,583 : INFO : topic #6 (0.020): 0.071*\"fewer\" + 0.023*\"epiru\" + 0.020*\"septemb\" + 0.019*\"teacher\" + 0.016*\"stake\" + 0.013*\"rodríguez\" + 0.012*\"proclaim\" + 0.011*\"direct\" + 0.011*\"movi\" + 0.010*\"acrimoni\"\n", + "2019-01-31 01:14:14,584 : INFO : topic #42 (0.020): 0.048*\"german\" + 0.032*\"germani\" + 0.016*\"jewish\" + 0.015*\"vol\" + 0.015*\"berlin\" + 0.015*\"israel\" + 0.014*\"der\" + 0.010*\"european\" + 0.009*\"jeremiah\" + 0.009*\"europ\"\n", + "2019-01-31 01:14:14,585 : INFO : topic #13 (0.020): 0.030*\"australia\" + 0.026*\"london\" + 0.025*\"new\" + 0.024*\"sourc\" + 0.023*\"australian\" + 0.023*\"england\" + 0.019*\"british\" + 0.017*\"ireland\" + 0.015*\"youth\" + 0.014*\"wale\"\n", + "2019-01-31 01:14:14,586 : INFO : topic #9 (0.020): 0.070*\"bone\" + 0.044*\"american\" + 0.027*\"valour\" + 0.018*\"folei\" + 0.018*\"dutch\" + 0.017*\"player\" + 0.017*\"polit\" + 0.015*\"english\" + 0.012*\"acrimoni\" + 0.012*\"simpler\"\n", + "2019-01-31 01:14:14,592 : INFO : topic diff=0.003603, rho=0.024340\n", + "2019-01-31 01:14:14,754 : INFO : PROGRESS: pass 0, at document #3378000/4922894\n", + "2019-01-31 01:14:16,156 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:14:16,423 : INFO : topic #41 (0.020): 0.040*\"citi\" + 0.024*\"palmer\" + 0.021*\"new\" + 0.014*\"strategist\" + 0.013*\"open\" + 0.013*\"center\" + 0.011*\"includ\" + 0.011*\"dai\" + 0.011*\"lobe\" + 0.009*\"highli\"\n", + "2019-01-31 01:14:16,424 : INFO : topic #44 (0.020): 0.033*\"rooftop\" + 0.028*\"final\" + 0.022*\"wife\" + 0.020*\"tourist\" + 0.018*\"champion\" + 0.016*\"taxpay\" + 0.015*\"martin\" + 0.015*\"tiepolo\" + 0.014*\"chamber\" + 0.012*\"open\"\n", + "2019-01-31 01:14:16,425 : INFO : topic #10 (0.020): 0.012*\"cdd\" + 0.008*\"media\" + 0.008*\"disco\" + 0.007*\"hormon\" + 0.007*\"pathwai\" + 0.007*\"caus\" + 0.006*\"have\" + 0.006*\"proper\" + 0.006*\"treat\" + 0.006*\"acid\"\n", + "2019-01-31 01:14:16,426 : INFO : topic #5 (0.020): 0.038*\"abroad\" + 0.028*\"son\" + 0.027*\"rel\" + 0.026*\"reconstruct\" + 0.021*\"band\" + 0.016*\"muscl\" + 0.016*\"simultan\" + 0.014*\"charcoal\" + 0.013*\"toyota\" + 0.010*\"myspac\"\n", + "2019-01-31 01:14:16,427 : INFO : topic #22 (0.020): 0.035*\"spars\" + 0.018*\"factor\" + 0.011*\"plaisir\" + 0.011*\"genu\" + 0.009*\"western\" + 0.008*\"median\" + 0.008*\"biom\" + 0.007*\"feel\" + 0.007*\"male\" + 0.007*\"trap\"\n", + "2019-01-31 01:14:16,433 : INFO : topic diff=0.003798, rho=0.024332\n", + "2019-01-31 01:14:19,119 : INFO : -11.591 per-word bound, 3084.6 perplexity estimate based on a held-out corpus of 2000 documents with 560510 words\n", + "2019-01-31 01:14:19,120 : INFO : PROGRESS: pass 0, at document #3380000/4922894\n", + "2019-01-31 01:14:20,491 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:14:20,758 : INFO : topic #40 (0.020): 0.087*\"unit\" + 0.023*\"schuster\" + 0.022*\"institut\" + 0.021*\"collector\" + 0.020*\"requir\" + 0.019*\"student\" + 0.015*\"professor\" + 0.012*\"http\" + 0.011*\"degre\" + 0.011*\"word\"\n", + "2019-01-31 01:14:20,759 : INFO : topic #46 (0.020): 0.017*\"sweden\" + 0.017*\"stop\" + 0.017*\"norwai\" + 0.015*\"swedish\" + 0.015*\"wind\" + 0.015*\"norwegian\" + 0.013*\"damag\" + 0.012*\"turkish\" + 0.012*\"denmark\" + 0.011*\"huntsvil\"\n", + "2019-01-31 01:14:20,760 : INFO : topic #49 (0.020): 0.045*\"india\" + 0.030*\"incumb\" + 0.014*\"islam\" + 0.013*\"pakistan\" + 0.012*\"anglo\" + 0.012*\"muskoge\" + 0.010*\"televis\" + 0.010*\"alam\" + 0.010*\"affection\" + 0.009*\"khalsa\"\n", + "2019-01-31 01:14:20,761 : INFO : topic #8 (0.020): 0.026*\"law\" + 0.022*\"cortic\" + 0.018*\"start\" + 0.016*\"act\" + 0.013*\"ricardo\" + 0.012*\"case\" + 0.010*\"replac\" + 0.009*\"polaris\" + 0.008*\"legal\" + 0.007*\"judaism\"\n", + "2019-01-31 01:14:20,762 : INFO : topic #36 (0.020): 0.011*\"network\" + 0.011*\"pop\" + 0.010*\"prognosi\" + 0.009*\"cytokin\" + 0.008*\"develop\" + 0.008*\"user\" + 0.008*\"uruguayan\" + 0.008*\"softwar\" + 0.008*\"diggin\" + 0.007*\"championship\"\n", + "2019-01-31 01:14:20,768 : INFO : topic diff=0.003455, rho=0.024325\n", + "2019-01-31 01:14:20,923 : INFO : PROGRESS: pass 0, at document #3382000/4922894\n", + "2019-01-31 01:14:22,288 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:14:22,554 : INFO : topic #20 (0.020): 0.144*\"scholar\" + 0.040*\"struggl\" + 0.034*\"high\" + 0.030*\"educ\" + 0.023*\"collector\" + 0.018*\"yawn\" + 0.013*\"prognosi\" + 0.010*\"gothic\" + 0.010*\"district\" + 0.009*\"task\"\n", + "2019-01-31 01:14:22,555 : INFO : topic #22 (0.020): 0.035*\"spars\" + 0.018*\"factor\" + 0.011*\"plaisir\" + 0.011*\"genu\" + 0.009*\"western\" + 0.008*\"median\" + 0.008*\"biom\" + 0.007*\"feel\" + 0.007*\"incom\" + 0.007*\"trap\"\n", + "2019-01-31 01:14:22,556 : INFO : topic #49 (0.020): 0.045*\"india\" + 0.031*\"incumb\" + 0.013*\"islam\" + 0.013*\"pakistan\" + 0.012*\"anglo\" + 0.012*\"muskoge\" + 0.010*\"televis\" + 0.010*\"alam\" + 0.009*\"affection\" + 0.009*\"sri\"\n", + "2019-01-31 01:14:22,557 : INFO : topic #39 (0.020): 0.056*\"canada\" + 0.043*\"canadian\" + 0.023*\"hoar\" + 0.022*\"toronto\" + 0.020*\"ontario\" + 0.016*\"new\" + 0.015*\"hydrogen\" + 0.015*\"novotná\" + 0.014*\"quebec\" + 0.014*\"misericordia\"\n", + "2019-01-31 01:14:22,558 : INFO : topic #24 (0.020): 0.037*\"book\" + 0.033*\"publicis\" + 0.029*\"word\" + 0.019*\"new\" + 0.014*\"arsen\" + 0.014*\"edit\" + 0.013*\"presid\" + 0.011*\"collect\" + 0.011*\"magazin\" + 0.011*\"nicola\"\n", + "2019-01-31 01:14:22,564 : INFO : topic diff=0.003627, rho=0.024318\n", + "2019-01-31 01:14:22,717 : INFO : PROGRESS: pass 0, at document #3384000/4922894\n", + "2019-01-31 01:14:24,063 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:14:24,330 : INFO : topic #12 (0.020): 0.008*\"number\" + 0.007*\"frontal\" + 0.007*\"gener\" + 0.006*\"poet\" + 0.006*\"southern\" + 0.006*\"exampl\" + 0.006*\"measur\" + 0.006*\"servitud\" + 0.006*\"théori\" + 0.006*\"utopian\"\n", + "2019-01-31 01:14:24,331 : INFO : topic #8 (0.020): 0.026*\"law\" + 0.022*\"cortic\" + 0.018*\"start\" + 0.016*\"act\" + 0.013*\"ricardo\" + 0.012*\"case\" + 0.010*\"replac\" + 0.009*\"polaris\" + 0.008*\"legal\" + 0.007*\"judaism\"\n", + "2019-01-31 01:14:24,332 : INFO : topic #15 (0.020): 0.011*\"small\" + 0.010*\"organ\" + 0.010*\"develop\" + 0.009*\"commun\" + 0.008*\"group\" + 0.008*\"word\" + 0.008*\"peopl\" + 0.007*\"human\" + 0.007*\"woman\" + 0.006*\"summerhil\"\n", + "2019-01-31 01:14:24,333 : INFO : topic #26 (0.020): 0.031*\"workplac\" + 0.029*\"champion\" + 0.027*\"woman\" + 0.026*\"olymp\" + 0.023*\"men\" + 0.022*\"medal\" + 0.021*\"event\" + 0.018*\"atheist\" + 0.018*\"taxpay\" + 0.018*\"nation\"\n", + "2019-01-31 01:14:24,334 : INFO : topic #29 (0.020): 0.031*\"companhia\" + 0.013*\"busi\" + 0.012*\"million\" + 0.011*\"market\" + 0.011*\"bank\" + 0.011*\"produc\" + 0.010*\"industri\" + 0.008*\"yawn\" + 0.008*\"manag\" + 0.007*\"oper\"\n", + "2019-01-31 01:14:24,339 : INFO : topic diff=0.003777, rho=0.024311\n", + "2019-01-31 01:14:24,499 : INFO : PROGRESS: pass 0, at document #3386000/4922894\n", + "2019-01-31 01:14:25,879 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 01:14:26,146 : INFO : topic #28 (0.020): 0.033*\"build\" + 0.028*\"hous\" + 0.018*\"buford\" + 0.014*\"histor\" + 0.013*\"rivièr\" + 0.011*\"constitut\" + 0.011*\"linear\" + 0.011*\"silicon\" + 0.010*\"briarwood\" + 0.010*\"strategist\"\n", + "2019-01-31 01:14:26,147 : INFO : topic #41 (0.020): 0.040*\"citi\" + 0.024*\"palmer\" + 0.021*\"new\" + 0.014*\"strategist\" + 0.013*\"open\" + 0.013*\"center\" + 0.011*\"dai\" + 0.011*\"includ\" + 0.011*\"lobe\" + 0.009*\"highli\"\n", + "2019-01-31 01:14:26,148 : INFO : topic #5 (0.020): 0.038*\"abroad\" + 0.028*\"son\" + 0.027*\"rel\" + 0.026*\"reconstruct\" + 0.021*\"band\" + 0.016*\"muscl\" + 0.016*\"simultan\" + 0.014*\"charcoal\" + 0.013*\"toyota\" + 0.010*\"myspac\"\n", + "2019-01-31 01:14:26,149 : INFO : topic #40 (0.020): 0.087*\"unit\" + 0.023*\"schuster\" + 0.022*\"institut\" + 0.021*\"collector\" + 0.021*\"requir\" + 0.019*\"student\" + 0.015*\"professor\" + 0.012*\"http\" + 0.011*\"degre\" + 0.011*\"word\"\n", + "2019-01-31 01:14:26,150 : INFO : topic #46 (0.020): 0.017*\"sweden\" + 0.017*\"stop\" + 0.016*\"norwai\" + 0.015*\"wind\" + 0.015*\"swedish\" + 0.014*\"norwegian\" + 0.013*\"damag\" + 0.012*\"denmark\" + 0.012*\"turkish\" + 0.011*\"huntsvil\"\n", + "2019-01-31 01:14:26,156 : INFO : topic diff=0.003653, rho=0.024304\n", + "2019-01-31 01:14:26,314 : INFO : PROGRESS: pass 0, at document #3388000/4922894\n", + "2019-01-31 01:14:27,699 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:14:27,965 : INFO : topic #35 (0.020): 0.056*\"russia\" + 0.037*\"sovereignti\" + 0.033*\"rural\" + 0.025*\"poison\" + 0.025*\"reprint\" + 0.023*\"personifi\" + 0.020*\"moscow\" + 0.017*\"poland\" + 0.015*\"unfortun\" + 0.014*\"malaysia\"\n", + "2019-01-31 01:14:27,966 : INFO : topic #46 (0.020): 0.017*\"stop\" + 0.017*\"sweden\" + 0.016*\"norwai\" + 0.016*\"wind\" + 0.015*\"swedish\" + 0.014*\"norwegian\" + 0.013*\"damag\" + 0.012*\"denmark\" + 0.012*\"turkish\" + 0.011*\"huntsvil\"\n", + "2019-01-31 01:14:27,967 : INFO : topic #8 (0.020): 0.026*\"law\" + 0.022*\"cortic\" + 0.018*\"start\" + 0.017*\"act\" + 0.013*\"ricardo\" + 0.012*\"case\" + 0.010*\"replac\" + 0.009*\"polaris\" + 0.008*\"legal\" + 0.007*\"judaism\"\n", + "2019-01-31 01:14:27,968 : INFO : topic #23 (0.020): 0.134*\"audit\" + 0.067*\"best\" + 0.034*\"yawn\" + 0.028*\"jacksonvil\" + 0.022*\"noll\" + 0.022*\"japanes\" + 0.019*\"festiv\" + 0.018*\"women\" + 0.016*\"intern\" + 0.013*\"winner\"\n", + "2019-01-31 01:14:27,969 : INFO : topic #19 (0.020): 0.016*\"languag\" + 0.015*\"centuri\" + 0.011*\"woodcut\" + 0.009*\"form\" + 0.009*\"origin\" + 0.008*\"mean\" + 0.008*\"trade\" + 0.007*\"english\" + 0.007*\"known\" + 0.007*\"ancestor\"\n", + "2019-01-31 01:14:27,975 : INFO : topic diff=0.004480, rho=0.024296\n", + "2019-01-31 01:14:28,191 : INFO : PROGRESS: pass 0, at document #3390000/4922894\n", + "2019-01-31 01:14:29,563 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:14:29,830 : INFO : topic #1 (0.020): 0.055*\"china\" + 0.047*\"chilton\" + 0.026*\"kong\" + 0.025*\"hong\" + 0.021*\"korea\" + 0.016*\"leah\" + 0.016*\"korean\" + 0.015*\"sourc\" + 0.014*\"kim\" + 0.014*\"shirin\"\n", + "2019-01-31 01:14:29,831 : INFO : topic #36 (0.020): 0.011*\"network\" + 0.010*\"prognosi\" + 0.010*\"pop\" + 0.009*\"cytokin\" + 0.008*\"develop\" + 0.008*\"softwar\" + 0.008*\"user\" + 0.008*\"uruguayan\" + 0.008*\"championship\" + 0.007*\"includ\"\n", + "2019-01-31 01:14:29,832 : INFO : topic #15 (0.020): 0.011*\"small\" + 0.010*\"organ\" + 0.010*\"develop\" + 0.009*\"commun\" + 0.008*\"group\" + 0.008*\"word\" + 0.008*\"peopl\" + 0.007*\"human\" + 0.007*\"woman\" + 0.007*\"summerhil\"\n", + "2019-01-31 01:14:29,833 : INFO : topic #20 (0.020): 0.145*\"scholar\" + 0.040*\"struggl\" + 0.034*\"high\" + 0.030*\"educ\" + 0.024*\"collector\" + 0.017*\"yawn\" + 0.013*\"prognosi\" + 0.010*\"gothic\" + 0.010*\"district\" + 0.010*\"task\"\n", + "2019-01-31 01:14:29,834 : INFO : topic #34 (0.020): 0.069*\"start\" + 0.034*\"new\" + 0.032*\"american\" + 0.031*\"unionist\" + 0.026*\"cotton\" + 0.021*\"year\" + 0.015*\"california\" + 0.013*\"warrior\" + 0.012*\"terri\" + 0.011*\"citi\"\n", + "2019-01-31 01:14:29,840 : INFO : topic diff=0.003205, rho=0.024289\n", + "2019-01-31 01:14:29,998 : INFO : PROGRESS: pass 0, at document #3392000/4922894\n", + "2019-01-31 01:14:31,385 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:14:31,651 : INFO : topic #22 (0.020): 0.035*\"spars\" + 0.018*\"factor\" + 0.011*\"plaisir\" + 0.010*\"genu\" + 0.009*\"western\" + 0.008*\"biom\" + 0.008*\"median\" + 0.008*\"feel\" + 0.008*\"male\" + 0.007*\"incom\"\n", + "2019-01-31 01:14:31,652 : INFO : topic #12 (0.020): 0.008*\"number\" + 0.007*\"frontal\" + 0.007*\"gener\" + 0.006*\"exampl\" + 0.006*\"poet\" + 0.006*\"southern\" + 0.006*\"measur\" + 0.006*\"théori\" + 0.006*\"servitud\" + 0.006*\"utopian\"\n", + "2019-01-31 01:14:31,653 : INFO : topic #3 (0.020): 0.033*\"present\" + 0.026*\"offic\" + 0.024*\"minist\" + 0.023*\"nation\" + 0.023*\"govern\" + 0.020*\"member\" + 0.018*\"serv\" + 0.016*\"start\" + 0.015*\"gener\" + 0.014*\"chickasaw\"\n", + "2019-01-31 01:14:31,654 : INFO : topic #25 (0.020): 0.032*\"ring\" + 0.019*\"lagrang\" + 0.018*\"area\" + 0.017*\"warmth\" + 0.015*\"mount\" + 0.010*\"north\" + 0.009*\"lobe\" + 0.009*\"sourc\" + 0.009*\"land\" + 0.009*\"foam\"\n", + "2019-01-31 01:14:31,655 : INFO : topic #38 (0.020): 0.022*\"walter\" + 0.009*\"aza\" + 0.009*\"battalion\" + 0.009*\"forc\" + 0.007*\"empath\" + 0.007*\"armi\" + 0.007*\"teufel\" + 0.006*\"militari\" + 0.006*\"govern\" + 0.006*\"pour\"\n", + "2019-01-31 01:14:31,661 : INFO : topic diff=0.003007, rho=0.024282\n", + "2019-01-31 01:14:31,824 : INFO : PROGRESS: pass 0, at document #3394000/4922894\n", + "2019-01-31 01:14:33,236 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:14:33,503 : INFO : topic #17 (0.020): 0.074*\"church\" + 0.023*\"cathol\" + 0.022*\"christian\" + 0.022*\"bishop\" + 0.018*\"sail\" + 0.015*\"retroflex\" + 0.010*\"relationship\" + 0.010*\"poll\" + 0.009*\"historiographi\" + 0.009*\"cathedr\"\n", + "2019-01-31 01:14:33,504 : INFO : topic #4 (0.020): 0.021*\"enfranchis\" + 0.015*\"depress\" + 0.013*\"pour\" + 0.009*\"mode\" + 0.008*\"veget\" + 0.007*\"elabor\" + 0.007*\"uruguayan\" + 0.006*\"develop\" + 0.006*\"produc\" + 0.006*\"spectacl\"\n", + "2019-01-31 01:14:33,505 : INFO : topic #24 (0.020): 0.037*\"book\" + 0.033*\"publicis\" + 0.029*\"word\" + 0.019*\"new\" + 0.014*\"arsen\" + 0.014*\"edit\" + 0.013*\"presid\" + 0.011*\"magazin\" + 0.011*\"collect\" + 0.011*\"nicola\"\n", + "2019-01-31 01:14:33,506 : INFO : topic #37 (0.020): 0.013*\"charact\" + 0.011*\"septemb\" + 0.010*\"man\" + 0.010*\"anim\" + 0.007*\"comic\" + 0.007*\"appear\" + 0.007*\"storag\" + 0.006*\"workplac\" + 0.006*\"fusiform\" + 0.006*\"vision\"\n", + "2019-01-31 01:14:33,507 : INFO : topic #1 (0.020): 0.055*\"china\" + 0.047*\"chilton\" + 0.025*\"kong\" + 0.025*\"hong\" + 0.021*\"korea\" + 0.016*\"leah\" + 0.016*\"korean\" + 0.015*\"sourc\" + 0.014*\"kim\" + 0.013*\"shirin\"\n", + "2019-01-31 01:14:33,513 : INFO : topic diff=0.003557, rho=0.024275\n", + "2019-01-31 01:14:33,671 : INFO : PROGRESS: pass 0, at document #3396000/4922894\n", + "2019-01-31 01:14:35,053 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:14:35,319 : INFO : topic #48 (0.020): 0.079*\"march\" + 0.079*\"sens\" + 0.078*\"octob\" + 0.073*\"august\" + 0.073*\"juli\" + 0.072*\"januari\" + 0.071*\"april\" + 0.070*\"notion\" + 0.069*\"judici\" + 0.067*\"decatur\"\n", + "2019-01-31 01:14:35,320 : INFO : topic #37 (0.020): 0.013*\"charact\" + 0.011*\"septemb\" + 0.010*\"anim\" + 0.010*\"man\" + 0.007*\"comic\" + 0.007*\"appear\" + 0.007*\"storag\" + 0.006*\"workplac\" + 0.006*\"fusiform\" + 0.006*\"vision\"\n", + "2019-01-31 01:14:35,321 : INFO : topic #23 (0.020): 0.134*\"audit\" + 0.067*\"best\" + 0.034*\"yawn\" + 0.028*\"jacksonvil\" + 0.023*\"japanes\" + 0.022*\"noll\" + 0.019*\"festiv\" + 0.018*\"women\" + 0.017*\"intern\" + 0.013*\"winner\"\n", + "2019-01-31 01:14:35,322 : INFO : topic #3 (0.020): 0.033*\"present\" + 0.026*\"offic\" + 0.024*\"minist\" + 0.023*\"nation\" + 0.023*\"govern\" + 0.020*\"member\" + 0.019*\"serv\" + 0.016*\"start\" + 0.015*\"gener\" + 0.014*\"chickasaw\"\n", + "2019-01-31 01:14:35,323 : INFO : topic #1 (0.020): 0.055*\"china\" + 0.047*\"chilton\" + 0.026*\"kong\" + 0.025*\"hong\" + 0.021*\"korea\" + 0.016*\"leah\" + 0.016*\"korean\" + 0.015*\"sourc\" + 0.013*\"kim\" + 0.013*\"shirin\"\n", + "2019-01-31 01:14:35,329 : INFO : topic diff=0.004078, rho=0.024268\n", + "2019-01-31 01:14:35,488 : INFO : PROGRESS: pass 0, at document #3398000/4922894\n", + "2019-01-31 01:14:36,873 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:14:37,140 : INFO : topic #41 (0.020): 0.041*\"citi\" + 0.024*\"palmer\" + 0.021*\"new\" + 0.014*\"strategist\" + 0.013*\"open\" + 0.013*\"center\" + 0.011*\"dai\" + 0.011*\"includ\" + 0.011*\"lobe\" + 0.009*\"highli\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 01:14:37,141 : INFO : topic #9 (0.020): 0.069*\"bone\" + 0.043*\"american\" + 0.027*\"valour\" + 0.018*\"dutch\" + 0.018*\"folei\" + 0.017*\"player\" + 0.017*\"polit\" + 0.015*\"english\" + 0.012*\"acrimoni\" + 0.011*\"simpler\"\n", + "2019-01-31 01:14:37,141 : INFO : topic #13 (0.020): 0.029*\"australia\" + 0.026*\"london\" + 0.025*\"new\" + 0.024*\"sourc\" + 0.023*\"england\" + 0.023*\"australian\" + 0.019*\"british\" + 0.017*\"ireland\" + 0.015*\"youth\" + 0.014*\"wale\"\n", + "2019-01-31 01:14:37,143 : INFO : topic #4 (0.020): 0.021*\"enfranchis\" + 0.015*\"depress\" + 0.013*\"pour\" + 0.009*\"mode\" + 0.008*\"veget\" + 0.007*\"elabor\" + 0.007*\"uruguayan\" + 0.006*\"develop\" + 0.006*\"produc\" + 0.006*\"spectacl\"\n", + "2019-01-31 01:14:37,144 : INFO : topic #7 (0.020): 0.020*\"snatch\" + 0.020*\"di\" + 0.019*\"factor\" + 0.016*\"yawn\" + 0.016*\"margin\" + 0.014*\"bone\" + 0.013*\"life\" + 0.013*\"faster\" + 0.012*\"deal\" + 0.011*\"john\"\n", + "2019-01-31 01:14:37,149 : INFO : topic diff=0.003290, rho=0.024261\n", + "2019-01-31 01:14:39,862 : INFO : -11.825 per-word bound, 3627.0 perplexity estimate based on a held-out corpus of 2000 documents with 570130 words\n", + "2019-01-31 01:14:39,862 : INFO : PROGRESS: pass 0, at document #3400000/4922894\n", + "2019-01-31 01:14:41,247 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:14:41,514 : INFO : topic #49 (0.020): 0.045*\"india\" + 0.030*\"incumb\" + 0.013*\"islam\" + 0.013*\"pakistan\" + 0.012*\"anglo\" + 0.011*\"muskoge\" + 0.010*\"alam\" + 0.010*\"khalsa\" + 0.010*\"affection\" + 0.010*\"televis\"\n", + "2019-01-31 01:14:41,515 : INFO : topic #15 (0.020): 0.011*\"small\" + 0.010*\"organ\" + 0.010*\"develop\" + 0.009*\"commun\" + 0.008*\"group\" + 0.008*\"word\" + 0.008*\"peopl\" + 0.007*\"human\" + 0.007*\"woman\" + 0.006*\"summerhil\"\n", + "2019-01-31 01:14:41,516 : INFO : topic #17 (0.020): 0.073*\"church\" + 0.022*\"cathol\" + 0.022*\"christian\" + 0.021*\"bishop\" + 0.018*\"sail\" + 0.015*\"retroflex\" + 0.010*\"relationship\" + 0.010*\"poll\" + 0.009*\"historiographi\" + 0.009*\"parish\"\n", + "2019-01-31 01:14:41,517 : INFO : topic #28 (0.020): 0.033*\"build\" + 0.028*\"hous\" + 0.018*\"buford\" + 0.014*\"histor\" + 0.013*\"rivièr\" + 0.011*\"constitut\" + 0.011*\"linear\" + 0.011*\"silicon\" + 0.010*\"briarwood\" + 0.010*\"depress\"\n", + "2019-01-31 01:14:41,518 : INFO : topic #10 (0.020): 0.012*\"cdd\" + 0.008*\"media\" + 0.008*\"disco\" + 0.007*\"hormon\" + 0.007*\"pathwai\" + 0.007*\"have\" + 0.007*\"caus\" + 0.006*\"proper\" + 0.006*\"acid\" + 0.006*\"treat\"\n", + "2019-01-31 01:14:41,524 : INFO : topic diff=0.003530, rho=0.024254\n", + "2019-01-31 01:14:41,683 : INFO : PROGRESS: pass 0, at document #3402000/4922894\n", + "2019-01-31 01:14:43,069 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:14:43,335 : INFO : topic #4 (0.020): 0.021*\"enfranchis\" + 0.015*\"depress\" + 0.013*\"pour\" + 0.009*\"mode\" + 0.008*\"veget\" + 0.007*\"elabor\" + 0.007*\"uruguayan\" + 0.006*\"produc\" + 0.006*\"develop\" + 0.006*\"spectacl\"\n", + "2019-01-31 01:14:43,336 : INFO : topic #18 (0.020): 0.011*\"théori\" + 0.007*\"later\" + 0.007*\"sack\" + 0.006*\"dai\" + 0.006*\"kill\" + 0.005*\"retrospect\" + 0.005*\"like\" + 0.005*\"end\" + 0.004*\"help\" + 0.004*\"call\"\n", + "2019-01-31 01:14:43,337 : INFO : topic #34 (0.020): 0.069*\"start\" + 0.034*\"new\" + 0.032*\"american\" + 0.031*\"unionist\" + 0.025*\"cotton\" + 0.021*\"year\" + 0.015*\"california\" + 0.013*\"warrior\" + 0.012*\"terri\" + 0.011*\"citi\"\n", + "2019-01-31 01:14:43,338 : INFO : topic #45 (0.020): 0.027*\"jpg\" + 0.025*\"fifteenth\" + 0.022*\"arsen\" + 0.019*\"pain\" + 0.019*\"illicit\" + 0.018*\"museo\" + 0.014*\"colder\" + 0.013*\"gai\" + 0.013*\"black\" + 0.012*\"western\"\n", + "2019-01-31 01:14:43,339 : INFO : topic #41 (0.020): 0.041*\"citi\" + 0.024*\"palmer\" + 0.021*\"new\" + 0.014*\"strategist\" + 0.013*\"open\" + 0.013*\"center\" + 0.011*\"dai\" + 0.011*\"includ\" + 0.011*\"lobe\" + 0.009*\"highli\"\n", + "2019-01-31 01:14:43,345 : INFO : topic diff=0.003784, rho=0.024246\n", + "2019-01-31 01:14:43,505 : INFO : PROGRESS: pass 0, at document #3404000/4922894\n", + "2019-01-31 01:14:44,892 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:14:45,159 : INFO : topic #40 (0.020): 0.087*\"unit\" + 0.023*\"schuster\" + 0.022*\"institut\" + 0.021*\"collector\" + 0.020*\"requir\" + 0.019*\"student\" + 0.015*\"professor\" + 0.012*\"http\" + 0.012*\"degre\" + 0.011*\"word\"\n", + "2019-01-31 01:14:45,160 : INFO : topic #35 (0.020): 0.056*\"russia\" + 0.038*\"sovereignti\" + 0.034*\"rural\" + 0.025*\"reprint\" + 0.024*\"poison\" + 0.022*\"personifi\" + 0.020*\"moscow\" + 0.017*\"poland\" + 0.015*\"unfortun\" + 0.013*\"malaysia\"\n", + "2019-01-31 01:14:45,161 : INFO : topic #2 (0.020): 0.047*\"isl\" + 0.039*\"shield\" + 0.018*\"narrat\" + 0.015*\"scot\" + 0.012*\"pope\" + 0.012*\"blur\" + 0.010*\"coalit\" + 0.010*\"nativist\" + 0.009*\"fleet\" + 0.009*\"class\"\n", + "2019-01-31 01:14:45,162 : INFO : topic #44 (0.020): 0.032*\"rooftop\" + 0.028*\"final\" + 0.022*\"wife\" + 0.020*\"tourist\" + 0.018*\"champion\" + 0.016*\"taxpay\" + 0.015*\"martin\" + 0.014*\"tiepolo\" + 0.013*\"chamber\" + 0.013*\"women\"\n", + "2019-01-31 01:14:45,163 : INFO : topic #48 (0.020): 0.079*\"march\" + 0.079*\"sens\" + 0.078*\"octob\" + 0.073*\"august\" + 0.073*\"juli\" + 0.072*\"januari\" + 0.071*\"april\" + 0.070*\"notion\" + 0.068*\"judici\" + 0.066*\"decatur\"\n", + "2019-01-31 01:14:45,169 : INFO : topic diff=0.004525, rho=0.024239\n", + "2019-01-31 01:14:45,328 : INFO : PROGRESS: pass 0, at document #3406000/4922894\n", + "2019-01-31 01:14:46,731 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:14:46,998 : INFO : topic #24 (0.020): 0.037*\"book\" + 0.033*\"publicis\" + 0.029*\"word\" + 0.019*\"new\" + 0.014*\"edit\" + 0.014*\"arsen\" + 0.013*\"presid\" + 0.011*\"magazin\" + 0.011*\"collect\" + 0.011*\"nicola\"\n", + "2019-01-31 01:14:46,999 : INFO : topic #20 (0.020): 0.143*\"scholar\" + 0.039*\"struggl\" + 0.033*\"high\" + 0.030*\"educ\" + 0.023*\"collector\" + 0.017*\"yawn\" + 0.013*\"prognosi\" + 0.011*\"district\" + 0.010*\"gothic\" + 0.010*\"task\"\n", + "2019-01-31 01:14:47,000 : INFO : topic #16 (0.020): 0.054*\"king\" + 0.031*\"priest\" + 0.020*\"rotterdam\" + 0.020*\"duke\" + 0.019*\"quarterli\" + 0.017*\"idiosyncrat\" + 0.016*\"grammat\" + 0.014*\"count\" + 0.013*\"kingdom\" + 0.013*\"portugues\"\n", + "2019-01-31 01:14:47,001 : INFO : topic #13 (0.020): 0.029*\"australia\" + 0.027*\"london\" + 0.025*\"new\" + 0.024*\"sourc\" + 0.023*\"england\" + 0.023*\"australian\" + 0.019*\"british\" + 0.017*\"ireland\" + 0.015*\"youth\" + 0.014*\"wale\"\n", + "2019-01-31 01:14:47,002 : INFO : topic #28 (0.020): 0.033*\"build\" + 0.028*\"hous\" + 0.018*\"buford\" + 0.014*\"histor\" + 0.013*\"rivièr\" + 0.011*\"constitut\" + 0.011*\"linear\" + 0.011*\"silicon\" + 0.010*\"briarwood\" + 0.010*\"depress\"\n", + "2019-01-31 01:14:47,008 : INFO : topic diff=0.003319, rho=0.024232\n", + "2019-01-31 01:14:47,162 : INFO : PROGRESS: pass 0, at document #3408000/4922894\n", + "2019-01-31 01:14:48,533 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:14:48,803 : INFO : topic #16 (0.020): 0.054*\"king\" + 0.031*\"priest\" + 0.020*\"rotterdam\" + 0.020*\"duke\" + 0.019*\"quarterli\" + 0.017*\"idiosyncrat\" + 0.016*\"grammat\" + 0.014*\"count\" + 0.013*\"kingdom\" + 0.013*\"portugues\"\n", + "2019-01-31 01:14:48,804 : INFO : topic #34 (0.020): 0.069*\"start\" + 0.034*\"new\" + 0.032*\"american\" + 0.031*\"unionist\" + 0.025*\"cotton\" + 0.021*\"year\" + 0.015*\"california\" + 0.013*\"warrior\" + 0.011*\"terri\" + 0.011*\"citi\"\n", + "2019-01-31 01:14:48,805 : INFO : topic #5 (0.020): 0.038*\"abroad\" + 0.029*\"son\" + 0.027*\"rel\" + 0.026*\"reconstruct\" + 0.020*\"band\" + 0.016*\"muscl\" + 0.016*\"simultan\" + 0.014*\"charcoal\" + 0.014*\"toyota\" + 0.010*\"myspac\"\n", + "2019-01-31 01:14:48,806 : INFO : topic #3 (0.020): 0.033*\"present\" + 0.026*\"offic\" + 0.024*\"minist\" + 0.023*\"govern\" + 0.023*\"nation\" + 0.020*\"member\" + 0.018*\"serv\" + 0.017*\"start\" + 0.015*\"gener\" + 0.014*\"chickasaw\"\n", + "2019-01-31 01:14:48,807 : INFO : topic #14 (0.020): 0.024*\"forc\" + 0.021*\"aggress\" + 0.021*\"armi\" + 0.020*\"walter\" + 0.018*\"com\" + 0.014*\"oper\" + 0.014*\"unionist\" + 0.013*\"militari\" + 0.012*\"airbu\" + 0.011*\"diversifi\"\n", + "2019-01-31 01:14:48,813 : INFO : topic diff=0.003191, rho=0.024225\n", + "2019-01-31 01:14:48,971 : INFO : PROGRESS: pass 0, at document #3410000/4922894\n", + "2019-01-31 01:14:50,362 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:14:50,628 : INFO : topic #14 (0.020): 0.024*\"forc\" + 0.021*\"aggress\" + 0.021*\"armi\" + 0.020*\"walter\" + 0.018*\"com\" + 0.014*\"oper\" + 0.014*\"unionist\" + 0.013*\"militari\" + 0.011*\"airbu\" + 0.011*\"diversifi\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 01:14:50,630 : INFO : topic #39 (0.020): 0.056*\"canada\" + 0.042*\"canadian\" + 0.023*\"hoar\" + 0.022*\"toronto\" + 0.019*\"ontario\" + 0.016*\"new\" + 0.015*\"hydrogen\" + 0.014*\"novotná\" + 0.014*\"quebec\" + 0.014*\"misericordia\"\n", + "2019-01-31 01:14:50,631 : INFO : topic #18 (0.020): 0.011*\"théori\" + 0.007*\"later\" + 0.007*\"sack\" + 0.006*\"dai\" + 0.006*\"kill\" + 0.005*\"like\" + 0.005*\"retrospect\" + 0.005*\"end\" + 0.004*\"help\" + 0.004*\"call\"\n", + "2019-01-31 01:14:50,632 : INFO : topic #11 (0.020): 0.023*\"john\" + 0.012*\"will\" + 0.011*\"david\" + 0.011*\"jame\" + 0.010*\"rival\" + 0.009*\"mexican–american\" + 0.008*\"paul\" + 0.008*\"georg\" + 0.008*\"slur\" + 0.008*\"rhyme\"\n", + "2019-01-31 01:14:50,633 : INFO : topic #25 (0.020): 0.032*\"ring\" + 0.019*\"lagrang\" + 0.018*\"area\" + 0.017*\"warmth\" + 0.015*\"mount\" + 0.010*\"north\" + 0.009*\"sourc\" + 0.009*\"lobe\" + 0.009*\"palmer\" + 0.009*\"land\"\n", + "2019-01-31 01:14:50,639 : INFO : topic diff=0.003742, rho=0.024218\n", + "2019-01-31 01:14:50,798 : INFO : PROGRESS: pass 0, at document #3412000/4922894\n", + "2019-01-31 01:14:52,205 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:14:52,471 : INFO : topic #1 (0.020): 0.053*\"china\" + 0.048*\"chilton\" + 0.025*\"kong\" + 0.024*\"hong\" + 0.021*\"korea\" + 0.016*\"korean\" + 0.016*\"leah\" + 0.015*\"sourc\" + 0.013*\"shirin\" + 0.013*\"kim\"\n", + "2019-01-31 01:14:52,472 : INFO : topic #11 (0.020): 0.023*\"john\" + 0.012*\"will\" + 0.011*\"jame\" + 0.011*\"david\" + 0.010*\"rival\" + 0.009*\"mexican–american\" + 0.008*\"paul\" + 0.008*\"georg\" + 0.008*\"slur\" + 0.008*\"rhyme\"\n", + "2019-01-31 01:14:52,473 : INFO : topic #33 (0.020): 0.062*\"french\" + 0.046*\"franc\" + 0.032*\"pari\" + 0.023*\"sail\" + 0.021*\"jean\" + 0.017*\"daphn\" + 0.014*\"lazi\" + 0.012*\"loui\" + 0.011*\"piec\" + 0.009*\"wine\"\n", + "2019-01-31 01:14:52,474 : INFO : topic #7 (0.020): 0.021*\"snatch\" + 0.020*\"di\" + 0.018*\"factor\" + 0.016*\"yawn\" + 0.015*\"margin\" + 0.014*\"bone\" + 0.013*\"life\" + 0.012*\"faster\" + 0.012*\"deal\" + 0.011*\"john\"\n", + "2019-01-31 01:14:52,475 : INFO : topic #4 (0.020): 0.021*\"enfranchis\" + 0.015*\"depress\" + 0.013*\"pour\" + 0.009*\"mode\" + 0.008*\"veget\" + 0.007*\"elabor\" + 0.007*\"uruguayan\" + 0.006*\"produc\" + 0.006*\"develop\" + 0.006*\"spectacl\"\n", + "2019-01-31 01:14:52,481 : INFO : topic diff=0.003123, rho=0.024211\n", + "2019-01-31 01:14:52,643 : INFO : PROGRESS: pass 0, at document #3414000/4922894\n", + "2019-01-31 01:14:54,032 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:14:54,299 : INFO : topic #32 (0.020): 0.049*\"district\" + 0.044*\"vigour\" + 0.044*\"popolo\" + 0.037*\"cotton\" + 0.036*\"tortur\" + 0.022*\"area\" + 0.022*\"adulthood\" + 0.021*\"multitud\" + 0.020*\"citi\" + 0.019*\"cede\"\n", + "2019-01-31 01:14:54,300 : INFO : topic #16 (0.020): 0.054*\"king\" + 0.031*\"priest\" + 0.020*\"duke\" + 0.020*\"rotterdam\" + 0.020*\"quarterli\" + 0.016*\"idiosyncrat\" + 0.016*\"grammat\" + 0.013*\"count\" + 0.013*\"kingdom\" + 0.013*\"portugues\"\n", + "2019-01-31 01:14:54,301 : INFO : topic #10 (0.020): 0.012*\"cdd\" + 0.008*\"media\" + 0.008*\"disco\" + 0.007*\"hormon\" + 0.007*\"pathwai\" + 0.007*\"have\" + 0.007*\"caus\" + 0.006*\"proper\" + 0.006*\"treat\" + 0.005*\"effect\"\n", + "2019-01-31 01:14:54,302 : INFO : topic #33 (0.020): 0.062*\"french\" + 0.047*\"franc\" + 0.032*\"pari\" + 0.023*\"sail\" + 0.021*\"jean\" + 0.017*\"daphn\" + 0.014*\"lazi\" + 0.012*\"loui\" + 0.011*\"piec\" + 0.009*\"wine\"\n", + "2019-01-31 01:14:54,303 : INFO : topic #40 (0.020): 0.086*\"unit\" + 0.023*\"schuster\" + 0.021*\"institut\" + 0.021*\"collector\" + 0.020*\"requir\" + 0.018*\"student\" + 0.015*\"professor\" + 0.012*\"http\" + 0.011*\"degre\" + 0.011*\"word\"\n", + "2019-01-31 01:14:54,309 : INFO : topic diff=0.003516, rho=0.024204\n", + "2019-01-31 01:14:54,467 : INFO : PROGRESS: pass 0, at document #3416000/4922894\n", + "2019-01-31 01:14:55,860 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:14:56,126 : INFO : topic #11 (0.020): 0.023*\"john\" + 0.012*\"will\" + 0.011*\"jame\" + 0.011*\"david\" + 0.010*\"rival\" + 0.009*\"mexican–american\" + 0.008*\"paul\" + 0.008*\"georg\" + 0.008*\"slur\" + 0.008*\"rhyme\"\n", + "2019-01-31 01:14:56,128 : INFO : topic #44 (0.020): 0.032*\"rooftop\" + 0.028*\"final\" + 0.022*\"wife\" + 0.020*\"tourist\" + 0.018*\"champion\" + 0.016*\"taxpay\" + 0.015*\"martin\" + 0.014*\"tiepolo\" + 0.014*\"chamber\" + 0.013*\"women\"\n", + "2019-01-31 01:14:56,129 : INFO : topic #49 (0.020): 0.044*\"india\" + 0.031*\"incumb\" + 0.014*\"islam\" + 0.013*\"pakistan\" + 0.011*\"anglo\" + 0.011*\"muskoge\" + 0.011*\"televis\" + 0.011*\"alam\" + 0.010*\"khalsa\" + 0.009*\"affection\"\n", + "2019-01-31 01:14:56,130 : INFO : topic #36 (0.020): 0.011*\"network\" + 0.011*\"prognosi\" + 0.010*\"pop\" + 0.008*\"cytokin\" + 0.008*\"user\" + 0.008*\"develop\" + 0.008*\"softwar\" + 0.008*\"uruguayan\" + 0.008*\"diggin\" + 0.007*\"championship\"\n", + "2019-01-31 01:14:56,131 : INFO : topic #7 (0.020): 0.021*\"snatch\" + 0.020*\"di\" + 0.018*\"factor\" + 0.016*\"yawn\" + 0.015*\"margin\" + 0.014*\"bone\" + 0.013*\"life\" + 0.012*\"faster\" + 0.012*\"deal\" + 0.011*\"john\"\n", + "2019-01-31 01:14:56,137 : INFO : topic diff=0.002914, rho=0.024197\n", + "2019-01-31 01:14:56,291 : INFO : PROGRESS: pass 0, at document #3418000/4922894\n", + "2019-01-31 01:14:57,652 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:14:57,921 : INFO : topic #43 (0.020): 0.064*\"elect\" + 0.053*\"parti\" + 0.025*\"voluntari\" + 0.024*\"democrat\" + 0.021*\"member\" + 0.017*\"polici\" + 0.016*\"republ\" + 0.013*\"report\" + 0.013*\"selma\" + 0.013*\"bypass\"\n", + "2019-01-31 01:14:57,923 : INFO : topic #37 (0.020): 0.012*\"charact\" + 0.010*\"septemb\" + 0.010*\"man\" + 0.010*\"anim\" + 0.007*\"comic\" + 0.007*\"appear\" + 0.007*\"storag\" + 0.006*\"workplac\" + 0.006*\"fusiform\" + 0.006*\"vision\"\n", + "2019-01-31 01:14:57,924 : INFO : topic #41 (0.020): 0.041*\"citi\" + 0.024*\"palmer\" + 0.021*\"new\" + 0.014*\"strategist\" + 0.013*\"open\" + 0.012*\"center\" + 0.011*\"includ\" + 0.011*\"dai\" + 0.011*\"lobe\" + 0.009*\"highli\"\n", + "2019-01-31 01:14:57,925 : INFO : topic #7 (0.020): 0.021*\"snatch\" + 0.020*\"di\" + 0.018*\"factor\" + 0.016*\"yawn\" + 0.015*\"margin\" + 0.014*\"bone\" + 0.013*\"life\" + 0.012*\"faster\" + 0.012*\"deal\" + 0.011*\"john\"\n", + "2019-01-31 01:14:57,926 : INFO : topic #39 (0.020): 0.057*\"canada\" + 0.043*\"canadian\" + 0.023*\"hoar\" + 0.022*\"toronto\" + 0.020*\"ontario\" + 0.016*\"new\" + 0.015*\"hydrogen\" + 0.014*\"novotná\" + 0.014*\"misericordia\" + 0.014*\"quebec\"\n", + "2019-01-31 01:14:57,932 : INFO : topic diff=0.003979, rho=0.024190\n", + "2019-01-31 01:15:00,656 : INFO : -11.625 per-word bound, 3157.7 perplexity estimate based on a held-out corpus of 2000 documents with 577054 words\n", + "2019-01-31 01:15:00,656 : INFO : PROGRESS: pass 0, at document #3420000/4922894\n", + "2019-01-31 01:15:02,051 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:15:02,317 : INFO : topic #45 (0.020): 0.027*\"jpg\" + 0.025*\"fifteenth\" + 0.023*\"arsen\" + 0.019*\"pain\" + 0.019*\"illicit\" + 0.019*\"museo\" + 0.014*\"colder\" + 0.012*\"gai\" + 0.012*\"black\" + 0.012*\"western\"\n", + "2019-01-31 01:15:02,318 : INFO : topic #43 (0.020): 0.064*\"elect\" + 0.053*\"parti\" + 0.025*\"voluntari\" + 0.024*\"democrat\" + 0.021*\"member\" + 0.017*\"polici\" + 0.016*\"republ\" + 0.013*\"report\" + 0.013*\"selma\" + 0.013*\"bypass\"\n", + "2019-01-31 01:15:02,319 : INFO : topic #38 (0.020): 0.023*\"walter\" + 0.010*\"aza\" + 0.009*\"battalion\" + 0.009*\"forc\" + 0.008*\"empath\" + 0.007*\"armi\" + 0.007*\"teufel\" + 0.006*\"militari\" + 0.006*\"govern\" + 0.006*\"pour\"\n", + "2019-01-31 01:15:02,321 : INFO : topic #10 (0.020): 0.012*\"cdd\" + 0.008*\"media\" + 0.008*\"disco\" + 0.007*\"hormon\" + 0.007*\"have\" + 0.007*\"pathwai\" + 0.006*\"caus\" + 0.006*\"proper\" + 0.006*\"treat\" + 0.005*\"effect\"\n", + "2019-01-31 01:15:02,322 : INFO : topic #27 (0.020): 0.070*\"questionnair\" + 0.020*\"candid\" + 0.019*\"taxpay\" + 0.015*\"ret\" + 0.013*\"driver\" + 0.013*\"tornado\" + 0.012*\"find\" + 0.011*\"fool\" + 0.010*\"champion\" + 0.010*\"squatter\"\n", + "2019-01-31 01:15:02,327 : INFO : topic diff=0.004008, rho=0.024183\n", + "2019-01-31 01:15:02,551 : INFO : PROGRESS: pass 0, at document #3422000/4922894\n", + "2019-01-31 01:15:03,979 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:15:04,246 : INFO : topic #16 (0.020): 0.054*\"king\" + 0.030*\"priest\" + 0.020*\"duke\" + 0.020*\"quarterli\" + 0.019*\"rotterdam\" + 0.017*\"idiosyncrat\" + 0.016*\"grammat\" + 0.013*\"count\" + 0.013*\"kingdom\" + 0.013*\"portugues\"\n", + "2019-01-31 01:15:04,247 : INFO : topic #35 (0.020): 0.058*\"russia\" + 0.037*\"sovereignti\" + 0.034*\"rural\" + 0.025*\"reprint\" + 0.025*\"poison\" + 0.023*\"personifi\" + 0.021*\"moscow\" + 0.017*\"poland\" + 0.015*\"unfortun\" + 0.014*\"malaysia\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 01:15:04,248 : INFO : topic #42 (0.020): 0.048*\"german\" + 0.032*\"germani\" + 0.015*\"israel\" + 0.015*\"vol\" + 0.015*\"jewish\" + 0.015*\"berlin\" + 0.013*\"der\" + 0.010*\"european\" + 0.009*\"isra\" + 0.009*\"europ\"\n", + "2019-01-31 01:15:04,249 : INFO : topic #2 (0.020): 0.048*\"isl\" + 0.039*\"shield\" + 0.018*\"narrat\" + 0.015*\"scot\" + 0.012*\"pope\" + 0.012*\"blur\" + 0.010*\"coalit\" + 0.010*\"nativist\" + 0.009*\"fleet\" + 0.009*\"class\"\n", + "2019-01-31 01:15:04,250 : INFO : topic #37 (0.020): 0.012*\"charact\" + 0.010*\"septemb\" + 0.010*\"man\" + 0.010*\"anim\" + 0.008*\"comic\" + 0.007*\"appear\" + 0.006*\"storag\" + 0.006*\"workplac\" + 0.006*\"fusiform\" + 0.006*\"vision\"\n", + "2019-01-31 01:15:04,256 : INFO : topic diff=0.003858, rho=0.024175\n", + "2019-01-31 01:15:04,414 : INFO : PROGRESS: pass 0, at document #3424000/4922894\n", + "2019-01-31 01:15:05,807 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:15:06,073 : INFO : topic #24 (0.020): 0.037*\"book\" + 0.033*\"publicis\" + 0.029*\"word\" + 0.019*\"new\" + 0.014*\"edit\" + 0.014*\"arsen\" + 0.013*\"presid\" + 0.011*\"magazin\" + 0.011*\"collect\" + 0.011*\"worldwid\"\n", + "2019-01-31 01:15:06,074 : INFO : topic #33 (0.020): 0.062*\"french\" + 0.047*\"franc\" + 0.032*\"pari\" + 0.023*\"sail\" + 0.022*\"jean\" + 0.017*\"daphn\" + 0.014*\"lazi\" + 0.012*\"loui\" + 0.011*\"piec\" + 0.010*\"wine\"\n", + "2019-01-31 01:15:06,075 : INFO : topic #13 (0.020): 0.029*\"australia\" + 0.027*\"london\" + 0.025*\"new\" + 0.024*\"sourc\" + 0.023*\"australian\" + 0.023*\"england\" + 0.019*\"british\" + 0.017*\"ireland\" + 0.015*\"youth\" + 0.013*\"wale\"\n", + "2019-01-31 01:15:06,076 : INFO : topic #40 (0.020): 0.085*\"unit\" + 0.025*\"schuster\" + 0.021*\"institut\" + 0.021*\"requir\" + 0.020*\"collector\" + 0.019*\"student\" + 0.015*\"professor\" + 0.012*\"http\" + 0.011*\"degre\" + 0.011*\"word\"\n", + "2019-01-31 01:15:06,077 : INFO : topic #48 (0.020): 0.079*\"sens\" + 0.078*\"march\" + 0.078*\"octob\" + 0.073*\"august\" + 0.073*\"juli\" + 0.073*\"januari\" + 0.070*\"april\" + 0.070*\"notion\" + 0.069*\"judici\" + 0.067*\"decatur\"\n", + "2019-01-31 01:15:06,083 : INFO : topic diff=0.003491, rho=0.024168\n", + "2019-01-31 01:15:06,239 : INFO : PROGRESS: pass 0, at document #3426000/4922894\n", + "2019-01-31 01:15:07,627 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:15:07,894 : INFO : topic #14 (0.020): 0.024*\"forc\" + 0.022*\"aggress\" + 0.021*\"armi\" + 0.020*\"walter\" + 0.018*\"com\" + 0.014*\"oper\" + 0.014*\"unionist\" + 0.013*\"militari\" + 0.012*\"airbu\" + 0.011*\"refut\"\n", + "2019-01-31 01:15:07,895 : INFO : topic #46 (0.020): 0.018*\"stop\" + 0.016*\"sweden\" + 0.016*\"wind\" + 0.015*\"norwai\" + 0.015*\"swedish\" + 0.014*\"damag\" + 0.013*\"norwegian\" + 0.013*\"huntsvil\" + 0.011*\"denmark\" + 0.011*\"turkish\"\n", + "2019-01-31 01:15:07,896 : INFO : topic #15 (0.020): 0.011*\"small\" + 0.011*\"organ\" + 0.010*\"develop\" + 0.009*\"commun\" + 0.008*\"group\" + 0.008*\"word\" + 0.008*\"peopl\" + 0.007*\"woman\" + 0.007*\"human\" + 0.006*\"summerhil\"\n", + "2019-01-31 01:15:07,897 : INFO : topic #5 (0.020): 0.039*\"abroad\" + 0.028*\"son\" + 0.027*\"rel\" + 0.026*\"reconstruct\" + 0.021*\"band\" + 0.016*\"muscl\" + 0.016*\"simultan\" + 0.014*\"charcoal\" + 0.014*\"toyota\" + 0.010*\"vocabulari\"\n", + "2019-01-31 01:15:07,898 : INFO : topic #2 (0.020): 0.048*\"isl\" + 0.039*\"shield\" + 0.018*\"narrat\" + 0.015*\"scot\" + 0.012*\"pope\" + 0.012*\"blur\" + 0.010*\"coalit\" + 0.010*\"nativist\" + 0.009*\"fleet\" + 0.009*\"class\"\n", + "2019-01-31 01:15:07,903 : INFO : topic diff=0.003325, rho=0.024161\n", + "2019-01-31 01:15:08,060 : INFO : PROGRESS: pass 0, at document #3428000/4922894\n", + "2019-01-31 01:15:09,449 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:15:09,716 : INFO : topic #10 (0.020): 0.012*\"cdd\" + 0.008*\"media\" + 0.007*\"disco\" + 0.007*\"hormon\" + 0.007*\"have\" + 0.007*\"pathwai\" + 0.007*\"caus\" + 0.006*\"proper\" + 0.006*\"treat\" + 0.005*\"effect\"\n", + "2019-01-31 01:15:09,717 : INFO : topic #27 (0.020): 0.070*\"questionnair\" + 0.020*\"candid\" + 0.019*\"taxpay\" + 0.014*\"ret\" + 0.013*\"driver\" + 0.013*\"tornado\" + 0.012*\"find\" + 0.012*\"fool\" + 0.010*\"squatter\" + 0.010*\"champion\"\n", + "2019-01-31 01:15:09,718 : INFO : topic #22 (0.020): 0.034*\"spars\" + 0.018*\"factor\" + 0.012*\"genu\" + 0.011*\"plaisir\" + 0.009*\"monument\" + 0.008*\"biom\" + 0.008*\"feel\" + 0.008*\"western\" + 0.008*\"male\" + 0.008*\"median\"\n", + "2019-01-31 01:15:09,719 : INFO : topic #40 (0.020): 0.084*\"unit\" + 0.024*\"schuster\" + 0.022*\"institut\" + 0.021*\"requir\" + 0.021*\"collector\" + 0.019*\"student\" + 0.015*\"professor\" + 0.012*\"http\" + 0.011*\"degre\" + 0.011*\"word\"\n", + "2019-01-31 01:15:09,720 : INFO : topic #9 (0.020): 0.067*\"bone\" + 0.044*\"american\" + 0.028*\"valour\" + 0.018*\"dutch\" + 0.018*\"player\" + 0.018*\"folei\" + 0.016*\"polit\" + 0.015*\"english\" + 0.013*\"acrimoni\" + 0.012*\"wedg\"\n", + "2019-01-31 01:15:09,726 : INFO : topic diff=0.003611, rho=0.024154\n", + "2019-01-31 01:15:09,888 : INFO : PROGRESS: pass 0, at document #3430000/4922894\n", + "2019-01-31 01:15:11,293 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:15:11,563 : INFO : topic #2 (0.020): 0.049*\"isl\" + 0.039*\"shield\" + 0.018*\"narrat\" + 0.015*\"scot\" + 0.012*\"pope\" + 0.012*\"blur\" + 0.010*\"coalit\" + 0.010*\"nativist\" + 0.009*\"fleet\" + 0.009*\"class\"\n", + "2019-01-31 01:15:11,564 : INFO : topic #37 (0.020): 0.012*\"charact\" + 0.010*\"septemb\" + 0.010*\"man\" + 0.010*\"anim\" + 0.007*\"comic\" + 0.007*\"appear\" + 0.006*\"storag\" + 0.006*\"workplac\" + 0.006*\"fusiform\" + 0.006*\"vision\"\n", + "2019-01-31 01:15:11,565 : INFO : topic #38 (0.020): 0.022*\"walter\" + 0.010*\"aza\" + 0.009*\"forc\" + 0.009*\"battalion\" + 0.008*\"empath\" + 0.007*\"armi\" + 0.007*\"teufel\" + 0.006*\"govern\" + 0.006*\"militari\" + 0.006*\"pour\"\n", + "2019-01-31 01:15:11,566 : INFO : topic #32 (0.020): 0.049*\"district\" + 0.044*\"vigour\" + 0.044*\"popolo\" + 0.036*\"cotton\" + 0.036*\"tortur\" + 0.022*\"adulthood\" + 0.022*\"area\" + 0.020*\"multitud\" + 0.020*\"citi\" + 0.019*\"cede\"\n", + "2019-01-31 01:15:11,567 : INFO : topic #3 (0.020): 0.032*\"present\" + 0.026*\"offic\" + 0.023*\"minist\" + 0.023*\"nation\" + 0.023*\"govern\" + 0.020*\"member\" + 0.019*\"serv\" + 0.016*\"start\" + 0.016*\"gener\" + 0.014*\"chickasaw\"\n", + "2019-01-31 01:15:11,573 : INFO : topic diff=0.003685, rho=0.024147\n", + "2019-01-31 01:15:11,728 : INFO : PROGRESS: pass 0, at document #3432000/4922894\n", + "2019-01-31 01:15:13,100 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:15:13,367 : INFO : topic #33 (0.020): 0.062*\"french\" + 0.047*\"franc\" + 0.033*\"pari\" + 0.023*\"sail\" + 0.022*\"jean\" + 0.017*\"daphn\" + 0.014*\"lazi\" + 0.012*\"loui\" + 0.011*\"piec\" + 0.009*\"wine\"\n", + "2019-01-31 01:15:13,368 : INFO : topic #15 (0.020): 0.011*\"small\" + 0.010*\"organ\" + 0.010*\"develop\" + 0.009*\"commun\" + 0.008*\"group\" + 0.008*\"word\" + 0.008*\"peopl\" + 0.007*\"woman\" + 0.007*\"human\" + 0.006*\"summerhil\"\n", + "2019-01-31 01:15:13,369 : INFO : topic #31 (0.020): 0.050*\"fusiform\" + 0.026*\"scientist\" + 0.025*\"taxpay\" + 0.023*\"player\" + 0.019*\"place\" + 0.014*\"clot\" + 0.013*\"leagu\" + 0.011*\"folei\" + 0.010*\"yawn\" + 0.009*\"reconstruct\"\n", + "2019-01-31 01:15:13,370 : INFO : topic #28 (0.020): 0.034*\"build\" + 0.028*\"hous\" + 0.018*\"buford\" + 0.014*\"histor\" + 0.013*\"rivièr\" + 0.011*\"constitut\" + 0.011*\"linear\" + 0.011*\"silicon\" + 0.011*\"briarwood\" + 0.010*\"depress\"\n", + "2019-01-31 01:15:13,371 : INFO : topic #14 (0.020): 0.024*\"forc\" + 0.022*\"aggress\" + 0.020*\"walter\" + 0.020*\"armi\" + 0.018*\"com\" + 0.014*\"oper\" + 0.014*\"unionist\" + 0.013*\"militari\" + 0.012*\"airbu\" + 0.010*\"refut\"\n", + "2019-01-31 01:15:13,377 : INFO : topic diff=0.002838, rho=0.024140\n", + "2019-01-31 01:15:13,533 : INFO : PROGRESS: pass 0, at document #3434000/4922894\n", + "2019-01-31 01:15:14,906 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:15:15,173 : INFO : topic #37 (0.020): 0.012*\"charact\" + 0.010*\"septemb\" + 0.010*\"man\" + 0.010*\"anim\" + 0.007*\"comic\" + 0.007*\"appear\" + 0.006*\"storag\" + 0.006*\"fusiform\" + 0.006*\"workplac\" + 0.006*\"vision\"\n", + "2019-01-31 01:15:15,174 : INFO : topic #30 (0.020): 0.037*\"cleveland\" + 0.034*\"leagu\" + 0.030*\"place\" + 0.027*\"taxpay\" + 0.024*\"scientist\" + 0.023*\"crete\" + 0.022*\"folei\" + 0.017*\"goal\" + 0.015*\"martin\" + 0.013*\"schmitz\"\n", + "2019-01-31 01:15:15,175 : INFO : topic #20 (0.020): 0.145*\"scholar\" + 0.040*\"struggl\" + 0.034*\"high\" + 0.030*\"educ\" + 0.024*\"collector\" + 0.017*\"yawn\" + 0.013*\"prognosi\" + 0.010*\"district\" + 0.010*\"gothic\" + 0.010*\"task\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 01:15:15,176 : INFO : topic #1 (0.020): 0.054*\"china\" + 0.047*\"chilton\" + 0.025*\"kong\" + 0.024*\"hong\" + 0.021*\"korea\" + 0.017*\"korean\" + 0.016*\"leah\" + 0.016*\"sourc\" + 0.014*\"kim\" + 0.014*\"shirin\"\n", + "2019-01-31 01:15:15,177 : INFO : topic #2 (0.020): 0.049*\"isl\" + 0.039*\"shield\" + 0.018*\"narrat\" + 0.015*\"scot\" + 0.012*\"pope\" + 0.012*\"blur\" + 0.010*\"nativist\" + 0.010*\"coalit\" + 0.009*\"fleet\" + 0.009*\"class\"\n", + "2019-01-31 01:15:15,183 : INFO : topic diff=0.003527, rho=0.024133\n", + "2019-01-31 01:15:15,339 : INFO : PROGRESS: pass 0, at document #3436000/4922894\n", + "2019-01-31 01:15:16,726 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:15:16,993 : INFO : topic #27 (0.020): 0.069*\"questionnair\" + 0.019*\"candid\" + 0.019*\"taxpay\" + 0.015*\"ret\" + 0.013*\"driver\" + 0.013*\"tornado\" + 0.012*\"fool\" + 0.012*\"find\" + 0.010*\"champion\" + 0.010*\"squatter\"\n", + "2019-01-31 01:15:16,994 : INFO : topic #0 (0.020): 0.066*\"statewid\" + 0.042*\"line\" + 0.035*\"raid\" + 0.026*\"rosenwald\" + 0.020*\"traceabl\" + 0.020*\"serv\" + 0.017*\"airmen\" + 0.017*\"rivièr\" + 0.014*\"oper\" + 0.011*\"transient\"\n", + "2019-01-31 01:15:16,995 : INFO : topic #44 (0.020): 0.032*\"rooftop\" + 0.028*\"final\" + 0.022*\"wife\" + 0.020*\"tourist\" + 0.018*\"champion\" + 0.016*\"taxpay\" + 0.015*\"martin\" + 0.014*\"tiepolo\" + 0.013*\"chamber\" + 0.013*\"women\"\n", + "2019-01-31 01:15:16,996 : INFO : topic #21 (0.020): 0.033*\"samford\" + 0.023*\"spain\" + 0.019*\"del\" + 0.017*\"mexico\" + 0.016*\"italian\" + 0.014*\"soviet\" + 0.012*\"santa\" + 0.011*\"juan\" + 0.011*\"carlo\" + 0.011*\"lizard\"\n", + "2019-01-31 01:15:16,997 : INFO : topic #6 (0.020): 0.070*\"fewer\" + 0.024*\"epiru\" + 0.020*\"septemb\" + 0.019*\"teacher\" + 0.016*\"stake\" + 0.013*\"rodríguez\" + 0.012*\"proclaim\" + 0.011*\"direct\" + 0.010*\"movi\" + 0.010*\"acrimoni\"\n", + "2019-01-31 01:15:17,003 : INFO : topic diff=0.003398, rho=0.024126\n", + "2019-01-31 01:15:17,163 : INFO : PROGRESS: pass 0, at document #3438000/4922894\n", + "2019-01-31 01:15:18,567 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:15:18,834 : INFO : topic #4 (0.020): 0.021*\"enfranchis\" + 0.015*\"depress\" + 0.014*\"pour\" + 0.008*\"mode\" + 0.008*\"elabor\" + 0.008*\"veget\" + 0.007*\"uruguayan\" + 0.006*\"produc\" + 0.006*\"develop\" + 0.006*\"spectacl\"\n", + "2019-01-31 01:15:18,834 : INFO : topic #0 (0.020): 0.066*\"statewid\" + 0.042*\"line\" + 0.035*\"raid\" + 0.026*\"rosenwald\" + 0.020*\"traceabl\" + 0.020*\"serv\" + 0.017*\"airmen\" + 0.017*\"rivièr\" + 0.014*\"oper\" + 0.011*\"transient\"\n", + "2019-01-31 01:15:18,836 : INFO : topic #31 (0.020): 0.050*\"fusiform\" + 0.026*\"scientist\" + 0.025*\"taxpay\" + 0.023*\"player\" + 0.019*\"place\" + 0.014*\"clot\" + 0.013*\"leagu\" + 0.011*\"folei\" + 0.010*\"yawn\" + 0.009*\"reconstruct\"\n", + "2019-01-31 01:15:18,837 : INFO : topic #10 (0.020): 0.012*\"cdd\" + 0.008*\"media\" + 0.008*\"disco\" + 0.007*\"hormon\" + 0.007*\"have\" + 0.007*\"caus\" + 0.006*\"pathwai\" + 0.006*\"proper\" + 0.006*\"treat\" + 0.005*\"effect\"\n", + "2019-01-31 01:15:18,838 : INFO : topic #33 (0.020): 0.063*\"french\" + 0.048*\"franc\" + 0.032*\"pari\" + 0.023*\"jean\" + 0.022*\"sail\" + 0.017*\"daphn\" + 0.014*\"lazi\" + 0.012*\"loui\" + 0.011*\"piec\" + 0.010*\"wine\"\n", + "2019-01-31 01:15:18,844 : INFO : topic diff=0.003924, rho=0.024119\n", + "2019-01-31 01:15:21,498 : INFO : -11.858 per-word bound, 3712.3 perplexity estimate based on a held-out corpus of 2000 documents with 530854 words\n", + "2019-01-31 01:15:21,498 : INFO : PROGRESS: pass 0, at document #3440000/4922894\n", + "2019-01-31 01:15:22,880 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:15:23,147 : INFO : topic #25 (0.020): 0.032*\"ring\" + 0.019*\"area\" + 0.019*\"lagrang\" + 0.017*\"warmth\" + 0.015*\"mount\" + 0.013*\"palmer\" + 0.010*\"foam\" + 0.010*\"north\" + 0.010*\"nation\" + 0.009*\"sourc\"\n", + "2019-01-31 01:15:23,148 : INFO : topic #41 (0.020): 0.041*\"citi\" + 0.024*\"palmer\" + 0.021*\"new\" + 0.015*\"strategist\" + 0.013*\"open\" + 0.012*\"center\" + 0.011*\"includ\" + 0.011*\"dai\" + 0.011*\"lobe\" + 0.009*\"local\"\n", + "2019-01-31 01:15:23,149 : INFO : topic #6 (0.020): 0.070*\"fewer\" + 0.024*\"epiru\" + 0.020*\"septemb\" + 0.019*\"teacher\" + 0.016*\"stake\" + 0.013*\"rodríguez\" + 0.012*\"proclaim\" + 0.011*\"direct\" + 0.010*\"movi\" + 0.010*\"acrimoni\"\n", + "2019-01-31 01:15:23,150 : INFO : topic #48 (0.020): 0.079*\"sens\" + 0.079*\"march\" + 0.077*\"octob\" + 0.073*\"juli\" + 0.073*\"januari\" + 0.072*\"august\" + 0.071*\"april\" + 0.070*\"notion\" + 0.069*\"judici\" + 0.067*\"decatur\"\n", + "2019-01-31 01:15:23,151 : INFO : topic #13 (0.020): 0.028*\"australia\" + 0.026*\"london\" + 0.025*\"new\" + 0.024*\"sourc\" + 0.023*\"australian\" + 0.022*\"england\" + 0.019*\"british\" + 0.017*\"ireland\" + 0.015*\"youth\" + 0.014*\"wale\"\n", + "2019-01-31 01:15:23,157 : INFO : topic diff=0.003858, rho=0.024112\n", + "2019-01-31 01:15:23,316 : INFO : PROGRESS: pass 0, at document #3442000/4922894\n", + "2019-01-31 01:15:24,798 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:15:25,066 : INFO : topic #3 (0.020): 0.032*\"present\" + 0.026*\"offic\" + 0.025*\"nation\" + 0.023*\"minist\" + 0.023*\"govern\" + 0.020*\"member\" + 0.019*\"serv\" + 0.016*\"start\" + 0.016*\"gener\" + 0.014*\"chickasaw\"\n", + "2019-01-31 01:15:25,067 : INFO : topic #11 (0.020): 0.023*\"john\" + 0.012*\"will\" + 0.011*\"jame\" + 0.011*\"david\" + 0.010*\"rival\" + 0.009*\"mexican–american\" + 0.008*\"paul\" + 0.008*\"georg\" + 0.008*\"slur\" + 0.007*\"rhyme\"\n", + "2019-01-31 01:15:25,068 : INFO : topic #21 (0.020): 0.033*\"samford\" + 0.022*\"spain\" + 0.019*\"del\" + 0.017*\"mexico\" + 0.016*\"italian\" + 0.014*\"soviet\" + 0.011*\"santa\" + 0.011*\"juan\" + 0.011*\"carlo\" + 0.011*\"lizard\"\n", + "2019-01-31 01:15:25,070 : INFO : topic #45 (0.020): 0.027*\"jpg\" + 0.025*\"arsen\" + 0.025*\"fifteenth\" + 0.020*\"museo\" + 0.019*\"pain\" + 0.019*\"illicit\" + 0.015*\"colder\" + 0.013*\"gai\" + 0.012*\"black\" + 0.011*\"western\"\n", + "2019-01-31 01:15:25,071 : INFO : topic #28 (0.020): 0.034*\"build\" + 0.029*\"hous\" + 0.018*\"buford\" + 0.014*\"histor\" + 0.013*\"rivièr\" + 0.011*\"constitut\" + 0.011*\"briarwood\" + 0.011*\"linear\" + 0.011*\"silicon\" + 0.010*\"depress\"\n", + "2019-01-31 01:15:25,077 : INFO : topic diff=0.003395, rho=0.024105\n", + "2019-01-31 01:15:25,234 : INFO : PROGRESS: pass 0, at document #3444000/4922894\n", + "2019-01-31 01:15:26,618 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:15:26,885 : INFO : topic #34 (0.020): 0.069*\"start\" + 0.034*\"new\" + 0.031*\"american\" + 0.031*\"unionist\" + 0.025*\"cotton\" + 0.021*\"year\" + 0.015*\"california\" + 0.013*\"warrior\" + 0.012*\"terri\" + 0.011*\"citi\"\n", + "2019-01-31 01:15:26,886 : INFO : topic #27 (0.020): 0.069*\"questionnair\" + 0.020*\"candid\" + 0.019*\"taxpay\" + 0.015*\"ret\" + 0.014*\"driver\" + 0.012*\"tornado\" + 0.012*\"fool\" + 0.012*\"find\" + 0.010*\"champion\" + 0.009*\"squatter\"\n", + "2019-01-31 01:15:26,887 : INFO : topic #45 (0.020): 0.027*\"jpg\" + 0.025*\"arsen\" + 0.025*\"fifteenth\" + 0.020*\"museo\" + 0.019*\"pain\" + 0.019*\"illicit\" + 0.015*\"colder\" + 0.013*\"gai\" + 0.012*\"black\" + 0.012*\"western\"\n", + "2019-01-31 01:15:26,888 : INFO : topic #41 (0.020): 0.041*\"citi\" + 0.024*\"palmer\" + 0.021*\"new\" + 0.015*\"strategist\" + 0.013*\"open\" + 0.012*\"center\" + 0.011*\"includ\" + 0.011*\"dai\" + 0.011*\"lobe\" + 0.009*\"highli\"\n", + "2019-01-31 01:15:26,890 : INFO : topic #18 (0.020): 0.011*\"théori\" + 0.007*\"later\" + 0.007*\"sack\" + 0.006*\"dai\" + 0.006*\"kill\" + 0.005*\"like\" + 0.005*\"retrospect\" + 0.005*\"end\" + 0.004*\"help\" + 0.004*\"call\"\n", + "2019-01-31 01:15:26,896 : INFO : topic diff=0.003107, rho=0.024098\n", + "2019-01-31 01:15:27,051 : INFO : PROGRESS: pass 0, at document #3446000/4922894\n", + "2019-01-31 01:15:28,417 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:15:28,687 : INFO : topic #1 (0.020): 0.056*\"china\" + 0.048*\"chilton\" + 0.024*\"kong\" + 0.024*\"hong\" + 0.021*\"korea\" + 0.017*\"korean\" + 0.015*\"sourc\" + 0.015*\"leah\" + 0.014*\"shirin\" + 0.013*\"kim\"\n", + "2019-01-31 01:15:28,688 : INFO : topic #12 (0.020): 0.009*\"number\" + 0.007*\"frontal\" + 0.007*\"gener\" + 0.006*\"poet\" + 0.006*\"measur\" + 0.006*\"exampl\" + 0.006*\"southern\" + 0.006*\"servitud\" + 0.006*\"utopian\" + 0.006*\"théori\"\n", + "2019-01-31 01:15:28,689 : INFO : topic #45 (0.020): 0.026*\"jpg\" + 0.026*\"arsen\" + 0.024*\"fifteenth\" + 0.020*\"museo\" + 0.019*\"pain\" + 0.019*\"illicit\" + 0.015*\"colder\" + 0.013*\"gai\" + 0.012*\"black\" + 0.012*\"western\"\n", + "2019-01-31 01:15:28,690 : INFO : topic #11 (0.020): 0.023*\"john\" + 0.012*\"will\" + 0.011*\"jame\" + 0.011*\"david\" + 0.010*\"rival\" + 0.009*\"mexican–american\" + 0.008*\"paul\" + 0.008*\"georg\" + 0.008*\"slur\" + 0.007*\"rhyme\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 01:15:28,692 : INFO : topic #28 (0.020): 0.034*\"build\" + 0.029*\"hous\" + 0.018*\"buford\" + 0.014*\"histor\" + 0.013*\"rivièr\" + 0.011*\"constitut\" + 0.011*\"briarwood\" + 0.011*\"linear\" + 0.011*\"silicon\" + 0.010*\"depress\"\n", + "2019-01-31 01:15:28,698 : INFO : topic diff=0.003295, rho=0.024091\n", + "2019-01-31 01:15:28,852 : INFO : PROGRESS: pass 0, at document #3448000/4922894\n", + "2019-01-31 01:15:30,217 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:15:30,483 : INFO : topic #6 (0.020): 0.070*\"fewer\" + 0.024*\"epiru\" + 0.020*\"septemb\" + 0.019*\"teacher\" + 0.016*\"stake\" + 0.013*\"rodríguez\" + 0.012*\"proclaim\" + 0.011*\"direct\" + 0.011*\"movi\" + 0.010*\"acrimoni\"\n", + "2019-01-31 01:15:30,485 : INFO : topic #37 (0.020): 0.012*\"charact\" + 0.011*\"septemb\" + 0.010*\"anim\" + 0.010*\"man\" + 0.008*\"comic\" + 0.007*\"appear\" + 0.006*\"storag\" + 0.006*\"workplac\" + 0.006*\"fusiform\" + 0.006*\"vision\"\n", + "2019-01-31 01:15:30,486 : INFO : topic #25 (0.020): 0.032*\"ring\" + 0.019*\"area\" + 0.019*\"lagrang\" + 0.017*\"warmth\" + 0.015*\"mount\" + 0.013*\"palmer\" + 0.010*\"north\" + 0.010*\"foam\" + 0.010*\"nation\" + 0.009*\"sourc\"\n", + "2019-01-31 01:15:30,487 : INFO : topic #31 (0.020): 0.050*\"fusiform\" + 0.026*\"scientist\" + 0.025*\"taxpay\" + 0.022*\"player\" + 0.019*\"place\" + 0.014*\"clot\" + 0.013*\"leagu\" + 0.012*\"folei\" + 0.010*\"yawn\" + 0.010*\"reconstruct\"\n", + "2019-01-31 01:15:30,488 : INFO : topic #40 (0.020): 0.086*\"unit\" + 0.024*\"schuster\" + 0.022*\"institut\" + 0.021*\"requir\" + 0.021*\"collector\" + 0.019*\"student\" + 0.015*\"professor\" + 0.012*\"http\" + 0.011*\"degre\" + 0.011*\"word\"\n", + "2019-01-31 01:15:30,494 : INFO : topic diff=0.004371, rho=0.024084\n", + "2019-01-31 01:15:30,653 : INFO : PROGRESS: pass 0, at document #3450000/4922894\n", + "2019-01-31 01:15:32,045 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:15:32,311 : INFO : topic #1 (0.020): 0.055*\"china\" + 0.048*\"chilton\" + 0.025*\"kong\" + 0.025*\"hong\" + 0.021*\"korea\" + 0.017*\"korean\" + 0.015*\"sourc\" + 0.015*\"leah\" + 0.014*\"shirin\" + 0.013*\"kim\"\n", + "2019-01-31 01:15:32,312 : INFO : topic #2 (0.020): 0.048*\"isl\" + 0.039*\"shield\" + 0.018*\"narrat\" + 0.014*\"scot\" + 0.013*\"pope\" + 0.012*\"blur\" + 0.010*\"nativist\" + 0.010*\"coalit\" + 0.009*\"fleet\" + 0.008*\"class\"\n", + "2019-01-31 01:15:32,314 : INFO : topic #8 (0.020): 0.026*\"law\" + 0.023*\"cortic\" + 0.018*\"start\" + 0.017*\"act\" + 0.012*\"case\" + 0.012*\"ricardo\" + 0.010*\"replac\" + 0.009*\"polaris\" + 0.008*\"legal\" + 0.008*\"order\"\n", + "2019-01-31 01:15:32,315 : INFO : topic #19 (0.020): 0.016*\"languag\" + 0.015*\"centuri\" + 0.011*\"woodcut\" + 0.009*\"form\" + 0.009*\"origin\" + 0.009*\"mean\" + 0.008*\"trade\" + 0.008*\"english\" + 0.007*\"known\" + 0.006*\"ancestor\"\n", + "2019-01-31 01:15:32,316 : INFO : topic #49 (0.020): 0.044*\"india\" + 0.031*\"incumb\" + 0.013*\"pakistan\" + 0.013*\"islam\" + 0.011*\"anglo\" + 0.011*\"televis\" + 0.011*\"muskoge\" + 0.010*\"tajikistan\" + 0.010*\"alam\" + 0.010*\"affection\"\n", + "2019-01-31 01:15:32,322 : INFO : topic diff=0.003806, rho=0.024077\n", + "2019-01-31 01:15:32,479 : INFO : PROGRESS: pass 0, at document #3452000/4922894\n", + "2019-01-31 01:15:33,871 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:15:34,137 : INFO : topic #19 (0.020): 0.016*\"languag\" + 0.015*\"centuri\" + 0.011*\"woodcut\" + 0.009*\"form\" + 0.009*\"mean\" + 0.009*\"origin\" + 0.008*\"trade\" + 0.008*\"english\" + 0.007*\"known\" + 0.006*\"ancestor\"\n", + "2019-01-31 01:15:34,139 : INFO : topic #35 (0.020): 0.058*\"russia\" + 0.037*\"sovereignti\" + 0.034*\"rural\" + 0.026*\"poison\" + 0.024*\"reprint\" + 0.023*\"personifi\" + 0.020*\"moscow\" + 0.017*\"poland\" + 0.015*\"unfortun\" + 0.014*\"malaysia\"\n", + "2019-01-31 01:15:34,139 : INFO : topic #13 (0.020): 0.028*\"australia\" + 0.026*\"london\" + 0.025*\"new\" + 0.025*\"sourc\" + 0.023*\"australian\" + 0.023*\"england\" + 0.019*\"british\" + 0.017*\"ireland\" + 0.015*\"youth\" + 0.014*\"wale\"\n", + "2019-01-31 01:15:34,141 : INFO : topic #10 (0.020): 0.012*\"cdd\" + 0.008*\"media\" + 0.008*\"disco\" + 0.007*\"have\" + 0.007*\"hormon\" + 0.007*\"pathwai\" + 0.007*\"caus\" + 0.006*\"proper\" + 0.006*\"treat\" + 0.005*\"effect\"\n", + "2019-01-31 01:15:34,142 : INFO : topic #39 (0.020): 0.058*\"canada\" + 0.045*\"canadian\" + 0.023*\"toronto\" + 0.023*\"hoar\" + 0.020*\"ontario\" + 0.016*\"new\" + 0.015*\"hydrogen\" + 0.014*\"novotná\" + 0.014*\"misericordia\" + 0.014*\"quebec\"\n", + "2019-01-31 01:15:34,148 : INFO : topic diff=0.003816, rho=0.024070\n", + "2019-01-31 01:15:34,360 : INFO : PROGRESS: pass 0, at document #3454000/4922894\n", + "2019-01-31 01:15:35,746 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:15:36,013 : INFO : topic #25 (0.020): 0.032*\"ring\" + 0.019*\"area\" + 0.019*\"lagrang\" + 0.017*\"warmth\" + 0.015*\"mount\" + 0.013*\"palmer\" + 0.010*\"north\" + 0.010*\"nation\" + 0.009*\"foam\" + 0.009*\"sourc\"\n", + "2019-01-31 01:15:36,014 : INFO : topic #0 (0.020): 0.065*\"statewid\" + 0.041*\"line\" + 0.035*\"raid\" + 0.026*\"rosenwald\" + 0.021*\"traceabl\" + 0.020*\"serv\" + 0.018*\"rivièr\" + 0.017*\"airmen\" + 0.014*\"oper\" + 0.011*\"transient\"\n", + "2019-01-31 01:15:36,016 : INFO : topic #17 (0.020): 0.075*\"church\" + 0.022*\"christian\" + 0.022*\"cathol\" + 0.020*\"bishop\" + 0.018*\"sail\" + 0.015*\"retroflex\" + 0.010*\"relationship\" + 0.010*\"historiographi\" + 0.010*\"cathedr\" + 0.009*\"poll\"\n", + "2019-01-31 01:15:36,017 : INFO : topic #23 (0.020): 0.135*\"audit\" + 0.068*\"best\" + 0.032*\"yawn\" + 0.029*\"jacksonvil\" + 0.023*\"japanes\" + 0.022*\"noll\" + 0.020*\"festiv\" + 0.019*\"women\" + 0.017*\"intern\" + 0.013*\"winner\"\n", + "2019-01-31 01:15:36,018 : INFO : topic #43 (0.020): 0.065*\"elect\" + 0.054*\"parti\" + 0.025*\"voluntari\" + 0.024*\"democrat\" + 0.020*\"member\" + 0.017*\"republ\" + 0.017*\"polici\" + 0.014*\"report\" + 0.013*\"selma\" + 0.013*\"bypass\"\n", + "2019-01-31 01:15:36,024 : INFO : topic diff=0.003505, rho=0.024063\n", + "2019-01-31 01:15:36,178 : INFO : PROGRESS: pass 0, at document #3456000/4922894\n", + "2019-01-31 01:15:37,556 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:15:37,823 : INFO : topic #37 (0.020): 0.012*\"charact\" + 0.010*\"septemb\" + 0.010*\"anim\" + 0.010*\"man\" + 0.008*\"comic\" + 0.007*\"storag\" + 0.007*\"appear\" + 0.006*\"fusiform\" + 0.006*\"workplac\" + 0.006*\"vision\"\n", + "2019-01-31 01:15:37,824 : INFO : topic #34 (0.020): 0.069*\"start\" + 0.034*\"new\" + 0.031*\"american\" + 0.031*\"unionist\" + 0.025*\"cotton\" + 0.021*\"year\" + 0.015*\"california\" + 0.013*\"warrior\" + 0.012*\"terri\" + 0.011*\"citi\"\n", + "2019-01-31 01:15:37,825 : INFO : topic #45 (0.020): 0.026*\"jpg\" + 0.026*\"arsen\" + 0.024*\"fifteenth\" + 0.020*\"museo\" + 0.019*\"pain\" + 0.018*\"illicit\" + 0.014*\"colder\" + 0.013*\"gai\" + 0.012*\"black\" + 0.012*\"exhaust\"\n", + "2019-01-31 01:15:37,826 : INFO : topic #28 (0.020): 0.034*\"build\" + 0.029*\"hous\" + 0.018*\"buford\" + 0.014*\"histor\" + 0.012*\"rivièr\" + 0.012*\"linear\" + 0.011*\"constitut\" + 0.011*\"briarwood\" + 0.011*\"silicon\" + 0.010*\"depress\"\n", + "2019-01-31 01:15:37,827 : INFO : topic #31 (0.020): 0.050*\"fusiform\" + 0.027*\"scientist\" + 0.025*\"taxpay\" + 0.022*\"player\" + 0.019*\"place\" + 0.014*\"clot\" + 0.013*\"leagu\" + 0.012*\"folei\" + 0.010*\"yawn\" + 0.010*\"reconstruct\"\n", + "2019-01-31 01:15:37,833 : INFO : topic diff=0.003642, rho=0.024056\n", + "2019-01-31 01:15:37,991 : INFO : PROGRESS: pass 0, at document #3458000/4922894\n", + "2019-01-31 01:15:39,359 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:15:39,625 : INFO : topic #4 (0.020): 0.021*\"enfranchis\" + 0.015*\"depress\" + 0.014*\"pour\" + 0.008*\"mode\" + 0.008*\"elabor\" + 0.008*\"veget\" + 0.007*\"uruguayan\" + 0.006*\"produc\" + 0.006*\"develop\" + 0.006*\"spectacl\"\n", + "2019-01-31 01:15:39,626 : INFO : topic #10 (0.020): 0.013*\"cdd\" + 0.008*\"media\" + 0.008*\"disco\" + 0.007*\"have\" + 0.007*\"hormon\" + 0.007*\"pathwai\" + 0.007*\"caus\" + 0.006*\"proper\" + 0.006*\"treat\" + 0.005*\"effect\"\n", + "2019-01-31 01:15:39,627 : INFO : topic #27 (0.020): 0.070*\"questionnair\" + 0.020*\"candid\" + 0.018*\"taxpay\" + 0.014*\"ret\" + 0.014*\"driver\" + 0.013*\"fool\" + 0.013*\"tornado\" + 0.011*\"find\" + 0.011*\"squatter\" + 0.010*\"champion\"\n", + "2019-01-31 01:15:39,628 : INFO : topic #43 (0.020): 0.065*\"elect\" + 0.054*\"parti\" + 0.025*\"voluntari\" + 0.024*\"democrat\" + 0.020*\"member\" + 0.017*\"republ\" + 0.017*\"polici\" + 0.013*\"report\" + 0.013*\"bypass\" + 0.013*\"seaport\"\n", + "2019-01-31 01:15:39,629 : INFO : topic #23 (0.020): 0.135*\"audit\" + 0.067*\"best\" + 0.032*\"yawn\" + 0.028*\"jacksonvil\" + 0.022*\"japanes\" + 0.022*\"noll\" + 0.020*\"festiv\" + 0.019*\"women\" + 0.017*\"intern\" + 0.013*\"winner\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 01:15:39,635 : INFO : topic diff=0.003291, rho=0.024049\n", + "2019-01-31 01:15:42,283 : INFO : -11.556 per-word bound, 3010.0 perplexity estimate based on a held-out corpus of 2000 documents with 558121 words\n", + "2019-01-31 01:15:42,284 : INFO : PROGRESS: pass 0, at document #3460000/4922894\n", + "2019-01-31 01:15:43,645 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:15:43,912 : INFO : topic #18 (0.020): 0.011*\"théori\" + 0.007*\"later\" + 0.007*\"sack\" + 0.006*\"dai\" + 0.006*\"kill\" + 0.005*\"like\" + 0.005*\"retrospect\" + 0.005*\"end\" + 0.004*\"help\" + 0.004*\"call\"\n", + "2019-01-31 01:15:43,913 : INFO : topic #12 (0.020): 0.008*\"number\" + 0.008*\"frontal\" + 0.007*\"gener\" + 0.006*\"servitud\" + 0.006*\"exampl\" + 0.006*\"poet\" + 0.006*\"southern\" + 0.006*\"measur\" + 0.006*\"théori\" + 0.006*\"utopian\"\n", + "2019-01-31 01:15:43,914 : INFO : topic #16 (0.020): 0.056*\"king\" + 0.030*\"priest\" + 0.020*\"rotterdam\" + 0.019*\"duke\" + 0.019*\"quarterli\" + 0.017*\"idiosyncrat\" + 0.016*\"grammat\" + 0.014*\"kingdom\" + 0.013*\"count\" + 0.013*\"portugues\"\n", + "2019-01-31 01:15:43,915 : INFO : topic #46 (0.020): 0.018*\"stop\" + 0.016*\"sweden\" + 0.015*\"norwai\" + 0.015*\"wind\" + 0.015*\"swedish\" + 0.013*\"damag\" + 0.013*\"norwegian\" + 0.012*\"huntsvil\" + 0.011*\"treeless\" + 0.010*\"denmark\"\n", + "2019-01-31 01:15:43,916 : INFO : topic #44 (0.020): 0.031*\"rooftop\" + 0.027*\"final\" + 0.021*\"wife\" + 0.020*\"tourist\" + 0.018*\"champion\" + 0.016*\"taxpay\" + 0.015*\"martin\" + 0.014*\"tiepolo\" + 0.013*\"women\" + 0.013*\"chamber\"\n", + "2019-01-31 01:15:43,922 : INFO : topic diff=0.002954, rho=0.024042\n", + "2019-01-31 01:15:44,074 : INFO : PROGRESS: pass 0, at document #3462000/4922894\n", + "2019-01-31 01:15:45,414 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:15:45,681 : INFO : topic #13 (0.020): 0.027*\"australia\" + 0.026*\"london\" + 0.025*\"sourc\" + 0.025*\"new\" + 0.023*\"australian\" + 0.022*\"england\" + 0.019*\"british\" + 0.018*\"ireland\" + 0.015*\"youth\" + 0.014*\"wale\"\n", + "2019-01-31 01:15:45,682 : INFO : topic #12 (0.020): 0.009*\"number\" + 0.008*\"frontal\" + 0.007*\"gener\" + 0.007*\"servitud\" + 0.006*\"exampl\" + 0.006*\"poet\" + 0.006*\"southern\" + 0.006*\"measur\" + 0.006*\"utopian\" + 0.006*\"théori\"\n", + "2019-01-31 01:15:45,683 : INFO : topic #33 (0.020): 0.062*\"french\" + 0.048*\"franc\" + 0.032*\"pari\" + 0.023*\"jean\" + 0.022*\"sail\" + 0.017*\"daphn\" + 0.014*\"lazi\" + 0.012*\"loui\" + 0.011*\"piec\" + 0.010*\"wine\"\n", + "2019-01-31 01:15:45,684 : INFO : topic #38 (0.020): 0.022*\"walter\" + 0.010*\"aza\" + 0.009*\"forc\" + 0.009*\"battalion\" + 0.007*\"empath\" + 0.007*\"armi\" + 0.007*\"teufel\" + 0.006*\"govern\" + 0.006*\"militari\" + 0.006*\"pour\"\n", + "2019-01-31 01:15:45,685 : INFO : topic #35 (0.020): 0.059*\"russia\" + 0.037*\"sovereignti\" + 0.034*\"rural\" + 0.026*\"poison\" + 0.024*\"reprint\" + 0.023*\"personifi\" + 0.020*\"moscow\" + 0.018*\"poland\" + 0.015*\"unfortun\" + 0.014*\"malaysia\"\n", + "2019-01-31 01:15:45,691 : INFO : topic diff=0.003354, rho=0.024035\n", + "2019-01-31 01:15:45,844 : INFO : PROGRESS: pass 0, at document #3464000/4922894\n", + "2019-01-31 01:15:47,193 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:15:47,459 : INFO : topic #34 (0.020): 0.068*\"start\" + 0.034*\"new\" + 0.032*\"american\" + 0.031*\"unionist\" + 0.024*\"cotton\" + 0.021*\"year\" + 0.015*\"california\" + 0.013*\"warrior\" + 0.012*\"terri\" + 0.011*\"citi\"\n", + "2019-01-31 01:15:47,460 : INFO : topic #15 (0.020): 0.011*\"small\" + 0.010*\"organ\" + 0.010*\"develop\" + 0.009*\"commun\" + 0.008*\"group\" + 0.008*\"peopl\" + 0.008*\"word\" + 0.007*\"human\" + 0.007*\"woman\" + 0.006*\"summerhil\"\n", + "2019-01-31 01:15:47,461 : INFO : topic #30 (0.020): 0.036*\"cleveland\" + 0.034*\"leagu\" + 0.030*\"place\" + 0.027*\"taxpay\" + 0.024*\"scientist\" + 0.024*\"crete\" + 0.022*\"folei\" + 0.017*\"goal\" + 0.015*\"martin\" + 0.013*\"schmitz\"\n", + "2019-01-31 01:15:47,462 : INFO : topic #9 (0.020): 0.067*\"bone\" + 0.044*\"american\" + 0.030*\"valour\" + 0.019*\"dutch\" + 0.019*\"folei\" + 0.018*\"player\" + 0.016*\"polit\" + 0.015*\"english\" + 0.013*\"acrimoni\" + 0.012*\"wedg\"\n", + "2019-01-31 01:15:47,464 : INFO : topic #7 (0.020): 0.021*\"snatch\" + 0.020*\"di\" + 0.018*\"factor\" + 0.016*\"yawn\" + 0.015*\"margin\" + 0.014*\"bone\" + 0.013*\"faster\" + 0.013*\"life\" + 0.012*\"deal\" + 0.011*\"john\"\n", + "2019-01-31 01:15:47,470 : INFO : topic diff=0.003137, rho=0.024028\n", + "2019-01-31 01:15:47,630 : INFO : PROGRESS: pass 0, at document #3466000/4922894\n", + "2019-01-31 01:15:49,016 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:15:49,283 : INFO : topic #8 (0.020): 0.026*\"law\" + 0.023*\"cortic\" + 0.018*\"start\" + 0.017*\"act\" + 0.012*\"case\" + 0.012*\"ricardo\" + 0.010*\"replac\" + 0.009*\"polaris\" + 0.008*\"legal\" + 0.008*\"order\"\n", + "2019-01-31 01:15:49,284 : INFO : topic #12 (0.020): 0.009*\"number\" + 0.008*\"frontal\" + 0.007*\"gener\" + 0.006*\"servitud\" + 0.006*\"exampl\" + 0.006*\"poet\" + 0.006*\"southern\" + 0.006*\"measur\" + 0.006*\"théori\" + 0.006*\"utopian\"\n", + "2019-01-31 01:15:49,285 : INFO : topic #24 (0.020): 0.037*\"book\" + 0.033*\"publicis\" + 0.029*\"word\" + 0.019*\"new\" + 0.015*\"edit\" + 0.013*\"presid\" + 0.013*\"arsen\" + 0.011*\"collect\" + 0.011*\"worldwid\" + 0.011*\"magazin\"\n", + "2019-01-31 01:15:49,286 : INFO : topic #29 (0.020): 0.030*\"companhia\" + 0.014*\"bank\" + 0.013*\"busi\" + 0.012*\"million\" + 0.011*\"market\" + 0.011*\"produc\" + 0.010*\"industri\" + 0.009*\"yawn\" + 0.008*\"manag\" + 0.007*\"oper\"\n", + "2019-01-31 01:15:49,287 : INFO : topic #32 (0.020): 0.050*\"district\" + 0.046*\"vigour\" + 0.044*\"popolo\" + 0.036*\"tortur\" + 0.036*\"cotton\" + 0.022*\"adulthood\" + 0.022*\"multitud\" + 0.022*\"area\" + 0.020*\"citi\" + 0.019*\"cede\"\n", + "2019-01-31 01:15:49,293 : INFO : topic diff=0.004386, rho=0.024022\n", + "2019-01-31 01:15:49,454 : INFO : PROGRESS: pass 0, at document #3468000/4922894\n", + "2019-01-31 01:15:50,844 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:15:51,111 : INFO : topic #19 (0.020): 0.016*\"languag\" + 0.015*\"centuri\" + 0.011*\"woodcut\" + 0.009*\"form\" + 0.009*\"mean\" + 0.009*\"origin\" + 0.008*\"trade\" + 0.008*\"english\" + 0.007*\"known\" + 0.006*\"ancestor\"\n", + "2019-01-31 01:15:51,112 : INFO : topic #43 (0.020): 0.066*\"elect\" + 0.054*\"parti\" + 0.026*\"voluntari\" + 0.024*\"democrat\" + 0.020*\"member\" + 0.016*\"republ\" + 0.016*\"polici\" + 0.014*\"seaport\" + 0.014*\"report\" + 0.013*\"bypass\"\n", + "2019-01-31 01:15:51,113 : INFO : topic #31 (0.020): 0.050*\"fusiform\" + 0.026*\"scientist\" + 0.025*\"taxpay\" + 0.023*\"player\" + 0.019*\"place\" + 0.014*\"clot\" + 0.013*\"leagu\" + 0.012*\"folei\" + 0.010*\"yawn\" + 0.010*\"reconstruct\"\n", + "2019-01-31 01:15:51,114 : INFO : topic #34 (0.020): 0.069*\"start\" + 0.033*\"new\" + 0.032*\"unionist\" + 0.032*\"american\" + 0.024*\"cotton\" + 0.021*\"year\" + 0.016*\"california\" + 0.013*\"warrior\" + 0.012*\"terri\" + 0.011*\"citi\"\n", + "2019-01-31 01:15:51,115 : INFO : topic #18 (0.020): 0.011*\"théori\" + 0.007*\"later\" + 0.007*\"sack\" + 0.006*\"dai\" + 0.006*\"kill\" + 0.005*\"like\" + 0.005*\"retrospect\" + 0.005*\"end\" + 0.004*\"help\" + 0.004*\"call\"\n", + "2019-01-31 01:15:51,121 : INFO : topic diff=0.003418, rho=0.024015\n", + "2019-01-31 01:15:51,275 : INFO : PROGRESS: pass 0, at document #3470000/4922894\n", + "2019-01-31 01:15:52,616 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:15:52,882 : INFO : topic #33 (0.020): 0.061*\"french\" + 0.048*\"franc\" + 0.032*\"pari\" + 0.022*\"jean\" + 0.021*\"sail\" + 0.016*\"daphn\" + 0.013*\"lazi\" + 0.012*\"loui\" + 0.011*\"piec\" + 0.009*\"wine\"\n", + "2019-01-31 01:15:52,883 : INFO : topic #12 (0.020): 0.008*\"number\" + 0.008*\"frontal\" + 0.007*\"gener\" + 0.006*\"servitud\" + 0.006*\"exampl\" + 0.006*\"poet\" + 0.006*\"southern\" + 0.006*\"measur\" + 0.006*\"théori\" + 0.006*\"utopian\"\n", + "2019-01-31 01:15:52,884 : INFO : topic #7 (0.020): 0.021*\"snatch\" + 0.020*\"di\" + 0.018*\"factor\" + 0.016*\"yawn\" + 0.015*\"margin\" + 0.014*\"bone\" + 0.013*\"faster\" + 0.013*\"life\" + 0.012*\"deal\" + 0.011*\"john\"\n", + "2019-01-31 01:15:52,885 : INFO : topic #24 (0.020): 0.038*\"book\" + 0.033*\"publicis\" + 0.029*\"word\" + 0.019*\"new\" + 0.015*\"edit\" + 0.013*\"presid\" + 0.013*\"arsen\" + 0.011*\"collect\" + 0.011*\"worldwid\" + 0.011*\"nicola\"\n", + "2019-01-31 01:15:52,887 : INFO : topic #41 (0.020): 0.041*\"citi\" + 0.024*\"palmer\" + 0.021*\"new\" + 0.016*\"strategist\" + 0.013*\"open\" + 0.012*\"center\" + 0.011*\"includ\" + 0.011*\"dai\" + 0.011*\"lobe\" + 0.009*\"highli\"\n", + "2019-01-31 01:15:52,892 : INFO : topic diff=0.003855, rho=0.024008\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 01:15:53,051 : INFO : PROGRESS: pass 0, at document #3472000/4922894\n", + "2019-01-31 01:15:54,414 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:15:54,681 : INFO : topic #25 (0.020): 0.031*\"ring\" + 0.019*\"area\" + 0.018*\"lagrang\" + 0.017*\"warmth\" + 0.016*\"mount\" + 0.013*\"palmer\" + 0.010*\"north\" + 0.009*\"foam\" + 0.009*\"nation\" + 0.009*\"lobe\"\n", + "2019-01-31 01:15:54,682 : INFO : topic #11 (0.020): 0.023*\"john\" + 0.012*\"will\" + 0.012*\"david\" + 0.011*\"jame\" + 0.010*\"rival\" + 0.009*\"mexican–american\" + 0.008*\"paul\" + 0.008*\"georg\" + 0.008*\"slur\" + 0.007*\"rhyme\"\n", + "2019-01-31 01:15:54,683 : INFO : topic #2 (0.020): 0.049*\"isl\" + 0.039*\"shield\" + 0.018*\"narrat\" + 0.015*\"scot\" + 0.012*\"pope\" + 0.012*\"blur\" + 0.010*\"coalit\" + 0.010*\"nativist\" + 0.009*\"fleet\" + 0.008*\"bahá\"\n", + "2019-01-31 01:15:54,684 : INFO : topic #20 (0.020): 0.145*\"scholar\" + 0.039*\"struggl\" + 0.034*\"high\" + 0.030*\"educ\" + 0.025*\"collector\" + 0.017*\"yawn\" + 0.012*\"prognosi\" + 0.010*\"district\" + 0.010*\"gothic\" + 0.009*\"start\"\n", + "2019-01-31 01:15:54,685 : INFO : topic #24 (0.020): 0.038*\"book\" + 0.033*\"publicis\" + 0.029*\"word\" + 0.019*\"new\" + 0.015*\"edit\" + 0.013*\"presid\" + 0.013*\"arsen\" + 0.011*\"collect\" + 0.011*\"worldwid\" + 0.011*\"nicola\"\n", + "2019-01-31 01:15:54,691 : INFO : topic diff=0.003773, rho=0.024001\n", + "2019-01-31 01:15:54,843 : INFO : PROGRESS: pass 0, at document #3474000/4922894\n", + "2019-01-31 01:15:56,207 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:15:56,473 : INFO : topic #39 (0.020): 0.058*\"canada\" + 0.046*\"canadian\" + 0.023*\"toronto\" + 0.023*\"hoar\" + 0.020*\"ontario\" + 0.017*\"hydrogen\" + 0.016*\"new\" + 0.015*\"novotná\" + 0.014*\"misericordia\" + 0.013*\"quebec\"\n", + "2019-01-31 01:15:56,474 : INFO : topic #30 (0.020): 0.036*\"cleveland\" + 0.035*\"leagu\" + 0.030*\"place\" + 0.027*\"taxpay\" + 0.024*\"crete\" + 0.024*\"scientist\" + 0.022*\"folei\" + 0.017*\"goal\" + 0.015*\"martin\" + 0.013*\"schmitz\"\n", + "2019-01-31 01:15:56,475 : INFO : topic #47 (0.020): 0.062*\"muscl\" + 0.032*\"perceptu\" + 0.020*\"theater\" + 0.020*\"compos\" + 0.018*\"place\" + 0.014*\"damn\" + 0.014*\"orchestr\" + 0.013*\"physician\" + 0.012*\"olympo\" + 0.011*\"word\"\n", + "2019-01-31 01:15:56,476 : INFO : topic #18 (0.020): 0.011*\"théori\" + 0.007*\"later\" + 0.007*\"sack\" + 0.006*\"dai\" + 0.006*\"kill\" + 0.005*\"like\" + 0.005*\"retrospect\" + 0.005*\"end\" + 0.004*\"help\" + 0.004*\"call\"\n", + "2019-01-31 01:15:56,477 : INFO : topic #8 (0.020): 0.026*\"law\" + 0.022*\"cortic\" + 0.018*\"start\" + 0.017*\"act\" + 0.012*\"case\" + 0.012*\"ricardo\" + 0.010*\"replac\" + 0.009*\"polaris\" + 0.008*\"legal\" + 0.007*\"order\"\n", + "2019-01-31 01:15:56,483 : INFO : topic diff=0.003531, rho=0.023994\n", + "2019-01-31 01:15:56,637 : INFO : PROGRESS: pass 0, at document #3476000/4922894\n", + "2019-01-31 01:15:58,000 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:15:58,266 : INFO : topic #32 (0.020): 0.050*\"district\" + 0.045*\"vigour\" + 0.043*\"popolo\" + 0.036*\"tortur\" + 0.035*\"cotton\" + 0.022*\"adulthood\" + 0.022*\"multitud\" + 0.022*\"area\" + 0.019*\"citi\" + 0.019*\"cede\"\n", + "2019-01-31 01:15:58,267 : INFO : topic #14 (0.020): 0.024*\"forc\" + 0.022*\"aggress\" + 0.021*\"armi\" + 0.020*\"walter\" + 0.018*\"com\" + 0.014*\"oper\" + 0.013*\"unionist\" + 0.012*\"militari\" + 0.011*\"airbu\" + 0.010*\"diversifi\"\n", + "2019-01-31 01:15:58,269 : INFO : topic #29 (0.020): 0.030*\"companhia\" + 0.014*\"bank\" + 0.013*\"busi\" + 0.012*\"million\" + 0.011*\"market\" + 0.011*\"produc\" + 0.010*\"industri\" + 0.009*\"yawn\" + 0.008*\"manag\" + 0.007*\"oper\"\n", + "2019-01-31 01:15:58,270 : INFO : topic #11 (0.020): 0.023*\"john\" + 0.012*\"will\" + 0.012*\"david\" + 0.011*\"jame\" + 0.010*\"rival\" + 0.009*\"mexican–american\" + 0.008*\"paul\" + 0.008*\"georg\" + 0.008*\"slur\" + 0.007*\"rhyme\"\n", + "2019-01-31 01:15:58,271 : INFO : topic #28 (0.020): 0.034*\"build\" + 0.028*\"hous\" + 0.018*\"buford\" + 0.014*\"histor\" + 0.012*\"rivièr\" + 0.012*\"linear\" + 0.011*\"constitut\" + 0.011*\"briarwood\" + 0.011*\"silicon\" + 0.010*\"depress\"\n", + "2019-01-31 01:15:58,276 : INFO : topic diff=0.003653, rho=0.023987\n", + "2019-01-31 01:15:58,436 : INFO : PROGRESS: pass 0, at document #3478000/4922894\n", + "2019-01-31 01:15:59,832 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:16:00,099 : INFO : topic #44 (0.020): 0.031*\"rooftop\" + 0.027*\"final\" + 0.021*\"wife\" + 0.021*\"tourist\" + 0.018*\"champion\" + 0.016*\"taxpay\" + 0.015*\"martin\" + 0.015*\"tiepolo\" + 0.013*\"chamber\" + 0.013*\"women\"\n", + "2019-01-31 01:16:00,100 : INFO : topic #24 (0.020): 0.038*\"book\" + 0.033*\"publicis\" + 0.028*\"word\" + 0.019*\"new\" + 0.015*\"edit\" + 0.013*\"presid\" + 0.013*\"arsen\" + 0.011*\"collect\" + 0.011*\"worldwid\" + 0.011*\"nicola\"\n", + "2019-01-31 01:16:00,101 : INFO : topic #14 (0.020): 0.024*\"forc\" + 0.022*\"aggress\" + 0.021*\"armi\" + 0.020*\"walter\" + 0.018*\"com\" + 0.014*\"oper\" + 0.013*\"unionist\" + 0.012*\"militari\" + 0.011*\"airbu\" + 0.010*\"diversifi\"\n", + "2019-01-31 01:16:00,102 : INFO : topic #47 (0.020): 0.061*\"muscl\" + 0.032*\"perceptu\" + 0.020*\"theater\" + 0.019*\"compos\" + 0.018*\"place\" + 0.014*\"damn\" + 0.014*\"orchestr\" + 0.013*\"physician\" + 0.012*\"olympo\" + 0.011*\"word\"\n", + "2019-01-31 01:16:00,104 : INFO : topic #11 (0.020): 0.023*\"john\" + 0.012*\"will\" + 0.011*\"david\" + 0.011*\"jame\" + 0.010*\"rival\" + 0.009*\"mexican–american\" + 0.008*\"paul\" + 0.008*\"georg\" + 0.008*\"slur\" + 0.007*\"rhyme\"\n", + "2019-01-31 01:16:00,109 : INFO : topic diff=0.004080, rho=0.023980\n", + "2019-01-31 01:16:02,859 : INFO : -11.986 per-word bound, 4057.6 perplexity estimate based on a held-out corpus of 2000 documents with 594242 words\n", + "2019-01-31 01:16:02,859 : INFO : PROGRESS: pass 0, at document #3480000/4922894\n", + "2019-01-31 01:16:04,257 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:16:04,523 : INFO : topic #33 (0.020): 0.062*\"french\" + 0.048*\"franc\" + 0.032*\"pari\" + 0.022*\"jean\" + 0.021*\"sail\" + 0.017*\"daphn\" + 0.013*\"lazi\" + 0.012*\"loui\" + 0.011*\"piec\" + 0.010*\"wine\"\n", + "2019-01-31 01:16:04,525 : INFO : topic #29 (0.020): 0.030*\"companhia\" + 0.014*\"bank\" + 0.013*\"busi\" + 0.012*\"million\" + 0.011*\"market\" + 0.011*\"produc\" + 0.010*\"industri\" + 0.009*\"yawn\" + 0.008*\"manag\" + 0.007*\"trace\"\n", + "2019-01-31 01:16:04,526 : INFO : topic #17 (0.020): 0.077*\"church\" + 0.022*\"cathol\" + 0.022*\"christian\" + 0.021*\"bishop\" + 0.018*\"sail\" + 0.014*\"retroflex\" + 0.010*\"historiographi\" + 0.010*\"relationship\" + 0.009*\"cathedr\" + 0.009*\"poll\"\n", + "2019-01-31 01:16:04,527 : INFO : topic #16 (0.020): 0.056*\"king\" + 0.031*\"priest\" + 0.020*\"duke\" + 0.019*\"rotterdam\" + 0.018*\"quarterli\" + 0.017*\"idiosyncrat\" + 0.016*\"grammat\" + 0.015*\"kingdom\" + 0.014*\"portugues\" + 0.013*\"count\"\n", + "2019-01-31 01:16:04,528 : INFO : topic #45 (0.020): 0.027*\"arsen\" + 0.026*\"jpg\" + 0.024*\"fifteenth\" + 0.021*\"museo\" + 0.019*\"pain\" + 0.018*\"illicit\" + 0.014*\"colder\" + 0.014*\"gai\" + 0.012*\"black\" + 0.012*\"exhaust\"\n", + "2019-01-31 01:16:04,534 : INFO : topic diff=0.004051, rho=0.023973\n", + "2019-01-31 01:16:04,690 : INFO : PROGRESS: pass 0, at document #3482000/4922894\n", + "2019-01-31 01:16:06,044 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:16:06,310 : INFO : topic #47 (0.020): 0.061*\"muscl\" + 0.032*\"perceptu\" + 0.020*\"theater\" + 0.019*\"compos\" + 0.019*\"place\" + 0.014*\"damn\" + 0.014*\"orchestr\" + 0.013*\"physician\" + 0.012*\"olympo\" + 0.011*\"word\"\n", + "2019-01-31 01:16:06,311 : INFO : topic #5 (0.020): 0.039*\"abroad\" + 0.028*\"son\" + 0.027*\"rel\" + 0.026*\"reconstruct\" + 0.021*\"band\" + 0.017*\"muscl\" + 0.016*\"simultan\" + 0.014*\"charcoal\" + 0.013*\"toyota\" + 0.009*\"vocabulari\"\n", + "2019-01-31 01:16:06,312 : INFO : topic #39 (0.020): 0.058*\"canada\" + 0.045*\"canadian\" + 0.023*\"toronto\" + 0.023*\"hoar\" + 0.020*\"ontario\" + 0.018*\"hydrogen\" + 0.016*\"new\" + 0.015*\"novotná\" + 0.013*\"quebec\" + 0.013*\"misericordia\"\n", + "2019-01-31 01:16:06,313 : INFO : topic #44 (0.020): 0.031*\"rooftop\" + 0.027*\"final\" + 0.022*\"wife\" + 0.020*\"tourist\" + 0.018*\"champion\" + 0.016*\"taxpay\" + 0.015*\"martin\" + 0.015*\"tiepolo\" + 0.013*\"chamber\" + 0.013*\"open\"\n", + "2019-01-31 01:16:06,314 : INFO : topic #42 (0.020): 0.049*\"german\" + 0.033*\"germani\" + 0.016*\"vol\" + 0.015*\"jewish\" + 0.015*\"israel\" + 0.014*\"berlin\" + 0.013*\"der\" + 0.010*\"european\" + 0.009*\"austria\" + 0.009*\"europ\"\n", + "2019-01-31 01:16:06,320 : INFO : topic diff=0.003648, rho=0.023966\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 01:16:06,480 : INFO : PROGRESS: pass 0, at document #3484000/4922894\n", + "2019-01-31 01:16:07,871 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:16:08,137 : INFO : topic #15 (0.020): 0.011*\"small\" + 0.010*\"organ\" + 0.010*\"develop\" + 0.009*\"commun\" + 0.009*\"group\" + 0.008*\"word\" + 0.008*\"peopl\" + 0.007*\"woman\" + 0.007*\"human\" + 0.007*\"summerhil\"\n", + "2019-01-31 01:16:08,138 : INFO : topic #18 (0.020): 0.011*\"théori\" + 0.007*\"later\" + 0.007*\"sack\" + 0.006*\"dai\" + 0.006*\"kill\" + 0.005*\"like\" + 0.005*\"retrospect\" + 0.005*\"end\" + 0.004*\"help\" + 0.004*\"call\"\n", + "2019-01-31 01:16:08,139 : INFO : topic #10 (0.020): 0.012*\"cdd\" + 0.008*\"media\" + 0.008*\"disco\" + 0.007*\"hormon\" + 0.007*\"have\" + 0.007*\"pathwai\" + 0.007*\"caus\" + 0.006*\"proper\" + 0.006*\"treat\" + 0.006*\"effect\"\n", + "2019-01-31 01:16:08,141 : INFO : topic #38 (0.020): 0.022*\"walter\" + 0.010*\"aza\" + 0.009*\"forc\" + 0.009*\"battalion\" + 0.007*\"empath\" + 0.007*\"armi\" + 0.007*\"govern\" + 0.006*\"teufel\" + 0.006*\"militari\" + 0.006*\"pour\"\n", + "2019-01-31 01:16:08,142 : INFO : topic #31 (0.020): 0.049*\"fusiform\" + 0.026*\"scientist\" + 0.026*\"taxpay\" + 0.022*\"player\" + 0.019*\"place\" + 0.014*\"clot\" + 0.013*\"leagu\" + 0.012*\"folei\" + 0.010*\"yawn\" + 0.009*\"reconstruct\"\n", + "2019-01-31 01:16:08,148 : INFO : topic diff=0.003325, rho=0.023959\n", + "2019-01-31 01:16:08,304 : INFO : PROGRESS: pass 0, at document #3486000/4922894\n", + "2019-01-31 01:16:09,664 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:16:09,932 : INFO : topic #40 (0.020): 0.085*\"unit\" + 0.024*\"schuster\" + 0.022*\"institut\" + 0.021*\"collector\" + 0.021*\"requir\" + 0.019*\"student\" + 0.014*\"professor\" + 0.012*\"degre\" + 0.012*\"http\" + 0.011*\"word\"\n", + "2019-01-31 01:16:09,933 : INFO : topic #45 (0.020): 0.027*\"arsen\" + 0.026*\"jpg\" + 0.024*\"fifteenth\" + 0.021*\"museo\" + 0.018*\"pain\" + 0.018*\"illicit\" + 0.014*\"colder\" + 0.014*\"gai\" + 0.012*\"black\" + 0.012*\"exhaust\"\n", + "2019-01-31 01:16:09,934 : INFO : topic #34 (0.020): 0.069*\"start\" + 0.033*\"new\" + 0.032*\"american\" + 0.032*\"unionist\" + 0.024*\"cotton\" + 0.021*\"year\" + 0.015*\"california\" + 0.013*\"warrior\" + 0.012*\"terri\" + 0.011*\"citi\"\n", + "2019-01-31 01:16:09,935 : INFO : topic #24 (0.020): 0.038*\"book\" + 0.033*\"publicis\" + 0.028*\"word\" + 0.019*\"new\" + 0.015*\"edit\" + 0.013*\"presid\" + 0.013*\"arsen\" + 0.011*\"collect\" + 0.011*\"worldwid\" + 0.011*\"nicola\"\n", + "2019-01-31 01:16:09,936 : INFO : topic #8 (0.020): 0.027*\"law\" + 0.022*\"cortic\" + 0.018*\"start\" + 0.017*\"act\" + 0.012*\"ricardo\" + 0.012*\"case\" + 0.010*\"replac\" + 0.010*\"polaris\" + 0.009*\"order\" + 0.008*\"legal\"\n", + "2019-01-31 01:16:09,943 : INFO : topic diff=0.003374, rho=0.023953\n", + "2019-01-31 01:16:10,164 : INFO : PROGRESS: pass 0, at document #3488000/4922894\n", + "2019-01-31 01:16:11,524 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:16:11,790 : INFO : topic #44 (0.020): 0.031*\"rooftop\" + 0.028*\"final\" + 0.022*\"wife\" + 0.020*\"tourist\" + 0.018*\"champion\" + 0.017*\"taxpay\" + 0.015*\"martin\" + 0.015*\"tiepolo\" + 0.013*\"chamber\" + 0.013*\"women\"\n", + "2019-01-31 01:16:11,791 : INFO : topic #33 (0.020): 0.061*\"french\" + 0.047*\"franc\" + 0.032*\"pari\" + 0.023*\"jean\" + 0.021*\"sail\" + 0.017*\"daphn\" + 0.013*\"lazi\" + 0.012*\"loui\" + 0.011*\"piec\" + 0.009*\"wine\"\n", + "2019-01-31 01:16:11,792 : INFO : topic #14 (0.020): 0.023*\"forc\" + 0.022*\"aggress\" + 0.021*\"armi\" + 0.020*\"walter\" + 0.018*\"com\" + 0.014*\"oper\" + 0.013*\"unionist\" + 0.012*\"militari\" + 0.012*\"airbu\" + 0.011*\"diversifi\"\n", + "2019-01-31 01:16:11,794 : INFO : topic #22 (0.020): 0.034*\"spars\" + 0.019*\"factor\" + 0.012*\"genu\" + 0.012*\"plaisir\" + 0.009*\"western\" + 0.008*\"biom\" + 0.007*\"median\" + 0.007*\"feel\" + 0.007*\"male\" + 0.007*\"monument\"\n", + "2019-01-31 01:16:11,795 : INFO : topic #41 (0.020): 0.040*\"citi\" + 0.024*\"palmer\" + 0.021*\"new\" + 0.016*\"strategist\" + 0.013*\"open\" + 0.012*\"center\" + 0.011*\"includ\" + 0.011*\"lobe\" + 0.011*\"dai\" + 0.009*\"highli\"\n", + "2019-01-31 01:16:11,801 : INFO : topic diff=0.003362, rho=0.023946\n", + "2019-01-31 01:16:11,961 : INFO : PROGRESS: pass 0, at document #3490000/4922894\n", + "2019-01-31 01:16:13,341 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:16:13,608 : INFO : topic #40 (0.020): 0.085*\"unit\" + 0.024*\"schuster\" + 0.021*\"institut\" + 0.021*\"collector\" + 0.021*\"requir\" + 0.019*\"student\" + 0.014*\"professor\" + 0.012*\"degre\" + 0.012*\"http\" + 0.011*\"word\"\n", + "2019-01-31 01:16:13,609 : INFO : topic #24 (0.020): 0.038*\"book\" + 0.033*\"publicis\" + 0.028*\"word\" + 0.019*\"new\" + 0.015*\"edit\" + 0.013*\"presid\" + 0.013*\"arsen\" + 0.011*\"collect\" + 0.011*\"magazin\" + 0.011*\"worldwid\"\n", + "2019-01-31 01:16:13,610 : INFO : topic #33 (0.020): 0.061*\"french\" + 0.047*\"franc\" + 0.032*\"pari\" + 0.023*\"jean\" + 0.021*\"sail\" + 0.017*\"daphn\" + 0.013*\"lazi\" + 0.012*\"loui\" + 0.011*\"piec\" + 0.009*\"wine\"\n", + "2019-01-31 01:16:13,611 : INFO : topic #32 (0.020): 0.050*\"district\" + 0.045*\"vigour\" + 0.044*\"popolo\" + 0.036*\"tortur\" + 0.035*\"cotton\" + 0.022*\"adulthood\" + 0.022*\"area\" + 0.021*\"multitud\" + 0.019*\"citi\" + 0.019*\"cede\"\n", + "2019-01-31 01:16:13,612 : INFO : topic #45 (0.020): 0.027*\"arsen\" + 0.026*\"jpg\" + 0.024*\"fifteenth\" + 0.021*\"museo\" + 0.018*\"pain\" + 0.018*\"illicit\" + 0.014*\"colder\" + 0.014*\"gai\" + 0.012*\"exhaust\" + 0.012*\"black\"\n", + "2019-01-31 01:16:13,618 : INFO : topic diff=0.002982, rho=0.023939\n", + "2019-01-31 01:16:13,771 : INFO : PROGRESS: pass 0, at document #3492000/4922894\n", + "2019-01-31 01:16:15,131 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:16:15,397 : INFO : topic #0 (0.020): 0.066*\"statewid\" + 0.043*\"line\" + 0.034*\"raid\" + 0.026*\"rosenwald\" + 0.020*\"traceabl\" + 0.020*\"serv\" + 0.019*\"rivièr\" + 0.016*\"airmen\" + 0.014*\"oper\" + 0.011*\"transient\"\n", + "2019-01-31 01:16:15,398 : INFO : topic #26 (0.020): 0.029*\"workplac\" + 0.029*\"champion\" + 0.027*\"woman\" + 0.024*\"men\" + 0.024*\"olymp\" + 0.022*\"medal\" + 0.021*\"event\" + 0.019*\"atheist\" + 0.018*\"rainfal\" + 0.018*\"taxpay\"\n", + "2019-01-31 01:16:15,400 : INFO : topic #25 (0.020): 0.032*\"ring\" + 0.019*\"area\" + 0.019*\"lagrang\" + 0.017*\"warmth\" + 0.016*\"mount\" + 0.012*\"palmer\" + 0.010*\"north\" + 0.009*\"foam\" + 0.009*\"nation\" + 0.009*\"sourc\"\n", + "2019-01-31 01:16:15,401 : INFO : topic #28 (0.020): 0.033*\"build\" + 0.028*\"hous\" + 0.018*\"buford\" + 0.014*\"histor\" + 0.012*\"linear\" + 0.012*\"rivièr\" + 0.011*\"constitut\" + 0.011*\"briarwood\" + 0.010*\"silicon\" + 0.010*\"depress\"\n", + "2019-01-31 01:16:15,402 : INFO : topic #5 (0.020): 0.039*\"abroad\" + 0.028*\"son\" + 0.027*\"rel\" + 0.026*\"reconstruct\" + 0.021*\"band\" + 0.017*\"muscl\" + 0.016*\"simultan\" + 0.014*\"charcoal\" + 0.013*\"toyota\" + 0.009*\"myspac\"\n", + "2019-01-31 01:16:15,408 : INFO : topic diff=0.004041, rho=0.023932\n", + "2019-01-31 01:16:15,563 : INFO : PROGRESS: pass 0, at document #3494000/4922894\n", + "2019-01-31 01:16:16,925 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:16:17,191 : INFO : topic #47 (0.020): 0.060*\"muscl\" + 0.032*\"perceptu\" + 0.020*\"theater\" + 0.019*\"compos\" + 0.018*\"place\" + 0.014*\"orchestr\" + 0.013*\"damn\" + 0.013*\"physician\" + 0.012*\"olympo\" + 0.011*\"word\"\n", + "2019-01-31 01:16:17,192 : INFO : topic #7 (0.020): 0.021*\"snatch\" + 0.020*\"di\" + 0.018*\"factor\" + 0.016*\"yawn\" + 0.015*\"margin\" + 0.014*\"bone\" + 0.013*\"faster\" + 0.013*\"life\" + 0.012*\"deal\" + 0.012*\"john\"\n", + "2019-01-31 01:16:17,194 : INFO : topic #8 (0.020): 0.027*\"law\" + 0.022*\"cortic\" + 0.018*\"start\" + 0.017*\"act\" + 0.012*\"ricardo\" + 0.012*\"case\" + 0.010*\"replac\" + 0.010*\"polaris\" + 0.009*\"order\" + 0.008*\"legal\"\n", + "2019-01-31 01:16:17,195 : INFO : topic #6 (0.020): 0.069*\"fewer\" + 0.024*\"epiru\" + 0.020*\"septemb\" + 0.019*\"teacher\" + 0.016*\"stake\" + 0.012*\"rodríguez\" + 0.011*\"proclaim\" + 0.011*\"direct\" + 0.011*\"movi\" + 0.010*\"acrimoni\"\n", + "2019-01-31 01:16:17,196 : INFO : topic #14 (0.020): 0.023*\"forc\" + 0.022*\"aggress\" + 0.021*\"armi\" + 0.020*\"walter\" + 0.018*\"com\" + 0.014*\"oper\" + 0.013*\"unionist\" + 0.012*\"militari\" + 0.012*\"airbu\" + 0.011*\"diversifi\"\n", + "2019-01-31 01:16:17,201 : INFO : topic diff=0.004123, rho=0.023925\n", + "2019-01-31 01:16:17,362 : INFO : PROGRESS: pass 0, at document #3496000/4922894\n", + "2019-01-31 01:16:18,772 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:16:19,039 : INFO : topic #2 (0.020): 0.050*\"isl\" + 0.038*\"shield\" + 0.018*\"narrat\" + 0.014*\"scot\" + 0.012*\"pope\" + 0.012*\"blur\" + 0.011*\"coalit\" + 0.010*\"nativist\" + 0.009*\"fleet\" + 0.008*\"bahá\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 01:16:19,040 : INFO : topic #25 (0.020): 0.032*\"ring\" + 0.019*\"area\" + 0.019*\"lagrang\" + 0.017*\"warmth\" + 0.016*\"mount\" + 0.012*\"palmer\" + 0.010*\"north\" + 0.009*\"foam\" + 0.009*\"nation\" + 0.009*\"sourc\"\n", + "2019-01-31 01:16:19,041 : INFO : topic #20 (0.020): 0.145*\"scholar\" + 0.039*\"struggl\" + 0.034*\"high\" + 0.030*\"educ\" + 0.024*\"collector\" + 0.017*\"yawn\" + 0.012*\"prognosi\" + 0.010*\"district\" + 0.010*\"gothic\" + 0.010*\"pseudo\"\n", + "2019-01-31 01:16:19,043 : INFO : topic #24 (0.020): 0.038*\"book\" + 0.033*\"publicis\" + 0.028*\"word\" + 0.019*\"new\" + 0.015*\"edit\" + 0.013*\"presid\" + 0.013*\"arsen\" + 0.011*\"collect\" + 0.011*\"magazin\" + 0.011*\"worldwid\"\n", + "2019-01-31 01:16:19,043 : INFO : topic #12 (0.020): 0.009*\"number\" + 0.008*\"frontal\" + 0.007*\"gener\" + 0.006*\"exampl\" + 0.006*\"poet\" + 0.006*\"servitud\" + 0.006*\"measur\" + 0.006*\"southern\" + 0.006*\"théori\" + 0.006*\"utopian\"\n", + "2019-01-31 01:16:19,049 : INFO : topic diff=0.004156, rho=0.023918\n", + "2019-01-31 01:16:19,208 : INFO : PROGRESS: pass 0, at document #3498000/4922894\n", + "2019-01-31 01:16:20,571 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:16:20,837 : INFO : topic #17 (0.020): 0.078*\"church\" + 0.022*\"cathol\" + 0.022*\"christian\" + 0.021*\"bishop\" + 0.017*\"sail\" + 0.014*\"retroflex\" + 0.010*\"historiographi\" + 0.010*\"relationship\" + 0.009*\"cathedr\" + 0.009*\"poll\"\n", + "2019-01-31 01:16:20,838 : INFO : topic #42 (0.020): 0.049*\"german\" + 0.033*\"germani\" + 0.016*\"vol\" + 0.015*\"jewish\" + 0.014*\"israel\" + 0.014*\"berlin\" + 0.013*\"der\" + 0.010*\"european\" + 0.009*\"austria\" + 0.009*\"europ\"\n", + "2019-01-31 01:16:20,839 : INFO : topic #3 (0.020): 0.033*\"present\" + 0.026*\"offic\" + 0.025*\"nation\" + 0.023*\"minist\" + 0.023*\"govern\" + 0.020*\"member\" + 0.017*\"serv\" + 0.016*\"start\" + 0.016*\"gener\" + 0.014*\"chickasaw\"\n", + "2019-01-31 01:16:20,840 : INFO : topic #23 (0.020): 0.135*\"audit\" + 0.068*\"best\" + 0.033*\"yawn\" + 0.028*\"jacksonvil\" + 0.023*\"japanes\" + 0.022*\"noll\" + 0.019*\"festiv\" + 0.018*\"women\" + 0.018*\"intern\" + 0.013*\"winner\"\n", + "2019-01-31 01:16:20,841 : INFO : topic #36 (0.020): 0.011*\"network\" + 0.011*\"prognosi\" + 0.010*\"pop\" + 0.009*\"softwar\" + 0.009*\"cytokin\" + 0.008*\"develop\" + 0.008*\"user\" + 0.008*\"uruguayan\" + 0.007*\"championship\" + 0.007*\"diggin\"\n", + "2019-01-31 01:16:20,847 : INFO : topic diff=0.003952, rho=0.023911\n", + "2019-01-31 01:16:23,506 : INFO : -11.620 per-word bound, 3147.9 perplexity estimate based on a held-out corpus of 2000 documents with 553231 words\n", + "2019-01-31 01:16:23,506 : INFO : PROGRESS: pass 0, at document #3500000/4922894\n", + "2019-01-31 01:16:24,876 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:16:25,142 : INFO : topic #2 (0.020): 0.049*\"isl\" + 0.038*\"shield\" + 0.017*\"narrat\" + 0.014*\"scot\" + 0.012*\"blur\" + 0.012*\"pope\" + 0.011*\"coalit\" + 0.010*\"nativist\" + 0.009*\"fleet\" + 0.008*\"bahá\"\n", + "2019-01-31 01:16:25,143 : INFO : topic #25 (0.020): 0.032*\"ring\" + 0.019*\"area\" + 0.019*\"lagrang\" + 0.017*\"warmth\" + 0.015*\"mount\" + 0.012*\"palmer\" + 0.010*\"north\" + 0.009*\"foam\" + 0.009*\"nation\" + 0.009*\"lobe\"\n", + "2019-01-31 01:16:25,145 : INFO : topic #10 (0.020): 0.011*\"cdd\" + 0.008*\"media\" + 0.008*\"disco\" + 0.008*\"have\" + 0.007*\"hormon\" + 0.007*\"caus\" + 0.007*\"pathwai\" + 0.006*\"proper\" + 0.006*\"effect\" + 0.006*\"treat\"\n", + "2019-01-31 01:16:25,146 : INFO : topic #29 (0.020): 0.031*\"companhia\" + 0.013*\"busi\" + 0.013*\"bank\" + 0.012*\"million\" + 0.011*\"market\" + 0.010*\"produc\" + 0.010*\"industri\" + 0.009*\"yawn\" + 0.008*\"manag\" + 0.007*\"trace\"\n", + "2019-01-31 01:16:25,147 : INFO : topic #27 (0.020): 0.072*\"questionnair\" + 0.019*\"candid\" + 0.019*\"taxpay\" + 0.014*\"driver\" + 0.013*\"ret\" + 0.012*\"fool\" + 0.012*\"find\" + 0.012*\"tornado\" + 0.010*\"squatter\" + 0.010*\"théori\"\n", + "2019-01-31 01:16:25,153 : INFO : topic diff=0.003629, rho=0.023905\n", + "2019-01-31 01:16:25,310 : INFO : PROGRESS: pass 0, at document #3502000/4922894\n", + "2019-01-31 01:16:26,679 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:16:26,945 : INFO : topic #25 (0.020): 0.032*\"ring\" + 0.019*\"area\" + 0.019*\"lagrang\" + 0.017*\"warmth\" + 0.015*\"mount\" + 0.012*\"palmer\" + 0.010*\"north\" + 0.009*\"foam\" + 0.009*\"nation\" + 0.009*\"lobe\"\n", + "2019-01-31 01:16:26,946 : INFO : topic #9 (0.020): 0.068*\"bone\" + 0.045*\"american\" + 0.031*\"valour\" + 0.020*\"dutch\" + 0.019*\"folei\" + 0.018*\"player\" + 0.016*\"polit\" + 0.015*\"english\" + 0.013*\"acrimoni\" + 0.012*\"simpler\"\n", + "2019-01-31 01:16:26,948 : INFO : topic #28 (0.020): 0.033*\"build\" + 0.028*\"hous\" + 0.018*\"buford\" + 0.014*\"histor\" + 0.012*\"linear\" + 0.011*\"rivièr\" + 0.011*\"constitut\" + 0.010*\"silicon\" + 0.010*\"briarwood\" + 0.010*\"depress\"\n", + "2019-01-31 01:16:26,949 : INFO : topic #30 (0.020): 0.035*\"cleveland\" + 0.035*\"leagu\" + 0.029*\"place\" + 0.027*\"taxpay\" + 0.024*\"scientist\" + 0.024*\"crete\" + 0.021*\"folei\" + 0.017*\"goal\" + 0.015*\"martin\" + 0.013*\"schmitz\"\n", + "2019-01-31 01:16:26,950 : INFO : topic #36 (0.020): 0.011*\"network\" + 0.011*\"prognosi\" + 0.010*\"pop\" + 0.009*\"softwar\" + 0.008*\"cytokin\" + 0.008*\"develop\" + 0.008*\"user\" + 0.008*\"uruguayan\" + 0.007*\"championship\" + 0.007*\"diggin\"\n", + "2019-01-31 01:16:26,956 : INFO : topic diff=0.003244, rho=0.023898\n", + "2019-01-31 01:16:27,110 : INFO : PROGRESS: pass 0, at document #3504000/4922894\n", + "2019-01-31 01:16:28,467 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:16:28,734 : INFO : topic #43 (0.020): 0.065*\"elect\" + 0.055*\"parti\" + 0.025*\"voluntari\" + 0.023*\"democrat\" + 0.020*\"member\" + 0.016*\"polici\" + 0.015*\"republ\" + 0.014*\"seaport\" + 0.014*\"report\" + 0.013*\"bypass\"\n", + "2019-01-31 01:16:28,735 : INFO : topic #25 (0.020): 0.032*\"ring\" + 0.019*\"area\" + 0.019*\"lagrang\" + 0.017*\"warmth\" + 0.016*\"mount\" + 0.012*\"palmer\" + 0.010*\"north\" + 0.009*\"foam\" + 0.009*\"lobe\" + 0.009*\"sourc\"\n", + "2019-01-31 01:16:28,736 : INFO : topic #1 (0.020): 0.055*\"china\" + 0.047*\"chilton\" + 0.024*\"kong\" + 0.024*\"hong\" + 0.021*\"korea\" + 0.017*\"korean\" + 0.015*\"shirin\" + 0.015*\"sourc\" + 0.014*\"leah\" + 0.012*\"kim\"\n", + "2019-01-31 01:16:28,737 : INFO : topic #14 (0.020): 0.024*\"forc\" + 0.022*\"aggress\" + 0.021*\"armi\" + 0.021*\"walter\" + 0.018*\"com\" + 0.014*\"unionist\" + 0.013*\"oper\" + 0.012*\"militari\" + 0.012*\"airbu\" + 0.010*\"diversifi\"\n", + "2019-01-31 01:16:28,738 : INFO : topic #11 (0.020): 0.023*\"john\" + 0.012*\"will\" + 0.012*\"david\" + 0.011*\"jame\" + 0.010*\"rival\" + 0.009*\"mexican–american\" + 0.008*\"paul\" + 0.008*\"georg\" + 0.008*\"slur\" + 0.007*\"rhyme\"\n", + "2019-01-31 01:16:28,744 : INFO : topic diff=0.003516, rho=0.023891\n", + "2019-01-31 01:16:28,898 : INFO : PROGRESS: pass 0, at document #3506000/4922894\n", + "2019-01-31 01:16:30,236 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:16:30,502 : INFO : topic #1 (0.020): 0.055*\"china\" + 0.047*\"chilton\" + 0.024*\"kong\" + 0.024*\"hong\" + 0.021*\"korea\" + 0.017*\"korean\" + 0.015*\"shirin\" + 0.015*\"sourc\" + 0.014*\"leah\" + 0.012*\"kim\"\n", + "2019-01-31 01:16:30,503 : INFO : topic #39 (0.020): 0.058*\"canada\" + 0.045*\"canadian\" + 0.023*\"toronto\" + 0.022*\"hoar\" + 0.021*\"ontario\" + 0.017*\"hydrogen\" + 0.015*\"new\" + 0.015*\"novotná\" + 0.014*\"misericordia\" + 0.013*\"quebec\"\n", + "2019-01-31 01:16:30,504 : INFO : topic #25 (0.020): 0.032*\"ring\" + 0.019*\"area\" + 0.019*\"lagrang\" + 0.017*\"warmth\" + 0.016*\"mount\" + 0.012*\"palmer\" + 0.010*\"north\" + 0.009*\"foam\" + 0.009*\"sourc\" + 0.009*\"lobe\"\n", + "2019-01-31 01:16:30,505 : INFO : topic #26 (0.020): 0.029*\"workplac\" + 0.029*\"champion\" + 0.027*\"woman\" + 0.025*\"men\" + 0.025*\"olymp\" + 0.021*\"medal\" + 0.021*\"event\" + 0.019*\"atheist\" + 0.018*\"rainfal\" + 0.018*\"taxpay\"\n", + "2019-01-31 01:16:30,506 : INFO : topic #5 (0.020): 0.039*\"abroad\" + 0.027*\"son\" + 0.027*\"rel\" + 0.026*\"reconstruct\" + 0.021*\"band\" + 0.017*\"muscl\" + 0.016*\"simultan\" + 0.014*\"charcoal\" + 0.013*\"toyota\" + 0.009*\"myspac\"\n", + "2019-01-31 01:16:30,512 : INFO : topic diff=0.003585, rho=0.023884\n", + "2019-01-31 01:16:30,662 : INFO : PROGRESS: pass 0, at document #3508000/4922894\n", + "2019-01-31 01:16:31,974 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:16:32,243 : INFO : topic #8 (0.020): 0.027*\"law\" + 0.023*\"cortic\" + 0.018*\"start\" + 0.016*\"act\" + 0.012*\"ricardo\" + 0.012*\"case\" + 0.010*\"replac\" + 0.009*\"polaris\" + 0.009*\"legal\" + 0.008*\"order\"\n", + "2019-01-31 01:16:32,244 : INFO : topic #31 (0.020): 0.050*\"fusiform\" + 0.028*\"scientist\" + 0.026*\"taxpay\" + 0.022*\"player\" + 0.019*\"place\" + 0.014*\"clot\" + 0.013*\"leagu\" + 0.012*\"folei\" + 0.010*\"yawn\" + 0.010*\"reconstruct\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 01:16:32,245 : INFO : topic #36 (0.020): 0.011*\"network\" + 0.011*\"prognosi\" + 0.010*\"pop\" + 0.009*\"softwar\" + 0.008*\"cytokin\" + 0.008*\"develop\" + 0.008*\"user\" + 0.008*\"uruguayan\" + 0.007*\"diggin\" + 0.007*\"championship\"\n", + "2019-01-31 01:16:32,246 : INFO : topic #20 (0.020): 0.146*\"scholar\" + 0.039*\"struggl\" + 0.034*\"high\" + 0.030*\"educ\" + 0.024*\"collector\" + 0.017*\"yawn\" + 0.012*\"prognosi\" + 0.010*\"district\" + 0.010*\"gothic\" + 0.010*\"task\"\n", + "2019-01-31 01:16:32,247 : INFO : topic #42 (0.020): 0.049*\"german\" + 0.033*\"germani\" + 0.016*\"vol\" + 0.014*\"israel\" + 0.014*\"jewish\" + 0.013*\"berlin\" + 0.013*\"der\" + 0.010*\"european\" + 0.009*\"europ\" + 0.009*\"austria\"\n", + "2019-01-31 01:16:32,253 : INFO : topic diff=0.004287, rho=0.023877\n", + "2019-01-31 01:16:32,412 : INFO : PROGRESS: pass 0, at document #3510000/4922894\n", + "2019-01-31 01:16:33,802 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:16:34,069 : INFO : topic #7 (0.020): 0.021*\"snatch\" + 0.020*\"di\" + 0.019*\"factor\" + 0.016*\"yawn\" + 0.015*\"margin\" + 0.014*\"bone\" + 0.013*\"faster\" + 0.013*\"life\" + 0.012*\"daughter\" + 0.012*\"deal\"\n", + "2019-01-31 01:16:34,070 : INFO : topic #22 (0.020): 0.035*\"spars\" + 0.018*\"factor\" + 0.011*\"plaisir\" + 0.011*\"genu\" + 0.009*\"western\" + 0.009*\"biom\" + 0.007*\"median\" + 0.007*\"feel\" + 0.007*\"male\" + 0.007*\"monument\"\n", + "2019-01-31 01:16:34,071 : INFO : topic #48 (0.020): 0.080*\"sens\" + 0.079*\"march\" + 0.077*\"octob\" + 0.073*\"juli\" + 0.072*\"januari\" + 0.071*\"august\" + 0.070*\"judici\" + 0.069*\"april\" + 0.069*\"notion\" + 0.066*\"decatur\"\n", + "2019-01-31 01:16:34,072 : INFO : topic #0 (0.020): 0.066*\"statewid\" + 0.043*\"line\" + 0.033*\"raid\" + 0.028*\"rosenwald\" + 0.020*\"rivièr\" + 0.020*\"traceabl\" + 0.019*\"serv\" + 0.017*\"airmen\" + 0.014*\"oper\" + 0.010*\"transient\"\n", + "2019-01-31 01:16:34,073 : INFO : topic #38 (0.020): 0.023*\"walter\" + 0.010*\"aza\" + 0.009*\"battalion\" + 0.009*\"forc\" + 0.008*\"empath\" + 0.007*\"armi\" + 0.007*\"teufel\" + 0.006*\"till\" + 0.006*\"govern\" + 0.006*\"pour\"\n", + "2019-01-31 01:16:34,079 : INFO : topic diff=0.003441, rho=0.023870\n", + "2019-01-31 01:16:34,238 : INFO : PROGRESS: pass 0, at document #3512000/4922894\n", + "2019-01-31 01:16:35,636 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:16:35,903 : INFO : topic #47 (0.020): 0.061*\"muscl\" + 0.032*\"perceptu\" + 0.020*\"theater\" + 0.019*\"place\" + 0.018*\"compos\" + 0.014*\"damn\" + 0.014*\"orchestr\" + 0.012*\"physician\" + 0.012*\"olympo\" + 0.011*\"word\"\n", + "2019-01-31 01:16:35,904 : INFO : topic #20 (0.020): 0.147*\"scholar\" + 0.040*\"struggl\" + 0.034*\"high\" + 0.030*\"educ\" + 0.024*\"collector\" + 0.018*\"yawn\" + 0.012*\"prognosi\" + 0.010*\"task\" + 0.010*\"district\" + 0.010*\"gothic\"\n", + "2019-01-31 01:16:35,905 : INFO : topic #42 (0.020): 0.049*\"german\" + 0.033*\"germani\" + 0.016*\"vol\" + 0.014*\"jewish\" + 0.014*\"israel\" + 0.014*\"berlin\" + 0.013*\"der\" + 0.010*\"european\" + 0.009*\"austria\" + 0.009*\"europ\"\n", + "2019-01-31 01:16:35,906 : INFO : topic #8 (0.020): 0.027*\"law\" + 0.023*\"cortic\" + 0.018*\"start\" + 0.016*\"act\" + 0.012*\"ricardo\" + 0.012*\"case\" + 0.010*\"replac\" + 0.009*\"polaris\" + 0.008*\"legal\" + 0.008*\"order\"\n", + "2019-01-31 01:16:35,907 : INFO : topic #2 (0.020): 0.049*\"isl\" + 0.039*\"shield\" + 0.017*\"narrat\" + 0.014*\"scot\" + 0.012*\"blur\" + 0.012*\"pope\" + 0.011*\"coalit\" + 0.010*\"nativist\" + 0.010*\"fleet\" + 0.009*\"bahá\"\n", + "2019-01-31 01:16:35,913 : INFO : topic diff=0.004478, rho=0.023864\n", + "2019-01-31 01:16:36,072 : INFO : PROGRESS: pass 0, at document #3514000/4922894\n", + "2019-01-31 01:16:37,452 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:16:37,718 : INFO : topic #33 (0.020): 0.063*\"french\" + 0.047*\"franc\" + 0.032*\"pari\" + 0.023*\"jean\" + 0.021*\"sail\" + 0.017*\"daphn\" + 0.013*\"lazi\" + 0.012*\"loui\" + 0.011*\"piec\" + 0.009*\"wine\"\n", + "2019-01-31 01:16:37,719 : INFO : topic #40 (0.020): 0.085*\"unit\" + 0.024*\"schuster\" + 0.021*\"institut\" + 0.021*\"requir\" + 0.020*\"collector\" + 0.019*\"student\" + 0.015*\"professor\" + 0.012*\"degre\" + 0.012*\"http\" + 0.011*\"word\"\n", + "2019-01-31 01:16:37,720 : INFO : topic #16 (0.020): 0.056*\"king\" + 0.030*\"priest\" + 0.020*\"rotterdam\" + 0.020*\"duke\" + 0.018*\"quarterli\" + 0.018*\"grammat\" + 0.016*\"idiosyncrat\" + 0.015*\"kingdom\" + 0.013*\"portugues\" + 0.013*\"count\"\n", + "2019-01-31 01:16:37,722 : INFO : topic #37 (0.020): 0.012*\"charact\" + 0.011*\"septemb\" + 0.010*\"anim\" + 0.009*\"man\" + 0.009*\"comic\" + 0.007*\"storag\" + 0.007*\"appear\" + 0.006*\"workplac\" + 0.006*\"fusiform\" + 0.006*\"vision\"\n", + "2019-01-31 01:16:37,723 : INFO : topic #18 (0.020): 0.011*\"théori\" + 0.007*\"later\" + 0.007*\"sack\" + 0.006*\"dai\" + 0.006*\"kill\" + 0.005*\"like\" + 0.005*\"retrospect\" + 0.005*\"end\" + 0.004*\"call\" + 0.004*\"help\"\n", + "2019-01-31 01:16:37,729 : INFO : topic diff=0.003138, rho=0.023857\n", + "2019-01-31 01:16:37,885 : INFO : PROGRESS: pass 0, at document #3516000/4922894\n", + "2019-01-31 01:16:39,262 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:16:39,529 : INFO : topic #47 (0.020): 0.060*\"muscl\" + 0.032*\"perceptu\" + 0.020*\"theater\" + 0.019*\"place\" + 0.018*\"compos\" + 0.014*\"orchestr\" + 0.014*\"damn\" + 0.013*\"olympo\" + 0.012*\"physician\" + 0.011*\"word\"\n", + "2019-01-31 01:16:39,530 : INFO : topic #42 (0.020): 0.049*\"german\" + 0.033*\"germani\" + 0.015*\"vol\" + 0.014*\"jewish\" + 0.014*\"israel\" + 0.014*\"berlin\" + 0.013*\"der\" + 0.010*\"european\" + 0.009*\"austria\" + 0.009*\"europ\"\n", + "2019-01-31 01:16:39,531 : INFO : topic #29 (0.020): 0.031*\"companhia\" + 0.013*\"busi\" + 0.013*\"bank\" + 0.012*\"million\" + 0.011*\"market\" + 0.010*\"produc\" + 0.010*\"industri\" + 0.009*\"manag\" + 0.008*\"yawn\" + 0.007*\"trace\"\n", + "2019-01-31 01:16:39,532 : INFO : topic #24 (0.020): 0.038*\"book\" + 0.033*\"publicis\" + 0.028*\"word\" + 0.019*\"new\" + 0.015*\"edit\" + 0.013*\"presid\" + 0.012*\"arsen\" + 0.011*\"collect\" + 0.011*\"magazin\" + 0.011*\"worldwid\"\n", + "2019-01-31 01:16:39,534 : INFO : topic #10 (0.020): 0.011*\"cdd\" + 0.008*\"media\" + 0.008*\"disco\" + 0.008*\"have\" + 0.008*\"hormon\" + 0.007*\"pathwai\" + 0.007*\"caus\" + 0.006*\"effect\" + 0.006*\"proper\" + 0.006*\"treat\"\n", + "2019-01-31 01:16:39,540 : INFO : topic diff=0.003031, rho=0.023850\n", + "2019-01-31 01:16:39,760 : INFO : PROGRESS: pass 0, at document #3518000/4922894\n", + "2019-01-31 01:16:41,175 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:16:41,442 : INFO : topic #20 (0.020): 0.146*\"scholar\" + 0.040*\"struggl\" + 0.034*\"high\" + 0.030*\"educ\" + 0.025*\"collector\" + 0.018*\"yawn\" + 0.012*\"prognosi\" + 0.010*\"task\" + 0.010*\"district\" + 0.010*\"gothic\"\n", + "2019-01-31 01:16:41,443 : INFO : topic #32 (0.020): 0.050*\"district\" + 0.045*\"vigour\" + 0.043*\"popolo\" + 0.037*\"cotton\" + 0.035*\"tortur\" + 0.024*\"toni\" + 0.022*\"multitud\" + 0.021*\"adulthood\" + 0.021*\"area\" + 0.020*\"citi\"\n", + "2019-01-31 01:16:41,444 : INFO : topic #41 (0.020): 0.041*\"citi\" + 0.024*\"palmer\" + 0.021*\"new\" + 0.017*\"strategist\" + 0.013*\"open\" + 0.012*\"center\" + 0.011*\"includ\" + 0.011*\"lobe\" + 0.011*\"dai\" + 0.009*\"local\"\n", + "2019-01-31 01:16:41,445 : INFO : topic #28 (0.020): 0.033*\"build\" + 0.028*\"hous\" + 0.019*\"buford\" + 0.014*\"histor\" + 0.011*\"linear\" + 0.011*\"rivièr\" + 0.011*\"constitut\" + 0.011*\"briarwood\" + 0.011*\"silicon\" + 0.010*\"depress\"\n", + "2019-01-31 01:16:41,446 : INFO : topic #44 (0.020): 0.031*\"rooftop\" + 0.027*\"final\" + 0.023*\"wife\" + 0.020*\"tourist\" + 0.018*\"champion\" + 0.016*\"taxpay\" + 0.015*\"martin\" + 0.014*\"tiepolo\" + 0.013*\"chamber\" + 0.013*\"women\"\n", + "2019-01-31 01:16:41,452 : INFO : topic diff=0.003552, rho=0.023843\n", + "2019-01-31 01:16:44,061 : INFO : -11.537 per-word bound, 2972.2 perplexity estimate based on a held-out corpus of 2000 documents with 552961 words\n", + "2019-01-31 01:16:44,061 : INFO : PROGRESS: pass 0, at document #3520000/4922894\n", + "2019-01-31 01:16:45,405 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:16:45,672 : INFO : topic #8 (0.020): 0.027*\"law\" + 0.023*\"cortic\" + 0.018*\"start\" + 0.016*\"act\" + 0.013*\"ricardo\" + 0.012*\"case\" + 0.010*\"replac\" + 0.009*\"polaris\" + 0.008*\"legal\" + 0.008*\"order\"\n", + "2019-01-31 01:16:45,673 : INFO : topic #20 (0.020): 0.145*\"scholar\" + 0.040*\"struggl\" + 0.033*\"high\" + 0.030*\"educ\" + 0.024*\"collector\" + 0.018*\"yawn\" + 0.012*\"prognosi\" + 0.010*\"district\" + 0.010*\"task\" + 0.010*\"gothic\"\n", + "2019-01-31 01:16:45,674 : INFO : topic #14 (0.020): 0.024*\"forc\" + 0.021*\"aggress\" + 0.021*\"walter\" + 0.021*\"armi\" + 0.018*\"com\" + 0.013*\"unionist\" + 0.013*\"oper\" + 0.012*\"militari\" + 0.012*\"airbu\" + 0.010*\"diversifi\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 01:16:45,676 : INFO : topic #21 (0.020): 0.033*\"samford\" + 0.022*\"spain\" + 0.019*\"del\" + 0.018*\"mexico\" + 0.016*\"italian\" + 0.014*\"soviet\" + 0.012*\"santa\" + 0.011*\"juan\" + 0.011*\"carlo\" + 0.011*\"mexican\"\n", + "2019-01-31 01:16:45,677 : INFO : topic #17 (0.020): 0.077*\"church\" + 0.023*\"christian\" + 0.022*\"cathol\" + 0.021*\"bishop\" + 0.017*\"sail\" + 0.015*\"retroflex\" + 0.010*\"relationship\" + 0.010*\"historiographi\" + 0.009*\"cathedr\" + 0.009*\"poll\"\n", + "2019-01-31 01:16:45,683 : INFO : topic diff=0.004242, rho=0.023837\n", + "2019-01-31 01:16:45,837 : INFO : PROGRESS: pass 0, at document #3522000/4922894\n", + "2019-01-31 01:16:47,191 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:16:47,458 : INFO : topic #47 (0.020): 0.061*\"muscl\" + 0.032*\"perceptu\" + 0.020*\"theater\" + 0.019*\"place\" + 0.018*\"compos\" + 0.014*\"orchestr\" + 0.014*\"damn\" + 0.013*\"olympo\" + 0.012*\"physician\" + 0.011*\"word\"\n", + "2019-01-31 01:16:47,459 : INFO : topic #29 (0.020): 0.031*\"companhia\" + 0.013*\"busi\" + 0.012*\"bank\" + 0.012*\"million\" + 0.011*\"market\" + 0.010*\"produc\" + 0.010*\"industri\" + 0.009*\"manag\" + 0.008*\"yawn\" + 0.007*\"trace\"\n", + "2019-01-31 01:16:47,460 : INFO : topic #49 (0.020): 0.044*\"india\" + 0.032*\"incumb\" + 0.014*\"pakistan\" + 0.013*\"islam\" + 0.011*\"anglo\" + 0.011*\"muskoge\" + 0.010*\"televis\" + 0.010*\"khalsa\" + 0.010*\"alam\" + 0.009*\"tajikistan\"\n", + "2019-01-31 01:16:47,461 : INFO : topic #3 (0.020): 0.033*\"present\" + 0.025*\"offic\" + 0.025*\"nation\" + 0.024*\"minist\" + 0.023*\"govern\" + 0.020*\"member\" + 0.020*\"serv\" + 0.016*\"start\" + 0.016*\"gener\" + 0.014*\"chickasaw\"\n", + "2019-01-31 01:16:47,462 : INFO : topic #13 (0.020): 0.026*\"australia\" + 0.026*\"sourc\" + 0.025*\"london\" + 0.025*\"new\" + 0.023*\"england\" + 0.022*\"australian\" + 0.020*\"british\" + 0.019*\"ireland\" + 0.016*\"youth\" + 0.013*\"wale\"\n", + "2019-01-31 01:16:47,468 : INFO : topic diff=0.003727, rho=0.023830\n", + "2019-01-31 01:16:47,625 : INFO : PROGRESS: pass 0, at document #3524000/4922894\n", + "2019-01-31 01:16:48,999 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:16:49,266 : INFO : topic #49 (0.020): 0.044*\"india\" + 0.031*\"incumb\" + 0.014*\"pakistan\" + 0.014*\"islam\" + 0.011*\"anglo\" + 0.011*\"muskoge\" + 0.010*\"televis\" + 0.010*\"khalsa\" + 0.010*\"alam\" + 0.009*\"affection\"\n", + "2019-01-31 01:16:49,267 : INFO : topic #3 (0.020): 0.033*\"present\" + 0.025*\"offic\" + 0.025*\"nation\" + 0.023*\"minist\" + 0.023*\"govern\" + 0.020*\"member\" + 0.020*\"serv\" + 0.016*\"start\" + 0.016*\"gener\" + 0.014*\"chickasaw\"\n", + "2019-01-31 01:16:49,268 : INFO : topic #30 (0.020): 0.035*\"leagu\" + 0.035*\"cleveland\" + 0.030*\"place\" + 0.028*\"taxpay\" + 0.024*\"scientist\" + 0.024*\"crete\" + 0.022*\"folei\" + 0.017*\"goal\" + 0.016*\"martin\" + 0.013*\"schmitz\"\n", + "2019-01-31 01:16:49,269 : INFO : topic #12 (0.020): 0.008*\"number\" + 0.007*\"frontal\" + 0.007*\"gener\" + 0.006*\"poet\" + 0.006*\"exampl\" + 0.006*\"servitud\" + 0.006*\"measur\" + 0.006*\"southern\" + 0.006*\"théori\" + 0.005*\"utopian\"\n", + "2019-01-31 01:16:49,271 : INFO : topic #29 (0.020): 0.031*\"companhia\" + 0.013*\"busi\" + 0.012*\"bank\" + 0.012*\"million\" + 0.011*\"market\" + 0.010*\"produc\" + 0.010*\"industri\" + 0.009*\"manag\" + 0.008*\"yawn\" + 0.007*\"trace\"\n", + "2019-01-31 01:16:49,277 : INFO : topic diff=0.003460, rho=0.023823\n", + "2019-01-31 01:16:49,437 : INFO : PROGRESS: pass 0, at document #3526000/4922894\n", + "2019-01-31 01:16:50,830 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:16:51,097 : INFO : topic #7 (0.020): 0.021*\"snatch\" + 0.020*\"di\" + 0.019*\"factor\" + 0.016*\"yawn\" + 0.016*\"margin\" + 0.014*\"bone\" + 0.013*\"life\" + 0.013*\"faster\" + 0.012*\"daughter\" + 0.012*\"deal\"\n", + "2019-01-31 01:16:51,098 : INFO : topic #17 (0.020): 0.077*\"church\" + 0.023*\"christian\" + 0.022*\"cathol\" + 0.021*\"bishop\" + 0.018*\"sail\" + 0.014*\"retroflex\" + 0.010*\"relationship\" + 0.009*\"historiographi\" + 0.009*\"poll\" + 0.009*\"cathedr\"\n", + "2019-01-31 01:16:51,099 : INFO : topic #5 (0.020): 0.038*\"abroad\" + 0.027*\"son\" + 0.027*\"rel\" + 0.026*\"reconstruct\" + 0.021*\"band\" + 0.017*\"muscl\" + 0.016*\"simultan\" + 0.014*\"charcoal\" + 0.013*\"toyota\" + 0.009*\"vocabulari\"\n", + "2019-01-31 01:16:51,100 : INFO : topic #20 (0.020): 0.144*\"scholar\" + 0.039*\"struggl\" + 0.033*\"high\" + 0.030*\"educ\" + 0.024*\"collector\" + 0.018*\"yawn\" + 0.012*\"prognosi\" + 0.010*\"district\" + 0.010*\"gothic\" + 0.010*\"task\"\n", + "2019-01-31 01:16:51,102 : INFO : topic #31 (0.020): 0.050*\"fusiform\" + 0.028*\"scientist\" + 0.026*\"taxpay\" + 0.023*\"player\" + 0.019*\"place\" + 0.014*\"clot\" + 0.013*\"leagu\" + 0.011*\"folei\" + 0.010*\"yawn\" + 0.010*\"reconstruct\"\n", + "2019-01-31 01:16:51,107 : INFO : topic diff=0.003938, rho=0.023816\n", + "2019-01-31 01:16:51,268 : INFO : PROGRESS: pass 0, at document #3528000/4922894\n", + "2019-01-31 01:16:52,675 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:16:52,941 : INFO : topic #26 (0.020): 0.029*\"champion\" + 0.029*\"workplac\" + 0.027*\"woman\" + 0.025*\"men\" + 0.025*\"olymp\" + 0.021*\"event\" + 0.021*\"medal\" + 0.019*\"atheist\" + 0.018*\"taxpay\" + 0.018*\"rainfal\"\n", + "2019-01-31 01:16:52,942 : INFO : topic #19 (0.020): 0.017*\"languag\" + 0.015*\"centuri\" + 0.011*\"woodcut\" + 0.009*\"form\" + 0.009*\"mean\" + 0.009*\"origin\" + 0.008*\"english\" + 0.008*\"trade\" + 0.007*\"known\" + 0.007*\"ancestor\"\n", + "2019-01-31 01:16:52,943 : INFO : topic #41 (0.020): 0.041*\"citi\" + 0.024*\"palmer\" + 0.021*\"new\" + 0.017*\"strategist\" + 0.013*\"open\" + 0.012*\"center\" + 0.011*\"includ\" + 0.011*\"lobe\" + 0.011*\"dai\" + 0.009*\"local\"\n", + "2019-01-31 01:16:52,945 : INFO : topic #47 (0.020): 0.061*\"muscl\" + 0.032*\"perceptu\" + 0.020*\"theater\" + 0.018*\"place\" + 0.018*\"compos\" + 0.014*\"damn\" + 0.014*\"orchestr\" + 0.013*\"olympo\" + 0.013*\"physician\" + 0.011*\"word\"\n", + "2019-01-31 01:16:52,946 : INFO : topic #31 (0.020): 0.050*\"fusiform\" + 0.028*\"scientist\" + 0.026*\"taxpay\" + 0.023*\"player\" + 0.019*\"place\" + 0.014*\"clot\" + 0.013*\"leagu\" + 0.011*\"folei\" + 0.010*\"yawn\" + 0.009*\"reconstruct\"\n", + "2019-01-31 01:16:52,952 : INFO : topic diff=0.003878, rho=0.023810\n", + "2019-01-31 01:16:53,108 : INFO : PROGRESS: pass 0, at document #3530000/4922894\n", + "2019-01-31 01:16:54,485 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:16:54,752 : INFO : topic #8 (0.020): 0.026*\"law\" + 0.022*\"cortic\" + 0.017*\"start\" + 0.017*\"act\" + 0.013*\"ricardo\" + 0.012*\"case\" + 0.010*\"replac\" + 0.010*\"order\" + 0.009*\"polaris\" + 0.008*\"legal\"\n", + "2019-01-31 01:16:54,753 : INFO : topic #46 (0.020): 0.018*\"stop\" + 0.017*\"sweden\" + 0.016*\"norwai\" + 0.014*\"swedish\" + 0.014*\"damag\" + 0.013*\"wind\" + 0.012*\"norwegian\" + 0.012*\"denmark\" + 0.011*\"treeless\" + 0.011*\"huntsvil\"\n", + "2019-01-31 01:16:54,754 : INFO : topic #16 (0.020): 0.056*\"king\" + 0.030*\"priest\" + 0.021*\"duke\" + 0.020*\"rotterdam\" + 0.018*\"quarterli\" + 0.018*\"grammat\" + 0.016*\"idiosyncrat\" + 0.015*\"kingdom\" + 0.013*\"count\" + 0.012*\"portugues\"\n", + "2019-01-31 01:16:54,755 : INFO : topic #45 (0.020): 0.028*\"arsen\" + 0.026*\"jpg\" + 0.024*\"fifteenth\" + 0.021*\"museo\" + 0.019*\"illicit\" + 0.018*\"pain\" + 0.015*\"colder\" + 0.014*\"gai\" + 0.012*\"black\" + 0.012*\"exhaust\"\n", + "2019-01-31 01:16:54,756 : INFO : topic #36 (0.020): 0.011*\"network\" + 0.010*\"prognosi\" + 0.010*\"pop\" + 0.008*\"cytokin\" + 0.008*\"softwar\" + 0.008*\"develop\" + 0.008*\"user\" + 0.008*\"uruguayan\" + 0.007*\"diggin\" + 0.007*\"brio\"\n", + "2019-01-31 01:16:54,762 : INFO : topic diff=0.003643, rho=0.023803\n", + "2019-01-31 01:16:54,923 : INFO : PROGRESS: pass 0, at document #3532000/4922894\n", + "2019-01-31 01:16:56,329 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:16:56,596 : INFO : topic #32 (0.020): 0.049*\"district\" + 0.045*\"vigour\" + 0.043*\"popolo\" + 0.036*\"cotton\" + 0.035*\"tortur\" + 0.022*\"toni\" + 0.022*\"multitud\" + 0.022*\"adulthood\" + 0.021*\"area\" + 0.020*\"citi\"\n", + "2019-01-31 01:16:56,597 : INFO : topic #45 (0.020): 0.028*\"arsen\" + 0.026*\"jpg\" + 0.024*\"fifteenth\" + 0.021*\"museo\" + 0.019*\"illicit\" + 0.018*\"pain\" + 0.015*\"colder\" + 0.013*\"gai\" + 0.013*\"black\" + 0.012*\"exhaust\"\n", + "2019-01-31 01:16:56,598 : INFO : topic #27 (0.020): 0.073*\"questionnair\" + 0.019*\"taxpay\" + 0.018*\"candid\" + 0.016*\"ret\" + 0.014*\"driver\" + 0.012*\"find\" + 0.012*\"fool\" + 0.011*\"tornado\" + 0.010*\"squatter\" + 0.010*\"landslid\"\n", + "2019-01-31 01:16:56,599 : INFO : topic #48 (0.020): 0.078*\"sens\" + 0.078*\"march\" + 0.076*\"octob\" + 0.071*\"juli\" + 0.069*\"august\" + 0.069*\"januari\" + 0.068*\"notion\" + 0.067*\"april\" + 0.067*\"judici\" + 0.065*\"decatur\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 01:16:56,600 : INFO : topic #13 (0.020): 0.027*\"australia\" + 0.026*\"sourc\" + 0.025*\"london\" + 0.025*\"new\" + 0.024*\"england\" + 0.023*\"australian\" + 0.020*\"british\" + 0.019*\"ireland\" + 0.015*\"youth\" + 0.014*\"wale\"\n", + "2019-01-31 01:16:56,605 : INFO : topic diff=0.004546, rho=0.023796\n", + "2019-01-31 01:16:56,762 : INFO : PROGRESS: pass 0, at document #3534000/4922894\n", + "2019-01-31 01:16:58,142 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:16:58,408 : INFO : topic #32 (0.020): 0.050*\"district\" + 0.045*\"vigour\" + 0.043*\"popolo\" + 0.036*\"cotton\" + 0.035*\"tortur\" + 0.022*\"multitud\" + 0.022*\"toni\" + 0.022*\"adulthood\" + 0.021*\"area\" + 0.020*\"citi\"\n", + "2019-01-31 01:16:58,409 : INFO : topic #49 (0.020): 0.044*\"india\" + 0.032*\"incumb\" + 0.014*\"pakistan\" + 0.013*\"islam\" + 0.011*\"anglo\" + 0.011*\"muskoge\" + 0.010*\"televis\" + 0.010*\"khalsa\" + 0.010*\"alam\" + 0.009*\"affection\"\n", + "2019-01-31 01:16:58,410 : INFO : topic #43 (0.020): 0.066*\"elect\" + 0.054*\"parti\" + 0.026*\"voluntari\" + 0.023*\"democrat\" + 0.020*\"member\" + 0.016*\"polici\" + 0.016*\"republ\" + 0.014*\"bypass\" + 0.014*\"seaport\" + 0.013*\"report\"\n", + "2019-01-31 01:16:58,412 : INFO : topic #11 (0.020): 0.024*\"john\" + 0.012*\"will\" + 0.012*\"jame\" + 0.012*\"david\" + 0.010*\"rival\" + 0.009*\"mexican–american\" + 0.008*\"paul\" + 0.008*\"georg\" + 0.008*\"slur\" + 0.007*\"rhyme\"\n", + "2019-01-31 01:16:58,412 : INFO : topic #26 (0.020): 0.029*\"workplac\" + 0.028*\"champion\" + 0.027*\"woman\" + 0.025*\"olymp\" + 0.025*\"men\" + 0.021*\"medal\" + 0.021*\"event\" + 0.019*\"atheist\" + 0.019*\"alic\" + 0.018*\"taxpay\"\n", + "2019-01-31 01:16:58,418 : INFO : topic diff=0.003382, rho=0.023789\n", + "2019-01-31 01:16:58,572 : INFO : PROGRESS: pass 0, at document #3536000/4922894\n", + "2019-01-31 01:16:59,935 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:17:00,202 : INFO : topic #39 (0.020): 0.058*\"canada\" + 0.045*\"canadian\" + 0.024*\"toronto\" + 0.023*\"hoar\" + 0.020*\"ontario\" + 0.016*\"hydrogen\" + 0.016*\"new\" + 0.014*\"novotná\" + 0.013*\"misericordia\" + 0.012*\"quebec\"\n", + "2019-01-31 01:17:00,203 : INFO : topic #45 (0.020): 0.029*\"arsen\" + 0.026*\"jpg\" + 0.024*\"fifteenth\" + 0.021*\"museo\" + 0.019*\"illicit\" + 0.019*\"pain\" + 0.015*\"colder\" + 0.014*\"gai\" + 0.013*\"black\" + 0.012*\"exhaust\"\n", + "2019-01-31 01:17:00,204 : INFO : topic #0 (0.020): 0.065*\"statewid\" + 0.043*\"line\" + 0.035*\"raid\" + 0.027*\"rosenwald\" + 0.022*\"rivièr\" + 0.019*\"serv\" + 0.019*\"traceabl\" + 0.017*\"airmen\" + 0.014*\"oper\" + 0.010*\"transient\"\n", + "2019-01-31 01:17:00,205 : INFO : topic #33 (0.020): 0.061*\"french\" + 0.046*\"franc\" + 0.032*\"pari\" + 0.023*\"jean\" + 0.021*\"sail\" + 0.017*\"daphn\" + 0.013*\"lazi\" + 0.012*\"loui\" + 0.011*\"piec\" + 0.009*\"wine\"\n", + "2019-01-31 01:17:00,206 : INFO : topic #35 (0.020): 0.057*\"russia\" + 0.036*\"sovereignti\" + 0.035*\"rural\" + 0.025*\"poison\" + 0.024*\"reprint\" + 0.024*\"personifi\" + 0.021*\"moscow\" + 0.019*\"poland\" + 0.015*\"unfortun\" + 0.014*\"malaysia\"\n", + "2019-01-31 01:17:00,212 : INFO : topic diff=0.003572, rho=0.023783\n", + "2019-01-31 01:17:00,370 : INFO : PROGRESS: pass 0, at document #3538000/4922894\n", + "2019-01-31 01:17:01,727 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:17:01,996 : INFO : topic #30 (0.020): 0.036*\"cleveland\" + 0.035*\"leagu\" + 0.030*\"place\" + 0.027*\"taxpay\" + 0.024*\"scientist\" + 0.024*\"crete\" + 0.022*\"folei\" + 0.017*\"goal\" + 0.016*\"martin\" + 0.013*\"schmitz\"\n", + "2019-01-31 01:17:01,997 : INFO : topic #31 (0.020): 0.050*\"fusiform\" + 0.028*\"scientist\" + 0.025*\"taxpay\" + 0.023*\"player\" + 0.019*\"place\" + 0.014*\"clot\" + 0.013*\"leagu\" + 0.011*\"folei\" + 0.010*\"yawn\" + 0.009*\"reconstruct\"\n", + "2019-01-31 01:17:01,998 : INFO : topic #24 (0.020): 0.038*\"book\" + 0.033*\"publicis\" + 0.028*\"word\" + 0.019*\"new\" + 0.014*\"edit\" + 0.013*\"presid\" + 0.012*\"arsen\" + 0.011*\"collect\" + 0.011*\"worldwid\" + 0.011*\"magazin\"\n", + "2019-01-31 01:17:01,999 : INFO : topic #9 (0.020): 0.066*\"bone\" + 0.045*\"american\" + 0.030*\"valour\" + 0.019*\"dutch\" + 0.018*\"folei\" + 0.018*\"player\" + 0.016*\"polit\" + 0.016*\"english\" + 0.013*\"acrimoni\" + 0.012*\"simpler\"\n", + "2019-01-31 01:17:02,000 : INFO : topic #7 (0.020): 0.021*\"snatch\" + 0.020*\"di\" + 0.019*\"factor\" + 0.016*\"yawn\" + 0.016*\"margin\" + 0.014*\"bone\" + 0.013*\"life\" + 0.013*\"faster\" + 0.012*\"daughter\" + 0.012*\"john\"\n", + "2019-01-31 01:17:02,006 : INFO : topic diff=0.003498, rho=0.023776\n", + "2019-01-31 01:17:04,718 : INFO : -11.322 per-word bound, 2560.3 perplexity estimate based on a held-out corpus of 2000 documents with 561770 words\n", + "2019-01-31 01:17:04,718 : INFO : PROGRESS: pass 0, at document #3540000/4922894\n", + "2019-01-31 01:17:06,095 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:17:06,362 : INFO : topic #44 (0.020): 0.031*\"rooftop\" + 0.027*\"final\" + 0.023*\"wife\" + 0.019*\"tourist\" + 0.018*\"champion\" + 0.016*\"taxpay\" + 0.015*\"martin\" + 0.015*\"tiepolo\" + 0.013*\"chamber\" + 0.013*\"women\"\n", + "2019-01-31 01:17:06,363 : INFO : topic #1 (0.020): 0.055*\"china\" + 0.046*\"chilton\" + 0.025*\"kong\" + 0.024*\"hong\" + 0.020*\"korea\" + 0.017*\"korean\" + 0.015*\"sourc\" + 0.015*\"shirin\" + 0.014*\"leah\" + 0.012*\"kim\"\n", + "2019-01-31 01:17:06,365 : INFO : topic #10 (0.020): 0.011*\"cdd\" + 0.008*\"disco\" + 0.008*\"media\" + 0.007*\"have\" + 0.007*\"hormon\" + 0.007*\"pathwai\" + 0.007*\"caus\" + 0.006*\"effect\" + 0.006*\"treat\" + 0.006*\"proper\"\n", + "2019-01-31 01:17:06,366 : INFO : topic #28 (0.020): 0.033*\"build\" + 0.028*\"hous\" + 0.019*\"buford\" + 0.014*\"histor\" + 0.011*\"linear\" + 0.011*\"constitut\" + 0.011*\"rivièr\" + 0.011*\"depress\" + 0.011*\"silicon\" + 0.010*\"briarwood\"\n", + "2019-01-31 01:17:06,367 : INFO : topic #38 (0.020): 0.023*\"walter\" + 0.010*\"aza\" + 0.009*\"battalion\" + 0.008*\"forc\" + 0.008*\"empath\" + 0.007*\"teufel\" + 0.007*\"armi\" + 0.006*\"till\" + 0.006*\"militari\" + 0.006*\"pour\"\n", + "2019-01-31 01:17:06,373 : INFO : topic diff=0.003522, rho=0.023769\n", + "2019-01-31 01:17:06,528 : INFO : PROGRESS: pass 0, at document #3542000/4922894\n", + "2019-01-31 01:17:08,316 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:17:08,586 : INFO : topic #21 (0.020): 0.032*\"samford\" + 0.022*\"spain\" + 0.019*\"del\" + 0.018*\"mexico\" + 0.017*\"italian\" + 0.014*\"soviet\" + 0.012*\"santa\" + 0.011*\"juan\" + 0.011*\"carlo\" + 0.010*\"mexican\"\n", + "2019-01-31 01:17:08,587 : INFO : topic #32 (0.020): 0.050*\"district\" + 0.045*\"vigour\" + 0.043*\"popolo\" + 0.036*\"cotton\" + 0.036*\"tortur\" + 0.022*\"multitud\" + 0.022*\"adulthood\" + 0.021*\"area\" + 0.021*\"toni\" + 0.020*\"citi\"\n", + "2019-01-31 01:17:08,588 : INFO : topic #3 (0.020): 0.034*\"present\" + 0.025*\"nation\" + 0.025*\"offic\" + 0.024*\"minist\" + 0.023*\"govern\" + 0.020*\"member\" + 0.019*\"serv\" + 0.016*\"start\" + 0.016*\"gener\" + 0.014*\"chickasaw\"\n", + "2019-01-31 01:17:08,589 : INFO : topic #9 (0.020): 0.067*\"bone\" + 0.045*\"american\" + 0.030*\"valour\" + 0.019*\"dutch\" + 0.018*\"folei\" + 0.018*\"player\" + 0.016*\"polit\" + 0.015*\"english\" + 0.013*\"acrimoni\" + 0.012*\"simpler\"\n", + "2019-01-31 01:17:08,590 : INFO : topic #46 (0.020): 0.018*\"stop\" + 0.016*\"sweden\" + 0.016*\"norwai\" + 0.014*\"swedish\" + 0.013*\"wind\" + 0.013*\"damag\" + 0.013*\"norwegian\" + 0.012*\"treeless\" + 0.012*\"huntsvil\" + 0.011*\"denmark\"\n", + "2019-01-31 01:17:08,596 : INFO : topic diff=0.003359, rho=0.023762\n", + "2019-01-31 01:17:08,754 : INFO : PROGRESS: pass 0, at document #3544000/4922894\n", + "2019-01-31 01:17:10,128 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:17:10,394 : INFO : topic #2 (0.020): 0.048*\"isl\" + 0.038*\"shield\" + 0.018*\"narrat\" + 0.015*\"scot\" + 0.013*\"blur\" + 0.011*\"coalit\" + 0.011*\"pope\" + 0.010*\"nativist\" + 0.009*\"fleet\" + 0.009*\"bahá\"\n", + "2019-01-31 01:17:10,395 : INFO : topic #34 (0.020): 0.067*\"start\" + 0.033*\"new\" + 0.031*\"american\" + 0.030*\"unionist\" + 0.025*\"cotton\" + 0.021*\"year\" + 0.015*\"california\" + 0.013*\"warrior\" + 0.012*\"terri\" + 0.012*\"north\"\n", + "2019-01-31 01:17:10,396 : INFO : topic #41 (0.020): 0.040*\"citi\" + 0.024*\"palmer\" + 0.021*\"new\" + 0.016*\"strategist\" + 0.013*\"open\" + 0.012*\"center\" + 0.011*\"includ\" + 0.011*\"lobe\" + 0.010*\"dai\" + 0.009*\"local\"\n", + "2019-01-31 01:17:10,397 : INFO : topic #31 (0.020): 0.049*\"fusiform\" + 0.028*\"scientist\" + 0.026*\"taxpay\" + 0.023*\"player\" + 0.019*\"place\" + 0.014*\"clot\" + 0.013*\"leagu\" + 0.011*\"folei\" + 0.010*\"yawn\" + 0.009*\"reconstruct\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 01:17:10,399 : INFO : topic #6 (0.020): 0.069*\"fewer\" + 0.023*\"epiru\" + 0.021*\"septemb\" + 0.019*\"teacher\" + 0.016*\"stake\" + 0.012*\"rodríguez\" + 0.012*\"proclaim\" + 0.011*\"direct\" + 0.011*\"movi\" + 0.010*\"acrimoni\"\n", + "2019-01-31 01:17:10,404 : INFO : topic diff=0.004090, rho=0.023756\n", + "2019-01-31 01:17:10,560 : INFO : PROGRESS: pass 0, at document #3546000/4922894\n", + "2019-01-31 01:17:11,904 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:17:12,170 : INFO : topic #43 (0.020): 0.066*\"elect\" + 0.053*\"parti\" + 0.026*\"voluntari\" + 0.022*\"democrat\" + 0.020*\"member\" + 0.016*\"polici\" + 0.015*\"republ\" + 0.014*\"bypass\" + 0.013*\"seaport\" + 0.013*\"report\"\n", + "2019-01-31 01:17:12,172 : INFO : topic #6 (0.020): 0.069*\"fewer\" + 0.023*\"epiru\" + 0.021*\"septemb\" + 0.019*\"teacher\" + 0.016*\"stake\" + 0.012*\"rodríguez\" + 0.012*\"proclaim\" + 0.011*\"direct\" + 0.011*\"movi\" + 0.010*\"acrimoni\"\n", + "2019-01-31 01:17:12,173 : INFO : topic #4 (0.020): 0.020*\"enfranchis\" + 0.015*\"depress\" + 0.014*\"pour\" + 0.008*\"mode\" + 0.008*\"elabor\" + 0.008*\"veget\" + 0.008*\"uruguayan\" + 0.006*\"develop\" + 0.006*\"produc\" + 0.006*\"spectacl\"\n", + "2019-01-31 01:17:12,174 : INFO : topic #2 (0.020): 0.047*\"isl\" + 0.038*\"shield\" + 0.018*\"narrat\" + 0.015*\"scot\" + 0.013*\"blur\" + 0.011*\"pope\" + 0.011*\"coalit\" + 0.010*\"nativist\" + 0.009*\"fleet\" + 0.009*\"bahá\"\n", + "2019-01-31 01:17:12,175 : INFO : topic #22 (0.020): 0.035*\"spars\" + 0.018*\"factor\" + 0.011*\"plaisir\" + 0.011*\"genu\" + 0.009*\"western\" + 0.008*\"biom\" + 0.008*\"median\" + 0.007*\"feel\" + 0.007*\"male\" + 0.007*\"incom\"\n", + "2019-01-31 01:17:12,181 : INFO : topic diff=0.002942, rho=0.023749\n", + "2019-01-31 01:17:12,342 : INFO : PROGRESS: pass 0, at document #3548000/4922894\n", + "2019-01-31 01:17:13,745 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:17:14,011 : INFO : topic #30 (0.020): 0.036*\"cleveland\" + 0.035*\"leagu\" + 0.030*\"place\" + 0.027*\"taxpay\" + 0.024*\"scientist\" + 0.024*\"crete\" + 0.022*\"folei\" + 0.017*\"goal\" + 0.016*\"martin\" + 0.013*\"schmitz\"\n", + "2019-01-31 01:17:14,012 : INFO : topic #9 (0.020): 0.067*\"bone\" + 0.045*\"american\" + 0.031*\"valour\" + 0.019*\"dutch\" + 0.018*\"folei\" + 0.018*\"player\" + 0.016*\"polit\" + 0.016*\"english\" + 0.013*\"acrimoni\" + 0.012*\"simpler\"\n", + "2019-01-31 01:17:14,014 : INFO : topic #18 (0.020): 0.011*\"théori\" + 0.007*\"later\" + 0.007*\"sack\" + 0.006*\"dai\" + 0.006*\"kill\" + 0.005*\"like\" + 0.005*\"retrospect\" + 0.005*\"end\" + 0.004*\"call\" + 0.004*\"kenworthi\"\n", + "2019-01-31 01:17:14,015 : INFO : topic #11 (0.020): 0.024*\"john\" + 0.012*\"will\" + 0.012*\"jame\" + 0.011*\"david\" + 0.010*\"rival\" + 0.009*\"mexican–american\" + 0.008*\"paul\" + 0.008*\"slur\" + 0.008*\"georg\" + 0.007*\"rhyme\"\n", + "2019-01-31 01:17:14,016 : INFO : topic #32 (0.020): 0.050*\"district\" + 0.045*\"vigour\" + 0.043*\"popolo\" + 0.036*\"cotton\" + 0.036*\"tortur\" + 0.022*\"multitud\" + 0.022*\"adulthood\" + 0.021*\"area\" + 0.020*\"toni\" + 0.020*\"citi\"\n", + "2019-01-31 01:17:14,022 : INFO : topic diff=0.003812, rho=0.023742\n", + "2019-01-31 01:17:14,237 : INFO : PROGRESS: pass 0, at document #3550000/4922894\n", + "2019-01-31 01:17:15,642 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:17:15,908 : INFO : topic #0 (0.020): 0.065*\"statewid\" + 0.043*\"line\" + 0.034*\"raid\" + 0.027*\"rosenwald\" + 0.025*\"rivièr\" + 0.019*\"serv\" + 0.019*\"traceabl\" + 0.017*\"airmen\" + 0.014*\"oper\" + 0.010*\"transient\"\n", + "2019-01-31 01:17:15,910 : INFO : topic #5 (0.020): 0.038*\"abroad\" + 0.028*\"son\" + 0.027*\"rel\" + 0.026*\"reconstruct\" + 0.021*\"band\" + 0.017*\"muscl\" + 0.016*\"simultan\" + 0.014*\"charcoal\" + 0.013*\"toyota\" + 0.009*\"vocabulari\"\n", + "2019-01-31 01:17:15,911 : INFO : topic #28 (0.020): 0.033*\"build\" + 0.028*\"hous\" + 0.019*\"buford\" + 0.014*\"histor\" + 0.012*\"linear\" + 0.011*\"constitut\" + 0.011*\"depress\" + 0.011*\"rivièr\" + 0.010*\"silicon\" + 0.010*\"briarwood\"\n", + "2019-01-31 01:17:15,912 : INFO : topic #13 (0.020): 0.027*\"australia\" + 0.026*\"sourc\" + 0.025*\"new\" + 0.025*\"london\" + 0.023*\"england\" + 0.023*\"australian\" + 0.019*\"british\" + 0.018*\"ireland\" + 0.015*\"youth\" + 0.014*\"wale\"\n", + "2019-01-31 01:17:15,913 : INFO : topic #43 (0.020): 0.066*\"elect\" + 0.053*\"parti\" + 0.026*\"voluntari\" + 0.022*\"democrat\" + 0.020*\"member\" + 0.016*\"polici\" + 0.015*\"republ\" + 0.014*\"bypass\" + 0.013*\"seaport\" + 0.013*\"report\"\n", + "2019-01-31 01:17:15,919 : INFO : topic diff=0.003343, rho=0.023736\n", + "2019-01-31 01:17:16,074 : INFO : PROGRESS: pass 0, at document #3552000/4922894\n", + "2019-01-31 01:17:17,427 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:17:17,694 : INFO : topic #24 (0.020): 0.038*\"book\" + 0.033*\"publicis\" + 0.028*\"word\" + 0.019*\"new\" + 0.014*\"edit\" + 0.013*\"presid\" + 0.012*\"arsen\" + 0.011*\"collect\" + 0.011*\"worldwid\" + 0.011*\"magazin\"\n", + "2019-01-31 01:17:17,695 : INFO : topic #13 (0.020): 0.027*\"australia\" + 0.026*\"sourc\" + 0.025*\"london\" + 0.025*\"new\" + 0.024*\"england\" + 0.023*\"australian\" + 0.019*\"british\" + 0.018*\"ireland\" + 0.015*\"youth\" + 0.014*\"wale\"\n", + "2019-01-31 01:17:17,696 : INFO : topic #0 (0.020): 0.065*\"statewid\" + 0.043*\"line\" + 0.034*\"raid\" + 0.027*\"rosenwald\" + 0.025*\"rivièr\" + 0.020*\"serv\" + 0.019*\"traceabl\" + 0.017*\"airmen\" + 0.014*\"oper\" + 0.010*\"transient\"\n", + "2019-01-31 01:17:17,697 : INFO : topic #1 (0.020): 0.055*\"china\" + 0.045*\"chilton\" + 0.025*\"kong\" + 0.025*\"hong\" + 0.021*\"korea\" + 0.017*\"korean\" + 0.015*\"sourc\" + 0.014*\"shirin\" + 0.014*\"leah\" + 0.013*\"kim\"\n", + "2019-01-31 01:17:17,698 : INFO : topic #43 (0.020): 0.066*\"elect\" + 0.053*\"parti\" + 0.026*\"voluntari\" + 0.022*\"democrat\" + 0.020*\"member\" + 0.016*\"polici\" + 0.015*\"republ\" + 0.014*\"bypass\" + 0.013*\"seaport\" + 0.013*\"report\"\n", + "2019-01-31 01:17:17,704 : INFO : topic diff=0.004405, rho=0.023729\n", + "2019-01-31 01:17:17,857 : INFO : PROGRESS: pass 0, at document #3554000/4922894\n", + "2019-01-31 01:17:19,204 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:17:19,469 : INFO : topic #7 (0.020): 0.021*\"snatch\" + 0.020*\"di\" + 0.018*\"factor\" + 0.016*\"yawn\" + 0.015*\"margin\" + 0.014*\"bone\" + 0.013*\"life\" + 0.013*\"faster\" + 0.012*\"daughter\" + 0.012*\"john\"\n", + "2019-01-31 01:17:19,471 : INFO : topic #12 (0.020): 0.009*\"number\" + 0.007*\"frontal\" + 0.007*\"gener\" + 0.007*\"southern\" + 0.006*\"exampl\" + 0.006*\"poet\" + 0.006*\"servitud\" + 0.006*\"théori\" + 0.006*\"measur\" + 0.005*\"utopian\"\n", + "2019-01-31 01:17:19,472 : INFO : topic #2 (0.020): 0.047*\"isl\" + 0.039*\"shield\" + 0.018*\"narrat\" + 0.015*\"scot\" + 0.013*\"blur\" + 0.011*\"pope\" + 0.011*\"coalit\" + 0.011*\"nativist\" + 0.009*\"fleet\" + 0.008*\"bahá\"\n", + "2019-01-31 01:17:19,473 : INFO : topic #44 (0.020): 0.032*\"rooftop\" + 0.028*\"final\" + 0.024*\"wife\" + 0.019*\"tourist\" + 0.018*\"champion\" + 0.016*\"taxpay\" + 0.016*\"martin\" + 0.015*\"tiepolo\" + 0.013*\"chamber\" + 0.013*\"women\"\n", + "2019-01-31 01:17:19,474 : INFO : topic #13 (0.020): 0.027*\"australia\" + 0.026*\"sourc\" + 0.025*\"new\" + 0.025*\"london\" + 0.024*\"england\" + 0.023*\"australian\" + 0.019*\"british\" + 0.018*\"ireland\" + 0.015*\"youth\" + 0.014*\"wale\"\n", + "2019-01-31 01:17:19,479 : INFO : topic diff=0.003399, rho=0.023722\n", + "2019-01-31 01:17:19,642 : INFO : PROGRESS: pass 0, at document #3556000/4922894\n", + "2019-01-31 01:17:21,015 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:17:21,282 : INFO : topic #30 (0.020): 0.037*\"cleveland\" + 0.035*\"leagu\" + 0.030*\"place\" + 0.027*\"taxpay\" + 0.024*\"scientist\" + 0.024*\"crete\" + 0.022*\"folei\" + 0.017*\"goal\" + 0.015*\"martin\" + 0.013*\"schmitz\"\n", + "2019-01-31 01:17:21,283 : INFO : topic #10 (0.020): 0.011*\"cdd\" + 0.009*\"media\" + 0.008*\"disco\" + 0.008*\"have\" + 0.008*\"hormon\" + 0.007*\"pathwai\" + 0.007*\"caus\" + 0.006*\"treat\" + 0.006*\"effect\" + 0.006*\"proper\"\n", + "2019-01-31 01:17:21,284 : INFO : topic #39 (0.020): 0.057*\"canada\" + 0.045*\"canadian\" + 0.024*\"toronto\" + 0.022*\"hoar\" + 0.019*\"ontario\" + 0.016*\"new\" + 0.016*\"hydrogen\" + 0.016*\"misericordia\" + 0.014*\"novotná\" + 0.012*\"quebec\"\n", + "2019-01-31 01:17:21,285 : INFO : topic #3 (0.020): 0.034*\"present\" + 0.025*\"offic\" + 0.025*\"nation\" + 0.024*\"minist\" + 0.022*\"govern\" + 0.020*\"member\" + 0.019*\"serv\" + 0.016*\"start\" + 0.016*\"gener\" + 0.014*\"chickasaw\"\n", + "2019-01-31 01:17:21,286 : INFO : topic #37 (0.020): 0.012*\"charact\" + 0.011*\"septemb\" + 0.010*\"anim\" + 0.009*\"man\" + 0.008*\"comic\" + 0.007*\"appear\" + 0.007*\"storag\" + 0.006*\"fusiform\" + 0.006*\"workplac\" + 0.006*\"vision\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 01:17:21,292 : INFO : topic diff=0.003774, rho=0.023716\n", + "2019-01-31 01:17:21,448 : INFO : PROGRESS: pass 0, at document #3558000/4922894\n", + "2019-01-31 01:17:22,801 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:17:23,068 : INFO : topic #9 (0.020): 0.067*\"bone\" + 0.045*\"american\" + 0.031*\"valour\" + 0.019*\"dutch\" + 0.018*\"folei\" + 0.018*\"player\" + 0.016*\"polit\" + 0.016*\"english\" + 0.013*\"acrimoni\" + 0.012*\"simpler\"\n", + "2019-01-31 01:17:23,069 : INFO : topic #16 (0.020): 0.056*\"king\" + 0.029*\"priest\" + 0.021*\"duke\" + 0.019*\"rotterdam\" + 0.018*\"quarterli\" + 0.017*\"idiosyncrat\" + 0.017*\"grammat\" + 0.014*\"kingdom\" + 0.013*\"portugues\" + 0.013*\"count\"\n", + "2019-01-31 01:17:23,070 : INFO : topic #28 (0.020): 0.033*\"build\" + 0.028*\"hous\" + 0.019*\"buford\" + 0.014*\"histor\" + 0.012*\"linear\" + 0.011*\"constitut\" + 0.011*\"depress\" + 0.010*\"rivièr\" + 0.010*\"briarwood\" + 0.010*\"silicon\"\n", + "2019-01-31 01:17:23,071 : INFO : topic #33 (0.020): 0.063*\"french\" + 0.048*\"franc\" + 0.032*\"pari\" + 0.023*\"jean\" + 0.021*\"sail\" + 0.017*\"daphn\" + 0.014*\"lazi\" + 0.012*\"loui\" + 0.011*\"piec\" + 0.009*\"wine\"\n", + "2019-01-31 01:17:23,072 : INFO : topic #49 (0.020): 0.045*\"india\" + 0.032*\"incumb\" + 0.013*\"islam\" + 0.013*\"pakistan\" + 0.011*\"muskoge\" + 0.010*\"anglo\" + 0.010*\"khalsa\" + 0.010*\"televis\" + 0.010*\"affection\" + 0.010*\"alam\"\n", + "2019-01-31 01:17:23,078 : INFO : topic diff=0.003613, rho=0.023709\n", + "2019-01-31 01:17:25,756 : INFO : -11.688 per-word bound, 3299.6 perplexity estimate based on a held-out corpus of 2000 documents with 559634 words\n", + "2019-01-31 01:17:25,757 : INFO : PROGRESS: pass 0, at document #3560000/4922894\n", + "2019-01-31 01:17:27,133 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:17:27,399 : INFO : topic #28 (0.020): 0.033*\"build\" + 0.028*\"hous\" + 0.019*\"buford\" + 0.015*\"histor\" + 0.012*\"linear\" + 0.011*\"constitut\" + 0.011*\"depress\" + 0.010*\"rivièr\" + 0.010*\"briarwood\" + 0.010*\"silicon\"\n", + "2019-01-31 01:17:27,400 : INFO : topic #13 (0.020): 0.026*\"australia\" + 0.026*\"sourc\" + 0.025*\"new\" + 0.025*\"london\" + 0.024*\"england\" + 0.023*\"australian\" + 0.019*\"british\" + 0.019*\"ireland\" + 0.015*\"youth\" + 0.014*\"wale\"\n", + "2019-01-31 01:17:27,401 : INFO : topic #17 (0.020): 0.078*\"church\" + 0.023*\"cathol\" + 0.022*\"christian\" + 0.021*\"bishop\" + 0.017*\"sail\" + 0.014*\"retroflex\" + 0.010*\"relationship\" + 0.010*\"poll\" + 0.009*\"cathedr\" + 0.009*\"historiographi\"\n", + "2019-01-31 01:17:27,402 : INFO : topic #31 (0.020): 0.051*\"fusiform\" + 0.028*\"scientist\" + 0.025*\"taxpay\" + 0.022*\"player\" + 0.019*\"place\" + 0.014*\"clot\" + 0.013*\"leagu\" + 0.011*\"folei\" + 0.010*\"yawn\" + 0.009*\"reconstruct\"\n", + "2019-01-31 01:17:27,403 : INFO : topic #24 (0.020): 0.038*\"book\" + 0.033*\"publicis\" + 0.028*\"word\" + 0.019*\"new\" + 0.014*\"edit\" + 0.013*\"presid\" + 0.012*\"arsen\" + 0.011*\"collect\" + 0.011*\"worldwid\" + 0.011*\"magazin\"\n", + "2019-01-31 01:17:27,409 : INFO : topic diff=0.003368, rho=0.023702\n", + "2019-01-31 01:17:27,568 : INFO : PROGRESS: pass 0, at document #3562000/4922894\n", + "2019-01-31 01:17:28,936 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:17:29,202 : INFO : topic #7 (0.020): 0.021*\"snatch\" + 0.020*\"di\" + 0.018*\"factor\" + 0.016*\"yawn\" + 0.015*\"margin\" + 0.014*\"bone\" + 0.013*\"life\" + 0.013*\"faster\" + 0.012*\"daughter\" + 0.012*\"john\"\n", + "2019-01-31 01:17:29,203 : INFO : topic #13 (0.020): 0.026*\"australia\" + 0.026*\"sourc\" + 0.025*\"new\" + 0.025*\"london\" + 0.024*\"england\" + 0.022*\"australian\" + 0.019*\"british\" + 0.019*\"ireland\" + 0.015*\"youth\" + 0.014*\"wale\"\n", + "2019-01-31 01:17:29,204 : INFO : topic #40 (0.020): 0.086*\"unit\" + 0.023*\"schuster\" + 0.022*\"institut\" + 0.021*\"requir\" + 0.020*\"collector\" + 0.019*\"student\" + 0.015*\"professor\" + 0.011*\"degre\" + 0.011*\"word\" + 0.011*\"http\"\n", + "2019-01-31 01:17:29,205 : INFO : topic #20 (0.020): 0.143*\"scholar\" + 0.040*\"struggl\" + 0.033*\"high\" + 0.030*\"educ\" + 0.024*\"collector\" + 0.018*\"yawn\" + 0.013*\"prognosi\" + 0.010*\"task\" + 0.009*\"district\" + 0.009*\"start\"\n", + "2019-01-31 01:17:29,206 : INFO : topic #0 (0.020): 0.066*\"statewid\" + 0.042*\"line\" + 0.033*\"raid\" + 0.026*\"rosenwald\" + 0.024*\"rivièr\" + 0.020*\"serv\" + 0.019*\"traceabl\" + 0.016*\"airmen\" + 0.014*\"oper\" + 0.010*\"transient\"\n", + "2019-01-31 01:17:29,212 : INFO : topic diff=0.003161, rho=0.023696\n", + "2019-01-31 01:17:29,369 : INFO : PROGRESS: pass 0, at document #3564000/4922894\n", + "2019-01-31 01:17:30,744 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:17:31,010 : INFO : topic #3 (0.020): 0.034*\"present\" + 0.025*\"offic\" + 0.025*\"nation\" + 0.024*\"minist\" + 0.023*\"govern\" + 0.020*\"member\" + 0.019*\"serv\" + 0.016*\"start\" + 0.016*\"gener\" + 0.014*\"chickasaw\"\n", + "2019-01-31 01:17:31,011 : INFO : topic #29 (0.020): 0.031*\"companhia\" + 0.013*\"busi\" + 0.012*\"million\" + 0.011*\"bank\" + 0.011*\"market\" + 0.011*\"produc\" + 0.010*\"industri\" + 0.009*\"manag\" + 0.008*\"yawn\" + 0.007*\"trace\"\n", + "2019-01-31 01:17:31,012 : INFO : topic #11 (0.020): 0.024*\"john\" + 0.012*\"will\" + 0.012*\"jame\" + 0.011*\"david\" + 0.010*\"rival\" + 0.009*\"mexican–american\" + 0.008*\"paul\" + 0.008*\"slur\" + 0.008*\"georg\" + 0.007*\"rhyme\"\n", + "2019-01-31 01:17:31,013 : INFO : topic #37 (0.020): 0.012*\"charact\" + 0.011*\"septemb\" + 0.010*\"anim\" + 0.009*\"man\" + 0.008*\"comic\" + 0.007*\"appear\" + 0.007*\"storag\" + 0.006*\"fusiform\" + 0.006*\"workplac\" + 0.006*\"vision\"\n", + "2019-01-31 01:17:31,014 : INFO : topic #39 (0.020): 0.056*\"canada\" + 0.045*\"canadian\" + 0.023*\"toronto\" + 0.022*\"hoar\" + 0.019*\"ontario\" + 0.016*\"new\" + 0.015*\"hydrogen\" + 0.015*\"misericordia\" + 0.015*\"novotná\" + 0.012*\"quebec\"\n", + "2019-01-31 01:17:31,020 : INFO : topic diff=0.003937, rho=0.023689\n", + "2019-01-31 01:17:31,179 : INFO : PROGRESS: pass 0, at document #3566000/4922894\n", + "2019-01-31 01:17:32,550 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:17:32,818 : INFO : topic #20 (0.020): 0.144*\"scholar\" + 0.040*\"struggl\" + 0.033*\"high\" + 0.030*\"educ\" + 0.024*\"collector\" + 0.018*\"yawn\" + 0.013*\"prognosi\" + 0.010*\"task\" + 0.010*\"district\" + 0.009*\"start\"\n", + "2019-01-31 01:17:32,819 : INFO : topic #14 (0.020): 0.024*\"forc\" + 0.022*\"aggress\" + 0.022*\"walter\" + 0.020*\"armi\" + 0.017*\"com\" + 0.014*\"oper\" + 0.014*\"unionist\" + 0.013*\"militari\" + 0.012*\"airbu\" + 0.010*\"diversifi\"\n", + "2019-01-31 01:17:32,820 : INFO : topic #1 (0.020): 0.056*\"china\" + 0.046*\"chilton\" + 0.025*\"kong\" + 0.024*\"hong\" + 0.020*\"korea\" + 0.018*\"shirin\" + 0.018*\"korean\" + 0.016*\"sourc\" + 0.014*\"kim\" + 0.014*\"leah\"\n", + "2019-01-31 01:17:32,821 : INFO : topic #48 (0.020): 0.079*\"sens\" + 0.078*\"march\" + 0.077*\"octob\" + 0.071*\"juli\" + 0.070*\"august\" + 0.069*\"judici\" + 0.069*\"januari\" + 0.068*\"notion\" + 0.066*\"april\" + 0.065*\"decatur\"\n", + "2019-01-31 01:17:32,822 : INFO : topic #40 (0.020): 0.086*\"unit\" + 0.023*\"schuster\" + 0.022*\"institut\" + 0.021*\"requir\" + 0.021*\"collector\" + 0.019*\"student\" + 0.015*\"professor\" + 0.011*\"word\" + 0.011*\"degre\" + 0.011*\"http\"\n", + "2019-01-31 01:17:32,828 : INFO : topic diff=0.004484, rho=0.023682\n", + "2019-01-31 01:17:32,989 : INFO : PROGRESS: pass 0, at document #3568000/4922894\n", + "2019-01-31 01:17:34,395 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:17:34,661 : INFO : topic #4 (0.020): 0.021*\"enfranchis\" + 0.015*\"depress\" + 0.014*\"pour\" + 0.008*\"mode\" + 0.008*\"elabor\" + 0.008*\"uruguayan\" + 0.008*\"veget\" + 0.006*\"develop\" + 0.006*\"produc\" + 0.006*\"spectacl\"\n", + "2019-01-31 01:17:34,662 : INFO : topic #24 (0.020): 0.038*\"book\" + 0.033*\"publicis\" + 0.028*\"word\" + 0.020*\"new\" + 0.014*\"edit\" + 0.013*\"presid\" + 0.011*\"arsen\" + 0.011*\"collect\" + 0.011*\"worldwid\" + 0.011*\"magazin\"\n", + "2019-01-31 01:17:34,663 : INFO : topic #13 (0.020): 0.026*\"australia\" + 0.026*\"sourc\" + 0.025*\"london\" + 0.025*\"new\" + 0.024*\"england\" + 0.022*\"australian\" + 0.019*\"british\" + 0.018*\"ireland\" + 0.015*\"youth\" + 0.014*\"wale\"\n", + "2019-01-31 01:17:34,664 : INFO : topic #3 (0.020): 0.034*\"present\" + 0.026*\"offic\" + 0.025*\"nation\" + 0.024*\"minist\" + 0.022*\"govern\" + 0.020*\"member\" + 0.020*\"serv\" + 0.016*\"start\" + 0.016*\"gener\" + 0.014*\"chickasaw\"\n", + "2019-01-31 01:17:34,665 : INFO : topic #42 (0.020): 0.049*\"german\" + 0.032*\"germani\" + 0.015*\"vol\" + 0.014*\"israel\" + 0.013*\"jewish\" + 0.013*\"der\" + 0.013*\"berlin\" + 0.011*\"european\" + 0.009*\"europ\" + 0.009*\"austria\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 01:17:34,671 : INFO : topic diff=0.003744, rho=0.023676\n", + "2019-01-31 01:17:34,826 : INFO : PROGRESS: pass 0, at document #3570000/4922894\n", + "2019-01-31 01:17:36,186 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:17:36,452 : INFO : topic #13 (0.020): 0.026*\"australia\" + 0.026*\"sourc\" + 0.025*\"london\" + 0.025*\"new\" + 0.024*\"england\" + 0.022*\"australian\" + 0.019*\"british\" + 0.018*\"ireland\" + 0.015*\"youth\" + 0.014*\"wale\"\n", + "2019-01-31 01:17:36,453 : INFO : topic #23 (0.020): 0.135*\"audit\" + 0.068*\"best\" + 0.033*\"yawn\" + 0.028*\"jacksonvil\" + 0.023*\"japanes\" + 0.022*\"noll\" + 0.018*\"festiv\" + 0.018*\"intern\" + 0.017*\"women\" + 0.013*\"prison\"\n", + "2019-01-31 01:17:36,454 : INFO : topic #37 (0.020): 0.012*\"charact\" + 0.011*\"septemb\" + 0.010*\"anim\" + 0.010*\"man\" + 0.008*\"comic\" + 0.007*\"appear\" + 0.007*\"storag\" + 0.006*\"fusiform\" + 0.006*\"workplac\" + 0.006*\"vision\"\n", + "2019-01-31 01:17:36,455 : INFO : topic #3 (0.020): 0.034*\"present\" + 0.026*\"offic\" + 0.024*\"minist\" + 0.024*\"nation\" + 0.022*\"govern\" + 0.020*\"member\" + 0.020*\"serv\" + 0.016*\"start\" + 0.016*\"gener\" + 0.014*\"chickasaw\"\n", + "2019-01-31 01:17:36,456 : INFO : topic #27 (0.020): 0.072*\"questionnair\" + 0.020*\"taxpay\" + 0.019*\"candid\" + 0.017*\"ret\" + 0.014*\"driver\" + 0.013*\"tornado\" + 0.012*\"find\" + 0.012*\"squatter\" + 0.011*\"fool\" + 0.009*\"théori\"\n", + "2019-01-31 01:17:36,462 : INFO : topic diff=0.003084, rho=0.023669\n", + "2019-01-31 01:17:36,619 : INFO : PROGRESS: pass 0, at document #3572000/4922894\n", + "2019-01-31 01:17:37,992 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:17:38,259 : INFO : topic #17 (0.020): 0.077*\"church\" + 0.023*\"cathol\" + 0.022*\"christian\" + 0.021*\"bishop\" + 0.017*\"sail\" + 0.014*\"retroflex\" + 0.010*\"relationship\" + 0.010*\"poll\" + 0.010*\"historiographi\" + 0.010*\"cathedr\"\n", + "2019-01-31 01:17:38,260 : INFO : topic #5 (0.020): 0.038*\"abroad\" + 0.028*\"son\" + 0.027*\"rel\" + 0.025*\"reconstruct\" + 0.020*\"band\" + 0.017*\"muscl\" + 0.016*\"simultan\" + 0.014*\"charcoal\" + 0.013*\"toyota\" + 0.009*\"vocabulari\"\n", + "2019-01-31 01:17:38,261 : INFO : topic #35 (0.020): 0.058*\"russia\" + 0.036*\"rural\" + 0.036*\"sovereignti\" + 0.025*\"poison\" + 0.025*\"reprint\" + 0.023*\"personifi\" + 0.022*\"moscow\" + 0.018*\"poland\" + 0.015*\"unfortun\" + 0.014*\"tyrant\"\n", + "2019-01-31 01:17:38,263 : INFO : topic #6 (0.020): 0.069*\"fewer\" + 0.023*\"epiru\" + 0.021*\"septemb\" + 0.019*\"teacher\" + 0.016*\"stake\" + 0.012*\"rodríguez\" + 0.012*\"proclaim\" + 0.011*\"direct\" + 0.011*\"movi\" + 0.010*\"acrimoni\"\n", + "2019-01-31 01:17:38,263 : INFO : topic #39 (0.020): 0.058*\"canada\" + 0.045*\"canadian\" + 0.023*\"toronto\" + 0.022*\"hoar\" + 0.020*\"ontario\" + 0.016*\"new\" + 0.016*\"hydrogen\" + 0.015*\"misericordia\" + 0.015*\"novotná\" + 0.012*\"quebec\"\n", + "2019-01-31 01:17:38,269 : INFO : topic diff=0.003464, rho=0.023662\n", + "2019-01-31 01:17:38,427 : INFO : PROGRESS: pass 0, at document #3574000/4922894\n", + "2019-01-31 01:17:39,799 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:17:40,065 : INFO : topic #4 (0.020): 0.021*\"enfranchis\" + 0.015*\"depress\" + 0.015*\"pour\" + 0.008*\"mode\" + 0.008*\"elabor\" + 0.008*\"uruguayan\" + 0.008*\"veget\" + 0.006*\"produc\" + 0.006*\"develop\" + 0.006*\"spectacl\"\n", + "2019-01-31 01:17:40,066 : INFO : topic #26 (0.020): 0.030*\"workplac\" + 0.029*\"champion\" + 0.026*\"woman\" + 0.025*\"olymp\" + 0.024*\"men\" + 0.022*\"medal\" + 0.020*\"event\" + 0.019*\"alic\" + 0.018*\"atheist\" + 0.018*\"taxpay\"\n", + "2019-01-31 01:17:40,067 : INFO : topic #41 (0.020): 0.040*\"citi\" + 0.023*\"palmer\" + 0.021*\"new\" + 0.016*\"strategist\" + 0.013*\"open\" + 0.012*\"center\" + 0.011*\"lobe\" + 0.011*\"includ\" + 0.011*\"dai\" + 0.009*\"local\"\n", + "2019-01-31 01:17:40,068 : INFO : topic #0 (0.020): 0.067*\"statewid\" + 0.043*\"line\" + 0.033*\"raid\" + 0.026*\"rosenwald\" + 0.024*\"rivièr\" + 0.020*\"serv\" + 0.019*\"traceabl\" + 0.017*\"airmen\" + 0.014*\"oper\" + 0.010*\"transient\"\n", + "2019-01-31 01:17:40,069 : INFO : topic #5 (0.020): 0.038*\"abroad\" + 0.028*\"son\" + 0.027*\"rel\" + 0.026*\"reconstruct\" + 0.020*\"band\" + 0.017*\"muscl\" + 0.016*\"simultan\" + 0.014*\"charcoal\" + 0.013*\"toyota\" + 0.009*\"vocabulari\"\n", + "2019-01-31 01:17:40,075 : INFO : topic diff=0.003328, rho=0.023656\n", + "2019-01-31 01:17:40,233 : INFO : PROGRESS: pass 0, at document #3576000/4922894\n", + "2019-01-31 01:17:41,618 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:17:41,886 : INFO : topic #12 (0.020): 0.008*\"number\" + 0.007*\"frontal\" + 0.007*\"gener\" + 0.006*\"poet\" + 0.006*\"exampl\" + 0.006*\"southern\" + 0.006*\"théori\" + 0.006*\"servitud\" + 0.006*\"measur\" + 0.005*\"utopian\"\n", + "2019-01-31 01:17:41,887 : INFO : topic #34 (0.020): 0.067*\"start\" + 0.034*\"new\" + 0.031*\"american\" + 0.030*\"unionist\" + 0.024*\"cotton\" + 0.021*\"year\" + 0.015*\"california\" + 0.013*\"warrior\" + 0.012*\"terri\" + 0.012*\"north\"\n", + "2019-01-31 01:17:41,888 : INFO : topic #20 (0.020): 0.143*\"scholar\" + 0.041*\"struggl\" + 0.033*\"high\" + 0.030*\"educ\" + 0.025*\"collector\" + 0.018*\"yawn\" + 0.013*\"prognosi\" + 0.010*\"task\" + 0.009*\"district\" + 0.009*\"gothic\"\n", + "2019-01-31 01:17:41,889 : INFO : topic #10 (0.020): 0.011*\"cdd\" + 0.009*\"media\" + 0.009*\"have\" + 0.008*\"disco\" + 0.008*\"hormon\" + 0.007*\"pathwai\" + 0.007*\"caus\" + 0.006*\"treat\" + 0.006*\"effect\" + 0.006*\"proper\"\n", + "2019-01-31 01:17:41,890 : INFO : topic #28 (0.020): 0.034*\"build\" + 0.028*\"hous\" + 0.019*\"buford\" + 0.014*\"histor\" + 0.012*\"linear\" + 0.011*\"constitut\" + 0.011*\"depress\" + 0.010*\"briarwood\" + 0.010*\"rivièr\" + 0.010*\"silicon\"\n", + "2019-01-31 01:17:41,896 : INFO : topic diff=0.003590, rho=0.023649\n", + "2019-01-31 01:17:42,048 : INFO : PROGRESS: pass 0, at document #3578000/4922894\n", + "2019-01-31 01:17:43,376 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:17:43,642 : INFO : topic #47 (0.020): 0.062*\"muscl\" + 0.032*\"perceptu\" + 0.020*\"theater\" + 0.019*\"place\" + 0.018*\"compos\" + 0.015*\"damn\" + 0.014*\"orchestr\" + 0.013*\"olympo\" + 0.013*\"physician\" + 0.011*\"word\"\n", + "2019-01-31 01:17:43,644 : INFO : topic #0 (0.020): 0.067*\"statewid\" + 0.043*\"line\" + 0.033*\"raid\" + 0.026*\"rosenwald\" + 0.024*\"rivièr\" + 0.020*\"serv\" + 0.019*\"traceabl\" + 0.017*\"airmen\" + 0.014*\"oper\" + 0.010*\"transient\"\n", + "2019-01-31 01:17:43,645 : INFO : topic #12 (0.020): 0.008*\"number\" + 0.007*\"frontal\" + 0.007*\"gener\" + 0.007*\"poet\" + 0.006*\"southern\" + 0.006*\"exampl\" + 0.006*\"théori\" + 0.006*\"servitud\" + 0.006*\"measur\" + 0.005*\"utopian\"\n", + "2019-01-31 01:17:43,646 : INFO : topic #1 (0.020): 0.056*\"china\" + 0.045*\"chilton\" + 0.024*\"hong\" + 0.024*\"kong\" + 0.020*\"korea\" + 0.017*\"korean\" + 0.017*\"shirin\" + 0.016*\"sourc\" + 0.014*\"kim\" + 0.014*\"leah\"\n", + "2019-01-31 01:17:43,647 : INFO : topic #23 (0.020): 0.134*\"audit\" + 0.067*\"best\" + 0.034*\"yawn\" + 0.028*\"jacksonvil\" + 0.023*\"japanes\" + 0.022*\"noll\" + 0.018*\"festiv\" + 0.018*\"intern\" + 0.017*\"women\" + 0.013*\"prison\"\n", + "2019-01-31 01:17:43,652 : INFO : topic diff=0.003800, rho=0.023643\n", + "2019-01-31 01:17:46,409 : INFO : -11.569 per-word bound, 3037.9 perplexity estimate based on a held-out corpus of 2000 documents with 592364 words\n", + "2019-01-31 01:17:46,410 : INFO : PROGRESS: pass 0, at document #3580000/4922894\n", + "2019-01-31 01:17:47,817 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:17:48,083 : INFO : topic #20 (0.020): 0.142*\"scholar\" + 0.041*\"struggl\" + 0.033*\"high\" + 0.030*\"educ\" + 0.025*\"collector\" + 0.018*\"yawn\" + 0.013*\"prognosi\" + 0.010*\"task\" + 0.009*\"district\" + 0.009*\"start\"\n", + "2019-01-31 01:17:48,084 : INFO : topic #11 (0.020): 0.024*\"john\" + 0.012*\"will\" + 0.012*\"jame\" + 0.011*\"david\" + 0.010*\"rival\" + 0.009*\"mexican–american\" + 0.008*\"paul\" + 0.008*\"slur\" + 0.008*\"georg\" + 0.007*\"rhyme\"\n", + "2019-01-31 01:17:48,086 : INFO : topic #40 (0.020): 0.086*\"unit\" + 0.023*\"schuster\" + 0.022*\"institut\" + 0.021*\"requir\" + 0.021*\"collector\" + 0.019*\"student\" + 0.015*\"professor\" + 0.011*\"degre\" + 0.011*\"http\" + 0.011*\"word\"\n", + "2019-01-31 01:17:48,087 : INFO : topic #5 (0.020): 0.038*\"abroad\" + 0.028*\"son\" + 0.027*\"rel\" + 0.026*\"reconstruct\" + 0.020*\"band\" + 0.017*\"muscl\" + 0.016*\"simultan\" + 0.014*\"charcoal\" + 0.013*\"toyota\" + 0.009*\"myspac\"\n", + "2019-01-31 01:17:48,088 : INFO : topic #24 (0.020): 0.038*\"book\" + 0.033*\"publicis\" + 0.029*\"word\" + 0.020*\"new\" + 0.014*\"edit\" + 0.013*\"presid\" + 0.011*\"collect\" + 0.011*\"arsen\" + 0.011*\"magazin\" + 0.011*\"worldwid\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 01:17:48,094 : INFO : topic diff=0.003957, rho=0.023636\n", + "2019-01-31 01:17:48,250 : INFO : PROGRESS: pass 0, at document #3582000/4922894\n", + "2019-01-31 01:17:49,618 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:17:49,884 : INFO : topic #12 (0.020): 0.008*\"number\" + 0.007*\"frontal\" + 0.007*\"gener\" + 0.007*\"southern\" + 0.006*\"poet\" + 0.006*\"exampl\" + 0.006*\"théori\" + 0.006*\"servitud\" + 0.006*\"measur\" + 0.005*\"utopian\"\n", + "2019-01-31 01:17:49,886 : INFO : topic #35 (0.020): 0.058*\"russia\" + 0.036*\"rural\" + 0.036*\"sovereignti\" + 0.025*\"reprint\" + 0.024*\"poison\" + 0.023*\"personifi\" + 0.021*\"moscow\" + 0.018*\"poland\" + 0.015*\"unfortun\" + 0.014*\"tyrant\"\n", + "2019-01-31 01:17:49,887 : INFO : topic #3 (0.020): 0.034*\"present\" + 0.026*\"offic\" + 0.024*\"nation\" + 0.024*\"minist\" + 0.022*\"govern\" + 0.020*\"member\" + 0.020*\"serv\" + 0.016*\"start\" + 0.016*\"gener\" + 0.014*\"chickasaw\"\n", + "2019-01-31 01:17:49,888 : INFO : topic #44 (0.020): 0.031*\"rooftop\" + 0.028*\"final\" + 0.024*\"wife\" + 0.019*\"tourist\" + 0.018*\"champion\" + 0.016*\"taxpay\" + 0.015*\"martin\" + 0.015*\"tiepolo\" + 0.013*\"chamber\" + 0.013*\"women\"\n", + "2019-01-31 01:17:49,889 : INFO : topic #49 (0.020): 0.044*\"india\" + 0.033*\"incumb\" + 0.013*\"pakistan\" + 0.013*\"islam\" + 0.011*\"affection\" + 0.011*\"muskoge\" + 0.011*\"anglo\" + 0.010*\"alam\" + 0.010*\"televis\" + 0.010*\"khalsa\"\n", + "2019-01-31 01:17:49,894 : INFO : topic diff=0.003751, rho=0.023629\n", + "2019-01-31 01:17:50,111 : INFO : PROGRESS: pass 0, at document #3584000/4922894\n", + "2019-01-31 01:17:51,494 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:17:51,760 : INFO : topic #2 (0.020): 0.045*\"isl\" + 0.041*\"shield\" + 0.018*\"narrat\" + 0.015*\"scot\" + 0.012*\"blur\" + 0.011*\"nativist\" + 0.011*\"pope\" + 0.011*\"coalit\" + 0.009*\"fleet\" + 0.009*\"sai\"\n", + "2019-01-31 01:17:51,761 : INFO : topic #9 (0.020): 0.067*\"bone\" + 0.045*\"american\" + 0.030*\"valour\" + 0.019*\"dutch\" + 0.018*\"player\" + 0.018*\"folei\" + 0.017*\"polit\" + 0.016*\"english\" + 0.013*\"acrimoni\" + 0.012*\"simpler\"\n", + "2019-01-31 01:17:51,763 : INFO : topic #38 (0.020): 0.023*\"walter\" + 0.011*\"aza\" + 0.009*\"battalion\" + 0.009*\"forc\" + 0.008*\"teufel\" + 0.007*\"empath\" + 0.007*\"armi\" + 0.006*\"till\" + 0.006*\"govern\" + 0.006*\"militari\"\n", + "2019-01-31 01:17:51,764 : INFO : topic #18 (0.020): 0.011*\"théori\" + 0.007*\"later\" + 0.007*\"sack\" + 0.006*\"dai\" + 0.006*\"kill\" + 0.005*\"like\" + 0.005*\"retrospect\" + 0.005*\"end\" + 0.004*\"call\" + 0.004*\"kenworthi\"\n", + "2019-01-31 01:17:51,765 : INFO : topic #11 (0.020): 0.024*\"john\" + 0.012*\"will\" + 0.012*\"jame\" + 0.011*\"david\" + 0.010*\"rival\" + 0.009*\"mexican–american\" + 0.008*\"paul\" + 0.008*\"slur\" + 0.008*\"georg\" + 0.007*\"rhyme\"\n", + "2019-01-31 01:17:51,771 : INFO : topic diff=0.004011, rho=0.023623\n", + "2019-01-31 01:17:51,928 : INFO : PROGRESS: pass 0, at document #3586000/4922894\n", + "2019-01-31 01:17:53,300 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:17:53,567 : INFO : topic #44 (0.020): 0.031*\"rooftop\" + 0.028*\"final\" + 0.024*\"wife\" + 0.019*\"tourist\" + 0.018*\"champion\" + 0.016*\"taxpay\" + 0.015*\"tiepolo\" + 0.015*\"martin\" + 0.013*\"chamber\" + 0.013*\"women\"\n", + "2019-01-31 01:17:53,568 : INFO : topic #18 (0.020): 0.011*\"théori\" + 0.007*\"later\" + 0.007*\"sack\" + 0.006*\"dai\" + 0.006*\"kill\" + 0.005*\"like\" + 0.005*\"retrospect\" + 0.005*\"end\" + 0.004*\"call\" + 0.004*\"kenworthi\"\n", + "2019-01-31 01:17:53,569 : INFO : topic #33 (0.020): 0.065*\"french\" + 0.047*\"franc\" + 0.031*\"pari\" + 0.022*\"jean\" + 0.020*\"sail\" + 0.017*\"daphn\" + 0.014*\"lazi\" + 0.011*\"loui\" + 0.011*\"piec\" + 0.009*\"wine\"\n", + "2019-01-31 01:17:53,570 : INFO : topic #35 (0.020): 0.057*\"russia\" + 0.036*\"rural\" + 0.036*\"sovereignti\" + 0.025*\"reprint\" + 0.024*\"poison\" + 0.023*\"personifi\" + 0.021*\"moscow\" + 0.018*\"poland\" + 0.015*\"unfortun\" + 0.014*\"czech\"\n", + "2019-01-31 01:17:53,571 : INFO : topic #11 (0.020): 0.024*\"john\" + 0.012*\"will\" + 0.012*\"jame\" + 0.011*\"david\" + 0.010*\"rival\" + 0.009*\"mexican–american\" + 0.008*\"paul\" + 0.008*\"slur\" + 0.008*\"georg\" + 0.007*\"rhyme\"\n", + "2019-01-31 01:17:53,577 : INFO : topic diff=0.003633, rho=0.023616\n", + "2019-01-31 01:17:53,737 : INFO : PROGRESS: pass 0, at document #3588000/4922894\n", + "2019-01-31 01:17:55,153 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:17:55,419 : INFO : topic #35 (0.020): 0.057*\"russia\" + 0.036*\"rural\" + 0.036*\"sovereignti\" + 0.024*\"reprint\" + 0.024*\"poison\" + 0.023*\"personifi\" + 0.021*\"moscow\" + 0.018*\"poland\" + 0.015*\"unfortun\" + 0.014*\"tyrant\"\n", + "2019-01-31 01:17:55,420 : INFO : topic #33 (0.020): 0.065*\"french\" + 0.047*\"franc\" + 0.031*\"pari\" + 0.022*\"jean\" + 0.020*\"sail\" + 0.017*\"daphn\" + 0.014*\"lazi\" + 0.012*\"loui\" + 0.011*\"piec\" + 0.008*\"wine\"\n", + "2019-01-31 01:17:55,421 : INFO : topic #25 (0.020): 0.033*\"ring\" + 0.018*\"area\" + 0.018*\"lagrang\" + 0.016*\"mount\" + 0.016*\"warmth\" + 0.010*\"palmer\" + 0.010*\"north\" + 0.009*\"sourc\" + 0.009*\"land\" + 0.009*\"lobe\"\n", + "2019-01-31 01:17:55,422 : INFO : topic #31 (0.020): 0.053*\"fusiform\" + 0.027*\"scientist\" + 0.025*\"taxpay\" + 0.023*\"player\" + 0.020*\"place\" + 0.014*\"clot\" + 0.013*\"leagu\" + 0.011*\"folei\" + 0.010*\"yawn\" + 0.009*\"reconstruct\"\n", + "2019-01-31 01:17:55,423 : INFO : topic #8 (0.020): 0.026*\"law\" + 0.022*\"cortic\" + 0.018*\"start\" + 0.017*\"act\" + 0.012*\"ricardo\" + 0.012*\"case\" + 0.011*\"order\" + 0.010*\"replac\" + 0.010*\"polaris\" + 0.008*\"legal\"\n", + "2019-01-31 01:17:55,429 : INFO : topic diff=0.003215, rho=0.023610\n", + "2019-01-31 01:17:55,584 : INFO : PROGRESS: pass 0, at document #3590000/4922894\n", + "2019-01-31 01:17:56,951 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:17:57,217 : INFO : topic #40 (0.020): 0.086*\"unit\" + 0.023*\"schuster\" + 0.022*\"institut\" + 0.021*\"collector\" + 0.021*\"requir\" + 0.019*\"student\" + 0.015*\"professor\" + 0.013*\"http\" + 0.011*\"degre\" + 0.011*\"word\"\n", + "2019-01-31 01:17:57,219 : INFO : topic #11 (0.020): 0.024*\"john\" + 0.012*\"jame\" + 0.012*\"will\" + 0.011*\"david\" + 0.010*\"rival\" + 0.009*\"mexican–american\" + 0.008*\"paul\" + 0.008*\"slur\" + 0.008*\"georg\" + 0.007*\"rhyme\"\n", + "2019-01-31 01:17:57,220 : INFO : topic #19 (0.020): 0.016*\"languag\" + 0.015*\"centuri\" + 0.011*\"woodcut\" + 0.009*\"form\" + 0.009*\"origin\" + 0.009*\"mean\" + 0.008*\"english\" + 0.008*\"trade\" + 0.007*\"known\" + 0.006*\"modern\"\n", + "2019-01-31 01:17:57,221 : INFO : topic #0 (0.020): 0.067*\"statewid\" + 0.042*\"line\" + 0.032*\"raid\" + 0.026*\"rosenwald\" + 0.024*\"rivièr\" + 0.020*\"serv\" + 0.019*\"traceabl\" + 0.018*\"airmen\" + 0.014*\"oper\" + 0.010*\"transient\"\n", + "2019-01-31 01:17:57,222 : INFO : topic #43 (0.020): 0.066*\"elect\" + 0.053*\"parti\" + 0.027*\"voluntari\" + 0.023*\"democrat\" + 0.020*\"member\" + 0.016*\"polici\" + 0.015*\"republ\" + 0.015*\"bypass\" + 0.013*\"seaport\" + 0.013*\"report\"\n", + "2019-01-31 01:17:57,228 : INFO : topic diff=0.003583, rho=0.023603\n", + "2019-01-31 01:17:57,383 : INFO : PROGRESS: pass 0, at document #3592000/4922894\n", + "2019-01-31 01:17:58,750 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:17:59,017 : INFO : topic #12 (0.020): 0.008*\"number\" + 0.008*\"frontal\" + 0.007*\"southern\" + 0.007*\"gener\" + 0.006*\"poet\" + 0.006*\"exampl\" + 0.006*\"théori\" + 0.006*\"servitud\" + 0.006*\"measur\" + 0.005*\"differ\"\n", + "2019-01-31 01:17:59,018 : INFO : topic #19 (0.020): 0.016*\"languag\" + 0.015*\"centuri\" + 0.011*\"woodcut\" + 0.009*\"form\" + 0.009*\"origin\" + 0.009*\"mean\" + 0.008*\"english\" + 0.008*\"trade\" + 0.007*\"known\" + 0.006*\"modern\"\n", + "2019-01-31 01:17:59,019 : INFO : topic #9 (0.020): 0.067*\"bone\" + 0.045*\"american\" + 0.031*\"valour\" + 0.019*\"dutch\" + 0.018*\"player\" + 0.018*\"folei\" + 0.016*\"polit\" + 0.016*\"english\" + 0.013*\"acrimoni\" + 0.012*\"simpler\"\n", + "2019-01-31 01:17:59,020 : INFO : topic #24 (0.020): 0.039*\"book\" + 0.033*\"publicis\" + 0.029*\"word\" + 0.020*\"new\" + 0.014*\"edit\" + 0.013*\"presid\" + 0.011*\"collect\" + 0.011*\"magazin\" + 0.011*\"worldwid\" + 0.011*\"arsen\"\n", + "2019-01-31 01:17:59,021 : INFO : topic #25 (0.020): 0.033*\"ring\" + 0.018*\"area\" + 0.018*\"lagrang\" + 0.016*\"mount\" + 0.016*\"warmth\" + 0.011*\"palmer\" + 0.010*\"north\" + 0.009*\"sourc\" + 0.009*\"land\" + 0.009*\"lobe\"\n", + "2019-01-31 01:17:59,027 : INFO : topic diff=0.004528, rho=0.023596\n", + "2019-01-31 01:17:59,184 : INFO : PROGRESS: pass 0, at document #3594000/4922894\n", + "2019-01-31 01:18:00,538 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 01:18:00,805 : INFO : topic #48 (0.020): 0.079*\"sens\" + 0.078*\"octob\" + 0.076*\"march\" + 0.070*\"juli\" + 0.069*\"august\" + 0.069*\"judici\" + 0.069*\"januari\" + 0.068*\"notion\" + 0.066*\"april\" + 0.064*\"decatur\"\n", + "2019-01-31 01:18:00,806 : INFO : topic #45 (0.020): 0.032*\"arsen\" + 0.027*\"jpg\" + 0.026*\"museo\" + 0.025*\"fifteenth\" + 0.020*\"pain\" + 0.018*\"illicit\" + 0.014*\"colder\" + 0.014*\"gai\" + 0.013*\"exhaust\" + 0.012*\"black\"\n", + "2019-01-31 01:18:00,807 : INFO : topic #37 (0.020): 0.013*\"charact\" + 0.011*\"septemb\" + 0.010*\"anim\" + 0.010*\"man\" + 0.008*\"comic\" + 0.007*\"appear\" + 0.007*\"storag\" + 0.006*\"fusiform\" + 0.006*\"workplac\" + 0.006*\"vision\"\n", + "2019-01-31 01:18:00,808 : INFO : topic #23 (0.020): 0.134*\"audit\" + 0.068*\"best\" + 0.033*\"yawn\" + 0.028*\"jacksonvil\" + 0.023*\"japanes\" + 0.022*\"noll\" + 0.018*\"festiv\" + 0.018*\"women\" + 0.018*\"intern\" + 0.013*\"winner\"\n", + "2019-01-31 01:18:00,809 : INFO : topic #29 (0.020): 0.031*\"companhia\" + 0.013*\"busi\" + 0.012*\"million\" + 0.011*\"market\" + 0.011*\"bank\" + 0.011*\"produc\" + 0.010*\"industri\" + 0.008*\"manag\" + 0.008*\"yawn\" + 0.007*\"oper\"\n", + "2019-01-31 01:18:00,815 : INFO : topic diff=0.003881, rho=0.023590\n", + "2019-01-31 01:18:00,970 : INFO : PROGRESS: pass 0, at document #3596000/4922894\n", + "2019-01-31 01:18:02,339 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:18:02,605 : INFO : topic #11 (0.020): 0.024*\"john\" + 0.012*\"jame\" + 0.012*\"will\" + 0.011*\"david\" + 0.010*\"rival\" + 0.009*\"mexican–american\" + 0.008*\"paul\" + 0.008*\"slur\" + 0.008*\"georg\" + 0.007*\"rhyme\"\n", + "2019-01-31 01:18:02,606 : INFO : topic #33 (0.020): 0.064*\"french\" + 0.047*\"franc\" + 0.031*\"pari\" + 0.022*\"jean\" + 0.020*\"sail\" + 0.017*\"daphn\" + 0.014*\"lazi\" + 0.012*\"loui\" + 0.011*\"piec\" + 0.008*\"wine\"\n", + "2019-01-31 01:18:02,607 : INFO : topic #31 (0.020): 0.053*\"fusiform\" + 0.027*\"scientist\" + 0.025*\"taxpay\" + 0.023*\"player\" + 0.020*\"place\" + 0.014*\"clot\" + 0.013*\"leagu\" + 0.011*\"folei\" + 0.010*\"yawn\" + 0.009*\"reconstruct\"\n", + "2019-01-31 01:18:02,609 : INFO : topic #21 (0.020): 0.033*\"samford\" + 0.021*\"spain\" + 0.019*\"del\" + 0.018*\"mexico\" + 0.016*\"italian\" + 0.013*\"soviet\" + 0.013*\"santa\" + 0.012*\"juan\" + 0.011*\"carlo\" + 0.010*\"lizard\"\n", + "2019-01-31 01:18:02,610 : INFO : topic #34 (0.020): 0.067*\"start\" + 0.034*\"new\" + 0.031*\"american\" + 0.030*\"unionist\" + 0.025*\"cotton\" + 0.021*\"year\" + 0.015*\"california\" + 0.013*\"warrior\" + 0.012*\"terri\" + 0.011*\"citi\"\n", + "2019-01-31 01:18:02,615 : INFO : topic diff=0.003692, rho=0.023583\n", + "2019-01-31 01:18:02,773 : INFO : PROGRESS: pass 0, at document #3598000/4922894\n", + "2019-01-31 01:18:04,169 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:18:04,436 : INFO : topic #48 (0.020): 0.079*\"sens\" + 0.078*\"octob\" + 0.077*\"march\" + 0.071*\"juli\" + 0.069*\"august\" + 0.069*\"januari\" + 0.069*\"judici\" + 0.069*\"notion\" + 0.067*\"april\" + 0.065*\"decatur\"\n", + "2019-01-31 01:18:04,437 : INFO : topic #13 (0.020): 0.027*\"australia\" + 0.026*\"sourc\" + 0.025*\"london\" + 0.025*\"new\" + 0.025*\"england\" + 0.023*\"australian\" + 0.019*\"british\" + 0.018*\"ireland\" + 0.015*\"youth\" + 0.014*\"wale\"\n", + "2019-01-31 01:18:04,438 : INFO : topic #21 (0.020): 0.033*\"samford\" + 0.021*\"spain\" + 0.019*\"del\" + 0.018*\"mexico\" + 0.016*\"italian\" + 0.013*\"soviet\" + 0.013*\"santa\" + 0.012*\"juan\" + 0.011*\"carlo\" + 0.010*\"lizard\"\n", + "2019-01-31 01:18:04,439 : INFO : topic #17 (0.020): 0.076*\"church\" + 0.022*\"cathol\" + 0.022*\"christian\" + 0.021*\"bishop\" + 0.017*\"sail\" + 0.015*\"retroflex\" + 0.010*\"relationship\" + 0.009*\"poll\" + 0.009*\"historiographi\" + 0.009*\"cathedr\"\n", + "2019-01-31 01:18:04,440 : INFO : topic #10 (0.020): 0.011*\"cdd\" + 0.009*\"media\" + 0.009*\"have\" + 0.008*\"hormon\" + 0.008*\"disco\" + 0.007*\"pathwai\" + 0.007*\"caus\" + 0.006*\"treat\" + 0.006*\"effect\" + 0.006*\"proper\"\n", + "2019-01-31 01:18:04,446 : INFO : topic diff=0.004106, rho=0.023577\n", + "2019-01-31 01:18:07,101 : INFO : -11.619 per-word bound, 3144.9 perplexity estimate based on a held-out corpus of 2000 documents with 539947 words\n", + "2019-01-31 01:18:07,101 : INFO : PROGRESS: pass 0, at document #3600000/4922894\n", + "2019-01-31 01:18:08,462 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:18:08,728 : INFO : topic #48 (0.020): 0.079*\"sens\" + 0.078*\"octob\" + 0.077*\"march\" + 0.071*\"juli\" + 0.070*\"august\" + 0.069*\"notion\" + 0.069*\"januari\" + 0.069*\"judici\" + 0.067*\"april\" + 0.065*\"decatur\"\n", + "2019-01-31 01:18:08,730 : INFO : topic #32 (0.020): 0.053*\"district\" + 0.047*\"vigour\" + 0.043*\"popolo\" + 0.036*\"cotton\" + 0.036*\"tortur\" + 0.022*\"area\" + 0.022*\"multitud\" + 0.020*\"adulthood\" + 0.019*\"citi\" + 0.018*\"cede\"\n", + "2019-01-31 01:18:08,731 : INFO : topic #1 (0.020): 0.055*\"china\" + 0.045*\"chilton\" + 0.023*\"kong\" + 0.023*\"hong\" + 0.020*\"korea\" + 0.020*\"korean\" + 0.016*\"sourc\" + 0.016*\"shirin\" + 0.015*\"kim\" + 0.014*\"leah\"\n", + "2019-01-31 01:18:08,732 : INFO : topic #10 (0.020): 0.011*\"cdd\" + 0.009*\"media\" + 0.008*\"have\" + 0.008*\"disco\" + 0.008*\"hormon\" + 0.007*\"pathwai\" + 0.007*\"caus\" + 0.006*\"treat\" + 0.006*\"proper\" + 0.006*\"effect\"\n", + "2019-01-31 01:18:08,733 : INFO : topic #39 (0.020): 0.059*\"canada\" + 0.045*\"canadian\" + 0.023*\"toronto\" + 0.023*\"hoar\" + 0.021*\"ontario\" + 0.016*\"hydrogen\" + 0.016*\"new\" + 0.015*\"misericordia\" + 0.014*\"novotná\" + 0.013*\"quebec\"\n", + "2019-01-31 01:18:08,739 : INFO : topic diff=0.003770, rho=0.023570\n", + "2019-01-31 01:18:08,899 : INFO : PROGRESS: pass 0, at document #3602000/4922894\n", + "2019-01-31 01:18:10,286 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:18:10,552 : INFO : topic #46 (0.020): 0.022*\"norwai\" + 0.019*\"stop\" + 0.016*\"sweden\" + 0.015*\"wind\" + 0.014*\"swedish\" + 0.013*\"norwegian\" + 0.013*\"huntsvil\" + 0.013*\"damag\" + 0.013*\"treeless\" + 0.011*\"denmark\"\n", + "2019-01-31 01:18:10,554 : INFO : topic #29 (0.020): 0.031*\"companhia\" + 0.013*\"busi\" + 0.012*\"million\" + 0.011*\"market\" + 0.011*\"bank\" + 0.011*\"produc\" + 0.010*\"industri\" + 0.008*\"manag\" + 0.008*\"yawn\" + 0.007*\"oper\"\n", + "2019-01-31 01:18:10,555 : INFO : topic #48 (0.020): 0.079*\"sens\" + 0.078*\"octob\" + 0.077*\"march\" + 0.071*\"juli\" + 0.070*\"august\" + 0.070*\"notion\" + 0.069*\"judici\" + 0.069*\"januari\" + 0.067*\"april\" + 0.065*\"decatur\"\n", + "2019-01-31 01:18:10,556 : INFO : topic #45 (0.020): 0.033*\"arsen\" + 0.027*\"jpg\" + 0.025*\"museo\" + 0.025*\"fifteenth\" + 0.019*\"pain\" + 0.018*\"illicit\" + 0.014*\"colder\" + 0.014*\"gai\" + 0.013*\"exhaust\" + 0.012*\"black\"\n", + "2019-01-31 01:18:10,557 : INFO : topic #34 (0.020): 0.066*\"start\" + 0.034*\"new\" + 0.031*\"american\" + 0.030*\"unionist\" + 0.025*\"cotton\" + 0.021*\"year\" + 0.015*\"california\" + 0.013*\"warrior\" + 0.012*\"terri\" + 0.011*\"citi\"\n", + "2019-01-31 01:18:10,563 : INFO : topic diff=0.003455, rho=0.023564\n", + "2019-01-31 01:18:10,715 : INFO : PROGRESS: pass 0, at document #3604000/4922894\n", + "2019-01-31 01:18:12,053 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:18:12,319 : INFO : topic #17 (0.020): 0.076*\"church\" + 0.022*\"christian\" + 0.022*\"cathol\" + 0.021*\"bishop\" + 0.017*\"sail\" + 0.015*\"retroflex\" + 0.010*\"relationship\" + 0.009*\"historiographi\" + 0.009*\"poll\" + 0.009*\"cathedr\"\n", + "2019-01-31 01:18:12,320 : INFO : topic #1 (0.020): 0.054*\"china\" + 0.046*\"chilton\" + 0.024*\"kong\" + 0.023*\"hong\" + 0.020*\"korea\" + 0.020*\"korean\" + 0.016*\"sourc\" + 0.016*\"shirin\" + 0.014*\"kim\" + 0.014*\"leah\"\n", + "2019-01-31 01:18:12,321 : INFO : topic #37 (0.020): 0.013*\"charact\" + 0.011*\"septemb\" + 0.010*\"anim\" + 0.010*\"man\" + 0.008*\"comic\" + 0.007*\"appear\" + 0.007*\"storag\" + 0.007*\"fusiform\" + 0.006*\"workplac\" + 0.006*\"vision\"\n", + "2019-01-31 01:18:12,323 : INFO : topic #43 (0.020): 0.066*\"elect\" + 0.054*\"parti\" + 0.026*\"voluntari\" + 0.022*\"democrat\" + 0.020*\"member\" + 0.016*\"polici\" + 0.014*\"bypass\" + 0.014*\"republ\" + 0.013*\"seaport\" + 0.013*\"report\"\n", + "2019-01-31 01:18:12,324 : INFO : topic #6 (0.020): 0.069*\"fewer\" + 0.023*\"epiru\" + 0.021*\"septemb\" + 0.019*\"teacher\" + 0.016*\"stake\" + 0.012*\"rodríguez\" + 0.012*\"proclaim\" + 0.011*\"direct\" + 0.011*\"movi\" + 0.010*\"acrimoni\"\n", + "2019-01-31 01:18:12,329 : INFO : topic diff=0.003178, rho=0.023557\n", + "2019-01-31 01:18:12,487 : INFO : PROGRESS: pass 0, at document #3606000/4922894\n", + "2019-01-31 01:18:13,879 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:18:14,146 : INFO : topic #19 (0.020): 0.016*\"languag\" + 0.015*\"centuri\" + 0.011*\"woodcut\" + 0.009*\"form\" + 0.009*\"origin\" + 0.009*\"mean\" + 0.008*\"english\" + 0.008*\"trade\" + 0.007*\"known\" + 0.006*\"ancestor\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 01:18:14,147 : INFO : topic #25 (0.020): 0.033*\"ring\" + 0.019*\"area\" + 0.018*\"lagrang\" + 0.016*\"mount\" + 0.016*\"warmth\" + 0.010*\"palmer\" + 0.010*\"north\" + 0.009*\"sourc\" + 0.009*\"land\" + 0.009*\"lobe\"\n", + "2019-01-31 01:18:14,148 : INFO : topic #14 (0.020): 0.024*\"forc\" + 0.022*\"aggress\" + 0.021*\"walter\" + 0.020*\"armi\" + 0.017*\"com\" + 0.014*\"oper\" + 0.014*\"unionist\" + 0.012*\"militari\" + 0.012*\"airbu\" + 0.010*\"diversifi\"\n", + "2019-01-31 01:18:14,149 : INFO : topic #3 (0.020): 0.034*\"present\" + 0.025*\"offic\" + 0.024*\"nation\" + 0.024*\"minist\" + 0.023*\"govern\" + 0.020*\"member\" + 0.019*\"serv\" + 0.016*\"start\" + 0.016*\"gener\" + 0.014*\"chickasaw\"\n", + "2019-01-31 01:18:14,150 : INFO : topic #18 (0.020): 0.011*\"théori\" + 0.007*\"later\" + 0.007*\"sack\" + 0.006*\"dai\" + 0.006*\"kill\" + 0.005*\"like\" + 0.005*\"retrospect\" + 0.005*\"end\" + 0.004*\"call\" + 0.004*\"kenworthi\"\n", + "2019-01-31 01:18:14,156 : INFO : topic diff=0.003445, rho=0.023551\n", + "2019-01-31 01:18:14,310 : INFO : PROGRESS: pass 0, at document #3608000/4922894\n", + "2019-01-31 01:18:15,673 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:18:15,939 : INFO : topic #29 (0.020): 0.031*\"companhia\" + 0.013*\"busi\" + 0.012*\"million\" + 0.011*\"market\" + 0.011*\"bank\" + 0.011*\"produc\" + 0.010*\"industri\" + 0.008*\"manag\" + 0.008*\"yawn\" + 0.007*\"oper\"\n", + "2019-01-31 01:18:15,941 : INFO : topic #37 (0.020): 0.013*\"charact\" + 0.011*\"septemb\" + 0.010*\"anim\" + 0.009*\"man\" + 0.008*\"comic\" + 0.007*\"appear\" + 0.007*\"storag\" + 0.007*\"fusiform\" + 0.006*\"workplac\" + 0.006*\"vision\"\n", + "2019-01-31 01:18:15,942 : INFO : topic #18 (0.020): 0.011*\"théori\" + 0.007*\"later\" + 0.007*\"sack\" + 0.006*\"dai\" + 0.006*\"kill\" + 0.005*\"like\" + 0.005*\"retrospect\" + 0.005*\"end\" + 0.004*\"call\" + 0.004*\"kenworthi\"\n", + "2019-01-31 01:18:15,943 : INFO : topic #10 (0.020): 0.011*\"cdd\" + 0.009*\"media\" + 0.008*\"have\" + 0.008*\"disco\" + 0.008*\"hormon\" + 0.007*\"pathwai\" + 0.007*\"caus\" + 0.006*\"treat\" + 0.006*\"proper\" + 0.006*\"effect\"\n", + "2019-01-31 01:18:15,944 : INFO : topic #30 (0.020): 0.036*\"cleveland\" + 0.035*\"leagu\" + 0.030*\"place\" + 0.028*\"taxpay\" + 0.024*\"scientist\" + 0.024*\"crete\" + 0.021*\"folei\" + 0.017*\"goal\" + 0.016*\"martin\" + 0.012*\"schmitz\"\n", + "2019-01-31 01:18:15,950 : INFO : topic diff=0.004031, rho=0.023544\n", + "2019-01-31 01:18:16,104 : INFO : PROGRESS: pass 0, at document #3610000/4922894\n", + "2019-01-31 01:18:17,465 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:18:17,732 : INFO : topic #15 (0.020): 0.011*\"small\" + 0.010*\"organ\" + 0.010*\"develop\" + 0.009*\"commun\" + 0.009*\"group\" + 0.008*\"word\" + 0.008*\"peopl\" + 0.007*\"human\" + 0.007*\"woman\" + 0.007*\"summerhil\"\n", + "2019-01-31 01:18:17,733 : INFO : topic #24 (0.020): 0.039*\"book\" + 0.033*\"publicis\" + 0.029*\"word\" + 0.020*\"new\" + 0.014*\"edit\" + 0.013*\"presid\" + 0.011*\"magazin\" + 0.011*\"collect\" + 0.011*\"worldwid\" + 0.011*\"storag\"\n", + "2019-01-31 01:18:17,734 : INFO : topic #21 (0.020): 0.033*\"samford\" + 0.021*\"spain\" + 0.019*\"del\" + 0.017*\"mexico\" + 0.016*\"italian\" + 0.013*\"soviet\" + 0.012*\"santa\" + 0.012*\"juan\" + 0.011*\"carlo\" + 0.010*\"itali\"\n", + "2019-01-31 01:18:17,735 : INFO : topic #49 (0.020): 0.043*\"india\" + 0.031*\"incumb\" + 0.014*\"pakistan\" + 0.012*\"islam\" + 0.011*\"muskoge\" + 0.011*\"affection\" + 0.010*\"sri\" + 0.010*\"anglo\" + 0.010*\"alam\" + 0.010*\"khalsa\"\n", + "2019-01-31 01:18:17,736 : INFO : topic #27 (0.020): 0.074*\"questionnair\" + 0.020*\"taxpay\" + 0.020*\"candid\" + 0.017*\"ret\" + 0.014*\"driver\" + 0.013*\"tornado\" + 0.012*\"fool\" + 0.012*\"find\" + 0.011*\"squatter\" + 0.010*\"horac\"\n", + "2019-01-31 01:18:17,742 : INFO : topic diff=0.003085, rho=0.023538\n", + "2019-01-31 01:18:17,897 : INFO : PROGRESS: pass 0, at document #3612000/4922894\n", + "2019-01-31 01:18:19,261 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:18:19,528 : INFO : topic #18 (0.020): 0.011*\"théori\" + 0.007*\"later\" + 0.007*\"sack\" + 0.006*\"dai\" + 0.006*\"kill\" + 0.005*\"like\" + 0.005*\"retrospect\" + 0.005*\"end\" + 0.004*\"call\" + 0.004*\"kenworthi\"\n", + "2019-01-31 01:18:19,529 : INFO : topic #25 (0.020): 0.033*\"ring\" + 0.019*\"area\" + 0.018*\"lagrang\" + 0.016*\"mount\" + 0.016*\"warmth\" + 0.010*\"palmer\" + 0.010*\"north\" + 0.009*\"land\" + 0.009*\"sourc\" + 0.009*\"foam\"\n", + "2019-01-31 01:18:19,530 : INFO : topic #29 (0.020): 0.031*\"companhia\" + 0.013*\"busi\" + 0.012*\"million\" + 0.012*\"market\" + 0.011*\"bank\" + 0.011*\"produc\" + 0.010*\"industri\" + 0.008*\"manag\" + 0.008*\"yawn\" + 0.007*\"oper\"\n", + "2019-01-31 01:18:19,531 : INFO : topic #5 (0.020): 0.038*\"abroad\" + 0.028*\"son\" + 0.027*\"rel\" + 0.026*\"reconstruct\" + 0.020*\"band\" + 0.017*\"muscl\" + 0.016*\"simultan\" + 0.014*\"charcoal\" + 0.014*\"toyota\" + 0.009*\"myspac\"\n", + "2019-01-31 01:18:19,532 : INFO : topic #26 (0.020): 0.030*\"workplac\" + 0.029*\"champion\" + 0.026*\"woman\" + 0.024*\"olymp\" + 0.023*\"men\" + 0.022*\"medal\" + 0.019*\"event\" + 0.019*\"alic\" + 0.018*\"rainfal\" + 0.018*\"taxpay\"\n", + "2019-01-31 01:18:19,538 : INFO : topic diff=0.003891, rho=0.023531\n", + "2019-01-31 01:18:19,759 : INFO : PROGRESS: pass 0, at document #3614000/4922894\n", + "2019-01-31 01:18:21,167 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:18:21,434 : INFO : topic #41 (0.020): 0.039*\"citi\" + 0.024*\"palmer\" + 0.021*\"new\" + 0.016*\"strategist\" + 0.013*\"open\" + 0.012*\"center\" + 0.011*\"dai\" + 0.011*\"lobe\" + 0.011*\"includ\" + 0.009*\"local\"\n", + "2019-01-31 01:18:21,435 : INFO : topic #36 (0.020): 0.011*\"network\" + 0.010*\"prognosi\" + 0.010*\"pop\" + 0.008*\"cytokin\" + 0.008*\"develop\" + 0.008*\"diggin\" + 0.008*\"softwar\" + 0.008*\"user\" + 0.008*\"championship\" + 0.008*\"uruguayan\"\n", + "2019-01-31 01:18:21,436 : INFO : topic #47 (0.020): 0.061*\"muscl\" + 0.033*\"perceptu\" + 0.020*\"theater\" + 0.018*\"place\" + 0.018*\"compos\" + 0.016*\"damn\" + 0.014*\"orchestr\" + 0.013*\"olympo\" + 0.013*\"physician\" + 0.012*\"jack\"\n", + "2019-01-31 01:18:21,437 : INFO : topic #26 (0.020): 0.030*\"workplac\" + 0.029*\"champion\" + 0.026*\"woman\" + 0.024*\"olymp\" + 0.023*\"men\" + 0.022*\"medal\" + 0.019*\"event\" + 0.018*\"rainfal\" + 0.018*\"alic\" + 0.018*\"taxpay\"\n", + "2019-01-31 01:18:21,438 : INFO : topic #1 (0.020): 0.053*\"china\" + 0.045*\"chilton\" + 0.023*\"kong\" + 0.023*\"hong\" + 0.021*\"korea\" + 0.019*\"korean\" + 0.016*\"sourc\" + 0.016*\"shirin\" + 0.015*\"kim\" + 0.013*\"leah\"\n", + "2019-01-31 01:18:21,444 : INFO : topic diff=0.003763, rho=0.023525\n", + "2019-01-31 01:18:21,604 : INFO : PROGRESS: pass 0, at document #3616000/4922894\n", + "2019-01-31 01:18:23,001 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:18:23,267 : INFO : topic #1 (0.020): 0.054*\"china\" + 0.045*\"chilton\" + 0.024*\"kong\" + 0.023*\"hong\" + 0.021*\"korea\" + 0.019*\"korean\" + 0.016*\"sourc\" + 0.016*\"shirin\" + 0.015*\"kim\" + 0.013*\"leah\"\n", + "2019-01-31 01:18:23,268 : INFO : topic #26 (0.020): 0.029*\"workplac\" + 0.029*\"champion\" + 0.027*\"woman\" + 0.024*\"olymp\" + 0.024*\"men\" + 0.022*\"medal\" + 0.019*\"event\" + 0.019*\"alic\" + 0.018*\"rainfal\" + 0.018*\"taxpay\"\n", + "2019-01-31 01:18:23,269 : INFO : topic #16 (0.020): 0.060*\"king\" + 0.032*\"priest\" + 0.020*\"duke\" + 0.020*\"quarterli\" + 0.019*\"idiosyncrat\" + 0.019*\"rotterdam\" + 0.016*\"grammat\" + 0.013*\"count\" + 0.013*\"kingdom\" + 0.013*\"brazil\"\n", + "2019-01-31 01:18:23,270 : INFO : topic #0 (0.020): 0.067*\"statewid\" + 0.043*\"line\" + 0.032*\"raid\" + 0.026*\"rosenwald\" + 0.023*\"rivièr\" + 0.019*\"serv\" + 0.019*\"traceabl\" + 0.018*\"airmen\" + 0.014*\"oper\" + 0.010*\"transient\"\n", + "2019-01-31 01:18:23,271 : INFO : topic #47 (0.020): 0.062*\"muscl\" + 0.033*\"perceptu\" + 0.020*\"theater\" + 0.018*\"place\" + 0.018*\"compos\" + 0.016*\"damn\" + 0.014*\"orchestr\" + 0.013*\"olympo\" + 0.013*\"physician\" + 0.012*\"jack\"\n", + "2019-01-31 01:18:23,277 : INFO : topic diff=0.003321, rho=0.023518\n", + "2019-01-31 01:18:23,432 : INFO : PROGRESS: pass 0, at document #3618000/4922894\n", + "2019-01-31 01:18:24,794 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:18:25,061 : INFO : topic #6 (0.020): 0.070*\"fewer\" + 0.023*\"epiru\" + 0.021*\"septemb\" + 0.018*\"teacher\" + 0.016*\"stake\" + 0.012*\"rodríguez\" + 0.012*\"proclaim\" + 0.011*\"direct\" + 0.010*\"movi\" + 0.010*\"acrimoni\"\n", + "2019-01-31 01:18:25,062 : INFO : topic #21 (0.020): 0.033*\"samford\" + 0.021*\"spain\" + 0.019*\"del\" + 0.018*\"mexico\" + 0.016*\"italian\" + 0.013*\"soviet\" + 0.012*\"santa\" + 0.011*\"juan\" + 0.011*\"carlo\" + 0.010*\"josé\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 01:18:25,063 : INFO : topic #31 (0.020): 0.055*\"fusiform\" + 0.027*\"scientist\" + 0.025*\"taxpay\" + 0.023*\"player\" + 0.020*\"place\" + 0.014*\"clot\" + 0.013*\"leagu\" + 0.011*\"folei\" + 0.010*\"yawn\" + 0.009*\"reconstruct\"\n", + "2019-01-31 01:18:25,064 : INFO : topic #42 (0.020): 0.048*\"german\" + 0.031*\"germani\" + 0.017*\"vol\" + 0.014*\"der\" + 0.013*\"israel\" + 0.013*\"jewish\" + 0.013*\"berlin\" + 0.010*\"european\" + 0.009*\"europ\" + 0.009*\"austria\"\n", + "2019-01-31 01:18:25,065 : INFO : topic #35 (0.020): 0.056*\"russia\" + 0.036*\"rural\" + 0.036*\"sovereignti\" + 0.026*\"poison\" + 0.024*\"reprint\" + 0.023*\"personifi\" + 0.020*\"moscow\" + 0.018*\"poland\" + 0.015*\"tyrant\" + 0.014*\"unfortun\"\n", + "2019-01-31 01:18:25,071 : INFO : topic diff=0.003761, rho=0.023512\n", + "2019-01-31 01:18:27,659 : INFO : -11.642 per-word bound, 3196.0 perplexity estimate based on a held-out corpus of 2000 documents with 499041 words\n", + "2019-01-31 01:18:27,659 : INFO : PROGRESS: pass 0, at document #3620000/4922894\n", + "2019-01-31 01:18:29,011 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:18:29,277 : INFO : topic #2 (0.020): 0.047*\"isl\" + 0.040*\"shield\" + 0.018*\"narrat\" + 0.014*\"scot\" + 0.012*\"blur\" + 0.011*\"pope\" + 0.011*\"nativist\" + 0.011*\"coalit\" + 0.009*\"fleet\" + 0.009*\"sai\"\n", + "2019-01-31 01:18:29,279 : INFO : topic #37 (0.020): 0.013*\"charact\" + 0.011*\"septemb\" + 0.010*\"anim\" + 0.009*\"man\" + 0.008*\"comic\" + 0.007*\"appear\" + 0.007*\"storag\" + 0.007*\"fusiform\" + 0.006*\"workplac\" + 0.006*\"vision\"\n", + "2019-01-31 01:18:29,280 : INFO : topic #28 (0.020): 0.034*\"build\" + 0.029*\"hous\" + 0.019*\"buford\" + 0.014*\"histor\" + 0.012*\"linear\" + 0.011*\"constitut\" + 0.011*\"depress\" + 0.010*\"silicon\" + 0.010*\"briarwood\" + 0.010*\"pistol\"\n", + "2019-01-31 01:18:29,281 : INFO : topic #5 (0.020): 0.038*\"abroad\" + 0.028*\"son\" + 0.027*\"rel\" + 0.026*\"reconstruct\" + 0.020*\"band\" + 0.017*\"muscl\" + 0.016*\"simultan\" + 0.014*\"charcoal\" + 0.014*\"toyota\" + 0.009*\"myspac\"\n", + "2019-01-31 01:18:29,282 : INFO : topic #35 (0.020): 0.056*\"russia\" + 0.036*\"rural\" + 0.036*\"sovereignti\" + 0.026*\"poison\" + 0.024*\"reprint\" + 0.023*\"personifi\" + 0.020*\"moscow\" + 0.018*\"poland\" + 0.015*\"tyrant\" + 0.014*\"unfortun\"\n", + "2019-01-31 01:18:29,288 : INFO : topic diff=0.004018, rho=0.023505\n", + "2019-01-31 01:18:29,448 : INFO : PROGRESS: pass 0, at document #3622000/4922894\n", + "2019-01-31 01:18:30,847 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:18:31,114 : INFO : topic #49 (0.020): 0.043*\"india\" + 0.031*\"incumb\" + 0.013*\"pakistan\" + 0.013*\"islam\" + 0.012*\"muskoge\" + 0.012*\"anglo\" + 0.011*\"affection\" + 0.010*\"sri\" + 0.010*\"televis\" + 0.010*\"khalsa\"\n", + "2019-01-31 01:18:31,115 : INFO : topic #21 (0.020): 0.032*\"samford\" + 0.021*\"spain\" + 0.019*\"del\" + 0.018*\"mexico\" + 0.016*\"italian\" + 0.013*\"soviet\" + 0.012*\"santa\" + 0.012*\"juan\" + 0.010*\"carlo\" + 0.010*\"itali\"\n", + "2019-01-31 01:18:31,116 : INFO : topic #1 (0.020): 0.054*\"china\" + 0.045*\"chilton\" + 0.024*\"kong\" + 0.023*\"hong\" + 0.021*\"korea\" + 0.019*\"korean\" + 0.016*\"sourc\" + 0.016*\"shirin\" + 0.014*\"kim\" + 0.013*\"leah\"\n", + "2019-01-31 01:18:31,117 : INFO : topic #46 (0.020): 0.021*\"norwai\" + 0.018*\"stop\" + 0.017*\"sweden\" + 0.015*\"swedish\" + 0.014*\"wind\" + 0.013*\"norwegian\" + 0.012*\"denmark\" + 0.012*\"huntsvil\" + 0.012*\"damag\" + 0.011*\"treeless\"\n", + "2019-01-31 01:18:31,118 : INFO : topic #20 (0.020): 0.144*\"scholar\" + 0.040*\"struggl\" + 0.033*\"high\" + 0.031*\"educ\" + 0.024*\"collector\" + 0.018*\"yawn\" + 0.013*\"prognosi\" + 0.010*\"task\" + 0.010*\"gothic\" + 0.009*\"district\"\n", + "2019-01-31 01:18:31,124 : INFO : topic diff=0.003610, rho=0.023499\n", + "2019-01-31 01:18:31,284 : INFO : PROGRESS: pass 0, at document #3624000/4922894\n", + "2019-01-31 01:18:32,676 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:18:32,943 : INFO : topic #41 (0.020): 0.039*\"citi\" + 0.024*\"palmer\" + 0.021*\"new\" + 0.016*\"strategist\" + 0.013*\"open\" + 0.012*\"center\" + 0.011*\"lobe\" + 0.011*\"includ\" + 0.011*\"dai\" + 0.009*\"local\"\n", + "2019-01-31 01:18:32,944 : INFO : topic #42 (0.020): 0.048*\"german\" + 0.032*\"germani\" + 0.017*\"vol\" + 0.014*\"der\" + 0.013*\"berlin\" + 0.013*\"jewish\" + 0.013*\"israel\" + 0.010*\"european\" + 0.009*\"europ\" + 0.009*\"austria\"\n", + "2019-01-31 01:18:32,945 : INFO : topic #30 (0.020): 0.036*\"cleveland\" + 0.035*\"leagu\" + 0.030*\"place\" + 0.028*\"taxpay\" + 0.024*\"crete\" + 0.024*\"scientist\" + 0.022*\"folei\" + 0.017*\"goal\" + 0.016*\"martin\" + 0.012*\"schmitz\"\n", + "2019-01-31 01:18:32,946 : INFO : topic #27 (0.020): 0.075*\"questionnair\" + 0.020*\"taxpay\" + 0.020*\"candid\" + 0.016*\"ret\" + 0.013*\"driver\" + 0.013*\"tornado\" + 0.012*\"fool\" + 0.012*\"find\" + 0.011*\"squatter\" + 0.010*\"horac\"\n", + "2019-01-31 01:18:32,947 : INFO : topic #24 (0.020): 0.039*\"book\" + 0.034*\"publicis\" + 0.028*\"word\" + 0.020*\"new\" + 0.014*\"edit\" + 0.013*\"presid\" + 0.011*\"magazin\" + 0.011*\"collect\" + 0.011*\"worldwid\" + 0.011*\"storag\"\n", + "2019-01-31 01:18:32,953 : INFO : topic diff=0.004570, rho=0.023492\n", + "2019-01-31 01:18:33,112 : INFO : PROGRESS: pass 0, at document #3626000/4922894\n", + "2019-01-31 01:18:34,497 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:18:34,762 : INFO : topic #35 (0.020): 0.055*\"russia\" + 0.036*\"rural\" + 0.036*\"sovereignti\" + 0.026*\"poison\" + 0.024*\"reprint\" + 0.023*\"personifi\" + 0.020*\"moscow\" + 0.018*\"poland\" + 0.015*\"tyrant\" + 0.014*\"unfortun\"\n", + "2019-01-31 01:18:34,764 : INFO : topic #4 (0.020): 0.021*\"enfranchis\" + 0.015*\"pour\" + 0.015*\"depress\" + 0.008*\"mode\" + 0.008*\"veget\" + 0.008*\"elabor\" + 0.007*\"uruguayan\" + 0.006*\"produc\" + 0.006*\"develop\" + 0.006*\"candid\"\n", + "2019-01-31 01:18:34,765 : INFO : topic #39 (0.020): 0.059*\"canada\" + 0.044*\"canadian\" + 0.024*\"hoar\" + 0.023*\"toronto\" + 0.020*\"ontario\" + 0.016*\"hydrogen\" + 0.016*\"new\" + 0.015*\"misericordia\" + 0.013*\"novotná\" + 0.013*\"quebec\"\n", + "2019-01-31 01:18:34,766 : INFO : topic #24 (0.020): 0.039*\"book\" + 0.034*\"publicis\" + 0.028*\"word\" + 0.020*\"new\" + 0.014*\"edit\" + 0.013*\"presid\" + 0.011*\"magazin\" + 0.011*\"collect\" + 0.011*\"worldwid\" + 0.011*\"storag\"\n", + "2019-01-31 01:18:34,767 : INFO : topic #19 (0.020): 0.016*\"languag\" + 0.015*\"centuri\" + 0.011*\"woodcut\" + 0.009*\"form\" + 0.009*\"origin\" + 0.009*\"mean\" + 0.008*\"english\" + 0.008*\"trade\" + 0.007*\"known\" + 0.006*\"ancestor\"\n", + "2019-01-31 01:18:34,773 : INFO : topic diff=0.004066, rho=0.023486\n", + "2019-01-31 01:18:34,925 : INFO : PROGRESS: pass 0, at document #3628000/4922894\n", + "2019-01-31 01:18:36,264 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:18:36,530 : INFO : topic #30 (0.020): 0.036*\"cleveland\" + 0.035*\"leagu\" + 0.030*\"place\" + 0.028*\"taxpay\" + 0.024*\"crete\" + 0.024*\"scientist\" + 0.022*\"folei\" + 0.017*\"goal\" + 0.016*\"martin\" + 0.012*\"schmitz\"\n", + "2019-01-31 01:18:36,531 : INFO : topic #32 (0.020): 0.051*\"district\" + 0.046*\"vigour\" + 0.044*\"popolo\" + 0.036*\"cotton\" + 0.036*\"tortur\" + 0.022*\"area\" + 0.022*\"multitud\" + 0.021*\"adulthood\" + 0.019*\"citi\" + 0.019*\"cede\"\n", + "2019-01-31 01:18:36,532 : INFO : topic #41 (0.020): 0.039*\"citi\" + 0.024*\"palmer\" + 0.020*\"new\" + 0.016*\"strategist\" + 0.013*\"open\" + 0.012*\"center\" + 0.011*\"dai\" + 0.011*\"lobe\" + 0.011*\"includ\" + 0.009*\"local\"\n", + "2019-01-31 01:18:36,533 : INFO : topic #9 (0.020): 0.069*\"bone\" + 0.046*\"american\" + 0.028*\"valour\" + 0.019*\"dutch\" + 0.018*\"folei\" + 0.018*\"player\" + 0.017*\"polit\" + 0.016*\"english\" + 0.012*\"acrimoni\" + 0.012*\"simpler\"\n", + "2019-01-31 01:18:36,534 : INFO : topic #44 (0.020): 0.032*\"rooftop\" + 0.028*\"final\" + 0.024*\"wife\" + 0.019*\"tourist\" + 0.018*\"champion\" + 0.015*\"taxpay\" + 0.014*\"tiepolo\" + 0.014*\"martin\" + 0.014*\"chamber\" + 0.013*\"open\"\n", + "2019-01-31 01:18:36,540 : INFO : topic diff=0.003929, rho=0.023479\n", + "2019-01-31 01:18:36,700 : INFO : PROGRESS: pass 0, at document #3630000/4922894\n", + "2019-01-31 01:18:38,088 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:18:38,354 : INFO : topic #34 (0.020): 0.066*\"start\" + 0.034*\"new\" + 0.032*\"american\" + 0.030*\"unionist\" + 0.025*\"cotton\" + 0.021*\"year\" + 0.015*\"california\" + 0.013*\"warrior\" + 0.011*\"terri\" + 0.011*\"north\"\n", + "2019-01-31 01:18:38,355 : INFO : topic #6 (0.020): 0.070*\"fewer\" + 0.024*\"epiru\" + 0.021*\"septemb\" + 0.018*\"teacher\" + 0.016*\"stake\" + 0.012*\"proclaim\" + 0.012*\"rodríguez\" + 0.011*\"direct\" + 0.011*\"movi\" + 0.010*\"acrimoni\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 01:18:38,356 : INFO : topic #21 (0.020): 0.032*\"samford\" + 0.021*\"spain\" + 0.019*\"del\" + 0.018*\"mexico\" + 0.016*\"italian\" + 0.013*\"soviet\" + 0.012*\"santa\" + 0.012*\"juan\" + 0.011*\"carlo\" + 0.010*\"itali\"\n", + "2019-01-31 01:18:38,358 : INFO : topic #18 (0.020): 0.011*\"théori\" + 0.007*\"later\" + 0.007*\"sack\" + 0.006*\"dai\" + 0.006*\"kill\" + 0.005*\"like\" + 0.005*\"retrospect\" + 0.005*\"end\" + 0.004*\"call\" + 0.004*\"kenworthi\"\n", + "2019-01-31 01:18:38,359 : INFO : topic #10 (0.020): 0.011*\"cdd\" + 0.009*\"media\" + 0.008*\"hormon\" + 0.008*\"have\" + 0.008*\"disco\" + 0.007*\"pathwai\" + 0.007*\"caus\" + 0.006*\"treat\" + 0.006*\"proper\" + 0.006*\"effect\"\n", + "2019-01-31 01:18:38,364 : INFO : topic diff=0.003398, rho=0.023473\n", + "2019-01-31 01:18:38,518 : INFO : PROGRESS: pass 0, at document #3632000/4922894\n", + "2019-01-31 01:18:39,874 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:18:40,140 : INFO : topic #33 (0.020): 0.063*\"french\" + 0.047*\"franc\" + 0.030*\"pari\" + 0.023*\"sail\" + 0.021*\"jean\" + 0.017*\"daphn\" + 0.014*\"lazi\" + 0.012*\"piec\" + 0.012*\"loui\" + 0.008*\"wine\"\n", + "2019-01-31 01:18:40,141 : INFO : topic #16 (0.020): 0.060*\"king\" + 0.032*\"priest\" + 0.020*\"duke\" + 0.020*\"quarterli\" + 0.019*\"idiosyncrat\" + 0.019*\"rotterdam\" + 0.016*\"grammat\" + 0.013*\"kingdom\" + 0.013*\"count\" + 0.013*\"portugues\"\n", + "2019-01-31 01:18:40,142 : INFO : topic #48 (0.020): 0.086*\"sens\" + 0.081*\"octob\" + 0.079*\"march\" + 0.069*\"juli\" + 0.069*\"august\" + 0.068*\"januari\" + 0.067*\"notion\" + 0.067*\"judici\" + 0.065*\"april\" + 0.064*\"decatur\"\n", + "2019-01-31 01:18:40,143 : INFO : topic #8 (0.020): 0.026*\"law\" + 0.023*\"cortic\" + 0.018*\"start\" + 0.016*\"act\" + 0.012*\"case\" + 0.012*\"ricardo\" + 0.010*\"replac\" + 0.009*\"order\" + 0.009*\"polaris\" + 0.008*\"legal\"\n", + "2019-01-31 01:18:40,144 : INFO : topic #23 (0.020): 0.135*\"audit\" + 0.069*\"best\" + 0.034*\"yawn\" + 0.029*\"jacksonvil\" + 0.023*\"japanes\" + 0.022*\"noll\" + 0.018*\"festiv\" + 0.018*\"intern\" + 0.018*\"women\" + 0.013*\"prison\"\n", + "2019-01-31 01:18:40,150 : INFO : topic diff=0.003796, rho=0.023466\n", + "2019-01-31 01:18:40,304 : INFO : PROGRESS: pass 0, at document #3634000/4922894\n", + "2019-01-31 01:18:41,676 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:18:41,942 : INFO : topic #25 (0.020): 0.032*\"ring\" + 0.018*\"area\" + 0.017*\"lagrang\" + 0.016*\"warmth\" + 0.016*\"mount\" + 0.012*\"crayfish\" + 0.010*\"north\" + 0.010*\"palmer\" + 0.009*\"sourc\" + 0.009*\"land\"\n", + "2019-01-31 01:18:41,943 : INFO : topic #37 (0.020): 0.013*\"charact\" + 0.011*\"septemb\" + 0.011*\"anim\" + 0.009*\"man\" + 0.008*\"comic\" + 0.007*\"appear\" + 0.007*\"storag\" + 0.007*\"fusiform\" + 0.006*\"workplac\" + 0.006*\"vision\"\n", + "2019-01-31 01:18:41,944 : INFO : topic #14 (0.020): 0.025*\"forc\" + 0.023*\"aggress\" + 0.021*\"walter\" + 0.019*\"armi\" + 0.017*\"com\" + 0.014*\"oper\" + 0.014*\"unionist\" + 0.012*\"militari\" + 0.012*\"airbu\" + 0.011*\"diversifi\"\n", + "2019-01-31 01:18:41,945 : INFO : topic #21 (0.020): 0.032*\"samford\" + 0.021*\"spain\" + 0.018*\"del\" + 0.018*\"mexico\" + 0.016*\"italian\" + 0.013*\"soviet\" + 0.012*\"santa\" + 0.012*\"juan\" + 0.011*\"carlo\" + 0.010*\"itali\"\n", + "2019-01-31 01:18:41,946 : INFO : topic #8 (0.020): 0.026*\"law\" + 0.023*\"cortic\" + 0.018*\"start\" + 0.016*\"act\" + 0.012*\"case\" + 0.012*\"ricardo\" + 0.010*\"replac\" + 0.009*\"order\" + 0.009*\"polaris\" + 0.008*\"legal\"\n", + "2019-01-31 01:18:41,952 : INFO : topic diff=0.003579, rho=0.023460\n", + "2019-01-31 01:18:42,102 : INFO : PROGRESS: pass 0, at document #3636000/4922894\n", + "2019-01-31 01:18:43,429 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:18:43,696 : INFO : topic #17 (0.020): 0.075*\"church\" + 0.024*\"christian\" + 0.023*\"cathol\" + 0.021*\"bishop\" + 0.017*\"sail\" + 0.015*\"retroflex\" + 0.010*\"relationship\" + 0.009*\"historiographi\" + 0.009*\"poll\" + 0.009*\"cathedr\"\n", + "2019-01-31 01:18:43,697 : INFO : topic #46 (0.020): 0.021*\"norwai\" + 0.018*\"stop\" + 0.017*\"sweden\" + 0.016*\"swedish\" + 0.014*\"wind\" + 0.014*\"norwegian\" + 0.013*\"denmark\" + 0.012*\"huntsvil\" + 0.012*\"damag\" + 0.011*\"treeless\"\n", + "2019-01-31 01:18:43,698 : INFO : topic #19 (0.020): 0.016*\"languag\" + 0.015*\"centuri\" + 0.011*\"woodcut\" + 0.009*\"form\" + 0.009*\"origin\" + 0.009*\"mean\" + 0.008*\"trade\" + 0.008*\"english\" + 0.007*\"known\" + 0.006*\"ancestor\"\n", + "2019-01-31 01:18:43,699 : INFO : topic #1 (0.020): 0.054*\"china\" + 0.045*\"chilton\" + 0.023*\"hong\" + 0.023*\"kong\" + 0.021*\"korea\" + 0.019*\"korean\" + 0.016*\"shirin\" + 0.015*\"sourc\" + 0.014*\"kim\" + 0.013*\"leah\"\n", + "2019-01-31 01:18:43,700 : INFO : topic #13 (0.020): 0.027*\"australia\" + 0.026*\"england\" + 0.025*\"sourc\" + 0.025*\"new\" + 0.025*\"london\" + 0.022*\"australian\" + 0.019*\"british\" + 0.018*\"ireland\" + 0.015*\"youth\" + 0.014*\"wale\"\n", + "2019-01-31 01:18:43,706 : INFO : topic diff=0.003809, rho=0.023453\n", + "2019-01-31 01:18:43,861 : INFO : PROGRESS: pass 0, at document #3638000/4922894\n", + "2019-01-31 01:18:45,223 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:18:45,490 : INFO : topic #41 (0.020): 0.039*\"citi\" + 0.024*\"palmer\" + 0.020*\"new\" + 0.016*\"strategist\" + 0.014*\"open\" + 0.012*\"center\" + 0.011*\"dai\" + 0.011*\"includ\" + 0.011*\"lobe\" + 0.009*\"local\"\n", + "2019-01-31 01:18:45,491 : INFO : topic #13 (0.020): 0.027*\"australia\" + 0.026*\"england\" + 0.025*\"sourc\" + 0.025*\"new\" + 0.025*\"london\" + 0.022*\"australian\" + 0.019*\"british\" + 0.018*\"ireland\" + 0.015*\"youth\" + 0.014*\"wale\"\n", + "2019-01-31 01:18:45,492 : INFO : topic #31 (0.020): 0.054*\"fusiform\" + 0.027*\"scientist\" + 0.025*\"taxpay\" + 0.023*\"player\" + 0.020*\"place\" + 0.015*\"clot\" + 0.013*\"leagu\" + 0.011*\"folei\" + 0.010*\"yawn\" + 0.009*\"reconstruct\"\n", + "2019-01-31 01:18:45,493 : INFO : topic #4 (0.020): 0.021*\"enfranchis\" + 0.015*\"depress\" + 0.014*\"pour\" + 0.009*\"mode\" + 0.008*\"veget\" + 0.008*\"elabor\" + 0.007*\"uruguayan\" + 0.006*\"produc\" + 0.006*\"develop\" + 0.006*\"candid\"\n", + "2019-01-31 01:18:45,494 : INFO : topic #1 (0.020): 0.054*\"china\" + 0.045*\"chilton\" + 0.024*\"kong\" + 0.023*\"hong\" + 0.021*\"korea\" + 0.019*\"korean\" + 0.016*\"shirin\" + 0.015*\"sourc\" + 0.014*\"kim\" + 0.013*\"leah\"\n", + "2019-01-31 01:18:45,500 : INFO : topic diff=0.003342, rho=0.023447\n", + "2019-01-31 01:18:48,089 : INFO : -12.147 per-word bound, 4534.6 perplexity estimate based on a held-out corpus of 2000 documents with 528573 words\n", + "2019-01-31 01:18:48,090 : INFO : PROGRESS: pass 0, at document #3640000/4922894\n", + "2019-01-31 01:18:49,435 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:18:49,701 : INFO : topic #47 (0.020): 0.063*\"muscl\" + 0.033*\"perceptu\" + 0.020*\"theater\" + 0.018*\"place\" + 0.018*\"compos\" + 0.016*\"damn\" + 0.014*\"orchestr\" + 0.013*\"physician\" + 0.013*\"olympo\" + 0.012*\"jack\"\n", + "2019-01-31 01:18:49,702 : INFO : topic #13 (0.020): 0.027*\"australia\" + 0.026*\"england\" + 0.025*\"sourc\" + 0.025*\"new\" + 0.025*\"london\" + 0.022*\"australian\" + 0.019*\"british\" + 0.018*\"ireland\" + 0.015*\"youth\" + 0.014*\"wale\"\n", + "2019-01-31 01:18:49,703 : INFO : topic #9 (0.020): 0.070*\"bone\" + 0.046*\"american\" + 0.028*\"valour\" + 0.019*\"dutch\" + 0.018*\"english\" + 0.018*\"folei\" + 0.017*\"player\" + 0.017*\"polit\" + 0.013*\"acrimoni\" + 0.012*\"simpler\"\n", + "2019-01-31 01:18:49,704 : INFO : topic #45 (0.020): 0.033*\"arsen\" + 0.028*\"jpg\" + 0.026*\"fifteenth\" + 0.025*\"museo\" + 0.019*\"pain\" + 0.018*\"illicit\" + 0.014*\"colder\" + 0.014*\"gai\" + 0.013*\"exhaust\" + 0.011*\"black\"\n", + "2019-01-31 01:18:49,705 : INFO : topic #10 (0.020): 0.011*\"cdd\" + 0.009*\"media\" + 0.008*\"hormon\" + 0.008*\"have\" + 0.008*\"disco\" + 0.007*\"pathwai\" + 0.007*\"caus\" + 0.006*\"proper\" + 0.006*\"treat\" + 0.006*\"effect\"\n", + "2019-01-31 01:18:49,711 : INFO : topic diff=0.004051, rho=0.023440\n", + "2019-01-31 01:18:49,872 : INFO : PROGRESS: pass 0, at document #3642000/4922894\n", + "2019-01-31 01:18:51,266 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:18:51,532 : INFO : topic #46 (0.020): 0.020*\"norwai\" + 0.018*\"stop\" + 0.017*\"sweden\" + 0.015*\"swedish\" + 0.015*\"damag\" + 0.013*\"wind\" + 0.013*\"norwegian\" + 0.013*\"huntsvil\" + 0.012*\"denmark\" + 0.011*\"treeless\"\n", + "2019-01-31 01:18:51,533 : INFO : topic #27 (0.020): 0.074*\"questionnair\" + 0.020*\"candid\" + 0.019*\"taxpay\" + 0.014*\"ret\" + 0.013*\"driver\" + 0.013*\"tornado\" + 0.012*\"fool\" + 0.011*\"find\" + 0.011*\"squatter\" + 0.010*\"horac\"\n", + "2019-01-31 01:18:51,535 : INFO : topic #38 (0.020): 0.022*\"walter\" + 0.010*\"aza\" + 0.009*\"battalion\" + 0.008*\"forc\" + 0.007*\"teufel\" + 0.007*\"empath\" + 0.007*\"armi\" + 0.006*\"govern\" + 0.006*\"till\" + 0.006*\"militari\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 01:18:51,536 : INFO : topic #1 (0.020): 0.054*\"china\" + 0.046*\"chilton\" + 0.024*\"kong\" + 0.023*\"hong\" + 0.020*\"korea\" + 0.018*\"korean\" + 0.016*\"shirin\" + 0.015*\"sourc\" + 0.014*\"kim\" + 0.013*\"leah\"\n", + "2019-01-31 01:18:51,537 : INFO : topic #19 (0.020): 0.016*\"languag\" + 0.015*\"centuri\" + 0.010*\"woodcut\" + 0.009*\"form\" + 0.009*\"origin\" + 0.009*\"mean\" + 0.008*\"trade\" + 0.008*\"english\" + 0.007*\"known\" + 0.007*\"ancestor\"\n", + "2019-01-31 01:18:51,542 : INFO : topic diff=0.003584, rho=0.023434\n", + "2019-01-31 01:18:51,700 : INFO : PROGRESS: pass 0, at document #3644000/4922894\n", + "2019-01-31 01:18:53,084 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:18:53,350 : INFO : topic #40 (0.020): 0.085*\"unit\" + 0.023*\"schuster\" + 0.022*\"institut\" + 0.021*\"requir\" + 0.021*\"collector\" + 0.019*\"student\" + 0.015*\"professor\" + 0.012*\"http\" + 0.011*\"word\" + 0.011*\"degre\"\n", + "2019-01-31 01:18:53,351 : INFO : topic #39 (0.020): 0.059*\"canada\" + 0.044*\"canadian\" + 0.024*\"hoar\" + 0.023*\"toronto\" + 0.020*\"ontario\" + 0.017*\"hydrogen\" + 0.016*\"new\" + 0.015*\"novotná\" + 0.014*\"misericordia\" + 0.012*\"quebec\"\n", + "2019-01-31 01:18:53,352 : INFO : topic #25 (0.020): 0.033*\"ring\" + 0.019*\"area\" + 0.017*\"lagrang\" + 0.016*\"warmth\" + 0.016*\"mount\" + 0.012*\"crayfish\" + 0.010*\"north\" + 0.010*\"palmer\" + 0.009*\"sourc\" + 0.009*\"land\"\n", + "2019-01-31 01:18:53,353 : INFO : topic #26 (0.020): 0.030*\"workplac\" + 0.029*\"champion\" + 0.027*\"woman\" + 0.025*\"olymp\" + 0.024*\"men\" + 0.021*\"medal\" + 0.019*\"event\" + 0.019*\"taxpay\" + 0.018*\"rainfal\" + 0.018*\"alic\"\n", + "2019-01-31 01:18:53,354 : INFO : topic #35 (0.020): 0.056*\"russia\" + 0.037*\"sovereignti\" + 0.037*\"rural\" + 0.025*\"poison\" + 0.024*\"reprint\" + 0.024*\"personifi\" + 0.020*\"moscow\" + 0.017*\"poland\" + 0.015*\"tyrant\" + 0.014*\"unfortun\"\n", + "2019-01-31 01:18:53,360 : INFO : topic diff=0.003571, rho=0.023427\n", + "2019-01-31 01:18:53,586 : INFO : PROGRESS: pass 0, at document #3646000/4922894\n", + "2019-01-31 01:18:54,995 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:18:55,261 : INFO : topic #32 (0.020): 0.051*\"district\" + 0.046*\"vigour\" + 0.044*\"popolo\" + 0.037*\"tortur\" + 0.035*\"cotton\" + 0.022*\"area\" + 0.022*\"multitud\" + 0.021*\"adulthood\" + 0.019*\"citi\" + 0.019*\"cede\"\n", + "2019-01-31 01:18:55,263 : INFO : topic #30 (0.020): 0.036*\"leagu\" + 0.036*\"cleveland\" + 0.030*\"place\" + 0.028*\"taxpay\" + 0.024*\"crete\" + 0.024*\"scientist\" + 0.022*\"folei\" + 0.017*\"goal\" + 0.015*\"martin\" + 0.012*\"schmitz\"\n", + "2019-01-31 01:18:55,264 : INFO : topic #0 (0.020): 0.065*\"statewid\" + 0.042*\"line\" + 0.031*\"raid\" + 0.026*\"rosenwald\" + 0.024*\"rivièr\" + 0.019*\"serv\" + 0.019*\"traceabl\" + 0.018*\"airmen\" + 0.013*\"oper\" + 0.010*\"transient\"\n", + "2019-01-31 01:18:55,265 : INFO : topic #27 (0.020): 0.075*\"questionnair\" + 0.020*\"candid\" + 0.019*\"taxpay\" + 0.014*\"ret\" + 0.013*\"driver\" + 0.013*\"tornado\" + 0.012*\"fool\" + 0.012*\"find\" + 0.011*\"squatter\" + 0.010*\"landslid\"\n", + "2019-01-31 01:18:55,266 : INFO : topic #18 (0.020): 0.011*\"théori\" + 0.007*\"later\" + 0.007*\"sack\" + 0.006*\"dai\" + 0.006*\"kill\" + 0.005*\"like\" + 0.005*\"retrospect\" + 0.005*\"end\" + 0.004*\"call\" + 0.004*\"kenworthi\"\n", + "2019-01-31 01:18:55,272 : INFO : topic diff=0.004159, rho=0.023421\n", + "2019-01-31 01:18:55,426 : INFO : PROGRESS: pass 0, at document #3648000/4922894\n", + "2019-01-31 01:18:56,772 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:18:57,038 : INFO : topic #33 (0.020): 0.064*\"french\" + 0.046*\"franc\" + 0.030*\"pari\" + 0.022*\"sail\" + 0.022*\"jean\" + 0.017*\"daphn\" + 0.014*\"lazi\" + 0.012*\"piec\" + 0.011*\"loui\" + 0.008*\"wine\"\n", + "2019-01-31 01:18:57,039 : INFO : topic #41 (0.020): 0.039*\"citi\" + 0.024*\"palmer\" + 0.020*\"new\" + 0.017*\"strategist\" + 0.014*\"open\" + 0.012*\"center\" + 0.011*\"includ\" + 0.011*\"lobe\" + 0.011*\"dai\" + 0.009*\"local\"\n", + "2019-01-31 01:18:57,040 : INFO : topic #44 (0.020): 0.031*\"rooftop\" + 0.029*\"final\" + 0.024*\"wife\" + 0.020*\"tourist\" + 0.018*\"champion\" + 0.015*\"taxpay\" + 0.014*\"chamber\" + 0.014*\"tiepolo\" + 0.014*\"martin\" + 0.014*\"open\"\n", + "2019-01-31 01:18:57,042 : INFO : topic #47 (0.020): 0.063*\"muscl\" + 0.033*\"perceptu\" + 0.021*\"theater\" + 0.018*\"place\" + 0.018*\"compos\" + 0.016*\"damn\" + 0.013*\"orchestr\" + 0.013*\"physician\" + 0.012*\"olympo\" + 0.012*\"word\"\n", + "2019-01-31 01:18:57,043 : INFO : topic #16 (0.020): 0.061*\"king\" + 0.032*\"priest\" + 0.020*\"duke\" + 0.019*\"quarterli\" + 0.019*\"rotterdam\" + 0.019*\"idiosyncrat\" + 0.016*\"grammat\" + 0.013*\"kingdom\" + 0.013*\"brazil\" + 0.013*\"portugues\"\n", + "2019-01-31 01:18:57,048 : INFO : topic diff=0.003302, rho=0.023415\n", + "2019-01-31 01:18:57,200 : INFO : PROGRESS: pass 0, at document #3650000/4922894\n", + "2019-01-31 01:18:58,542 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:18:58,809 : INFO : topic #31 (0.020): 0.055*\"fusiform\" + 0.027*\"scientist\" + 0.025*\"taxpay\" + 0.024*\"player\" + 0.020*\"place\" + 0.015*\"clot\" + 0.013*\"leagu\" + 0.011*\"folei\" + 0.010*\"yawn\" + 0.009*\"reconstruct\"\n", + "2019-01-31 01:18:58,810 : INFO : topic #46 (0.020): 0.020*\"norwai\" + 0.018*\"stop\" + 0.017*\"sweden\" + 0.015*\"damag\" + 0.015*\"swedish\" + 0.013*\"wind\" + 0.013*\"norwegian\" + 0.013*\"huntsvil\" + 0.012*\"denmark\" + 0.011*\"treeless\"\n", + "2019-01-31 01:18:58,811 : INFO : topic #12 (0.020): 0.008*\"number\" + 0.008*\"frontal\" + 0.007*\"gener\" + 0.006*\"southern\" + 0.006*\"exampl\" + 0.006*\"poet\" + 0.006*\"théori\" + 0.006*\"servitud\" + 0.006*\"measur\" + 0.005*\"differ\"\n", + "2019-01-31 01:18:58,812 : INFO : topic #15 (0.020): 0.011*\"small\" + 0.010*\"organ\" + 0.010*\"develop\" + 0.009*\"commun\" + 0.009*\"group\" + 0.008*\"word\" + 0.008*\"peopl\" + 0.008*\"woman\" + 0.007*\"human\" + 0.006*\"summerhil\"\n", + "2019-01-31 01:18:58,813 : INFO : topic #33 (0.020): 0.063*\"french\" + 0.046*\"franc\" + 0.030*\"pari\" + 0.022*\"sail\" + 0.022*\"jean\" + 0.017*\"daphn\" + 0.014*\"lazi\" + 0.012*\"piec\" + 0.011*\"loui\" + 0.008*\"wine\"\n", + "2019-01-31 01:18:58,819 : INFO : topic diff=0.003907, rho=0.023408\n", + "2019-01-31 01:18:58,971 : INFO : PROGRESS: pass 0, at document #3652000/4922894\n", + "2019-01-31 01:19:00,332 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:19:00,599 : INFO : topic #49 (0.020): 0.043*\"india\" + 0.032*\"incumb\" + 0.013*\"pakistan\" + 0.013*\"islam\" + 0.012*\"muskoge\" + 0.012*\"anglo\" + 0.011*\"televis\" + 0.011*\"affection\" + 0.011*\"sri\" + 0.010*\"tajikistan\"\n", + "2019-01-31 01:19:00,600 : INFO : topic #34 (0.020): 0.066*\"start\" + 0.034*\"new\" + 0.032*\"american\" + 0.029*\"unionist\" + 0.025*\"cotton\" + 0.020*\"year\" + 0.015*\"california\" + 0.013*\"warrior\" + 0.012*\"terri\" + 0.011*\"citi\"\n", + "2019-01-31 01:19:00,601 : INFO : topic #10 (0.020): 0.011*\"cdd\" + 0.009*\"media\" + 0.008*\"hormon\" + 0.008*\"disco\" + 0.008*\"have\" + 0.007*\"pathwai\" + 0.007*\"caus\" + 0.006*\"proper\" + 0.006*\"treat\" + 0.006*\"effect\"\n", + "2019-01-31 01:19:00,602 : INFO : topic #14 (0.020): 0.025*\"forc\" + 0.023*\"aggress\" + 0.021*\"walter\" + 0.020*\"armi\" + 0.017*\"com\" + 0.014*\"oper\" + 0.013*\"unionist\" + 0.012*\"militari\" + 0.012*\"airbu\" + 0.011*\"diversifi\"\n", + "2019-01-31 01:19:00,603 : INFO : topic #6 (0.020): 0.070*\"fewer\" + 0.024*\"epiru\" + 0.021*\"septemb\" + 0.018*\"teacher\" + 0.015*\"stake\" + 0.012*\"proclaim\" + 0.012*\"rodríguez\" + 0.011*\"direct\" + 0.010*\"movi\" + 0.010*\"acrimoni\"\n", + "2019-01-31 01:19:00,609 : INFO : topic diff=0.003376, rho=0.023402\n", + "2019-01-31 01:19:00,763 : INFO : PROGRESS: pass 0, at document #3654000/4922894\n", + "2019-01-31 01:19:02,132 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:19:02,399 : INFO : topic #11 (0.020): 0.023*\"john\" + 0.012*\"will\" + 0.011*\"jame\" + 0.011*\"david\" + 0.010*\"rival\" + 0.009*\"mexican–american\" + 0.008*\"paul\" + 0.008*\"georg\" + 0.008*\"slur\" + 0.007*\"rhyme\"\n", + "2019-01-31 01:19:02,400 : INFO : topic #13 (0.020): 0.026*\"australia\" + 0.026*\"sourc\" + 0.025*\"new\" + 0.025*\"england\" + 0.025*\"london\" + 0.022*\"australian\" + 0.019*\"british\" + 0.018*\"ireland\" + 0.015*\"youth\" + 0.014*\"wale\"\n", + "2019-01-31 01:19:02,401 : INFO : topic #9 (0.020): 0.069*\"bone\" + 0.046*\"american\" + 0.029*\"valour\" + 0.019*\"dutch\" + 0.018*\"english\" + 0.018*\"folei\" + 0.017*\"player\" + 0.017*\"polit\" + 0.012*\"acrimoni\" + 0.011*\"simpler\"\n", + "2019-01-31 01:19:02,402 : INFO : topic #18 (0.020): 0.011*\"théori\" + 0.007*\"later\" + 0.007*\"sack\" + 0.006*\"dai\" + 0.006*\"kill\" + 0.005*\"like\" + 0.005*\"retrospect\" + 0.005*\"end\" + 0.004*\"call\" + 0.004*\"kenworthi\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 01:19:02,403 : INFO : topic #6 (0.020): 0.070*\"fewer\" + 0.024*\"epiru\" + 0.021*\"septemb\" + 0.018*\"teacher\" + 0.015*\"stake\" + 0.012*\"proclaim\" + 0.012*\"rodríguez\" + 0.011*\"direct\" + 0.011*\"movi\" + 0.010*\"acrimoni\"\n", + "2019-01-31 01:19:02,409 : INFO : topic diff=0.003231, rho=0.023395\n", + "2019-01-31 01:19:02,567 : INFO : PROGRESS: pass 0, at document #3656000/4922894\n", + "2019-01-31 01:19:03,944 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:19:04,211 : INFO : topic #34 (0.020): 0.066*\"start\" + 0.034*\"new\" + 0.032*\"american\" + 0.029*\"unionist\" + 0.025*\"cotton\" + 0.020*\"year\" + 0.015*\"california\" + 0.013*\"warrior\" + 0.012*\"terri\" + 0.011*\"citi\"\n", + "2019-01-31 01:19:04,212 : INFO : topic #12 (0.020): 0.008*\"number\" + 0.008*\"frontal\" + 0.007*\"gener\" + 0.006*\"southern\" + 0.006*\"exampl\" + 0.006*\"poet\" + 0.006*\"théori\" + 0.006*\"servitud\" + 0.006*\"measur\" + 0.005*\"differ\"\n", + "2019-01-31 01:19:04,213 : INFO : topic #11 (0.020): 0.023*\"john\" + 0.012*\"will\" + 0.011*\"jame\" + 0.011*\"david\" + 0.010*\"rival\" + 0.009*\"mexican–american\" + 0.008*\"paul\" + 0.008*\"georg\" + 0.008*\"slur\" + 0.007*\"rhyme\"\n", + "2019-01-31 01:19:04,214 : INFO : topic #42 (0.020): 0.048*\"german\" + 0.032*\"germani\" + 0.017*\"vol\" + 0.014*\"der\" + 0.014*\"berlin\" + 0.014*\"israel\" + 0.014*\"jewish\" + 0.010*\"european\" + 0.009*\"europ\" + 0.008*\"austria\"\n", + "2019-01-31 01:19:04,215 : INFO : topic #43 (0.020): 0.064*\"elect\" + 0.055*\"parti\" + 0.025*\"voluntari\" + 0.022*\"democrat\" + 0.020*\"member\" + 0.017*\"polici\" + 0.016*\"seaport\" + 0.014*\"bypass\" + 0.014*\"republ\" + 0.013*\"report\"\n", + "2019-01-31 01:19:04,221 : INFO : topic diff=0.003621, rho=0.023389\n", + "2019-01-31 01:19:04,380 : INFO : PROGRESS: pass 0, at document #3658000/4922894\n", + "2019-01-31 01:19:05,763 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:19:06,029 : INFO : topic #23 (0.020): 0.136*\"audit\" + 0.070*\"best\" + 0.033*\"yawn\" + 0.029*\"jacksonvil\" + 0.023*\"japanes\" + 0.022*\"noll\" + 0.018*\"festiv\" + 0.018*\"intern\" + 0.018*\"women\" + 0.013*\"prison\"\n", + "2019-01-31 01:19:06,031 : INFO : topic #32 (0.020): 0.053*\"district\" + 0.046*\"vigour\" + 0.044*\"popolo\" + 0.037*\"tortur\" + 0.035*\"cotton\" + 0.022*\"area\" + 0.022*\"multitud\" + 0.021*\"adulthood\" + 0.019*\"citi\" + 0.019*\"cede\"\n", + "2019-01-31 01:19:06,032 : INFO : topic #25 (0.020): 0.033*\"ring\" + 0.019*\"area\" + 0.017*\"lagrang\" + 0.016*\"warmth\" + 0.016*\"mount\" + 0.012*\"crayfish\" + 0.010*\"north\" + 0.010*\"palmer\" + 0.009*\"sourc\" + 0.009*\"land\"\n", + "2019-01-31 01:19:06,033 : INFO : topic #35 (0.020): 0.055*\"russia\" + 0.036*\"sovereignti\" + 0.036*\"rural\" + 0.024*\"poison\" + 0.024*\"reprint\" + 0.023*\"personifi\" + 0.020*\"moscow\" + 0.017*\"poland\" + 0.014*\"unfortun\" + 0.014*\"tyrant\"\n", + "2019-01-31 01:19:06,034 : INFO : topic #8 (0.020): 0.026*\"law\" + 0.023*\"cortic\" + 0.019*\"start\" + 0.016*\"act\" + 0.012*\"case\" + 0.011*\"ricardo\" + 0.009*\"replac\" + 0.009*\"polaris\" + 0.009*\"order\" + 0.008*\"legal\"\n", + "2019-01-31 01:19:06,039 : INFO : topic diff=0.003983, rho=0.023383\n", + "2019-01-31 01:19:08,709 : INFO : -11.769 per-word bound, 3489.8 perplexity estimate based on a held-out corpus of 2000 documents with 550710 words\n", + "2019-01-31 01:19:08,709 : INFO : PROGRESS: pass 0, at document #3660000/4922894\n", + "2019-01-31 01:19:10,078 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:19:10,345 : INFO : topic #49 (0.020): 0.043*\"india\" + 0.032*\"incumb\" + 0.013*\"pakistan\" + 0.013*\"islam\" + 0.012*\"muskoge\" + 0.012*\"anglo\" + 0.011*\"televis\" + 0.011*\"affection\" + 0.011*\"sri\" + 0.010*\"tajikistan\"\n", + "2019-01-31 01:19:10,346 : INFO : topic #27 (0.020): 0.074*\"questionnair\" + 0.020*\"candid\" + 0.019*\"taxpay\" + 0.014*\"ret\" + 0.013*\"tornado\" + 0.013*\"driver\" + 0.012*\"fool\" + 0.012*\"find\" + 0.011*\"squatter\" + 0.010*\"landslid\"\n", + "2019-01-31 01:19:10,347 : INFO : topic #15 (0.020): 0.011*\"small\" + 0.010*\"organ\" + 0.010*\"develop\" + 0.009*\"commun\" + 0.008*\"group\" + 0.008*\"word\" + 0.008*\"woman\" + 0.008*\"peopl\" + 0.007*\"human\" + 0.006*\"summerhil\"\n", + "2019-01-31 01:19:10,348 : INFO : topic #14 (0.020): 0.025*\"forc\" + 0.023*\"aggress\" + 0.021*\"walter\" + 0.020*\"armi\" + 0.017*\"com\" + 0.014*\"oper\" + 0.014*\"unionist\" + 0.012*\"militari\" + 0.012*\"airbu\" + 0.011*\"diversifi\"\n", + "2019-01-31 01:19:10,349 : INFO : topic #21 (0.020): 0.034*\"samford\" + 0.022*\"spain\" + 0.018*\"del\" + 0.018*\"mexico\" + 0.016*\"italian\" + 0.013*\"soviet\" + 0.013*\"santa\" + 0.012*\"juan\" + 0.011*\"carlo\" + 0.010*\"mexican\"\n", + "2019-01-31 01:19:10,355 : INFO : topic diff=0.003735, rho=0.023376\n", + "2019-01-31 01:19:10,509 : INFO : PROGRESS: pass 0, at document #3662000/4922894\n", + "2019-01-31 01:19:11,877 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:19:12,143 : INFO : topic #13 (0.020): 0.026*\"australia\" + 0.026*\"sourc\" + 0.025*\"new\" + 0.024*\"london\" + 0.024*\"england\" + 0.022*\"australian\" + 0.019*\"british\" + 0.018*\"ireland\" + 0.015*\"youth\" + 0.014*\"wale\"\n", + "2019-01-31 01:19:12,144 : INFO : topic #8 (0.020): 0.026*\"law\" + 0.023*\"cortic\" + 0.019*\"start\" + 0.016*\"act\" + 0.012*\"case\" + 0.011*\"ricardo\" + 0.010*\"replac\" + 0.009*\"polaris\" + 0.009*\"order\" + 0.008*\"legal\"\n", + "2019-01-31 01:19:12,145 : INFO : topic #7 (0.020): 0.022*\"snatch\" + 0.020*\"di\" + 0.019*\"factor\" + 0.016*\"yawn\" + 0.015*\"margin\" + 0.014*\"bone\" + 0.013*\"faster\" + 0.013*\"life\" + 0.012*\"deal\" + 0.012*\"daughter\"\n", + "2019-01-31 01:19:12,146 : INFO : topic #36 (0.020): 0.011*\"network\" + 0.010*\"prognosi\" + 0.010*\"pop\" + 0.008*\"develop\" + 0.008*\"cytokin\" + 0.008*\"diggin\" + 0.008*\"softwar\" + 0.008*\"user\" + 0.008*\"uruguayan\" + 0.007*\"championship\"\n", + "2019-01-31 01:19:12,147 : INFO : topic #26 (0.020): 0.030*\"workplac\" + 0.029*\"champion\" + 0.027*\"woman\" + 0.025*\"olymp\" + 0.024*\"men\" + 0.021*\"medal\" + 0.020*\"event\" + 0.019*\"taxpay\" + 0.018*\"atheist\" + 0.018*\"rainfal\"\n", + "2019-01-31 01:19:12,153 : INFO : topic diff=0.003019, rho=0.023370\n", + "2019-01-31 01:19:12,310 : INFO : PROGRESS: pass 0, at document #3664000/4922894\n", + "2019-01-31 01:19:13,675 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:19:13,941 : INFO : topic #18 (0.020): 0.011*\"théori\" + 0.007*\"later\" + 0.007*\"sack\" + 0.006*\"dai\" + 0.006*\"kill\" + 0.005*\"like\" + 0.005*\"retrospect\" + 0.005*\"end\" + 0.004*\"call\" + 0.004*\"kenworthi\"\n", + "2019-01-31 01:19:13,942 : INFO : topic #35 (0.020): 0.056*\"russia\" + 0.036*\"rural\" + 0.036*\"sovereignti\" + 0.025*\"poison\" + 0.024*\"reprint\" + 0.023*\"personifi\" + 0.020*\"moscow\" + 0.017*\"poland\" + 0.014*\"tyrant\" + 0.014*\"unfortun\"\n", + "2019-01-31 01:19:13,943 : INFO : topic #31 (0.020): 0.055*\"fusiform\" + 0.027*\"scientist\" + 0.026*\"taxpay\" + 0.023*\"player\" + 0.020*\"place\" + 0.015*\"clot\" + 0.013*\"leagu\" + 0.011*\"folei\" + 0.010*\"yawn\" + 0.009*\"reconstruct\"\n", + "2019-01-31 01:19:13,944 : INFO : topic #0 (0.020): 0.068*\"statewid\" + 0.041*\"line\" + 0.031*\"raid\" + 0.026*\"rosenwald\" + 0.025*\"rivièr\" + 0.019*\"serv\" + 0.019*\"traceabl\" + 0.018*\"airmen\" + 0.013*\"oper\" + 0.010*\"transient\"\n", + "2019-01-31 01:19:13,945 : INFO : topic #16 (0.020): 0.061*\"king\" + 0.032*\"priest\" + 0.020*\"duke\" + 0.019*\"quarterli\" + 0.019*\"idiosyncrat\" + 0.019*\"rotterdam\" + 0.016*\"grammat\" + 0.014*\"kingdom\" + 0.013*\"brazil\" + 0.013*\"count\"\n", + "2019-01-31 01:19:13,951 : INFO : topic diff=0.004015, rho=0.023363\n", + "2019-01-31 01:19:14,102 : INFO : PROGRESS: pass 0, at document #3666000/4922894\n", + "2019-01-31 01:19:15,425 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:19:15,692 : INFO : topic #16 (0.020): 0.061*\"king\" + 0.032*\"priest\" + 0.020*\"duke\" + 0.019*\"quarterli\" + 0.019*\"idiosyncrat\" + 0.019*\"rotterdam\" + 0.016*\"grammat\" + 0.014*\"kingdom\" + 0.013*\"brazil\" + 0.013*\"count\"\n", + "2019-01-31 01:19:15,693 : INFO : topic #18 (0.020): 0.011*\"théori\" + 0.007*\"later\" + 0.007*\"sack\" + 0.006*\"dai\" + 0.006*\"kill\" + 0.005*\"retrospect\" + 0.005*\"like\" + 0.005*\"end\" + 0.004*\"call\" + 0.004*\"kenworthi\"\n", + "2019-01-31 01:19:15,694 : INFO : topic #32 (0.020): 0.053*\"district\" + 0.045*\"vigour\" + 0.044*\"popolo\" + 0.038*\"tortur\" + 0.035*\"cotton\" + 0.022*\"area\" + 0.022*\"multitud\" + 0.021*\"adulthood\" + 0.019*\"citi\" + 0.019*\"cede\"\n", + "2019-01-31 01:19:15,695 : INFO : topic #0 (0.020): 0.068*\"statewid\" + 0.041*\"line\" + 0.031*\"raid\" + 0.025*\"rosenwald\" + 0.025*\"rivièr\" + 0.019*\"serv\" + 0.019*\"traceabl\" + 0.018*\"airmen\" + 0.013*\"oper\" + 0.010*\"transient\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 01:19:15,696 : INFO : topic #41 (0.020): 0.039*\"citi\" + 0.023*\"palmer\" + 0.020*\"new\" + 0.017*\"strategist\" + 0.013*\"open\" + 0.012*\"center\" + 0.011*\"dai\" + 0.011*\"includ\" + 0.011*\"lobe\" + 0.009*\"local\"\n", + "2019-01-31 01:19:15,703 : INFO : topic diff=0.004083, rho=0.023357\n", + "2019-01-31 01:19:15,859 : INFO : PROGRESS: pass 0, at document #3668000/4922894\n", + "2019-01-31 01:19:17,232 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:19:17,498 : INFO : topic #18 (0.020): 0.011*\"théori\" + 0.007*\"later\" + 0.007*\"sack\" + 0.006*\"dai\" + 0.006*\"kill\" + 0.005*\"like\" + 0.005*\"retrospect\" + 0.005*\"end\" + 0.004*\"call\" + 0.004*\"kenworthi\"\n", + "2019-01-31 01:19:17,500 : INFO : topic #47 (0.020): 0.063*\"muscl\" + 0.033*\"perceptu\" + 0.020*\"theater\" + 0.018*\"place\" + 0.018*\"compos\" + 0.016*\"damn\" + 0.013*\"orchestr\" + 0.013*\"physician\" + 0.012*\"olympo\" + 0.012*\"jack\"\n", + "2019-01-31 01:19:17,501 : INFO : topic #34 (0.020): 0.066*\"start\" + 0.034*\"new\" + 0.032*\"american\" + 0.029*\"unionist\" + 0.025*\"cotton\" + 0.020*\"year\" + 0.016*\"california\" + 0.013*\"warrior\" + 0.012*\"terri\" + 0.011*\"citi\"\n", + "2019-01-31 01:19:17,502 : INFO : topic #23 (0.020): 0.136*\"audit\" + 0.069*\"best\" + 0.033*\"yawn\" + 0.029*\"jacksonvil\" + 0.023*\"japanes\" + 0.022*\"noll\" + 0.019*\"festiv\" + 0.018*\"women\" + 0.018*\"intern\" + 0.013*\"prison\"\n", + "2019-01-31 01:19:17,503 : INFO : topic #2 (0.020): 0.050*\"isl\" + 0.039*\"shield\" + 0.018*\"narrat\" + 0.015*\"scot\" + 0.013*\"blur\" + 0.011*\"pope\" + 0.011*\"nativist\" + 0.011*\"coalit\" + 0.009*\"fleet\" + 0.008*\"bahá\"\n", + "2019-01-31 01:19:17,509 : INFO : topic diff=0.003578, rho=0.023351\n", + "2019-01-31 01:19:17,663 : INFO : PROGRESS: pass 0, at document #3670000/4922894\n", + "2019-01-31 01:19:19,015 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:19:19,282 : INFO : topic #38 (0.020): 0.023*\"walter\" + 0.010*\"aza\" + 0.009*\"battalion\" + 0.008*\"forc\" + 0.007*\"teufel\" + 0.007*\"empath\" + 0.007*\"armi\" + 0.006*\"govern\" + 0.006*\"till\" + 0.006*\"militari\"\n", + "2019-01-31 01:19:19,283 : INFO : topic #12 (0.020): 0.008*\"number\" + 0.007*\"frontal\" + 0.007*\"gener\" + 0.006*\"southern\" + 0.006*\"poet\" + 0.006*\"exampl\" + 0.006*\"théori\" + 0.006*\"servitud\" + 0.006*\"measur\" + 0.005*\"differ\"\n", + "2019-01-31 01:19:19,284 : INFO : topic #20 (0.020): 0.141*\"scholar\" + 0.039*\"struggl\" + 0.032*\"high\" + 0.031*\"educ\" + 0.024*\"collector\" + 0.017*\"yawn\" + 0.013*\"prognosi\" + 0.011*\"district\" + 0.010*\"gothic\" + 0.010*\"start\"\n", + "2019-01-31 01:19:19,285 : INFO : topic #6 (0.020): 0.070*\"fewer\" + 0.024*\"epiru\" + 0.021*\"septemb\" + 0.018*\"teacher\" + 0.015*\"stake\" + 0.012*\"proclaim\" + 0.012*\"rodríguez\" + 0.011*\"direct\" + 0.010*\"movi\" + 0.010*\"acrimoni\"\n", + "2019-01-31 01:19:19,286 : INFO : topic #29 (0.020): 0.031*\"companhia\" + 0.013*\"busi\" + 0.013*\"million\" + 0.011*\"market\" + 0.011*\"bank\" + 0.011*\"produc\" + 0.010*\"industri\" + 0.009*\"manag\" + 0.008*\"yawn\" + 0.007*\"oper\"\n", + "2019-01-31 01:19:19,292 : INFO : topic diff=0.002792, rho=0.023344\n", + "2019-01-31 01:19:19,449 : INFO : PROGRESS: pass 0, at document #3672000/4922894\n", + "2019-01-31 01:19:20,835 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:19:21,102 : INFO : topic #26 (0.020): 0.030*\"workplac\" + 0.030*\"champion\" + 0.027*\"woman\" + 0.025*\"olymp\" + 0.024*\"men\" + 0.021*\"medal\" + 0.020*\"event\" + 0.019*\"atheist\" + 0.018*\"taxpay\" + 0.018*\"rainfal\"\n", + "2019-01-31 01:19:21,103 : INFO : topic #0 (0.020): 0.067*\"statewid\" + 0.042*\"line\" + 0.031*\"raid\" + 0.026*\"rosenwald\" + 0.025*\"rivièr\" + 0.019*\"serv\" + 0.019*\"traceabl\" + 0.017*\"airmen\" + 0.013*\"oper\" + 0.010*\"transient\"\n", + "2019-01-31 01:19:21,104 : INFO : topic #9 (0.020): 0.069*\"bone\" + 0.049*\"american\" + 0.027*\"valour\" + 0.018*\"dutch\" + 0.018*\"folei\" + 0.017*\"english\" + 0.017*\"player\" + 0.016*\"polit\" + 0.013*\"acrimoni\" + 0.012*\"simpler\"\n", + "2019-01-31 01:19:21,105 : INFO : topic #19 (0.020): 0.015*\"languag\" + 0.015*\"centuri\" + 0.010*\"woodcut\" + 0.009*\"form\" + 0.009*\"origin\" + 0.009*\"mean\" + 0.008*\"trade\" + 0.007*\"english\" + 0.007*\"ancestor\" + 0.007*\"known\"\n", + "2019-01-31 01:19:21,107 : INFO : topic #11 (0.020): 0.024*\"john\" + 0.012*\"will\" + 0.011*\"david\" + 0.011*\"jame\" + 0.010*\"rival\" + 0.009*\"mexican–american\" + 0.008*\"paul\" + 0.008*\"georg\" + 0.008*\"slur\" + 0.007*\"rhyme\"\n", + "2019-01-31 01:19:21,113 : INFO : topic diff=0.003094, rho=0.023338\n", + "2019-01-31 01:19:21,268 : INFO : PROGRESS: pass 0, at document #3674000/4922894\n", + "2019-01-31 01:19:22,631 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:19:22,898 : INFO : topic #40 (0.020): 0.086*\"unit\" + 0.023*\"schuster\" + 0.022*\"institut\" + 0.021*\"requir\" + 0.021*\"collector\" + 0.019*\"student\" + 0.015*\"professor\" + 0.012*\"http\" + 0.011*\"word\" + 0.011*\"degre\"\n", + "2019-01-31 01:19:22,899 : INFO : topic #29 (0.020): 0.031*\"companhia\" + 0.013*\"busi\" + 0.013*\"million\" + 0.011*\"market\" + 0.011*\"produc\" + 0.011*\"bank\" + 0.010*\"industri\" + 0.009*\"manag\" + 0.008*\"yawn\" + 0.007*\"oper\"\n", + "2019-01-31 01:19:22,900 : INFO : topic #22 (0.020): 0.034*\"spars\" + 0.018*\"factor\" + 0.012*\"plaisir\" + 0.011*\"genu\" + 0.009*\"western\" + 0.008*\"biom\" + 0.008*\"median\" + 0.007*\"incom\" + 0.007*\"male\" + 0.006*\"feel\"\n", + "2019-01-31 01:19:22,900 : INFO : topic #39 (0.020): 0.059*\"canada\" + 0.047*\"canadian\" + 0.025*\"hoar\" + 0.024*\"toronto\" + 0.021*\"ontario\" + 0.017*\"hydrogen\" + 0.016*\"new\" + 0.015*\"novotná\" + 0.014*\"misericordia\" + 0.013*\"quebec\"\n", + "2019-01-31 01:19:22,901 : INFO : topic #32 (0.020): 0.053*\"district\" + 0.045*\"vigour\" + 0.044*\"popolo\" + 0.037*\"tortur\" + 0.035*\"cotton\" + 0.022*\"area\" + 0.021*\"multitud\" + 0.021*\"adulthood\" + 0.019*\"cede\" + 0.019*\"citi\"\n", + "2019-01-31 01:19:22,907 : INFO : topic diff=0.003519, rho=0.023332\n", + "2019-01-31 01:19:23,062 : INFO : PROGRESS: pass 0, at document #3676000/4922894\n", + "2019-01-31 01:19:24,422 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:19:24,689 : INFO : topic #4 (0.020): 0.021*\"enfranchis\" + 0.014*\"depress\" + 0.014*\"pour\" + 0.009*\"veget\" + 0.008*\"mode\" + 0.008*\"elabor\" + 0.007*\"uruguayan\" + 0.006*\"produc\" + 0.006*\"develop\" + 0.006*\"encyclopedia\"\n", + "2019-01-31 01:19:24,690 : INFO : topic #29 (0.020): 0.031*\"companhia\" + 0.013*\"busi\" + 0.013*\"million\" + 0.011*\"market\" + 0.011*\"produc\" + 0.011*\"bank\" + 0.010*\"industri\" + 0.009*\"manag\" + 0.008*\"yawn\" + 0.007*\"oper\"\n", + "2019-01-31 01:19:24,691 : INFO : topic #22 (0.020): 0.034*\"spars\" + 0.018*\"factor\" + 0.012*\"plaisir\" + 0.011*\"genu\" + 0.009*\"western\" + 0.008*\"biom\" + 0.008*\"median\" + 0.007*\"incom\" + 0.007*\"male\" + 0.006*\"feel\"\n", + "2019-01-31 01:19:24,692 : INFO : topic #11 (0.020): 0.024*\"john\" + 0.012*\"will\" + 0.012*\"david\" + 0.011*\"jame\" + 0.010*\"rival\" + 0.009*\"mexican–american\" + 0.008*\"slur\" + 0.008*\"paul\" + 0.008*\"georg\" + 0.007*\"rhyme\"\n", + "2019-01-31 01:19:24,693 : INFO : topic #24 (0.020): 0.039*\"book\" + 0.034*\"publicis\" + 0.028*\"word\" + 0.019*\"new\" + 0.014*\"edit\" + 0.013*\"presid\" + 0.012*\"magazin\" + 0.011*\"worldwid\" + 0.011*\"collect\" + 0.011*\"storag\"\n", + "2019-01-31 01:19:24,699 : INFO : topic diff=0.003386, rho=0.023325\n", + "2019-01-31 01:19:24,856 : INFO : PROGRESS: pass 0, at document #3678000/4922894\n", + "2019-01-31 01:19:26,241 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:19:26,508 : INFO : topic #10 (0.020): 0.012*\"cdd\" + 0.009*\"media\" + 0.008*\"hormon\" + 0.008*\"disco\" + 0.008*\"pathwai\" + 0.007*\"have\" + 0.007*\"caus\" + 0.006*\"proper\" + 0.006*\"treat\" + 0.006*\"effect\"\n", + "2019-01-31 01:19:26,509 : INFO : topic #26 (0.020): 0.030*\"workplac\" + 0.029*\"champion\" + 0.027*\"woman\" + 0.025*\"olymp\" + 0.023*\"men\" + 0.021*\"medal\" + 0.019*\"event\" + 0.019*\"alic\" + 0.018*\"atheist\" + 0.018*\"taxpay\"\n", + "2019-01-31 01:19:26,509 : INFO : topic #46 (0.020): 0.019*\"norwai\" + 0.018*\"stop\" + 0.017*\"sweden\" + 0.016*\"swedish\" + 0.015*\"damag\" + 0.014*\"wind\" + 0.013*\"norwegian\" + 0.013*\"huntsvil\" + 0.012*\"treeless\" + 0.011*\"denmark\"\n", + "2019-01-31 01:19:26,511 : INFO : topic #7 (0.020): 0.022*\"snatch\" + 0.020*\"di\" + 0.019*\"factor\" + 0.016*\"yawn\" + 0.015*\"margin\" + 0.014*\"bone\" + 0.013*\"faster\" + 0.013*\"life\" + 0.012*\"deal\" + 0.012*\"will\"\n", + "2019-01-31 01:19:26,512 : INFO : topic #25 (0.020): 0.032*\"ring\" + 0.019*\"area\" + 0.017*\"lagrang\" + 0.016*\"warmth\" + 0.016*\"mount\" + 0.011*\"crayfish\" + 0.010*\"north\" + 0.009*\"palmer\" + 0.009*\"sourc\" + 0.009*\"land\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 01:19:26,518 : INFO : topic diff=0.003378, rho=0.023319\n", + "2019-01-31 01:19:29,277 : INFO : -11.762 per-word bound, 3473.4 perplexity estimate based on a held-out corpus of 2000 documents with 577792 words\n", + "2019-01-31 01:19:29,277 : INFO : PROGRESS: pass 0, at document #3680000/4922894\n", + "2019-01-31 01:19:30,648 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:19:30,915 : INFO : topic #10 (0.020): 0.012*\"cdd\" + 0.009*\"media\" + 0.008*\"hormon\" + 0.008*\"disco\" + 0.008*\"pathwai\" + 0.008*\"have\" + 0.007*\"caus\" + 0.006*\"proper\" + 0.006*\"treat\" + 0.006*\"effect\"\n", + "2019-01-31 01:19:30,916 : INFO : topic #40 (0.020): 0.085*\"unit\" + 0.023*\"schuster\" + 0.022*\"institut\" + 0.021*\"requir\" + 0.021*\"collector\" + 0.019*\"student\" + 0.015*\"professor\" + 0.011*\"http\" + 0.011*\"word\" + 0.011*\"degre\"\n", + "2019-01-31 01:19:30,917 : INFO : topic #25 (0.020): 0.032*\"ring\" + 0.019*\"area\" + 0.017*\"lagrang\" + 0.016*\"warmth\" + 0.016*\"mount\" + 0.011*\"crayfish\" + 0.010*\"north\" + 0.009*\"palmer\" + 0.009*\"sourc\" + 0.009*\"land\"\n", + "2019-01-31 01:19:30,918 : INFO : topic #44 (0.020): 0.030*\"rooftop\" + 0.027*\"final\" + 0.024*\"wife\" + 0.020*\"tourist\" + 0.018*\"champion\" + 0.015*\"taxpay\" + 0.014*\"martin\" + 0.014*\"chamber\" + 0.014*\"tiepolo\" + 0.013*\"open\"\n", + "2019-01-31 01:19:30,919 : INFO : topic #13 (0.020): 0.026*\"sourc\" + 0.026*\"australia\" + 0.025*\"new\" + 0.024*\"london\" + 0.023*\"england\" + 0.022*\"australian\" + 0.019*\"british\" + 0.017*\"ireland\" + 0.015*\"wale\" + 0.014*\"youth\"\n", + "2019-01-31 01:19:30,925 : INFO : topic diff=0.003556, rho=0.023313\n", + "2019-01-31 01:19:31,082 : INFO : PROGRESS: pass 0, at document #3682000/4922894\n", + "2019-01-31 01:19:32,434 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:19:32,700 : INFO : topic #29 (0.020): 0.031*\"companhia\" + 0.013*\"busi\" + 0.013*\"million\" + 0.011*\"market\" + 0.011*\"produc\" + 0.010*\"bank\" + 0.010*\"industri\" + 0.008*\"manag\" + 0.008*\"yawn\" + 0.007*\"oper\"\n", + "2019-01-31 01:19:32,701 : INFO : topic #9 (0.020): 0.070*\"bone\" + 0.049*\"american\" + 0.027*\"valour\" + 0.018*\"dutch\" + 0.018*\"folei\" + 0.017*\"english\" + 0.017*\"player\" + 0.016*\"polit\" + 0.012*\"acrimoni\" + 0.011*\"simpler\"\n", + "2019-01-31 01:19:32,703 : INFO : topic #15 (0.020): 0.011*\"small\" + 0.010*\"organ\" + 0.010*\"develop\" + 0.009*\"commun\" + 0.009*\"group\" + 0.008*\"word\" + 0.008*\"peopl\" + 0.008*\"woman\" + 0.007*\"human\" + 0.006*\"summerhil\"\n", + "2019-01-31 01:19:32,704 : INFO : topic #0 (0.020): 0.067*\"statewid\" + 0.041*\"line\" + 0.032*\"raid\" + 0.026*\"rosenwald\" + 0.025*\"rivièr\" + 0.019*\"serv\" + 0.019*\"traceabl\" + 0.017*\"airmen\" + 0.014*\"oper\" + 0.011*\"transient\"\n", + "2019-01-31 01:19:32,705 : INFO : topic #38 (0.020): 0.022*\"walter\" + 0.010*\"aza\" + 0.009*\"battalion\" + 0.008*\"forc\" + 0.008*\"teufel\" + 0.007*\"armi\" + 0.007*\"empath\" + 0.007*\"till\" + 0.006*\"govern\" + 0.006*\"militari\"\n", + "2019-01-31 01:19:32,711 : INFO : topic diff=0.003685, rho=0.023306\n", + "2019-01-31 01:19:32,863 : INFO : PROGRESS: pass 0, at document #3684000/4922894\n", + "2019-01-31 01:19:34,216 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:19:34,484 : INFO : topic #21 (0.020): 0.034*\"samford\" + 0.021*\"spain\" + 0.019*\"mexico\" + 0.019*\"del\" + 0.017*\"italian\" + 0.013*\"soviet\" + 0.012*\"santa\" + 0.011*\"juan\" + 0.011*\"mexican\" + 0.011*\"carlo\"\n", + "2019-01-31 01:19:34,485 : INFO : topic #42 (0.020): 0.049*\"german\" + 0.032*\"germani\" + 0.017*\"vol\" + 0.014*\"der\" + 0.014*\"jewish\" + 0.014*\"berlin\" + 0.014*\"israel\" + 0.010*\"european\" + 0.009*\"europ\" + 0.008*\"hungarian\"\n", + "2019-01-31 01:19:34,486 : INFO : topic #39 (0.020): 0.059*\"canada\" + 0.046*\"canadian\" + 0.025*\"hoar\" + 0.024*\"toronto\" + 0.022*\"ontario\" + 0.017*\"hydrogen\" + 0.016*\"new\" + 0.014*\"novotná\" + 0.014*\"misericordia\" + 0.013*\"quebec\"\n", + "2019-01-31 01:19:34,486 : INFO : topic #16 (0.020): 0.061*\"king\" + 0.031*\"priest\" + 0.020*\"duke\" + 0.019*\"quarterli\" + 0.019*\"idiosyncrat\" + 0.019*\"rotterdam\" + 0.016*\"grammat\" + 0.014*\"kingdom\" + 0.013*\"maria\" + 0.012*\"count\"\n", + "2019-01-31 01:19:34,488 : INFO : topic #36 (0.020): 0.011*\"network\" + 0.010*\"prognosi\" + 0.010*\"pop\" + 0.008*\"develop\" + 0.008*\"cytokin\" + 0.008*\"diggin\" + 0.008*\"softwar\" + 0.008*\"user\" + 0.007*\"uruguayan\" + 0.007*\"championship\"\n", + "2019-01-31 01:19:34,493 : INFO : topic diff=0.003395, rho=0.023300\n", + "2019-01-31 01:19:34,650 : INFO : PROGRESS: pass 0, at document #3686000/4922894\n", + "2019-01-31 01:19:36,020 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:19:36,287 : INFO : topic #6 (0.020): 0.070*\"fewer\" + 0.024*\"epiru\" + 0.021*\"septemb\" + 0.018*\"teacher\" + 0.015*\"stake\" + 0.012*\"proclaim\" + 0.012*\"rodríguez\" + 0.011*\"direct\" + 0.010*\"movi\" + 0.010*\"acrimoni\"\n", + "2019-01-31 01:19:36,288 : INFO : topic #37 (0.020): 0.013*\"charact\" + 0.011*\"septemb\" + 0.010*\"anim\" + 0.010*\"man\" + 0.009*\"comic\" + 0.007*\"appear\" + 0.007*\"storag\" + 0.007*\"fusiform\" + 0.006*\"workplac\" + 0.006*\"vision\"\n", + "2019-01-31 01:19:36,289 : INFO : topic #49 (0.020): 0.042*\"india\" + 0.031*\"incumb\" + 0.012*\"islam\" + 0.012*\"pakistan\" + 0.012*\"anglo\" + 0.012*\"muskoge\" + 0.011*\"televis\" + 0.011*\"sri\" + 0.010*\"affection\" + 0.010*\"tajikistan\"\n", + "2019-01-31 01:19:36,290 : INFO : topic #25 (0.020): 0.032*\"ring\" + 0.019*\"area\" + 0.017*\"lagrang\" + 0.016*\"mount\" + 0.016*\"warmth\" + 0.010*\"crayfish\" + 0.010*\"north\" + 0.010*\"palmer\" + 0.009*\"sourc\" + 0.009*\"land\"\n", + "2019-01-31 01:19:36,291 : INFO : topic #31 (0.020): 0.054*\"fusiform\" + 0.027*\"scientist\" + 0.025*\"taxpay\" + 0.024*\"player\" + 0.020*\"place\" + 0.015*\"clot\" + 0.013*\"leagu\" + 0.011*\"folei\" + 0.011*\"yawn\" + 0.009*\"reconstruct\"\n", + "2019-01-31 01:19:36,297 : INFO : topic diff=0.003139, rho=0.023294\n", + "2019-01-31 01:19:36,454 : INFO : PROGRESS: pass 0, at document #3688000/4922894\n", + "2019-01-31 01:19:37,846 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:19:38,112 : INFO : topic #45 (0.020): 0.036*\"arsen\" + 0.028*\"jpg\" + 0.026*\"fifteenth\" + 0.026*\"museo\" + 0.019*\"pain\" + 0.018*\"illicit\" + 0.015*\"colder\" + 0.014*\"exhaust\" + 0.013*\"gai\" + 0.011*\"artist\"\n", + "2019-01-31 01:19:38,113 : INFO : topic #21 (0.020): 0.034*\"samford\" + 0.021*\"spain\" + 0.018*\"mexico\" + 0.018*\"del\" + 0.017*\"italian\" + 0.013*\"soviet\" + 0.012*\"santa\" + 0.011*\"juan\" + 0.011*\"carlo\" + 0.011*\"mexican\"\n", + "2019-01-31 01:19:38,115 : INFO : topic #42 (0.020): 0.049*\"german\" + 0.032*\"germani\" + 0.017*\"vol\" + 0.014*\"der\" + 0.014*\"jewish\" + 0.014*\"berlin\" + 0.013*\"israel\" + 0.010*\"european\" + 0.009*\"hungarian\" + 0.009*\"europ\"\n", + "2019-01-31 01:19:38,116 : INFO : topic #36 (0.020): 0.011*\"network\" + 0.010*\"prognosi\" + 0.010*\"pop\" + 0.008*\"cytokin\" + 0.008*\"develop\" + 0.008*\"diggin\" + 0.008*\"softwar\" + 0.007*\"uruguayan\" + 0.007*\"user\" + 0.007*\"championship\"\n", + "2019-01-31 01:19:38,117 : INFO : topic #34 (0.020): 0.066*\"start\" + 0.034*\"new\" + 0.032*\"american\" + 0.029*\"unionist\" + 0.025*\"cotton\" + 0.020*\"year\" + 0.016*\"california\" + 0.013*\"warrior\" + 0.012*\"terri\" + 0.011*\"citi\"\n", + "2019-01-31 01:19:38,123 : INFO : topic diff=0.002987, rho=0.023287\n", + "2019-01-31 01:19:38,274 : INFO : PROGRESS: pass 0, at document #3690000/4922894\n", + "2019-01-31 01:19:39,604 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:19:39,870 : INFO : topic #20 (0.020): 0.142*\"scholar\" + 0.039*\"struggl\" + 0.033*\"high\" + 0.031*\"educ\" + 0.024*\"collector\" + 0.017*\"yawn\" + 0.013*\"prognosi\" + 0.011*\"district\" + 0.010*\"gothic\" + 0.010*\"start\"\n", + "2019-01-31 01:19:39,871 : INFO : topic #8 (0.020): 0.026*\"law\" + 0.023*\"cortic\" + 0.019*\"start\" + 0.016*\"act\" + 0.012*\"case\" + 0.011*\"ricardo\" + 0.010*\"polaris\" + 0.010*\"replac\" + 0.008*\"legal\" + 0.008*\"order\"\n", + "2019-01-31 01:19:39,872 : INFO : topic #26 (0.020): 0.029*\"workplac\" + 0.029*\"champion\" + 0.027*\"woman\" + 0.025*\"olymp\" + 0.023*\"men\" + 0.021*\"medal\" + 0.019*\"event\" + 0.019*\"atheist\" + 0.018*\"alic\" + 0.018*\"taxpay\"\n", + "2019-01-31 01:19:39,873 : INFO : topic #25 (0.020): 0.032*\"ring\" + 0.019*\"area\" + 0.017*\"lagrang\" + 0.016*\"warmth\" + 0.016*\"mount\" + 0.010*\"crayfish\" + 0.010*\"north\" + 0.009*\"palmer\" + 0.009*\"sourc\" + 0.009*\"land\"\n", + "2019-01-31 01:19:39,874 : INFO : topic #1 (0.020): 0.054*\"china\" + 0.047*\"chilton\" + 0.025*\"hong\" + 0.025*\"kong\" + 0.020*\"korea\" + 0.019*\"korean\" + 0.015*\"sourc\" + 0.015*\"shirin\" + 0.014*\"leah\" + 0.013*\"kim\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 01:19:39,880 : INFO : topic diff=0.003826, rho=0.023281\n", + "2019-01-31 01:19:40,038 : INFO : PROGRESS: pass 0, at document #3692000/4922894\n", + "2019-01-31 01:19:41,429 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:19:41,696 : INFO : topic #25 (0.020): 0.032*\"ring\" + 0.019*\"area\" + 0.017*\"lagrang\" + 0.016*\"warmth\" + 0.016*\"mount\" + 0.010*\"crayfish\" + 0.010*\"north\" + 0.010*\"palmer\" + 0.009*\"sourc\" + 0.009*\"land\"\n", + "2019-01-31 01:19:41,697 : INFO : topic #38 (0.020): 0.022*\"walter\" + 0.010*\"aza\" + 0.009*\"battalion\" + 0.008*\"forc\" + 0.007*\"teufel\" + 0.007*\"armi\" + 0.007*\"empath\" + 0.006*\"till\" + 0.006*\"militari\" + 0.006*\"govern\"\n", + "2019-01-31 01:19:41,698 : INFO : topic #15 (0.020): 0.011*\"small\" + 0.010*\"organ\" + 0.010*\"develop\" + 0.009*\"commun\" + 0.009*\"group\" + 0.008*\"word\" + 0.008*\"peopl\" + 0.007*\"woman\" + 0.007*\"human\" + 0.006*\"summerhil\"\n", + "2019-01-31 01:19:41,699 : INFO : topic #34 (0.020): 0.066*\"start\" + 0.034*\"new\" + 0.032*\"american\" + 0.029*\"unionist\" + 0.025*\"cotton\" + 0.020*\"year\" + 0.016*\"california\" + 0.013*\"warrior\" + 0.012*\"terri\" + 0.011*\"citi\"\n", + "2019-01-31 01:19:41,700 : INFO : topic #32 (0.020): 0.052*\"district\" + 0.044*\"vigour\" + 0.044*\"popolo\" + 0.037*\"tortur\" + 0.034*\"cotton\" + 0.023*\"area\" + 0.021*\"multitud\" + 0.021*\"adulthood\" + 0.019*\"cede\" + 0.019*\"citi\"\n", + "2019-01-31 01:19:41,706 : INFO : topic diff=0.003551, rho=0.023275\n", + "2019-01-31 01:19:41,863 : INFO : PROGRESS: pass 0, at document #3694000/4922894\n", + "2019-01-31 01:19:43,230 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:19:43,496 : INFO : topic #0 (0.020): 0.066*\"statewid\" + 0.041*\"line\" + 0.032*\"raid\" + 0.026*\"rosenwald\" + 0.025*\"rivièr\" + 0.019*\"traceabl\" + 0.019*\"serv\" + 0.018*\"airmen\" + 0.014*\"oper\" + 0.011*\"transient\"\n", + "2019-01-31 01:19:43,497 : INFO : topic #35 (0.020): 0.055*\"russia\" + 0.036*\"sovereignti\" + 0.034*\"rural\" + 0.025*\"poison\" + 0.024*\"reprint\" + 0.023*\"personifi\" + 0.020*\"moscow\" + 0.017*\"poland\" + 0.014*\"tyrant\" + 0.014*\"unfortun\"\n", + "2019-01-31 01:19:43,498 : INFO : topic #29 (0.020): 0.031*\"companhia\" + 0.013*\"busi\" + 0.012*\"million\" + 0.011*\"market\" + 0.011*\"produc\" + 0.011*\"bank\" + 0.010*\"industri\" + 0.008*\"manag\" + 0.008*\"yawn\" + 0.007*\"function\"\n", + "2019-01-31 01:19:43,499 : INFO : topic #49 (0.020): 0.042*\"india\" + 0.030*\"incumb\" + 0.013*\"islam\" + 0.013*\"pakistan\" + 0.012*\"anglo\" + 0.012*\"muskoge\" + 0.011*\"sri\" + 0.011*\"televis\" + 0.010*\"affection\" + 0.009*\"alam\"\n", + "2019-01-31 01:19:43,500 : INFO : topic #15 (0.020): 0.011*\"small\" + 0.010*\"organ\" + 0.010*\"develop\" + 0.009*\"commun\" + 0.009*\"group\" + 0.008*\"word\" + 0.008*\"peopl\" + 0.007*\"woman\" + 0.007*\"human\" + 0.006*\"summerhil\"\n", + "2019-01-31 01:19:43,506 : INFO : topic diff=0.003725, rho=0.023268\n", + "2019-01-31 01:19:43,662 : INFO : PROGRESS: pass 0, at document #3696000/4922894\n", + "2019-01-31 01:19:45,019 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:19:45,285 : INFO : topic #38 (0.020): 0.022*\"walter\" + 0.010*\"aza\" + 0.009*\"battalion\" + 0.008*\"forc\" + 0.008*\"teufel\" + 0.007*\"armi\" + 0.007*\"empath\" + 0.006*\"till\" + 0.006*\"militari\" + 0.006*\"govern\"\n", + "2019-01-31 01:19:45,286 : INFO : topic #44 (0.020): 0.030*\"rooftop\" + 0.027*\"final\" + 0.024*\"wife\" + 0.019*\"tourist\" + 0.019*\"champion\" + 0.015*\"taxpay\" + 0.015*\"martin\" + 0.014*\"tiepolo\" + 0.014*\"chamber\" + 0.013*\"women\"\n", + "2019-01-31 01:19:45,287 : INFO : topic #36 (0.020): 0.011*\"network\" + 0.010*\"pop\" + 0.010*\"prognosi\" + 0.008*\"cytokin\" + 0.008*\"diggin\" + 0.008*\"develop\" + 0.008*\"softwar\" + 0.008*\"uruguayan\" + 0.007*\"user\" + 0.007*\"includ\"\n", + "2019-01-31 01:19:45,288 : INFO : topic #18 (0.020): 0.011*\"théori\" + 0.007*\"later\" + 0.007*\"sack\" + 0.006*\"dai\" + 0.006*\"kill\" + 0.005*\"retrospect\" + 0.005*\"like\" + 0.005*\"end\" + 0.004*\"call\" + 0.004*\"kenworthi\"\n", + "2019-01-31 01:19:45,290 : INFO : topic #31 (0.020): 0.054*\"fusiform\" + 0.026*\"scientist\" + 0.025*\"taxpay\" + 0.024*\"player\" + 0.020*\"place\" + 0.015*\"clot\" + 0.013*\"leagu\" + 0.012*\"folei\" + 0.011*\"yawn\" + 0.009*\"reconstruct\"\n", + "2019-01-31 01:19:45,295 : INFO : topic diff=0.004642, rho=0.023262\n", + "2019-01-31 01:19:45,453 : INFO : PROGRESS: pass 0, at document #3698000/4922894\n", + "2019-01-31 01:19:46,831 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:19:47,098 : INFO : topic #9 (0.020): 0.071*\"bone\" + 0.047*\"american\" + 0.028*\"valour\" + 0.019*\"dutch\" + 0.018*\"folei\" + 0.017*\"english\" + 0.017*\"polit\" + 0.017*\"player\" + 0.013*\"acrimoni\" + 0.011*\"simpler\"\n", + "2019-01-31 01:19:47,099 : INFO : topic #30 (0.020): 0.036*\"leagu\" + 0.036*\"cleveland\" + 0.029*\"place\" + 0.027*\"taxpay\" + 0.025*\"crete\" + 0.024*\"scientist\" + 0.022*\"folei\" + 0.017*\"goal\" + 0.015*\"martin\" + 0.012*\"schmitz\"\n", + "2019-01-31 01:19:47,100 : INFO : topic #37 (0.020): 0.013*\"charact\" + 0.012*\"anim\" + 0.011*\"septemb\" + 0.010*\"man\" + 0.009*\"comic\" + 0.007*\"appear\" + 0.007*\"fusiform\" + 0.007*\"storag\" + 0.006*\"workplac\" + 0.006*\"vision\"\n", + "2019-01-31 01:19:47,101 : INFO : topic #7 (0.020): 0.022*\"snatch\" + 0.021*\"di\" + 0.019*\"factor\" + 0.016*\"yawn\" + 0.015*\"margin\" + 0.014*\"bone\" + 0.013*\"faster\" + 0.013*\"life\" + 0.012*\"deal\" + 0.012*\"will\"\n", + "2019-01-31 01:19:47,102 : INFO : topic #35 (0.020): 0.055*\"russia\" + 0.036*\"sovereignti\" + 0.034*\"rural\" + 0.025*\"poison\" + 0.023*\"reprint\" + 0.023*\"personifi\" + 0.020*\"moscow\" + 0.017*\"poland\" + 0.014*\"malaysia\" + 0.014*\"tyrant\"\n", + "2019-01-31 01:19:47,108 : INFO : topic diff=0.003341, rho=0.023256\n", + "2019-01-31 01:19:49,751 : INFO : -11.540 per-word bound, 2978.6 perplexity estimate based on a held-out corpus of 2000 documents with 542678 words\n", + "2019-01-31 01:19:49,751 : INFO : PROGRESS: pass 0, at document #3700000/4922894\n", + "2019-01-31 01:19:51,114 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:19:51,381 : INFO : topic #5 (0.020): 0.038*\"abroad\" + 0.028*\"son\" + 0.026*\"rel\" + 0.026*\"reconstruct\" + 0.021*\"band\" + 0.017*\"muscl\" + 0.015*\"simultan\" + 0.014*\"charcoal\" + 0.014*\"toyota\" + 0.010*\"myspac\"\n", + "2019-01-31 01:19:51,382 : INFO : topic #45 (0.020): 0.036*\"arsen\" + 0.028*\"jpg\" + 0.026*\"museo\" + 0.026*\"fifteenth\" + 0.022*\"pain\" + 0.019*\"illicit\" + 0.015*\"colder\" + 0.014*\"exhaust\" + 0.013*\"gai\" + 0.011*\"artist\"\n", + "2019-01-31 01:19:51,383 : INFO : topic #10 (0.020): 0.012*\"cdd\" + 0.009*\"media\" + 0.009*\"hormon\" + 0.008*\"disco\" + 0.008*\"pathwai\" + 0.007*\"have\" + 0.007*\"caus\" + 0.007*\"proper\" + 0.006*\"treat\" + 0.006*\"acid\"\n", + "2019-01-31 01:19:51,384 : INFO : topic #44 (0.020): 0.030*\"rooftop\" + 0.027*\"final\" + 0.024*\"wife\" + 0.020*\"tourist\" + 0.018*\"champion\" + 0.015*\"taxpay\" + 0.014*\"martin\" + 0.014*\"tiepolo\" + 0.014*\"chamber\" + 0.013*\"women\"\n", + "2019-01-31 01:19:51,385 : INFO : topic #16 (0.020): 0.061*\"king\" + 0.031*\"priest\" + 0.020*\"duke\" + 0.019*\"rotterdam\" + 0.019*\"quarterli\" + 0.019*\"idiosyncrat\" + 0.016*\"grammat\" + 0.013*\"kingdom\" + 0.012*\"maria\" + 0.012*\"brazil\"\n", + "2019-01-31 01:19:51,392 : INFO : topic diff=0.002826, rho=0.023250\n", + "2019-01-31 01:19:51,551 : INFO : PROGRESS: pass 0, at document #3702000/4922894\n", + "2019-01-31 01:19:52,927 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:19:53,193 : INFO : topic #30 (0.020): 0.036*\"leagu\" + 0.036*\"cleveland\" + 0.029*\"place\" + 0.027*\"taxpay\" + 0.025*\"crete\" + 0.024*\"scientist\" + 0.022*\"folei\" + 0.017*\"goal\" + 0.015*\"martin\" + 0.012*\"schmitz\"\n", + "2019-01-31 01:19:53,194 : INFO : topic #26 (0.020): 0.032*\"workplac\" + 0.031*\"champion\" + 0.026*\"woman\" + 0.025*\"olymp\" + 0.023*\"men\" + 0.021*\"medal\" + 0.020*\"event\" + 0.018*\"taxpay\" + 0.018*\"atheist\" + 0.018*\"nation\"\n", + "2019-01-31 01:19:53,195 : INFO : topic #45 (0.020): 0.036*\"arsen\" + 0.030*\"jpg\" + 0.028*\"fifteenth\" + 0.026*\"museo\" + 0.022*\"pain\" + 0.018*\"illicit\" + 0.015*\"colder\" + 0.014*\"exhaust\" + 0.013*\"gai\" + 0.011*\"depress\"\n", + "2019-01-31 01:19:53,196 : INFO : topic #34 (0.020): 0.065*\"start\" + 0.034*\"new\" + 0.031*\"american\" + 0.029*\"unionist\" + 0.026*\"cotton\" + 0.020*\"year\" + 0.015*\"california\" + 0.013*\"warrior\" + 0.012*\"terri\" + 0.011*\"citi\"\n", + "2019-01-31 01:19:53,197 : INFO : topic #8 (0.020): 0.026*\"law\" + 0.023*\"cortic\" + 0.019*\"start\" + 0.016*\"act\" + 0.012*\"case\" + 0.011*\"ricardo\" + 0.010*\"polaris\" + 0.009*\"replac\" + 0.008*\"legal\" + 0.008*\"order\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 01:19:53,204 : INFO : topic diff=0.003294, rho=0.023243\n", + "2019-01-31 01:19:53,364 : INFO : PROGRESS: pass 0, at document #3704000/4922894\n", + "2019-01-31 01:19:54,764 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:19:55,031 : INFO : topic #8 (0.020): 0.027*\"law\" + 0.023*\"cortic\" + 0.019*\"start\" + 0.016*\"act\" + 0.012*\"case\" + 0.011*\"ricardo\" + 0.010*\"polaris\" + 0.010*\"replac\" + 0.008*\"legal\" + 0.008*\"order\"\n", + "2019-01-31 01:19:55,032 : INFO : topic #19 (0.020): 0.015*\"centuri\" + 0.015*\"languag\" + 0.010*\"woodcut\" + 0.009*\"form\" + 0.009*\"origin\" + 0.009*\"mean\" + 0.008*\"trade\" + 0.007*\"english\" + 0.007*\"ancestor\" + 0.007*\"known\"\n", + "2019-01-31 01:19:55,033 : INFO : topic #16 (0.020): 0.061*\"king\" + 0.031*\"priest\" + 0.020*\"duke\" + 0.019*\"rotterdam\" + 0.019*\"quarterli\" + 0.018*\"idiosyncrat\" + 0.016*\"grammat\" + 0.015*\"kingdom\" + 0.012*\"count\" + 0.012*\"brazil\"\n", + "2019-01-31 01:19:55,034 : INFO : topic #12 (0.020): 0.008*\"number\" + 0.007*\"frontal\" + 0.007*\"gener\" + 0.006*\"southern\" + 0.006*\"exampl\" + 0.006*\"théori\" + 0.006*\"poet\" + 0.006*\"servitud\" + 0.006*\"measur\" + 0.005*\"differ\"\n", + "2019-01-31 01:19:55,035 : INFO : topic #40 (0.020): 0.085*\"unit\" + 0.023*\"schuster\" + 0.022*\"institut\" + 0.021*\"requir\" + 0.021*\"collector\" + 0.019*\"student\" + 0.014*\"professor\" + 0.011*\"word\" + 0.011*\"degre\" + 0.011*\"http\"\n", + "2019-01-31 01:19:55,041 : INFO : topic diff=0.003567, rho=0.023237\n", + "2019-01-31 01:19:55,198 : INFO : PROGRESS: pass 0, at document #3706000/4922894\n", + "2019-01-31 01:19:56,779 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:19:57,046 : INFO : topic #2 (0.020): 0.052*\"isl\" + 0.039*\"shield\" + 0.018*\"narrat\" + 0.015*\"scot\" + 0.012*\"blur\" + 0.012*\"pope\" + 0.011*\"nativist\" + 0.011*\"coalit\" + 0.009*\"fleet\" + 0.009*\"class\"\n", + "2019-01-31 01:19:57,047 : INFO : topic #29 (0.020): 0.031*\"companhia\" + 0.013*\"busi\" + 0.012*\"million\" + 0.011*\"market\" + 0.011*\"produc\" + 0.010*\"bank\" + 0.010*\"industri\" + 0.008*\"manag\" + 0.008*\"yawn\" + 0.007*\"serv\"\n", + "2019-01-31 01:19:57,048 : INFO : topic #16 (0.020): 0.061*\"king\" + 0.031*\"priest\" + 0.020*\"duke\" + 0.019*\"rotterdam\" + 0.018*\"quarterli\" + 0.018*\"idiosyncrat\" + 0.016*\"grammat\" + 0.015*\"kingdom\" + 0.013*\"count\" + 0.012*\"brazil\"\n", + "2019-01-31 01:19:57,049 : INFO : topic #17 (0.020): 0.076*\"church\" + 0.022*\"cathol\" + 0.022*\"christian\" + 0.022*\"bishop\" + 0.017*\"sail\" + 0.016*\"retroflex\" + 0.010*\"cathedr\" + 0.010*\"relationship\" + 0.009*\"historiographi\" + 0.009*\"poll\"\n", + "2019-01-31 01:19:57,050 : INFO : topic #35 (0.020): 0.056*\"russia\" + 0.036*\"sovereignti\" + 0.034*\"rural\" + 0.025*\"poison\" + 0.024*\"reprint\" + 0.023*\"personifi\" + 0.020*\"moscow\" + 0.017*\"poland\" + 0.014*\"unfortun\" + 0.014*\"malaysia\"\n", + "2019-01-31 01:19:57,056 : INFO : topic diff=0.003578, rho=0.023231\n", + "2019-01-31 01:19:57,211 : INFO : PROGRESS: pass 0, at document #3708000/4922894\n", + "2019-01-31 01:19:58,560 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:19:58,827 : INFO : topic #36 (0.020): 0.011*\"network\" + 0.010*\"prognosi\" + 0.010*\"pop\" + 0.008*\"cytokin\" + 0.008*\"diggin\" + 0.008*\"develop\" + 0.008*\"user\" + 0.008*\"softwar\" + 0.008*\"uruguayan\" + 0.007*\"championship\"\n", + "2019-01-31 01:19:58,828 : INFO : topic #29 (0.020): 0.031*\"companhia\" + 0.013*\"busi\" + 0.012*\"million\" + 0.011*\"market\" + 0.010*\"produc\" + 0.010*\"bank\" + 0.010*\"industri\" + 0.008*\"manag\" + 0.008*\"yawn\" + 0.007*\"oper\"\n", + "2019-01-31 01:19:58,829 : INFO : topic #38 (0.020): 0.022*\"walter\" + 0.010*\"aza\" + 0.009*\"battalion\" + 0.008*\"forc\" + 0.007*\"teufel\" + 0.007*\"armi\" + 0.007*\"empath\" + 0.006*\"govern\" + 0.006*\"till\" + 0.006*\"militari\"\n", + "2019-01-31 01:19:58,830 : INFO : topic #45 (0.020): 0.036*\"arsen\" + 0.030*\"jpg\" + 0.028*\"fifteenth\" + 0.026*\"museo\" + 0.022*\"pain\" + 0.019*\"illicit\" + 0.015*\"colder\" + 0.014*\"exhaust\" + 0.013*\"gai\" + 0.011*\"artist\"\n", + "2019-01-31 01:19:58,831 : INFO : topic #48 (0.020): 0.084*\"sens\" + 0.080*\"octob\" + 0.077*\"march\" + 0.072*\"juli\" + 0.070*\"august\" + 0.070*\"januari\" + 0.069*\"judici\" + 0.069*\"notion\" + 0.067*\"april\" + 0.065*\"decatur\"\n", + "2019-01-31 01:19:58,837 : INFO : topic diff=0.003446, rho=0.023224\n", + "2019-01-31 01:19:59,055 : INFO : PROGRESS: pass 0, at document #3710000/4922894\n", + "2019-01-31 01:20:00,436 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:20:00,703 : INFO : topic #37 (0.020): 0.012*\"charact\" + 0.011*\"anim\" + 0.011*\"septemb\" + 0.010*\"man\" + 0.009*\"comic\" + 0.007*\"appear\" + 0.007*\"fusiform\" + 0.007*\"storag\" + 0.006*\"workplac\" + 0.006*\"vision\"\n", + "2019-01-31 01:20:00,704 : INFO : topic #35 (0.020): 0.055*\"russia\" + 0.037*\"sovereignti\" + 0.034*\"rural\" + 0.024*\"poison\" + 0.024*\"reprint\" + 0.023*\"personifi\" + 0.021*\"moscow\" + 0.017*\"poland\" + 0.014*\"unfortun\" + 0.014*\"malaysia\"\n", + "2019-01-31 01:20:00,705 : INFO : topic #1 (0.020): 0.054*\"china\" + 0.047*\"chilton\" + 0.025*\"hong\" + 0.025*\"kong\" + 0.022*\"korea\" + 0.020*\"korean\" + 0.016*\"sourc\" + 0.015*\"shirin\" + 0.014*\"leah\" + 0.014*\"kim\"\n", + "2019-01-31 01:20:00,706 : INFO : topic #23 (0.020): 0.134*\"audit\" + 0.067*\"best\" + 0.033*\"yawn\" + 0.029*\"jacksonvil\" + 0.023*\"japanes\" + 0.022*\"noll\" + 0.018*\"festiv\" + 0.018*\"women\" + 0.017*\"intern\" + 0.013*\"prison\"\n", + "2019-01-31 01:20:00,707 : INFO : topic #42 (0.020): 0.050*\"german\" + 0.032*\"germani\" + 0.017*\"vol\" + 0.014*\"jewish\" + 0.014*\"berlin\" + 0.014*\"der\" + 0.013*\"israel\" + 0.010*\"european\" + 0.009*\"europ\" + 0.009*\"austria\"\n", + "2019-01-31 01:20:00,713 : INFO : topic diff=0.003352, rho=0.023218\n", + "2019-01-31 01:20:00,876 : INFO : PROGRESS: pass 0, at document #3712000/4922894\n", + "2019-01-31 01:20:02,287 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:20:02,553 : INFO : topic #15 (0.020): 0.011*\"small\" + 0.010*\"organ\" + 0.010*\"develop\" + 0.009*\"commun\" + 0.009*\"group\" + 0.008*\"word\" + 0.008*\"peopl\" + 0.007*\"woman\" + 0.007*\"human\" + 0.006*\"summerhil\"\n", + "2019-01-31 01:20:02,554 : INFO : topic #34 (0.020): 0.065*\"start\" + 0.034*\"new\" + 0.031*\"american\" + 0.029*\"unionist\" + 0.026*\"cotton\" + 0.021*\"year\" + 0.015*\"california\" + 0.013*\"warrior\" + 0.012*\"terri\" + 0.011*\"citi\"\n", + "2019-01-31 01:20:02,556 : INFO : topic #30 (0.020): 0.036*\"leagu\" + 0.035*\"cleveland\" + 0.029*\"place\" + 0.027*\"taxpay\" + 0.025*\"crete\" + 0.024*\"scientist\" + 0.021*\"folei\" + 0.017*\"goal\" + 0.015*\"martin\" + 0.012*\"schmitz\"\n", + "2019-01-31 01:20:02,557 : INFO : topic #0 (0.020): 0.067*\"statewid\" + 0.040*\"line\" + 0.031*\"raid\" + 0.027*\"rosenwald\" + 0.025*\"rivièr\" + 0.019*\"serv\" + 0.018*\"traceabl\" + 0.018*\"airmen\" + 0.014*\"oper\" + 0.011*\"transient\"\n", + "2019-01-31 01:20:02,558 : INFO : topic #8 (0.020): 0.027*\"law\" + 0.023*\"cortic\" + 0.019*\"start\" + 0.016*\"act\" + 0.012*\"case\" + 0.011*\"ricardo\" + 0.010*\"polaris\" + 0.009*\"replac\" + 0.009*\"legal\" + 0.008*\"order\"\n", + "2019-01-31 01:20:02,563 : INFO : topic diff=0.003899, rho=0.023212\n", + "2019-01-31 01:20:02,720 : INFO : PROGRESS: pass 0, at document #3714000/4922894\n", + "2019-01-31 01:20:04,091 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:20:04,358 : INFO : topic #28 (0.020): 0.036*\"build\" + 0.030*\"hous\" + 0.019*\"buford\" + 0.015*\"histor\" + 0.011*\"linear\" + 0.011*\"constitut\" + 0.011*\"depress\" + 0.011*\"silicon\" + 0.010*\"briarwood\" + 0.010*\"centuri\"\n", + "2019-01-31 01:20:04,359 : INFO : topic #46 (0.020): 0.017*\"norwai\" + 0.017*\"sweden\" + 0.017*\"stop\" + 0.016*\"swedish\" + 0.015*\"damag\" + 0.014*\"wind\" + 0.013*\"norwegian\" + 0.011*\"huntsvil\" + 0.011*\"denmark\" + 0.011*\"treeless\"\n", + "2019-01-31 01:20:04,360 : INFO : topic #45 (0.020): 0.036*\"arsen\" + 0.029*\"jpg\" + 0.028*\"fifteenth\" + 0.026*\"museo\" + 0.021*\"pain\" + 0.018*\"illicit\" + 0.015*\"colder\" + 0.014*\"exhaust\" + 0.013*\"gai\" + 0.011*\"western\"\n", + "2019-01-31 01:20:04,361 : INFO : topic #35 (0.020): 0.055*\"russia\" + 0.037*\"sovereignti\" + 0.034*\"rural\" + 0.024*\"poison\" + 0.024*\"personifi\" + 0.024*\"reprint\" + 0.020*\"moscow\" + 0.017*\"poland\" + 0.014*\"malaysia\" + 0.014*\"unfortun\"\n", + "2019-01-31 01:20:04,362 : INFO : topic #7 (0.020): 0.021*\"snatch\" + 0.021*\"di\" + 0.019*\"factor\" + 0.016*\"yawn\" + 0.015*\"margin\" + 0.014*\"bone\" + 0.013*\"life\" + 0.013*\"faster\" + 0.012*\"deal\" + 0.012*\"will\"\n", + "2019-01-31 01:20:04,368 : INFO : topic diff=0.003435, rho=0.023206\n", + "2019-01-31 01:20:04,527 : INFO : PROGRESS: pass 0, at document #3716000/4922894\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 01:20:05,911 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:20:06,178 : INFO : topic #38 (0.020): 0.023*\"walter\" + 0.010*\"aza\" + 0.009*\"battalion\" + 0.008*\"forc\" + 0.007*\"teufel\" + 0.007*\"armi\" + 0.007*\"empath\" + 0.006*\"govern\" + 0.006*\"militari\" + 0.006*\"till\"\n", + "2019-01-31 01:20:06,179 : INFO : topic #24 (0.020): 0.038*\"book\" + 0.034*\"publicis\" + 0.028*\"word\" + 0.019*\"new\" + 0.015*\"edit\" + 0.013*\"presid\" + 0.012*\"magazin\" + 0.011*\"worldwid\" + 0.011*\"collect\" + 0.011*\"storag\"\n", + "2019-01-31 01:20:06,180 : INFO : topic #18 (0.020): 0.011*\"théori\" + 0.007*\"later\" + 0.007*\"sack\" + 0.006*\"dai\" + 0.006*\"kill\" + 0.005*\"retrospect\" + 0.005*\"like\" + 0.005*\"end\" + 0.004*\"call\" + 0.004*\"kenworthi\"\n", + "2019-01-31 01:20:06,181 : INFO : topic #16 (0.020): 0.063*\"king\" + 0.031*\"priest\" + 0.020*\"duke\" + 0.019*\"rotterdam\" + 0.019*\"idiosyncrat\" + 0.018*\"quarterli\" + 0.016*\"grammat\" + 0.014*\"kingdom\" + 0.013*\"count\" + 0.012*\"maria\"\n", + "2019-01-31 01:20:06,182 : INFO : topic #8 (0.020): 0.027*\"law\" + 0.023*\"cortic\" + 0.018*\"start\" + 0.016*\"act\" + 0.012*\"case\" + 0.011*\"ricardo\" + 0.010*\"polaris\" + 0.009*\"replac\" + 0.008*\"legal\" + 0.008*\"order\"\n", + "2019-01-31 01:20:06,188 : INFO : topic diff=0.003722, rho=0.023199\n", + "2019-01-31 01:20:06,345 : INFO : PROGRESS: pass 0, at document #3718000/4922894\n", + "2019-01-31 01:20:07,734 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:20:08,000 : INFO : topic #2 (0.020): 0.051*\"isl\" + 0.038*\"shield\" + 0.018*\"narrat\" + 0.015*\"scot\" + 0.012*\"blur\" + 0.012*\"pope\" + 0.011*\"nativist\" + 0.011*\"coalit\" + 0.009*\"fleet\" + 0.009*\"bahá\"\n", + "2019-01-31 01:20:08,001 : INFO : topic #10 (0.020): 0.012*\"cdd\" + 0.009*\"hormon\" + 0.009*\"media\" + 0.008*\"pathwai\" + 0.008*\"disco\" + 0.007*\"have\" + 0.007*\"caus\" + 0.006*\"treat\" + 0.006*\"proper\" + 0.006*\"effect\"\n", + "2019-01-31 01:20:08,002 : INFO : topic #21 (0.020): 0.034*\"samford\" + 0.021*\"spain\" + 0.018*\"del\" + 0.018*\"mexico\" + 0.017*\"italian\" + 0.014*\"soviet\" + 0.012*\"santa\" + 0.011*\"juan\" + 0.010*\"lizard\" + 0.010*\"carlo\"\n", + "2019-01-31 01:20:08,003 : INFO : topic #27 (0.020): 0.073*\"questionnair\" + 0.020*\"candid\" + 0.018*\"taxpay\" + 0.013*\"driver\" + 0.013*\"fool\" + 0.012*\"find\" + 0.012*\"ret\" + 0.012*\"tornado\" + 0.010*\"landslid\" + 0.010*\"champion\"\n", + "2019-01-31 01:20:08,004 : INFO : topic #35 (0.020): 0.056*\"russia\" + 0.037*\"sovereignti\" + 0.034*\"rural\" + 0.024*\"poison\" + 0.023*\"reprint\" + 0.023*\"personifi\" + 0.021*\"moscow\" + 0.017*\"poland\" + 0.014*\"malaysia\" + 0.014*\"unfortun\"\n", + "2019-01-31 01:20:08,010 : INFO : topic diff=0.003373, rho=0.023193\n", + "2019-01-31 01:20:10,740 : INFO : -11.623 per-word bound, 3155.0 perplexity estimate based on a held-out corpus of 2000 documents with 572427 words\n", + "2019-01-31 01:20:10,741 : INFO : PROGRESS: pass 0, at document #3720000/4922894\n", + "2019-01-31 01:20:12,128 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:20:12,395 : INFO : topic #16 (0.020): 0.063*\"king\" + 0.031*\"priest\" + 0.020*\"duke\" + 0.019*\"quarterli\" + 0.019*\"rotterdam\" + 0.019*\"idiosyncrat\" + 0.016*\"grammat\" + 0.014*\"kingdom\" + 0.013*\"count\" + 0.012*\"brazil\"\n", + "2019-01-31 01:20:12,396 : INFO : topic #39 (0.020): 0.062*\"canada\" + 0.047*\"canadian\" + 0.025*\"hoar\" + 0.025*\"toronto\" + 0.022*\"ontario\" + 0.017*\"hydrogen\" + 0.015*\"new\" + 0.014*\"novotná\" + 0.014*\"misericordia\" + 0.013*\"quebec\"\n", + "2019-01-31 01:20:12,397 : INFO : topic #5 (0.020): 0.037*\"abroad\" + 0.028*\"son\" + 0.026*\"rel\" + 0.026*\"reconstruct\" + 0.021*\"band\" + 0.017*\"muscl\" + 0.015*\"simultan\" + 0.014*\"charcoal\" + 0.013*\"toyota\" + 0.010*\"myspac\"\n", + "2019-01-31 01:20:12,398 : INFO : topic #28 (0.020): 0.036*\"build\" + 0.030*\"hous\" + 0.019*\"buford\" + 0.015*\"histor\" + 0.012*\"linear\" + 0.011*\"constitut\" + 0.011*\"depress\" + 0.011*\"silicon\" + 0.010*\"briarwood\" + 0.010*\"centuri\"\n", + "2019-01-31 01:20:12,399 : INFO : topic #23 (0.020): 0.135*\"audit\" + 0.068*\"best\" + 0.034*\"yawn\" + 0.029*\"jacksonvil\" + 0.023*\"japanes\" + 0.021*\"noll\" + 0.019*\"festiv\" + 0.018*\"women\" + 0.017*\"intern\" + 0.013*\"prison\"\n", + "2019-01-31 01:20:12,405 : INFO : topic diff=0.004355, rho=0.023187\n", + "2019-01-31 01:20:12,565 : INFO : PROGRESS: pass 0, at document #3722000/4922894\n", + "2019-01-31 01:20:13,958 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:20:14,224 : INFO : topic #11 (0.020): 0.024*\"john\" + 0.012*\"jame\" + 0.012*\"will\" + 0.011*\"david\" + 0.010*\"rival\" + 0.009*\"mexican–american\" + 0.008*\"georg\" + 0.008*\"slur\" + 0.008*\"paul\" + 0.008*\"rhyme\"\n", + "2019-01-31 01:20:14,225 : INFO : topic #36 (0.020): 0.011*\"network\" + 0.010*\"prognosi\" + 0.010*\"pop\" + 0.008*\"cytokin\" + 0.008*\"diggin\" + 0.008*\"develop\" + 0.008*\"championship\" + 0.008*\"softwar\" + 0.008*\"user\" + 0.008*\"uruguayan\"\n", + "2019-01-31 01:20:14,226 : INFO : topic #33 (0.020): 0.062*\"french\" + 0.046*\"franc\" + 0.030*\"pari\" + 0.024*\"sail\" + 0.022*\"jean\" + 0.019*\"daphn\" + 0.014*\"lazi\" + 0.013*\"loui\" + 0.012*\"piec\" + 0.008*\"sangha\"\n", + "2019-01-31 01:20:14,227 : INFO : topic #22 (0.020): 0.034*\"spars\" + 0.020*\"factor\" + 0.012*\"plaisir\" + 0.011*\"genu\" + 0.010*\"western\" + 0.008*\"biom\" + 0.008*\"median\" + 0.007*\"male\" + 0.007*\"incom\" + 0.007*\"feel\"\n", + "2019-01-31 01:20:14,228 : INFO : topic #46 (0.020): 0.017*\"sweden\" + 0.017*\"stop\" + 0.017*\"norwai\" + 0.016*\"swedish\" + 0.016*\"damag\" + 0.014*\"wind\" + 0.013*\"norwegian\" + 0.012*\"huntsvil\" + 0.011*\"denmark\" + 0.011*\"treeless\"\n", + "2019-01-31 01:20:14,234 : INFO : topic diff=0.003129, rho=0.023181\n", + "2019-01-31 01:20:14,390 : INFO : PROGRESS: pass 0, at document #3724000/4922894\n", + "2019-01-31 01:20:15,754 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:20:16,021 : INFO : topic #7 (0.020): 0.021*\"snatch\" + 0.021*\"di\" + 0.019*\"factor\" + 0.016*\"yawn\" + 0.015*\"margin\" + 0.014*\"bone\" + 0.013*\"life\" + 0.013*\"faster\" + 0.012*\"deal\" + 0.011*\"will\"\n", + "2019-01-31 01:20:16,022 : INFO : topic #3 (0.020): 0.033*\"present\" + 0.027*\"offic\" + 0.023*\"nation\" + 0.022*\"minist\" + 0.022*\"govern\" + 0.022*\"serv\" + 0.020*\"member\" + 0.016*\"start\" + 0.016*\"gener\" + 0.014*\"chickasaw\"\n", + "2019-01-31 01:20:16,023 : INFO : topic #15 (0.020): 0.011*\"small\" + 0.010*\"organ\" + 0.009*\"develop\" + 0.009*\"commun\" + 0.009*\"group\" + 0.008*\"word\" + 0.008*\"peopl\" + 0.007*\"woman\" + 0.007*\"human\" + 0.006*\"summerhil\"\n", + "2019-01-31 01:20:16,024 : INFO : topic #5 (0.020): 0.038*\"abroad\" + 0.028*\"son\" + 0.026*\"rel\" + 0.026*\"reconstruct\" + 0.021*\"band\" + 0.017*\"muscl\" + 0.015*\"simultan\" + 0.014*\"charcoal\" + 0.013*\"toyota\" + 0.010*\"myspac\"\n", + "2019-01-31 01:20:16,025 : INFO : topic #25 (0.020): 0.032*\"ring\" + 0.019*\"area\" + 0.017*\"lagrang\" + 0.017*\"warmth\" + 0.016*\"mount\" + 0.010*\"north\" + 0.009*\"palmer\" + 0.009*\"crayfish\" + 0.009*\"sourc\" + 0.009*\"land\"\n", + "2019-01-31 01:20:16,031 : INFO : topic diff=0.003485, rho=0.023174\n", + "2019-01-31 01:20:16,182 : INFO : PROGRESS: pass 0, at document #3726000/4922894\n", + "2019-01-31 01:20:17,508 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:20:17,775 : INFO : topic #21 (0.020): 0.034*\"samford\" + 0.022*\"spain\" + 0.018*\"del\" + 0.018*\"mexico\" + 0.017*\"italian\" + 0.014*\"soviet\" + 0.012*\"santa\" + 0.011*\"juan\" + 0.010*\"lizard\" + 0.010*\"carlo\"\n", + "2019-01-31 01:20:17,776 : INFO : topic #10 (0.020): 0.012*\"cdd\" + 0.009*\"media\" + 0.009*\"hormon\" + 0.008*\"disco\" + 0.008*\"pathwai\" + 0.007*\"have\" + 0.007*\"caus\" + 0.006*\"treat\" + 0.006*\"proper\" + 0.006*\"effect\"\n", + "2019-01-31 01:20:17,777 : INFO : topic #4 (0.020): 0.020*\"enfranchis\" + 0.015*\"depress\" + 0.014*\"pour\" + 0.009*\"elabor\" + 0.009*\"veget\" + 0.008*\"mode\" + 0.007*\"uruguayan\" + 0.006*\"produc\" + 0.006*\"develop\" + 0.006*\"turn\"\n", + "2019-01-31 01:20:17,778 : INFO : topic #5 (0.020): 0.038*\"abroad\" + 0.028*\"son\" + 0.026*\"rel\" + 0.026*\"reconstruct\" + 0.020*\"band\" + 0.017*\"muscl\" + 0.015*\"simultan\" + 0.014*\"charcoal\" + 0.013*\"toyota\" + 0.010*\"myspac\"\n", + "2019-01-31 01:20:17,779 : INFO : topic #37 (0.020): 0.013*\"charact\" + 0.011*\"anim\" + 0.011*\"septemb\" + 0.010*\"man\" + 0.009*\"comic\" + 0.007*\"appear\" + 0.007*\"fusiform\" + 0.007*\"storag\" + 0.006*\"workplac\" + 0.006*\"vision\"\n", + "2019-01-31 01:20:17,785 : INFO : topic diff=0.003791, rho=0.023168\n", + "2019-01-31 01:20:17,940 : INFO : PROGRESS: pass 0, at document #3728000/4922894\n", + "2019-01-31 01:20:19,331 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 01:20:19,597 : INFO : topic #13 (0.020): 0.026*\"sourc\" + 0.025*\"london\" + 0.025*\"new\" + 0.025*\"australia\" + 0.023*\"england\" + 0.022*\"australian\" + 0.019*\"british\" + 0.016*\"ireland\" + 0.014*\"youth\" + 0.014*\"wale\"\n", + "2019-01-31 01:20:19,598 : INFO : topic #27 (0.020): 0.072*\"questionnair\" + 0.020*\"candid\" + 0.018*\"taxpay\" + 0.013*\"driver\" + 0.013*\"ret\" + 0.012*\"find\" + 0.012*\"fool\" + 0.011*\"tornado\" + 0.010*\"landslid\" + 0.010*\"champion\"\n", + "2019-01-31 01:20:19,599 : INFO : topic #42 (0.020): 0.050*\"german\" + 0.033*\"germani\" + 0.016*\"vol\" + 0.014*\"der\" + 0.014*\"jewish\" + 0.013*\"berlin\" + 0.013*\"israel\" + 0.010*\"european\" + 0.009*\"austria\" + 0.009*\"europ\"\n", + "2019-01-31 01:20:19,600 : INFO : topic #24 (0.020): 0.038*\"book\" + 0.034*\"publicis\" + 0.028*\"word\" + 0.019*\"new\" + 0.015*\"edit\" + 0.013*\"presid\" + 0.011*\"magazin\" + 0.011*\"worldwid\" + 0.011*\"collect\" + 0.011*\"storag\"\n", + "2019-01-31 01:20:19,601 : INFO : topic #18 (0.020): 0.011*\"théori\" + 0.007*\"later\" + 0.007*\"sack\" + 0.006*\"dai\" + 0.006*\"kill\" + 0.005*\"retrospect\" + 0.005*\"like\" + 0.005*\"end\" + 0.004*\"call\" + 0.004*\"help\"\n", + "2019-01-31 01:20:19,607 : INFO : topic diff=0.003686, rho=0.023162\n", + "2019-01-31 01:20:19,763 : INFO : PROGRESS: pass 0, at document #3730000/4922894\n", + "2019-01-31 01:20:21,141 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:20:21,408 : INFO : topic #48 (0.020): 0.085*\"sens\" + 0.080*\"octob\" + 0.077*\"march\" + 0.072*\"juli\" + 0.070*\"august\" + 0.070*\"judici\" + 0.069*\"notion\" + 0.069*\"januari\" + 0.067*\"april\" + 0.064*\"decatur\"\n", + "2019-01-31 01:20:21,409 : INFO : topic #24 (0.020): 0.038*\"book\" + 0.034*\"publicis\" + 0.028*\"word\" + 0.019*\"new\" + 0.015*\"edit\" + 0.013*\"presid\" + 0.011*\"magazin\" + 0.011*\"collect\" + 0.011*\"worldwid\" + 0.011*\"storag\"\n", + "2019-01-31 01:20:21,410 : INFO : topic #30 (0.020): 0.036*\"leagu\" + 0.035*\"cleveland\" + 0.029*\"place\" + 0.028*\"taxpay\" + 0.025*\"crete\" + 0.024*\"scientist\" + 0.021*\"folei\" + 0.017*\"goal\" + 0.015*\"martin\" + 0.012*\"schmitz\"\n", + "2019-01-31 01:20:21,411 : INFO : topic #42 (0.020): 0.050*\"german\" + 0.033*\"germani\" + 0.016*\"vol\" + 0.014*\"der\" + 0.014*\"jewish\" + 0.013*\"berlin\" + 0.013*\"israel\" + 0.010*\"european\" + 0.009*\"austria\" + 0.009*\"europ\"\n", + "2019-01-31 01:20:21,412 : INFO : topic #46 (0.020): 0.018*\"sweden\" + 0.017*\"norwai\" + 0.017*\"stop\" + 0.016*\"swedish\" + 0.016*\"damag\" + 0.014*\"wind\" + 0.013*\"norwegian\" + 0.011*\"huntsvil\" + 0.011*\"denmark\" + 0.011*\"treeless\"\n", + "2019-01-31 01:20:21,418 : INFO : topic diff=0.004074, rho=0.023156\n", + "2019-01-31 01:20:21,575 : INFO : PROGRESS: pass 0, at document #3732000/4922894\n", + "2019-01-31 01:20:22,968 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:20:23,234 : INFO : topic #0 (0.020): 0.067*\"statewid\" + 0.041*\"line\" + 0.031*\"raid\" + 0.026*\"rosenwald\" + 0.025*\"rivièr\" + 0.019*\"traceabl\" + 0.018*\"serv\" + 0.018*\"airmen\" + 0.014*\"oper\" + 0.011*\"transient\"\n", + "2019-01-31 01:20:23,235 : INFO : topic #18 (0.020): 0.011*\"théori\" + 0.007*\"later\" + 0.007*\"sack\" + 0.006*\"dai\" + 0.006*\"kill\" + 0.005*\"retrospect\" + 0.005*\"like\" + 0.005*\"end\" + 0.004*\"call\" + 0.004*\"help\"\n", + "2019-01-31 01:20:23,236 : INFO : topic #13 (0.020): 0.026*\"sourc\" + 0.025*\"london\" + 0.025*\"australia\" + 0.025*\"new\" + 0.023*\"england\" + 0.022*\"australian\" + 0.019*\"british\" + 0.016*\"ireland\" + 0.014*\"youth\" + 0.014*\"wale\"\n", + "2019-01-31 01:20:23,237 : INFO : topic #43 (0.020): 0.062*\"elect\" + 0.055*\"parti\" + 0.024*\"voluntari\" + 0.022*\"democrat\" + 0.020*\"member\" + 0.017*\"polici\" + 0.015*\"bypass\" + 0.014*\"seaport\" + 0.013*\"liber\" + 0.013*\"republ\"\n", + "2019-01-31 01:20:23,238 : INFO : topic #8 (0.020): 0.027*\"law\" + 0.022*\"cortic\" + 0.018*\"start\" + 0.016*\"act\" + 0.012*\"case\" + 0.011*\"ricardo\" + 0.010*\"polaris\" + 0.009*\"replac\" + 0.008*\"legal\" + 0.008*\"order\"\n", + "2019-01-31 01:20:23,244 : INFO : topic diff=0.004057, rho=0.023150\n", + "2019-01-31 01:20:23,402 : INFO : PROGRESS: pass 0, at document #3734000/4922894\n", + "2019-01-31 01:20:24,779 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:20:25,046 : INFO : topic #3 (0.020): 0.032*\"present\" + 0.027*\"offic\" + 0.023*\"nation\" + 0.022*\"govern\" + 0.022*\"minist\" + 0.022*\"serv\" + 0.020*\"member\" + 0.016*\"start\" + 0.016*\"gener\" + 0.015*\"chickasaw\"\n", + "2019-01-31 01:20:25,047 : INFO : topic #31 (0.020): 0.052*\"fusiform\" + 0.026*\"scientist\" + 0.025*\"taxpay\" + 0.024*\"player\" + 0.020*\"place\" + 0.014*\"clot\" + 0.013*\"leagu\" + 0.012*\"folei\" + 0.010*\"yawn\" + 0.009*\"reconstruct\"\n", + "2019-01-31 01:20:25,048 : INFO : topic #26 (0.020): 0.032*\"workplac\" + 0.030*\"champion\" + 0.026*\"woman\" + 0.025*\"olymp\" + 0.023*\"men\" + 0.021*\"medal\" + 0.020*\"event\" + 0.018*\"taxpay\" + 0.018*\"atheist\" + 0.018*\"rainfal\"\n", + "2019-01-31 01:20:25,049 : INFO : topic #8 (0.020): 0.027*\"law\" + 0.022*\"cortic\" + 0.019*\"start\" + 0.016*\"act\" + 0.012*\"case\" + 0.011*\"ricardo\" + 0.010*\"polaris\" + 0.009*\"replac\" + 0.008*\"legal\" + 0.008*\"order\"\n", + "2019-01-31 01:20:25,050 : INFO : topic #23 (0.020): 0.135*\"audit\" + 0.069*\"best\" + 0.033*\"yawn\" + 0.031*\"jacksonvil\" + 0.023*\"japanes\" + 0.021*\"noll\" + 0.018*\"women\" + 0.018*\"festiv\" + 0.017*\"intern\" + 0.013*\"prison\"\n", + "2019-01-31 01:20:25,056 : INFO : topic diff=0.004014, rho=0.023143\n", + "2019-01-31 01:20:25,215 : INFO : PROGRESS: pass 0, at document #3736000/4922894\n", + "2019-01-31 01:20:26,616 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:20:26,882 : INFO : topic #27 (0.020): 0.072*\"questionnair\" + 0.020*\"candid\" + 0.018*\"taxpay\" + 0.013*\"driver\" + 0.012*\"find\" + 0.012*\"tornado\" + 0.012*\"ret\" + 0.012*\"fool\" + 0.010*\"landslid\" + 0.010*\"champion\"\n", + "2019-01-31 01:20:26,883 : INFO : topic #43 (0.020): 0.062*\"elect\" + 0.055*\"parti\" + 0.024*\"voluntari\" + 0.021*\"democrat\" + 0.020*\"member\" + 0.017*\"polici\" + 0.015*\"bypass\" + 0.014*\"seaport\" + 0.013*\"liber\" + 0.013*\"republ\"\n", + "2019-01-31 01:20:26,884 : INFO : topic #20 (0.020): 0.144*\"scholar\" + 0.039*\"struggl\" + 0.034*\"high\" + 0.031*\"educ\" + 0.024*\"collector\" + 0.017*\"yawn\" + 0.013*\"prognosi\" + 0.010*\"district\" + 0.010*\"gothic\" + 0.009*\"task\"\n", + "2019-01-31 01:20:26,885 : INFO : topic #35 (0.020): 0.055*\"russia\" + 0.036*\"sovereignti\" + 0.033*\"rural\" + 0.024*\"poison\" + 0.023*\"personifi\" + 0.022*\"reprint\" + 0.021*\"moscow\" + 0.017*\"poland\" + 0.014*\"tyrant\" + 0.014*\"malaysia\"\n", + "2019-01-31 01:20:26,886 : INFO : topic #36 (0.020): 0.011*\"network\" + 0.011*\"prognosi\" + 0.010*\"pop\" + 0.008*\"diggin\" + 0.008*\"develop\" + 0.008*\"championship\" + 0.008*\"cytokin\" + 0.008*\"softwar\" + 0.008*\"user\" + 0.008*\"uruguayan\"\n", + "2019-01-31 01:20:26,892 : INFO : topic diff=0.003277, rho=0.023137\n", + "2019-01-31 01:20:27,051 : INFO : PROGRESS: pass 0, at document #3738000/4922894\n", + "2019-01-31 01:20:28,436 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:20:28,702 : INFO : topic #32 (0.020): 0.054*\"district\" + 0.044*\"popolo\" + 0.044*\"vigour\" + 0.036*\"tortur\" + 0.036*\"cotton\" + 0.023*\"area\" + 0.021*\"adulthood\" + 0.021*\"multitud\" + 0.019*\"cede\" + 0.018*\"regim\"\n", + "2019-01-31 01:20:28,703 : INFO : topic #13 (0.020): 0.026*\"sourc\" + 0.026*\"australia\" + 0.025*\"new\" + 0.025*\"london\" + 0.024*\"england\" + 0.022*\"australian\" + 0.019*\"british\" + 0.016*\"ireland\" + 0.014*\"wale\" + 0.014*\"youth\"\n", + "2019-01-31 01:20:28,704 : INFO : topic #43 (0.020): 0.062*\"elect\" + 0.055*\"parti\" + 0.024*\"voluntari\" + 0.021*\"democrat\" + 0.020*\"member\" + 0.017*\"polici\" + 0.015*\"bypass\" + 0.014*\"seaport\" + 0.013*\"liber\" + 0.013*\"republ\"\n", + "2019-01-31 01:20:28,705 : INFO : topic #40 (0.020): 0.084*\"unit\" + 0.023*\"schuster\" + 0.022*\"institut\" + 0.021*\"requir\" + 0.021*\"collector\" + 0.019*\"student\" + 0.014*\"professor\" + 0.011*\"word\" + 0.011*\"degre\" + 0.011*\"http\"\n", + "2019-01-31 01:20:28,706 : INFO : topic #11 (0.020): 0.024*\"john\" + 0.011*\"david\" + 0.011*\"will\" + 0.011*\"jame\" + 0.010*\"rival\" + 0.009*\"mexican–american\" + 0.008*\"georg\" + 0.008*\"slur\" + 0.008*\"paul\" + 0.007*\"rhyme\"\n", + "2019-01-31 01:20:28,712 : INFO : topic diff=0.003337, rho=0.023131\n", + "2019-01-31 01:20:31,430 : INFO : -11.380 per-word bound, 2664.7 perplexity estimate based on a held-out corpus of 2000 documents with 570046 words\n", + "2019-01-31 01:20:31,430 : INFO : PROGRESS: pass 0, at document #3740000/4922894\n", + "2019-01-31 01:20:32,807 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 01:20:33,073 : INFO : topic #45 (0.020): 0.036*\"arsen\" + 0.029*\"jpg\" + 0.028*\"fifteenth\" + 0.024*\"museo\" + 0.021*\"pain\" + 0.019*\"illicit\" + 0.015*\"colder\" + 0.014*\"exhaust\" + 0.013*\"gai\" + 0.012*\"western\"\n", + "2019-01-31 01:20:33,074 : INFO : topic #39 (0.020): 0.061*\"canada\" + 0.047*\"canadian\" + 0.025*\"hoar\" + 0.025*\"toronto\" + 0.021*\"ontario\" + 0.016*\"hydrogen\" + 0.015*\"new\" + 0.015*\"novotná\" + 0.014*\"misericordia\" + 0.012*\"quebec\"\n", + "2019-01-31 01:20:33,075 : INFO : topic #31 (0.020): 0.052*\"fusiform\" + 0.026*\"scientist\" + 0.025*\"taxpay\" + 0.024*\"player\" + 0.020*\"place\" + 0.015*\"clot\" + 0.013*\"leagu\" + 0.012*\"folei\" + 0.010*\"yawn\" + 0.009*\"reconstruct\"\n", + "2019-01-31 01:20:33,076 : INFO : topic #40 (0.020): 0.084*\"unit\" + 0.023*\"schuster\" + 0.022*\"institut\" + 0.021*\"requir\" + 0.021*\"collector\" + 0.019*\"student\" + 0.014*\"professor\" + 0.011*\"word\" + 0.011*\"degre\" + 0.011*\"http\"\n", + "2019-01-31 01:20:33,077 : INFO : topic #33 (0.020): 0.062*\"french\" + 0.047*\"franc\" + 0.031*\"pari\" + 0.023*\"sail\" + 0.023*\"jean\" + 0.018*\"daphn\" + 0.013*\"lazi\" + 0.013*\"loui\" + 0.012*\"piec\" + 0.009*\"wine\"\n", + "2019-01-31 01:20:33,083 : INFO : topic diff=0.003416, rho=0.023125\n", + "2019-01-31 01:20:33,297 : INFO : PROGRESS: pass 0, at document #3742000/4922894\n", + "2019-01-31 01:20:34,680 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:20:34,946 : INFO : topic #1 (0.020): 0.056*\"china\" + 0.048*\"chilton\" + 0.024*\"hong\" + 0.024*\"kong\" + 0.021*\"korea\" + 0.019*\"korean\" + 0.016*\"sourc\" + 0.015*\"shirin\" + 0.014*\"leah\" + 0.013*\"kim\"\n", + "2019-01-31 01:20:34,947 : INFO : topic #44 (0.020): 0.030*\"rooftop\" + 0.027*\"final\" + 0.024*\"wife\" + 0.020*\"tourist\" + 0.018*\"champion\" + 0.015*\"taxpay\" + 0.014*\"tiepolo\" + 0.014*\"martin\" + 0.014*\"chamber\" + 0.013*\"open\"\n", + "2019-01-31 01:20:34,948 : INFO : topic #39 (0.020): 0.061*\"canada\" + 0.047*\"canadian\" + 0.025*\"hoar\" + 0.025*\"toronto\" + 0.021*\"ontario\" + 0.016*\"hydrogen\" + 0.015*\"new\" + 0.015*\"novotná\" + 0.014*\"misericordia\" + 0.012*\"quebec\"\n", + "2019-01-31 01:20:34,949 : INFO : topic #33 (0.020): 0.062*\"french\" + 0.047*\"franc\" + 0.031*\"pari\" + 0.023*\"sail\" + 0.023*\"jean\" + 0.018*\"daphn\" + 0.013*\"lazi\" + 0.013*\"loui\" + 0.012*\"piec\" + 0.009*\"wine\"\n", + "2019-01-31 01:20:34,950 : INFO : topic #2 (0.020): 0.051*\"isl\" + 0.039*\"shield\" + 0.018*\"narrat\" + 0.015*\"scot\" + 0.012*\"blur\" + 0.012*\"pope\" + 0.011*\"coalit\" + 0.011*\"nativist\" + 0.009*\"bahá\" + 0.009*\"fleet\"\n", + "2019-01-31 01:20:34,956 : INFO : topic diff=0.002805, rho=0.023119\n", + "2019-01-31 01:20:35,109 : INFO : PROGRESS: pass 0, at document #3744000/4922894\n", + "2019-01-31 01:20:36,467 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:20:36,734 : INFO : topic #31 (0.020): 0.052*\"fusiform\" + 0.026*\"scientist\" + 0.025*\"taxpay\" + 0.024*\"player\" + 0.020*\"place\" + 0.014*\"clot\" + 0.013*\"leagu\" + 0.012*\"folei\" + 0.010*\"yawn\" + 0.009*\"reconstruct\"\n", + "2019-01-31 01:20:36,735 : INFO : topic #37 (0.020): 0.013*\"charact\" + 0.011*\"anim\" + 0.011*\"septemb\" + 0.010*\"man\" + 0.009*\"comic\" + 0.007*\"appear\" + 0.007*\"fusiform\" + 0.006*\"storag\" + 0.006*\"workplac\" + 0.006*\"vision\"\n", + "2019-01-31 01:20:36,736 : INFO : topic #46 (0.020): 0.018*\"damag\" + 0.017*\"stop\" + 0.017*\"norwai\" + 0.016*\"sweden\" + 0.015*\"swedish\" + 0.013*\"norwegian\" + 0.013*\"wind\" + 0.011*\"huntsvil\" + 0.011*\"denmark\" + 0.011*\"treeless\"\n", + "2019-01-31 01:20:36,737 : INFO : topic #10 (0.020): 0.011*\"cdd\" + 0.009*\"media\" + 0.009*\"hormon\" + 0.008*\"disco\" + 0.008*\"pathwai\" + 0.008*\"have\" + 0.007*\"caus\" + 0.006*\"treat\" + 0.006*\"proper\" + 0.006*\"acid\"\n", + "2019-01-31 01:20:36,738 : INFO : topic #3 (0.020): 0.032*\"present\" + 0.027*\"offic\" + 0.023*\"nation\" + 0.023*\"govern\" + 0.022*\"minist\" + 0.022*\"serv\" + 0.020*\"member\" + 0.016*\"gener\" + 0.016*\"start\" + 0.014*\"chickasaw\"\n", + "2019-01-31 01:20:36,743 : INFO : topic diff=0.003328, rho=0.023113\n", + "2019-01-31 01:20:36,901 : INFO : PROGRESS: pass 0, at document #3746000/4922894\n", + "2019-01-31 01:20:38,270 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:20:38,537 : INFO : topic #12 (0.020): 0.008*\"number\" + 0.007*\"frontal\" + 0.007*\"gener\" + 0.006*\"southern\" + 0.006*\"exampl\" + 0.006*\"théori\" + 0.006*\"poet\" + 0.006*\"measur\" + 0.006*\"servitud\" + 0.005*\"differ\"\n", + "2019-01-31 01:20:38,538 : INFO : topic #18 (0.020): 0.011*\"théori\" + 0.007*\"later\" + 0.007*\"sack\" + 0.006*\"dai\" + 0.005*\"kill\" + 0.005*\"retrospect\" + 0.005*\"like\" + 0.005*\"end\" + 0.004*\"call\" + 0.004*\"help\"\n", + "2019-01-31 01:20:38,539 : INFO : topic #33 (0.020): 0.062*\"french\" + 0.047*\"franc\" + 0.031*\"pari\" + 0.023*\"sail\" + 0.023*\"jean\" + 0.018*\"daphn\" + 0.014*\"lazi\" + 0.013*\"loui\" + 0.012*\"piec\" + 0.009*\"wine\"\n", + "2019-01-31 01:20:38,540 : INFO : topic #0 (0.020): 0.066*\"statewid\" + 0.042*\"line\" + 0.031*\"raid\" + 0.025*\"rosenwald\" + 0.024*\"rivièr\" + 0.019*\"serv\" + 0.019*\"traceabl\" + 0.017*\"airmen\" + 0.014*\"oper\" + 0.011*\"transient\"\n", + "2019-01-31 01:20:38,541 : INFO : topic #21 (0.020): 0.034*\"samford\" + 0.022*\"spain\" + 0.019*\"del\" + 0.018*\"mexico\" + 0.017*\"italian\" + 0.014*\"soviet\" + 0.012*\"santa\" + 0.011*\"juan\" + 0.011*\"lizard\" + 0.010*\"carlo\"\n", + "2019-01-31 01:20:38,547 : INFO : topic diff=0.002950, rho=0.023106\n", + "2019-01-31 01:20:38,705 : INFO : PROGRESS: pass 0, at document #3748000/4922894\n", + "2019-01-31 01:20:40,069 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:20:40,336 : INFO : topic #29 (0.020): 0.031*\"companhia\" + 0.012*\"million\" + 0.012*\"busi\" + 0.011*\"market\" + 0.011*\"bank\" + 0.011*\"produc\" + 0.010*\"industri\" + 0.008*\"yawn\" + 0.008*\"manag\" + 0.007*\"oper\"\n", + "2019-01-31 01:20:40,337 : INFO : topic #9 (0.020): 0.071*\"bone\" + 0.047*\"american\" + 0.028*\"valour\" + 0.018*\"dutch\" + 0.018*\"folei\" + 0.017*\"player\" + 0.017*\"polit\" + 0.016*\"english\" + 0.013*\"acrimoni\" + 0.011*\"simpler\"\n", + "2019-01-31 01:20:40,338 : INFO : topic #25 (0.020): 0.032*\"ring\" + 0.019*\"area\" + 0.017*\"lagrang\" + 0.017*\"warmth\" + 0.015*\"mount\" + 0.010*\"north\" + 0.009*\"palmer\" + 0.009*\"sourc\" + 0.009*\"crayfish\" + 0.009*\"land\"\n", + "2019-01-31 01:20:40,339 : INFO : topic #16 (0.020): 0.061*\"king\" + 0.031*\"priest\" + 0.021*\"duke\" + 0.018*\"quarterli\" + 0.018*\"rotterdam\" + 0.018*\"idiosyncrat\" + 0.017*\"grammat\" + 0.014*\"kingdom\" + 0.013*\"count\" + 0.013*\"brazil\"\n", + "2019-01-31 01:20:40,340 : INFO : topic #33 (0.020): 0.062*\"french\" + 0.047*\"franc\" + 0.031*\"pari\" + 0.023*\"sail\" + 0.023*\"jean\" + 0.018*\"daphn\" + 0.014*\"lazi\" + 0.013*\"loui\" + 0.012*\"piec\" + 0.009*\"wine\"\n", + "2019-01-31 01:20:40,346 : INFO : topic diff=0.003069, rho=0.023100\n", + "2019-01-31 01:20:40,502 : INFO : PROGRESS: pass 0, at document #3750000/4922894\n", + "2019-01-31 01:20:41,877 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:20:42,143 : INFO : topic #33 (0.020): 0.062*\"french\" + 0.047*\"franc\" + 0.031*\"pari\" + 0.023*\"jean\" + 0.023*\"sail\" + 0.018*\"daphn\" + 0.014*\"lazi\" + 0.013*\"loui\" + 0.012*\"piec\" + 0.009*\"wine\"\n", + "2019-01-31 01:20:42,144 : INFO : topic #2 (0.020): 0.051*\"isl\" + 0.039*\"shield\" + 0.018*\"narrat\" + 0.015*\"scot\" + 0.012*\"blur\" + 0.012*\"pope\" + 0.011*\"coalit\" + 0.011*\"nativist\" + 0.009*\"bahá\" + 0.009*\"fleet\"\n", + "2019-01-31 01:20:42,145 : INFO : topic #23 (0.020): 0.136*\"audit\" + 0.070*\"best\" + 0.033*\"yawn\" + 0.031*\"jacksonvil\" + 0.022*\"japanes\" + 0.021*\"noll\" + 0.018*\"women\" + 0.018*\"festiv\" + 0.017*\"intern\" + 0.012*\"winner\"\n", + "2019-01-31 01:20:42,146 : INFO : topic #19 (0.020): 0.016*\"languag\" + 0.015*\"centuri\" + 0.010*\"woodcut\" + 0.009*\"form\" + 0.009*\"origin\" + 0.009*\"mean\" + 0.008*\"trade\" + 0.008*\"english\" + 0.007*\"ancestor\" + 0.007*\"known\"\n", + "2019-01-31 01:20:42,147 : INFO : topic #37 (0.020): 0.013*\"charact\" + 0.011*\"anim\" + 0.011*\"septemb\" + 0.010*\"man\" + 0.009*\"comic\" + 0.007*\"appear\" + 0.006*\"storag\" + 0.006*\"workplac\" + 0.006*\"fusiform\" + 0.006*\"vision\"\n", + "2019-01-31 01:20:42,153 : INFO : topic diff=0.003296, rho=0.023094\n", + "2019-01-31 01:20:42,307 : INFO : PROGRESS: pass 0, at document #3752000/4922894\n", + "2019-01-31 01:20:43,665 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:20:43,931 : INFO : topic #31 (0.020): 0.051*\"fusiform\" + 0.026*\"scientist\" + 0.025*\"taxpay\" + 0.023*\"player\" + 0.020*\"place\" + 0.014*\"clot\" + 0.013*\"leagu\" + 0.012*\"folei\" + 0.010*\"yawn\" + 0.009*\"reconstruct\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 01:20:43,932 : INFO : topic #34 (0.020): 0.064*\"start\" + 0.034*\"new\" + 0.031*\"american\" + 0.028*\"unionist\" + 0.027*\"cotton\" + 0.021*\"year\" + 0.015*\"california\" + 0.013*\"warrior\" + 0.013*\"terri\" + 0.011*\"north\"\n", + "2019-01-31 01:20:43,933 : INFO : topic #42 (0.020): 0.049*\"german\" + 0.033*\"germani\" + 0.016*\"vol\" + 0.014*\"jewish\" + 0.014*\"israel\" + 0.014*\"der\" + 0.013*\"berlin\" + 0.011*\"european\" + 0.009*\"europ\" + 0.009*\"austria\"\n", + "2019-01-31 01:20:43,934 : INFO : topic #13 (0.020): 0.026*\"australia\" + 0.026*\"sourc\" + 0.025*\"new\" + 0.025*\"london\" + 0.023*\"england\" + 0.022*\"australian\" + 0.019*\"british\" + 0.016*\"ireland\" + 0.014*\"youth\" + 0.014*\"wale\"\n", + "2019-01-31 01:20:43,935 : INFO : topic #37 (0.020): 0.013*\"charact\" + 0.011*\"anim\" + 0.011*\"septemb\" + 0.009*\"man\" + 0.009*\"comic\" + 0.007*\"appear\" + 0.006*\"workplac\" + 0.006*\"fusiform\" + 0.006*\"storag\" + 0.006*\"vision\"\n", + "2019-01-31 01:20:43,941 : INFO : topic diff=0.003514, rho=0.023088\n", + "2019-01-31 01:20:44,101 : INFO : PROGRESS: pass 0, at document #3754000/4922894\n", + "2019-01-31 01:20:45,500 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:20:45,767 : INFO : topic #5 (0.020): 0.037*\"abroad\" + 0.028*\"son\" + 0.027*\"rel\" + 0.026*\"reconstruct\" + 0.021*\"band\" + 0.017*\"muscl\" + 0.015*\"simultan\" + 0.014*\"charcoal\" + 0.013*\"toyota\" + 0.010*\"myspac\"\n", + "2019-01-31 01:20:45,768 : INFO : topic #40 (0.020): 0.083*\"unit\" + 0.023*\"schuster\" + 0.022*\"institut\" + 0.021*\"collector\" + 0.021*\"requir\" + 0.020*\"student\" + 0.014*\"professor\" + 0.012*\"degre\" + 0.011*\"word\" + 0.011*\"http\"\n", + "2019-01-31 01:20:45,770 : INFO : topic #17 (0.020): 0.077*\"church\" + 0.022*\"cathol\" + 0.022*\"christian\" + 0.021*\"bishop\" + 0.017*\"sail\" + 0.016*\"retroflex\" + 0.010*\"cathedr\" + 0.010*\"relationship\" + 0.009*\"historiographi\" + 0.009*\"parish\"\n", + "2019-01-31 01:20:45,771 : INFO : topic #33 (0.020): 0.061*\"french\" + 0.047*\"franc\" + 0.031*\"pari\" + 0.023*\"jean\" + 0.022*\"sail\" + 0.018*\"daphn\" + 0.014*\"lazi\" + 0.013*\"loui\" + 0.012*\"piec\" + 0.009*\"wine\"\n", + "2019-01-31 01:20:45,771 : INFO : topic #26 (0.020): 0.031*\"workplac\" + 0.030*\"champion\" + 0.026*\"woman\" + 0.025*\"olymp\" + 0.023*\"men\" + 0.021*\"medal\" + 0.020*\"event\" + 0.019*\"rainfal\" + 0.018*\"taxpay\" + 0.018*\"atheist\"\n", + "2019-01-31 01:20:45,777 : INFO : topic diff=0.003947, rho=0.023082\n", + "2019-01-31 01:20:45,932 : INFO : PROGRESS: pass 0, at document #3756000/4922894\n", + "2019-01-31 01:20:47,290 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:20:47,557 : INFO : topic #48 (0.020): 0.083*\"sens\" + 0.078*\"octob\" + 0.076*\"march\" + 0.071*\"juli\" + 0.069*\"judici\" + 0.069*\"august\" + 0.069*\"januari\" + 0.068*\"notion\" + 0.067*\"april\" + 0.064*\"decatur\"\n", + "2019-01-31 01:20:47,558 : INFO : topic #39 (0.020): 0.060*\"canada\" + 0.047*\"canadian\" + 0.025*\"hoar\" + 0.024*\"toronto\" + 0.021*\"ontario\" + 0.017*\"hydrogen\" + 0.015*\"novotná\" + 0.015*\"new\" + 0.014*\"misericordia\" + 0.012*\"quebec\"\n", + "2019-01-31 01:20:47,559 : INFO : topic #17 (0.020): 0.077*\"church\" + 0.022*\"cathol\" + 0.022*\"christian\" + 0.021*\"bishop\" + 0.017*\"sail\" + 0.016*\"retroflex\" + 0.009*\"cathedr\" + 0.009*\"relationship\" + 0.009*\"historiographi\" + 0.009*\"parish\"\n", + "2019-01-31 01:20:47,560 : INFO : topic #15 (0.020): 0.011*\"small\" + 0.010*\"organ\" + 0.009*\"develop\" + 0.009*\"commun\" + 0.009*\"group\" + 0.008*\"word\" + 0.008*\"peopl\" + 0.007*\"woman\" + 0.007*\"human\" + 0.006*\"summerhil\"\n", + "2019-01-31 01:20:47,561 : INFO : topic #44 (0.020): 0.030*\"rooftop\" + 0.027*\"final\" + 0.023*\"wife\" + 0.020*\"tourist\" + 0.019*\"champion\" + 0.015*\"martin\" + 0.015*\"taxpay\" + 0.014*\"tiepolo\" + 0.013*\"chamber\" + 0.013*\"open\"\n", + "2019-01-31 01:20:47,567 : INFO : topic diff=0.003580, rho=0.023076\n", + "2019-01-31 01:20:47,725 : INFO : PROGRESS: pass 0, at document #3758000/4922894\n", + "2019-01-31 01:20:49,100 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:20:49,367 : INFO : topic #47 (0.020): 0.064*\"muscl\" + 0.033*\"perceptu\" + 0.021*\"theater\" + 0.018*\"place\" + 0.018*\"damn\" + 0.017*\"compos\" + 0.014*\"physician\" + 0.014*\"orchestr\" + 0.013*\"olympo\" + 0.012*\"jack\"\n", + "2019-01-31 01:20:49,368 : INFO : topic #21 (0.020): 0.033*\"samford\" + 0.023*\"spain\" + 0.019*\"del\" + 0.018*\"mexico\" + 0.017*\"italian\" + 0.014*\"soviet\" + 0.012*\"santa\" + 0.011*\"juan\" + 0.010*\"lizard\" + 0.010*\"carlo\"\n", + "2019-01-31 01:20:49,369 : INFO : topic #4 (0.020): 0.020*\"enfranchis\" + 0.014*\"depress\" + 0.014*\"pour\" + 0.009*\"elabor\" + 0.009*\"veget\" + 0.008*\"mode\" + 0.007*\"uruguayan\" + 0.006*\"produc\" + 0.006*\"develop\" + 0.006*\"turn\"\n", + "2019-01-31 01:20:49,370 : INFO : topic #26 (0.020): 0.031*\"workplac\" + 0.030*\"champion\" + 0.026*\"woman\" + 0.025*\"olymp\" + 0.024*\"men\" + 0.021*\"medal\" + 0.021*\"event\" + 0.019*\"rainfal\" + 0.018*\"taxpay\" + 0.018*\"atheist\"\n", + "2019-01-31 01:20:49,371 : INFO : topic #45 (0.020): 0.036*\"arsen\" + 0.029*\"jpg\" + 0.028*\"fifteenth\" + 0.025*\"museo\" + 0.021*\"pain\" + 0.018*\"illicit\" + 0.015*\"colder\" + 0.014*\"exhaust\" + 0.014*\"gai\" + 0.012*\"artist\"\n", + "2019-01-31 01:20:49,377 : INFO : topic diff=0.003449, rho=0.023069\n", + "2019-01-31 01:20:52,024 : INFO : -11.705 per-word bound, 3339.3 perplexity estimate based on a held-out corpus of 2000 documents with 530422 words\n", + "2019-01-31 01:20:52,025 : INFO : PROGRESS: pass 0, at document #3760000/4922894\n", + "2019-01-31 01:20:53,378 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:20:53,644 : INFO : topic #32 (0.020): 0.053*\"district\" + 0.044*\"popolo\" + 0.044*\"vigour\" + 0.037*\"tortur\" + 0.035*\"cotton\" + 0.022*\"area\" + 0.022*\"adulthood\" + 0.021*\"multitud\" + 0.019*\"cede\" + 0.018*\"regim\"\n", + "2019-01-31 01:20:53,645 : INFO : topic #49 (0.020): 0.042*\"india\" + 0.028*\"incumb\" + 0.013*\"islam\" + 0.013*\"pakistan\" + 0.013*\"muskoge\" + 0.012*\"anglo\" + 0.011*\"sri\" + 0.011*\"tajikistan\" + 0.010*\"televis\" + 0.010*\"affection\"\n", + "2019-01-31 01:20:53,646 : INFO : topic #2 (0.020): 0.050*\"isl\" + 0.039*\"shield\" + 0.018*\"narrat\" + 0.015*\"scot\" + 0.012*\"blur\" + 0.012*\"pope\" + 0.011*\"nativist\" + 0.011*\"coalit\" + 0.009*\"fleet\" + 0.009*\"bahá\"\n", + "2019-01-31 01:20:53,647 : INFO : topic #22 (0.020): 0.035*\"spars\" + 0.020*\"factor\" + 0.012*\"plaisir\" + 0.011*\"genu\" + 0.010*\"western\" + 0.008*\"biom\" + 0.008*\"median\" + 0.007*\"incom\" + 0.006*\"feel\" + 0.006*\"florida\"\n", + "2019-01-31 01:20:53,648 : INFO : topic #20 (0.020): 0.143*\"scholar\" + 0.039*\"struggl\" + 0.034*\"high\" + 0.031*\"educ\" + 0.024*\"collector\" + 0.018*\"yawn\" + 0.013*\"prognosi\" + 0.010*\"gothic\" + 0.010*\"district\" + 0.010*\"task\"\n", + "2019-01-31 01:20:53,654 : INFO : topic diff=0.004169, rho=0.023063\n", + "2019-01-31 01:20:53,814 : INFO : PROGRESS: pass 0, at document #3762000/4922894\n", + "2019-01-31 01:20:55,202 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:20:55,469 : INFO : topic #9 (0.020): 0.070*\"bone\" + 0.046*\"american\" + 0.029*\"valour\" + 0.020*\"dutch\" + 0.018*\"folei\" + 0.017*\"polit\" + 0.017*\"player\" + 0.016*\"english\" + 0.012*\"acrimoni\" + 0.011*\"simpler\"\n", + "2019-01-31 01:20:55,470 : INFO : topic #11 (0.020): 0.023*\"john\" + 0.011*\"will\" + 0.011*\"jame\" + 0.011*\"david\" + 0.010*\"rival\" + 0.009*\"mexican–american\" + 0.008*\"slur\" + 0.008*\"georg\" + 0.008*\"paul\" + 0.007*\"rhyme\"\n", + "2019-01-31 01:20:55,471 : INFO : topic #19 (0.020): 0.016*\"languag\" + 0.015*\"centuri\" + 0.010*\"woodcut\" + 0.009*\"form\" + 0.009*\"origin\" + 0.009*\"mean\" + 0.008*\"trade\" + 0.008*\"english\" + 0.007*\"ancestor\" + 0.007*\"known\"\n", + "2019-01-31 01:20:55,472 : INFO : topic #13 (0.020): 0.026*\"australia\" + 0.026*\"sourc\" + 0.025*\"new\" + 0.025*\"london\" + 0.023*\"england\" + 0.022*\"australian\" + 0.019*\"british\" + 0.016*\"ireland\" + 0.014*\"youth\" + 0.014*\"wale\"\n", + "2019-01-31 01:20:55,473 : INFO : topic #17 (0.020): 0.077*\"church\" + 0.022*\"cathol\" + 0.022*\"christian\" + 0.021*\"bishop\" + 0.017*\"sail\" + 0.015*\"retroflex\" + 0.010*\"relationship\" + 0.009*\"cathedr\" + 0.009*\"historiographi\" + 0.009*\"parish\"\n", + "2019-01-31 01:20:55,478 : INFO : topic diff=0.003462, rho=0.023057\n", + "2019-01-31 01:20:55,631 : INFO : PROGRESS: pass 0, at document #3764000/4922894\n", + "2019-01-31 01:20:56,974 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:20:57,240 : INFO : topic #20 (0.020): 0.144*\"scholar\" + 0.039*\"struggl\" + 0.034*\"high\" + 0.032*\"educ\" + 0.024*\"collector\" + 0.017*\"yawn\" + 0.013*\"prognosi\" + 0.010*\"gothic\" + 0.010*\"district\" + 0.010*\"task\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 01:20:57,241 : INFO : topic #11 (0.020): 0.023*\"john\" + 0.011*\"will\" + 0.011*\"jame\" + 0.011*\"david\" + 0.010*\"rival\" + 0.009*\"mexican–american\" + 0.008*\"slur\" + 0.008*\"georg\" + 0.008*\"paul\" + 0.007*\"rhyme\"\n", + "2019-01-31 01:20:57,242 : INFO : topic #32 (0.020): 0.053*\"district\" + 0.044*\"popolo\" + 0.044*\"vigour\" + 0.036*\"tortur\" + 0.036*\"cotton\" + 0.022*\"area\" + 0.022*\"adulthood\" + 0.021*\"multitud\" + 0.019*\"cede\" + 0.018*\"regim\"\n", + "2019-01-31 01:20:57,243 : INFO : topic #46 (0.020): 0.018*\"damag\" + 0.017*\"norwai\" + 0.016*\"stop\" + 0.016*\"sweden\" + 0.015*\"swedish\" + 0.013*\"wind\" + 0.013*\"norwegian\" + 0.011*\"huntsvil\" + 0.011*\"denmark\" + 0.011*\"treeless\"\n", + "2019-01-31 01:20:57,245 : INFO : topic #9 (0.020): 0.070*\"bone\" + 0.046*\"american\" + 0.028*\"valour\" + 0.020*\"dutch\" + 0.018*\"folei\" + 0.017*\"player\" + 0.017*\"polit\" + 0.016*\"english\" + 0.012*\"acrimoni\" + 0.011*\"simpler\"\n", + "2019-01-31 01:20:57,250 : INFO : topic diff=0.003189, rho=0.023051\n", + "2019-01-31 01:20:57,405 : INFO : PROGRESS: pass 0, at document #3766000/4922894\n", + "2019-01-31 01:20:58,761 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:20:59,027 : INFO : topic #11 (0.020): 0.023*\"john\" + 0.011*\"will\" + 0.011*\"jame\" + 0.011*\"david\" + 0.010*\"rival\" + 0.009*\"mexican–american\" + 0.008*\"slur\" + 0.008*\"georg\" + 0.008*\"paul\" + 0.007*\"rhyme\"\n", + "2019-01-31 01:20:59,028 : INFO : topic #22 (0.020): 0.035*\"spars\" + 0.020*\"factor\" + 0.012*\"plaisir\" + 0.011*\"genu\" + 0.010*\"western\" + 0.008*\"biom\" + 0.008*\"median\" + 0.007*\"incom\" + 0.006*\"trap\" + 0.006*\"florida\"\n", + "2019-01-31 01:20:59,029 : INFO : topic #24 (0.020): 0.039*\"book\" + 0.034*\"publicis\" + 0.028*\"word\" + 0.019*\"new\" + 0.014*\"edit\" + 0.013*\"presid\" + 0.011*\"magazin\" + 0.011*\"collect\" + 0.011*\"worldwid\" + 0.011*\"author\"\n", + "2019-01-31 01:20:59,030 : INFO : topic #12 (0.020): 0.008*\"number\" + 0.007*\"frontal\" + 0.007*\"gener\" + 0.006*\"exampl\" + 0.006*\"southern\" + 0.006*\"poet\" + 0.006*\"théori\" + 0.006*\"measur\" + 0.006*\"servitud\" + 0.005*\"method\"\n", + "2019-01-31 01:20:59,032 : INFO : topic #28 (0.020): 0.035*\"build\" + 0.029*\"hous\" + 0.018*\"buford\" + 0.015*\"histor\" + 0.011*\"linear\" + 0.011*\"constitut\" + 0.011*\"depress\" + 0.011*\"silicon\" + 0.011*\"briarwood\" + 0.010*\"centuri\"\n", + "2019-01-31 01:20:59,037 : INFO : topic diff=0.003222, rho=0.023045\n", + "2019-01-31 01:20:59,192 : INFO : PROGRESS: pass 0, at document #3768000/4922894\n", + "2019-01-31 01:21:00,542 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:21:00,808 : INFO : topic #11 (0.020): 0.023*\"john\" + 0.011*\"will\" + 0.011*\"jame\" + 0.011*\"david\" + 0.010*\"rival\" + 0.009*\"mexican–american\" + 0.008*\"slur\" + 0.008*\"georg\" + 0.008*\"paul\" + 0.007*\"rhyme\"\n", + "2019-01-31 01:21:00,809 : INFO : topic #29 (0.020): 0.031*\"companhia\" + 0.013*\"busi\" + 0.012*\"million\" + 0.011*\"market\" + 0.011*\"produc\" + 0.010*\"bank\" + 0.009*\"industri\" + 0.008*\"yawn\" + 0.008*\"manag\" + 0.007*\"function\"\n", + "2019-01-31 01:21:00,810 : INFO : topic #28 (0.020): 0.035*\"build\" + 0.029*\"hous\" + 0.018*\"buford\" + 0.015*\"histor\" + 0.011*\"linear\" + 0.011*\"constitut\" + 0.011*\"silicon\" + 0.011*\"depress\" + 0.011*\"briarwood\" + 0.010*\"centuri\"\n", + "2019-01-31 01:21:00,811 : INFO : topic #24 (0.020): 0.038*\"book\" + 0.034*\"publicis\" + 0.028*\"word\" + 0.019*\"new\" + 0.015*\"edit\" + 0.013*\"presid\" + 0.011*\"magazin\" + 0.011*\"worldwid\" + 0.011*\"collect\" + 0.011*\"author\"\n", + "2019-01-31 01:21:00,812 : INFO : topic #22 (0.020): 0.035*\"spars\" + 0.020*\"factor\" + 0.012*\"plaisir\" + 0.011*\"genu\" + 0.010*\"western\" + 0.008*\"biom\" + 0.008*\"median\" + 0.007*\"incom\" + 0.006*\"trap\" + 0.006*\"florida\"\n", + "2019-01-31 01:21:00,818 : INFO : topic diff=0.004050, rho=0.023039\n", + "2019-01-31 01:21:00,981 : INFO : PROGRESS: pass 0, at document #3770000/4922894\n", + "2019-01-31 01:21:02,381 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:21:02,647 : INFO : topic #6 (0.020): 0.070*\"fewer\" + 0.024*\"epiru\" + 0.020*\"septemb\" + 0.018*\"teacher\" + 0.015*\"stake\" + 0.012*\"rodríguez\" + 0.012*\"proclaim\" + 0.011*\"direct\" + 0.010*\"acrimoni\" + 0.010*\"movi\"\n", + "2019-01-31 01:21:02,648 : INFO : topic #29 (0.020): 0.031*\"companhia\" + 0.013*\"busi\" + 0.012*\"million\" + 0.011*\"market\" + 0.011*\"produc\" + 0.010*\"bank\" + 0.009*\"industri\" + 0.008*\"yawn\" + 0.008*\"manag\" + 0.007*\"oper\"\n", + "2019-01-31 01:21:02,649 : INFO : topic #11 (0.020): 0.023*\"john\" + 0.011*\"will\" + 0.011*\"jame\" + 0.011*\"david\" + 0.010*\"rival\" + 0.009*\"mexican–american\" + 0.008*\"slur\" + 0.008*\"georg\" + 0.008*\"paul\" + 0.007*\"rhyme\"\n", + "2019-01-31 01:21:02,650 : INFO : topic #43 (0.020): 0.062*\"elect\" + 0.055*\"parti\" + 0.024*\"voluntari\" + 0.023*\"democrat\" + 0.019*\"member\" + 0.017*\"polici\" + 0.015*\"bypass\" + 0.015*\"republ\" + 0.014*\"seaport\" + 0.013*\"selma\"\n", + "2019-01-31 01:21:02,652 : INFO : topic #41 (0.020): 0.038*\"citi\" + 0.024*\"palmer\" + 0.020*\"new\" + 0.016*\"strategist\" + 0.013*\"open\" + 0.013*\"center\" + 0.011*\"lobe\" + 0.011*\"includ\" + 0.011*\"dai\" + 0.009*\"local\"\n", + "2019-01-31 01:21:02,657 : INFO : topic diff=0.004060, rho=0.023033\n", + "2019-01-31 01:21:02,815 : INFO : PROGRESS: pass 0, at document #3772000/4922894\n", + "2019-01-31 01:21:04,189 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:21:04,457 : INFO : topic #27 (0.020): 0.070*\"questionnair\" + 0.021*\"candid\" + 0.018*\"taxpay\" + 0.013*\"driver\" + 0.013*\"tornado\" + 0.012*\"ret\" + 0.012*\"find\" + 0.012*\"fool\" + 0.010*\"champion\" + 0.010*\"landslid\"\n", + "2019-01-31 01:21:04,458 : INFO : topic #22 (0.020): 0.035*\"spars\" + 0.019*\"factor\" + 0.012*\"plaisir\" + 0.011*\"genu\" + 0.010*\"western\" + 0.008*\"biom\" + 0.008*\"median\" + 0.007*\"incom\" + 0.006*\"florida\" + 0.006*\"trap\"\n", + "2019-01-31 01:21:04,459 : INFO : topic #30 (0.020): 0.035*\"cleveland\" + 0.035*\"leagu\" + 0.030*\"place\" + 0.028*\"taxpay\" + 0.024*\"crete\" + 0.024*\"scientist\" + 0.021*\"folei\" + 0.017*\"goal\" + 0.015*\"martin\" + 0.012*\"schmitz\"\n", + "2019-01-31 01:21:04,460 : INFO : topic #42 (0.020): 0.048*\"german\" + 0.032*\"germani\" + 0.015*\"vol\" + 0.014*\"jewish\" + 0.014*\"israel\" + 0.013*\"der\" + 0.013*\"berlin\" + 0.011*\"european\" + 0.009*\"hungarian\" + 0.009*\"austria\"\n", + "2019-01-31 01:21:04,461 : INFO : topic #10 (0.020): 0.011*\"cdd\" + 0.010*\"media\" + 0.009*\"hormon\" + 0.008*\"disco\" + 0.007*\"have\" + 0.007*\"pathwai\" + 0.007*\"caus\" + 0.006*\"treat\" + 0.006*\"proper\" + 0.006*\"effect\"\n", + "2019-01-31 01:21:04,467 : INFO : topic diff=0.004034, rho=0.023027\n", + "2019-01-31 01:21:04,682 : INFO : PROGRESS: pass 0, at document #3774000/4922894\n", + "2019-01-31 01:21:06,081 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:21:06,347 : INFO : topic #46 (0.020): 0.017*\"damag\" + 0.017*\"stop\" + 0.016*\"norwai\" + 0.015*\"sweden\" + 0.014*\"swedish\" + 0.013*\"wind\" + 0.013*\"norwegian\" + 0.012*\"treeless\" + 0.011*\"huntsvil\" + 0.011*\"denmark\"\n", + "2019-01-31 01:21:06,348 : INFO : topic #28 (0.020): 0.035*\"build\" + 0.030*\"hous\" + 0.019*\"buford\" + 0.015*\"histor\" + 0.011*\"linear\" + 0.011*\"constitut\" + 0.011*\"briarwood\" + 0.011*\"depress\" + 0.011*\"silicon\" + 0.010*\"centuri\"\n", + "2019-01-31 01:21:06,349 : INFO : topic #45 (0.020): 0.037*\"arsen\" + 0.029*\"jpg\" + 0.028*\"fifteenth\" + 0.026*\"museo\" + 0.021*\"pain\" + 0.019*\"illicit\" + 0.014*\"colder\" + 0.014*\"gai\" + 0.014*\"exhaust\" + 0.012*\"artist\"\n", + "2019-01-31 01:21:06,350 : INFO : topic #34 (0.020): 0.065*\"start\" + 0.034*\"new\" + 0.031*\"american\" + 0.028*\"unionist\" + 0.026*\"cotton\" + 0.021*\"year\" + 0.015*\"california\" + 0.013*\"warrior\" + 0.012*\"terri\" + 0.012*\"north\"\n", + "2019-01-31 01:21:06,351 : INFO : topic #36 (0.020): 0.011*\"network\" + 0.011*\"prognosi\" + 0.010*\"pop\" + 0.008*\"develop\" + 0.008*\"diggin\" + 0.008*\"cytokin\" + 0.008*\"championship\" + 0.008*\"softwar\" + 0.008*\"uruguayan\" + 0.008*\"user\"\n", + "2019-01-31 01:21:06,357 : INFO : topic diff=0.003025, rho=0.023020\n", + "2019-01-31 01:21:06,513 : INFO : PROGRESS: pass 0, at document #3776000/4922894\n", + "2019-01-31 01:21:07,880 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:21:08,146 : INFO : topic #32 (0.020): 0.053*\"district\" + 0.044*\"popolo\" + 0.044*\"vigour\" + 0.036*\"tortur\" + 0.035*\"cotton\" + 0.022*\"area\" + 0.022*\"adulthood\" + 0.020*\"multitud\" + 0.019*\"cede\" + 0.019*\"regim\"\n", + "2019-01-31 01:21:08,147 : INFO : topic #27 (0.020): 0.070*\"questionnair\" + 0.021*\"candid\" + 0.018*\"taxpay\" + 0.013*\"driver\" + 0.013*\"tornado\" + 0.012*\"ret\" + 0.012*\"find\" + 0.012*\"fool\" + 0.010*\"champion\" + 0.010*\"landslid\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 01:21:08,148 : INFO : topic #34 (0.020): 0.065*\"start\" + 0.034*\"new\" + 0.031*\"american\" + 0.028*\"unionist\" + 0.026*\"cotton\" + 0.021*\"year\" + 0.015*\"california\" + 0.013*\"warrior\" + 0.012*\"terri\" + 0.012*\"north\"\n", + "2019-01-31 01:21:08,150 : INFO : topic #11 (0.020): 0.023*\"john\" + 0.011*\"will\" + 0.011*\"david\" + 0.011*\"jame\" + 0.010*\"rival\" + 0.009*\"mexican–american\" + 0.008*\"slur\" + 0.008*\"georg\" + 0.008*\"paul\" + 0.007*\"rhyme\"\n", + "2019-01-31 01:21:08,151 : INFO : topic #8 (0.020): 0.027*\"law\" + 0.023*\"cortic\" + 0.019*\"start\" + 0.016*\"act\" + 0.012*\"case\" + 0.012*\"ricardo\" + 0.010*\"polaris\" + 0.009*\"replac\" + 0.009*\"legal\" + 0.007*\"order\"\n", + "2019-01-31 01:21:08,157 : INFO : topic diff=0.003120, rho=0.023014\n", + "2019-01-31 01:21:08,310 : INFO : PROGRESS: pass 0, at document #3778000/4922894\n", + "2019-01-31 01:21:09,682 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:21:09,949 : INFO : topic #24 (0.020): 0.038*\"book\" + 0.034*\"publicis\" + 0.028*\"word\" + 0.019*\"new\" + 0.014*\"edit\" + 0.013*\"presid\" + 0.011*\"magazin\" + 0.011*\"worldwid\" + 0.011*\"collect\" + 0.011*\"author\"\n", + "2019-01-31 01:21:09,950 : INFO : topic #28 (0.020): 0.035*\"build\" + 0.030*\"hous\" + 0.018*\"buford\" + 0.015*\"histor\" + 0.011*\"linear\" + 0.011*\"constitut\" + 0.011*\"depress\" + 0.011*\"silicon\" + 0.011*\"briarwood\" + 0.010*\"centuri\"\n", + "2019-01-31 01:21:09,951 : INFO : topic #8 (0.020): 0.027*\"law\" + 0.023*\"cortic\" + 0.019*\"start\" + 0.016*\"act\" + 0.012*\"case\" + 0.012*\"ricardo\" + 0.010*\"polaris\" + 0.009*\"replac\" + 0.009*\"legal\" + 0.007*\"order\"\n", + "2019-01-31 01:21:09,952 : INFO : topic #7 (0.020): 0.021*\"snatch\" + 0.020*\"di\" + 0.019*\"factor\" + 0.016*\"yawn\" + 0.016*\"margin\" + 0.014*\"bone\" + 0.013*\"life\" + 0.013*\"faster\" + 0.012*\"deal\" + 0.012*\"daughter\"\n", + "2019-01-31 01:21:09,953 : INFO : topic #38 (0.020): 0.023*\"walter\" + 0.010*\"aza\" + 0.009*\"battalion\" + 0.008*\"forc\" + 0.007*\"teufel\" + 0.007*\"armi\" + 0.007*\"empath\" + 0.006*\"citi\" + 0.006*\"govern\" + 0.006*\"militari\"\n", + "2019-01-31 01:21:09,959 : INFO : topic diff=0.003370, rho=0.023008\n", + "2019-01-31 01:21:12,578 : INFO : -11.961 per-word bound, 3988.1 perplexity estimate based on a held-out corpus of 2000 documents with 522787 words\n", + "2019-01-31 01:21:12,579 : INFO : PROGRESS: pass 0, at document #3780000/4922894\n", + "2019-01-31 01:21:13,921 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:21:14,187 : INFO : topic #30 (0.020): 0.035*\"leagu\" + 0.035*\"cleveland\" + 0.030*\"place\" + 0.027*\"taxpay\" + 0.024*\"crete\" + 0.024*\"scientist\" + 0.021*\"folei\" + 0.017*\"goal\" + 0.015*\"martin\" + 0.012*\"schmitz\"\n", + "2019-01-31 01:21:14,188 : INFO : topic #47 (0.020): 0.064*\"muscl\" + 0.033*\"perceptu\" + 0.021*\"theater\" + 0.019*\"place\" + 0.018*\"compos\" + 0.017*\"damn\" + 0.013*\"physician\" + 0.013*\"orchestr\" + 0.013*\"olympo\" + 0.011*\"jack\"\n", + "2019-01-31 01:21:14,189 : INFO : topic #12 (0.020): 0.008*\"number\" + 0.007*\"frontal\" + 0.007*\"gener\" + 0.006*\"exampl\" + 0.006*\"southern\" + 0.006*\"poet\" + 0.006*\"théori\" + 0.006*\"measur\" + 0.006*\"servitud\" + 0.005*\"utopian\"\n", + "2019-01-31 01:21:14,190 : INFO : topic #34 (0.020): 0.065*\"start\" + 0.034*\"new\" + 0.031*\"american\" + 0.028*\"unionist\" + 0.026*\"cotton\" + 0.021*\"year\" + 0.016*\"california\" + 0.013*\"warrior\" + 0.012*\"terri\" + 0.012*\"north\"\n", + "2019-01-31 01:21:14,191 : INFO : topic #46 (0.020): 0.016*\"stop\" + 0.016*\"damag\" + 0.016*\"norwai\" + 0.015*\"sweden\" + 0.015*\"swedish\" + 0.013*\"wind\" + 0.013*\"norwegian\" + 0.012*\"treeless\" + 0.011*\"huntsvil\" + 0.011*\"denmark\"\n", + "2019-01-31 01:21:14,197 : INFO : topic diff=0.003498, rho=0.023002\n", + "2019-01-31 01:21:14,357 : INFO : PROGRESS: pass 0, at document #3782000/4922894\n", + "2019-01-31 01:21:15,736 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:21:16,003 : INFO : topic #43 (0.020): 0.062*\"elect\" + 0.055*\"parti\" + 0.024*\"voluntari\" + 0.023*\"democrat\" + 0.019*\"member\" + 0.017*\"polici\" + 0.015*\"republ\" + 0.015*\"bypass\" + 0.013*\"seaport\" + 0.013*\"selma\"\n", + "2019-01-31 01:21:16,004 : INFO : topic #13 (0.020): 0.025*\"sourc\" + 0.025*\"australia\" + 0.025*\"london\" + 0.025*\"new\" + 0.023*\"england\" + 0.022*\"australian\" + 0.019*\"british\" + 0.016*\"ireland\" + 0.014*\"youth\" + 0.014*\"wale\"\n", + "2019-01-31 01:21:16,005 : INFO : topic #25 (0.020): 0.032*\"ring\" + 0.019*\"area\" + 0.017*\"lagrang\" + 0.016*\"warmth\" + 0.015*\"mount\" + 0.010*\"north\" + 0.009*\"sourc\" + 0.009*\"palmer\" + 0.009*\"lobe\" + 0.009*\"land\"\n", + "2019-01-31 01:21:16,006 : INFO : topic #36 (0.020): 0.011*\"network\" + 0.011*\"prognosi\" + 0.009*\"pop\" + 0.009*\"cytokin\" + 0.008*\"diggin\" + 0.008*\"develop\" + 0.008*\"championship\" + 0.008*\"softwar\" + 0.008*\"uruguayan\" + 0.008*\"user\"\n", + "2019-01-31 01:21:16,007 : INFO : topic #31 (0.020): 0.051*\"fusiform\" + 0.026*\"scientist\" + 0.025*\"taxpay\" + 0.023*\"player\" + 0.020*\"place\" + 0.015*\"clot\" + 0.013*\"leagu\" + 0.011*\"folei\" + 0.010*\"yawn\" + 0.009*\"reconstruct\"\n", + "2019-01-31 01:21:16,013 : INFO : topic diff=0.003374, rho=0.022996\n", + "2019-01-31 01:21:16,167 : INFO : PROGRESS: pass 0, at document #3784000/4922894\n", + "2019-01-31 01:21:17,536 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:21:17,803 : INFO : topic #7 (0.020): 0.021*\"snatch\" + 0.020*\"di\" + 0.019*\"factor\" + 0.016*\"margin\" + 0.016*\"yawn\" + 0.014*\"bone\" + 0.013*\"life\" + 0.013*\"faster\" + 0.012*\"deal\" + 0.012*\"daughter\"\n", + "2019-01-31 01:21:17,804 : INFO : topic #14 (0.020): 0.025*\"forc\" + 0.024*\"aggress\" + 0.021*\"armi\" + 0.020*\"walter\" + 0.018*\"com\" + 0.013*\"unionist\" + 0.013*\"oper\" + 0.013*\"militari\" + 0.012*\"airbu\" + 0.011*\"diversifi\"\n", + "2019-01-31 01:21:17,805 : INFO : topic #34 (0.020): 0.065*\"start\" + 0.034*\"new\" + 0.031*\"american\" + 0.028*\"unionist\" + 0.026*\"cotton\" + 0.021*\"year\" + 0.015*\"california\" + 0.013*\"warrior\" + 0.012*\"terri\" + 0.012*\"north\"\n", + "2019-01-31 01:21:17,806 : INFO : topic #9 (0.020): 0.070*\"bone\" + 0.047*\"american\" + 0.029*\"valour\" + 0.020*\"dutch\" + 0.018*\"folei\" + 0.017*\"player\" + 0.017*\"polit\" + 0.017*\"english\" + 0.012*\"acrimoni\" + 0.011*\"simpler\"\n", + "2019-01-31 01:21:17,807 : INFO : topic #42 (0.020): 0.048*\"german\" + 0.032*\"germani\" + 0.015*\"vol\" + 0.014*\"jewish\" + 0.014*\"israel\" + 0.013*\"der\" + 0.013*\"berlin\" + 0.011*\"european\" + 0.009*\"europ\" + 0.009*\"austria\"\n", + "2019-01-31 01:21:17,813 : INFO : topic diff=0.003121, rho=0.022990\n", + "2019-01-31 01:21:17,970 : INFO : PROGRESS: pass 0, at document #3786000/4922894\n", + "2019-01-31 01:21:19,350 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:21:19,617 : INFO : topic #5 (0.020): 0.038*\"abroad\" + 0.028*\"son\" + 0.027*\"rel\" + 0.026*\"reconstruct\" + 0.021*\"band\" + 0.016*\"muscl\" + 0.015*\"simultan\" + 0.014*\"charcoal\" + 0.013*\"toyota\" + 0.009*\"myspac\"\n", + "2019-01-31 01:21:19,617 : INFO : topic #26 (0.020): 0.032*\"workplac\" + 0.030*\"champion\" + 0.026*\"woman\" + 0.025*\"olymp\" + 0.024*\"men\" + 0.021*\"medal\" + 0.020*\"event\" + 0.019*\"rainfal\" + 0.018*\"atheist\" + 0.018*\"taxpay\"\n", + "2019-01-31 01:21:19,619 : INFO : topic #23 (0.020): 0.135*\"audit\" + 0.068*\"best\" + 0.033*\"yawn\" + 0.030*\"jacksonvil\" + 0.023*\"japanes\" + 0.021*\"noll\" + 0.019*\"festiv\" + 0.018*\"women\" + 0.017*\"intern\" + 0.013*\"winner\"\n", + "2019-01-31 01:21:19,620 : INFO : topic #31 (0.020): 0.052*\"fusiform\" + 0.027*\"scientist\" + 0.025*\"taxpay\" + 0.023*\"player\" + 0.020*\"place\" + 0.015*\"clot\" + 0.013*\"leagu\" + 0.011*\"folei\" + 0.010*\"yawn\" + 0.009*\"reconstruct\"\n", + "2019-01-31 01:21:19,621 : INFO : topic #17 (0.020): 0.077*\"church\" + 0.022*\"cathol\" + 0.021*\"bishop\" + 0.021*\"christian\" + 0.017*\"sail\" + 0.015*\"retroflex\" + 0.010*\"relationship\" + 0.009*\"parish\" + 0.009*\"historiographi\" + 0.009*\"cathedr\"\n", + "2019-01-31 01:21:19,626 : INFO : topic diff=0.003101, rho=0.022984\n", + "2019-01-31 01:21:19,784 : INFO : PROGRESS: pass 0, at document #3788000/4922894\n", + "2019-01-31 01:21:21,154 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:21:21,421 : INFO : topic #20 (0.020): 0.144*\"scholar\" + 0.039*\"struggl\" + 0.033*\"high\" + 0.032*\"educ\" + 0.025*\"collector\" + 0.017*\"yawn\" + 0.014*\"prognosi\" + 0.010*\"district\" + 0.010*\"gothic\" + 0.010*\"task\"\n", + "2019-01-31 01:21:21,422 : INFO : topic #48 (0.020): 0.082*\"sens\" + 0.078*\"octob\" + 0.077*\"march\" + 0.072*\"juli\" + 0.071*\"august\" + 0.070*\"judici\" + 0.069*\"notion\" + 0.069*\"januari\" + 0.067*\"april\" + 0.064*\"decatur\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 01:21:21,423 : INFO : topic #25 (0.020): 0.031*\"ring\" + 0.019*\"area\" + 0.017*\"lagrang\" + 0.016*\"warmth\" + 0.015*\"mount\" + 0.010*\"north\" + 0.009*\"palmer\" + 0.009*\"sourc\" + 0.009*\"lobe\" + 0.009*\"land\"\n", + "2019-01-31 01:21:21,424 : INFO : topic #32 (0.020): 0.054*\"district\" + 0.044*\"popolo\" + 0.043*\"vigour\" + 0.035*\"tortur\" + 0.034*\"cotton\" + 0.023*\"area\" + 0.022*\"adulthood\" + 0.021*\"multitud\" + 0.019*\"cede\" + 0.019*\"regim\"\n", + "2019-01-31 01:21:21,425 : INFO : topic #6 (0.020): 0.070*\"fewer\" + 0.024*\"epiru\" + 0.020*\"septemb\" + 0.018*\"teacher\" + 0.015*\"stake\" + 0.012*\"rodríguez\" + 0.012*\"proclaim\" + 0.011*\"direct\" + 0.010*\"movi\" + 0.010*\"acrimoni\"\n", + "2019-01-31 01:21:21,431 : INFO : topic diff=0.002981, rho=0.022978\n", + "2019-01-31 01:21:21,587 : INFO : PROGRESS: pass 0, at document #3790000/4922894\n", + "2019-01-31 01:21:22,961 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:21:23,228 : INFO : topic #12 (0.020): 0.009*\"number\" + 0.007*\"frontal\" + 0.007*\"gener\" + 0.006*\"exampl\" + 0.006*\"southern\" + 0.006*\"poet\" + 0.006*\"théori\" + 0.006*\"servitud\" + 0.006*\"measur\" + 0.005*\"utopian\"\n", + "2019-01-31 01:21:23,229 : INFO : topic #41 (0.020): 0.038*\"citi\" + 0.024*\"palmer\" + 0.020*\"new\" + 0.016*\"strategist\" + 0.013*\"open\" + 0.013*\"center\" + 0.011*\"includ\" + 0.011*\"lobe\" + 0.010*\"dai\" + 0.009*\"local\"\n", + "2019-01-31 01:21:23,230 : INFO : topic #33 (0.020): 0.059*\"french\" + 0.046*\"franc\" + 0.032*\"pari\" + 0.023*\"sail\" + 0.022*\"jean\" + 0.017*\"daphn\" + 0.014*\"lazi\" + 0.013*\"loui\" + 0.012*\"piec\" + 0.009*\"wine\"\n", + "2019-01-31 01:21:23,231 : INFO : topic #44 (0.020): 0.029*\"rooftop\" + 0.027*\"final\" + 0.023*\"wife\" + 0.020*\"tourist\" + 0.019*\"champion\" + 0.015*\"taxpay\" + 0.014*\"martin\" + 0.014*\"open\" + 0.014*\"tiepolo\" + 0.013*\"chamber\"\n", + "2019-01-31 01:21:23,232 : INFO : topic #4 (0.020): 0.020*\"enfranchis\" + 0.015*\"depress\" + 0.014*\"pour\" + 0.008*\"mode\" + 0.008*\"elabor\" + 0.008*\"veget\" + 0.007*\"uruguayan\" + 0.006*\"turn\" + 0.006*\"produc\" + 0.006*\"develop\"\n", + "2019-01-31 01:21:23,238 : INFO : topic diff=0.003257, rho=0.022972\n", + "2019-01-31 01:21:23,395 : INFO : PROGRESS: pass 0, at document #3792000/4922894\n", + "2019-01-31 01:21:24,764 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:21:25,030 : INFO : topic #12 (0.020): 0.009*\"number\" + 0.007*\"frontal\" + 0.007*\"gener\" + 0.006*\"exampl\" + 0.006*\"southern\" + 0.006*\"théori\" + 0.006*\"poet\" + 0.006*\"servitud\" + 0.006*\"measur\" + 0.005*\"utopian\"\n", + "2019-01-31 01:21:25,031 : INFO : topic #11 (0.020): 0.023*\"john\" + 0.011*\"will\" + 0.011*\"david\" + 0.011*\"jame\" + 0.010*\"rival\" + 0.009*\"mexican–american\" + 0.008*\"slur\" + 0.008*\"georg\" + 0.008*\"paul\" + 0.007*\"rhyme\"\n", + "2019-01-31 01:21:25,032 : INFO : topic #23 (0.020): 0.136*\"audit\" + 0.068*\"best\" + 0.033*\"yawn\" + 0.030*\"jacksonvil\" + 0.023*\"japanes\" + 0.021*\"noll\" + 0.019*\"festiv\" + 0.019*\"women\" + 0.017*\"intern\" + 0.013*\"winner\"\n", + "2019-01-31 01:21:25,034 : INFO : topic #27 (0.020): 0.071*\"questionnair\" + 0.021*\"candid\" + 0.018*\"taxpay\" + 0.013*\"driver\" + 0.012*\"tornado\" + 0.012*\"fool\" + 0.012*\"ret\" + 0.012*\"find\" + 0.010*\"landslid\" + 0.010*\"champion\"\n", + "2019-01-31 01:21:25,035 : INFO : topic #41 (0.020): 0.038*\"citi\" + 0.024*\"palmer\" + 0.020*\"new\" + 0.016*\"strategist\" + 0.013*\"open\" + 0.013*\"center\" + 0.011*\"includ\" + 0.011*\"lobe\" + 0.010*\"dai\" + 0.009*\"local\"\n", + "2019-01-31 01:21:25,040 : INFO : topic diff=0.002636, rho=0.022966\n", + "2019-01-31 01:21:25,197 : INFO : PROGRESS: pass 0, at document #3794000/4922894\n", + "2019-01-31 01:21:26,563 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:21:26,829 : INFO : topic #4 (0.020): 0.020*\"enfranchis\" + 0.014*\"depress\" + 0.014*\"pour\" + 0.008*\"mode\" + 0.008*\"elabor\" + 0.008*\"veget\" + 0.007*\"uruguayan\" + 0.006*\"turn\" + 0.006*\"produc\" + 0.006*\"develop\"\n", + "2019-01-31 01:21:26,831 : INFO : topic #13 (0.020): 0.026*\"sourc\" + 0.025*\"australia\" + 0.025*\"london\" + 0.025*\"new\" + 0.023*\"england\" + 0.022*\"australian\" + 0.019*\"british\" + 0.016*\"ireland\" + 0.014*\"wale\" + 0.014*\"youth\"\n", + "2019-01-31 01:21:26,832 : INFO : topic #12 (0.020): 0.009*\"number\" + 0.007*\"frontal\" + 0.007*\"gener\" + 0.006*\"exampl\" + 0.006*\"southern\" + 0.006*\"poet\" + 0.006*\"théori\" + 0.006*\"servitud\" + 0.006*\"measur\" + 0.005*\"utopian\"\n", + "2019-01-31 01:21:26,833 : INFO : topic #10 (0.020): 0.011*\"cdd\" + 0.009*\"media\" + 0.008*\"hormon\" + 0.008*\"disco\" + 0.007*\"pathwai\" + 0.007*\"have\" + 0.007*\"caus\" + 0.006*\"treat\" + 0.006*\"proper\" + 0.006*\"effect\"\n", + "2019-01-31 01:21:26,834 : INFO : topic #47 (0.020): 0.063*\"muscl\" + 0.033*\"perceptu\" + 0.022*\"theater\" + 0.019*\"place\" + 0.018*\"compos\" + 0.017*\"damn\" + 0.013*\"olympo\" + 0.013*\"physician\" + 0.013*\"orchestr\" + 0.011*\"word\"\n", + "2019-01-31 01:21:26,840 : INFO : topic diff=0.003099, rho=0.022960\n", + "2019-01-31 01:21:26,993 : INFO : PROGRESS: pass 0, at document #3796000/4922894\n", + "2019-01-31 01:21:28,351 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:21:28,618 : INFO : topic #26 (0.020): 0.032*\"workplac\" + 0.031*\"champion\" + 0.026*\"woman\" + 0.025*\"olymp\" + 0.025*\"men\" + 0.021*\"medal\" + 0.020*\"event\" + 0.019*\"rainfal\" + 0.018*\"atheist\" + 0.018*\"taxpay\"\n", + "2019-01-31 01:21:28,619 : INFO : topic #27 (0.020): 0.072*\"questionnair\" + 0.022*\"candid\" + 0.018*\"taxpay\" + 0.013*\"driver\" + 0.013*\"tornado\" + 0.012*\"fool\" + 0.012*\"ret\" + 0.011*\"find\" + 0.010*\"landslid\" + 0.010*\"champion\"\n", + "2019-01-31 01:21:28,620 : INFO : topic #1 (0.020): 0.057*\"china\" + 0.046*\"chilton\" + 0.025*\"hong\" + 0.024*\"kong\" + 0.020*\"korea\" + 0.018*\"korean\" + 0.015*\"leah\" + 0.015*\"kim\" + 0.015*\"sourc\" + 0.014*\"shirin\"\n", + "2019-01-31 01:21:28,621 : INFO : topic #44 (0.020): 0.029*\"rooftop\" + 0.026*\"final\" + 0.023*\"wife\" + 0.020*\"tourist\" + 0.020*\"champion\" + 0.015*\"taxpay\" + 0.015*\"martin\" + 0.014*\"winner\" + 0.014*\"tiepolo\" + 0.014*\"chamber\"\n", + "2019-01-31 01:21:28,622 : INFO : topic #30 (0.020): 0.035*\"leagu\" + 0.035*\"cleveland\" + 0.029*\"place\" + 0.027*\"taxpay\" + 0.024*\"scientist\" + 0.024*\"crete\" + 0.021*\"folei\" + 0.017*\"goal\" + 0.015*\"martin\" + 0.012*\"schmitz\"\n", + "2019-01-31 01:21:28,628 : INFO : topic diff=0.003356, rho=0.022954\n", + "2019-01-31 01:21:28,788 : INFO : PROGRESS: pass 0, at document #3798000/4922894\n", + "2019-01-31 01:21:30,196 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:21:30,463 : INFO : topic #28 (0.020): 0.035*\"build\" + 0.030*\"hous\" + 0.018*\"buford\" + 0.015*\"histor\" + 0.011*\"linear\" + 0.011*\"constitut\" + 0.011*\"silicon\" + 0.011*\"depress\" + 0.011*\"centuri\" + 0.010*\"briarwood\"\n", + "2019-01-31 01:21:30,464 : INFO : topic #41 (0.020): 0.038*\"citi\" + 0.024*\"palmer\" + 0.020*\"new\" + 0.016*\"strategist\" + 0.013*\"open\" + 0.013*\"center\" + 0.011*\"includ\" + 0.011*\"lobe\" + 0.010*\"dai\" + 0.009*\"local\"\n", + "2019-01-31 01:21:30,465 : INFO : topic #32 (0.020): 0.054*\"district\" + 0.044*\"popolo\" + 0.042*\"vigour\" + 0.035*\"tortur\" + 0.034*\"cotton\" + 0.022*\"area\" + 0.022*\"adulthood\" + 0.020*\"multitud\" + 0.020*\"cede\" + 0.019*\"regim\"\n", + "2019-01-31 01:21:30,466 : INFO : topic #9 (0.020): 0.071*\"bone\" + 0.047*\"american\" + 0.028*\"valour\" + 0.019*\"dutch\" + 0.018*\"folei\" + 0.017*\"player\" + 0.017*\"polit\" + 0.016*\"english\" + 0.012*\"acrimoni\" + 0.012*\"simpler\"\n", + "2019-01-31 01:21:30,467 : INFO : topic #37 (0.020): 0.013*\"charact\" + 0.011*\"septemb\" + 0.011*\"anim\" + 0.010*\"man\" + 0.008*\"comic\" + 0.007*\"appear\" + 0.007*\"storag\" + 0.006*\"workplac\" + 0.006*\"fusiform\" + 0.006*\"vision\"\n", + "2019-01-31 01:21:30,473 : INFO : topic diff=0.004252, rho=0.022948\n", + "2019-01-31 01:21:33,146 : INFO : -11.837 per-word bound, 3657.8 perplexity estimate based on a held-out corpus of 2000 documents with 566504 words\n", + "2019-01-31 01:21:33,146 : INFO : PROGRESS: pass 0, at document #3800000/4922894\n", + "2019-01-31 01:21:34,505 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:21:34,772 : INFO : topic #0 (0.020): 0.065*\"statewid\" + 0.043*\"line\" + 0.031*\"raid\" + 0.025*\"rosenwald\" + 0.024*\"rivièr\" + 0.019*\"traceabl\" + 0.019*\"serv\" + 0.018*\"airmen\" + 0.015*\"oper\" + 0.011*\"transient\"\n", + "2019-01-31 01:21:34,773 : INFO : topic #28 (0.020): 0.035*\"build\" + 0.030*\"hous\" + 0.018*\"buford\" + 0.015*\"histor\" + 0.011*\"linear\" + 0.011*\"constitut\" + 0.011*\"silicon\" + 0.011*\"depress\" + 0.011*\"centuri\" + 0.010*\"briarwood\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 01:21:34,774 : INFO : topic #49 (0.020): 0.044*\"india\" + 0.029*\"incumb\" + 0.013*\"pakistan\" + 0.013*\"islam\" + 0.012*\"muskoge\" + 0.011*\"anglo\" + 0.011*\"affection\" + 0.011*\"sri\" + 0.010*\"khalsa\" + 0.010*\"tajikistan\"\n", + "2019-01-31 01:21:34,775 : INFO : topic #3 (0.020): 0.033*\"present\" + 0.027*\"offic\" + 0.023*\"minist\" + 0.023*\"nation\" + 0.023*\"govern\" + 0.021*\"serv\" + 0.020*\"member\" + 0.016*\"start\" + 0.016*\"gener\" + 0.014*\"chickasaw\"\n", + "2019-01-31 01:21:34,776 : INFO : topic #16 (0.020): 0.059*\"king\" + 0.030*\"priest\" + 0.022*\"duke\" + 0.018*\"rotterdam\" + 0.018*\"idiosyncrat\" + 0.017*\"quarterli\" + 0.016*\"grammat\" + 0.014*\"kingdom\" + 0.013*\"count\" + 0.013*\"brazil\"\n", + "2019-01-31 01:21:34,782 : INFO : topic diff=0.004160, rho=0.022942\n", + "2019-01-31 01:21:34,942 : INFO : PROGRESS: pass 0, at document #3802000/4922894\n", + "2019-01-31 01:21:36,327 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:21:36,593 : INFO : topic #47 (0.020): 0.063*\"muscl\" + 0.033*\"perceptu\" + 0.021*\"theater\" + 0.019*\"place\" + 0.017*\"compos\" + 0.017*\"damn\" + 0.013*\"olympo\" + 0.013*\"orchestr\" + 0.013*\"physician\" + 0.011*\"word\"\n", + "2019-01-31 01:21:36,594 : INFO : topic #7 (0.020): 0.021*\"snatch\" + 0.020*\"di\" + 0.019*\"factor\" + 0.016*\"margin\" + 0.016*\"yawn\" + 0.014*\"bone\" + 0.013*\"life\" + 0.013*\"faster\" + 0.012*\"deal\" + 0.012*\"daughter\"\n", + "2019-01-31 01:21:36,595 : INFO : topic #8 (0.020): 0.027*\"law\" + 0.022*\"cortic\" + 0.019*\"start\" + 0.015*\"act\" + 0.012*\"case\" + 0.012*\"ricardo\" + 0.010*\"polaris\" + 0.010*\"replac\" + 0.008*\"legal\" + 0.007*\"justic\"\n", + "2019-01-31 01:21:36,597 : INFO : topic #3 (0.020): 0.033*\"present\" + 0.027*\"offic\" + 0.023*\"minist\" + 0.023*\"nation\" + 0.023*\"govern\" + 0.021*\"serv\" + 0.020*\"member\" + 0.016*\"start\" + 0.016*\"gener\" + 0.014*\"chickasaw\"\n", + "2019-01-31 01:21:36,598 : INFO : topic #43 (0.020): 0.063*\"elect\" + 0.055*\"parti\" + 0.024*\"voluntari\" + 0.023*\"democrat\" + 0.020*\"member\" + 0.017*\"polici\" + 0.015*\"bypass\" + 0.014*\"republ\" + 0.013*\"seaport\" + 0.013*\"liber\"\n", + "2019-01-31 01:21:36,603 : INFO : topic diff=0.003732, rho=0.022936\n", + "2019-01-31 01:21:36,760 : INFO : PROGRESS: pass 0, at document #3804000/4922894\n", + "2019-01-31 01:21:38,130 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:21:38,396 : INFO : topic #43 (0.020): 0.063*\"elect\" + 0.055*\"parti\" + 0.024*\"voluntari\" + 0.023*\"democrat\" + 0.020*\"member\" + 0.017*\"polici\" + 0.015*\"bypass\" + 0.014*\"republ\" + 0.013*\"seaport\" + 0.013*\"liber\"\n", + "2019-01-31 01:21:38,397 : INFO : topic #17 (0.020): 0.077*\"church\" + 0.022*\"cathol\" + 0.021*\"christian\" + 0.021*\"bishop\" + 0.017*\"sail\" + 0.015*\"retroflex\" + 0.010*\"relationship\" + 0.009*\"parish\" + 0.009*\"cathedr\" + 0.009*\"historiographi\"\n", + "2019-01-31 01:21:38,398 : INFO : topic #0 (0.020): 0.065*\"statewid\" + 0.043*\"line\" + 0.031*\"raid\" + 0.025*\"rosenwald\" + 0.025*\"rivièr\" + 0.019*\"traceabl\" + 0.019*\"serv\" + 0.018*\"airmen\" + 0.015*\"oper\" + 0.011*\"transient\"\n", + "2019-01-31 01:21:38,399 : INFO : topic #8 (0.020): 0.027*\"law\" + 0.022*\"cortic\" + 0.019*\"start\" + 0.016*\"act\" + 0.012*\"case\" + 0.012*\"ricardo\" + 0.010*\"polaris\" + 0.010*\"replac\" + 0.008*\"legal\" + 0.007*\"justic\"\n", + "2019-01-31 01:21:38,400 : INFO : topic #33 (0.020): 0.060*\"french\" + 0.045*\"franc\" + 0.032*\"pari\" + 0.023*\"sail\" + 0.022*\"jean\" + 0.017*\"daphn\" + 0.014*\"lazi\" + 0.013*\"loui\" + 0.011*\"piec\" + 0.009*\"wine\"\n", + "2019-01-31 01:21:38,406 : INFO : topic diff=0.003228, rho=0.022930\n", + "2019-01-31 01:21:38,617 : INFO : PROGRESS: pass 0, at document #3806000/4922894\n", + "2019-01-31 01:21:39,987 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:21:40,254 : INFO : topic #25 (0.020): 0.031*\"ring\" + 0.019*\"area\" + 0.017*\"lagrang\" + 0.016*\"warmth\" + 0.015*\"mount\" + 0.010*\"north\" + 0.009*\"sourc\" + 0.009*\"palmer\" + 0.009*\"lobe\" + 0.009*\"land\"\n", + "2019-01-31 01:21:40,255 : INFO : topic #19 (0.020): 0.017*\"languag\" + 0.015*\"centuri\" + 0.010*\"woodcut\" + 0.009*\"form\" + 0.009*\"origin\" + 0.009*\"mean\" + 0.008*\"trade\" + 0.008*\"english\" + 0.007*\"known\" + 0.007*\"ancestor\"\n", + "2019-01-31 01:21:40,256 : INFO : topic #36 (0.020): 0.011*\"network\" + 0.011*\"prognosi\" + 0.010*\"pop\" + 0.008*\"cytokin\" + 0.008*\"develop\" + 0.008*\"diggin\" + 0.008*\"user\" + 0.008*\"uruguayan\" + 0.008*\"softwar\" + 0.007*\"championship\"\n", + "2019-01-31 01:21:40,257 : INFO : topic #41 (0.020): 0.039*\"citi\" + 0.024*\"palmer\" + 0.020*\"new\" + 0.016*\"strategist\" + 0.013*\"open\" + 0.013*\"center\" + 0.011*\"includ\" + 0.011*\"lobe\" + 0.010*\"dai\" + 0.009*\"highli\"\n", + "2019-01-31 01:21:40,258 : INFO : topic #2 (0.020): 0.049*\"isl\" + 0.039*\"shield\" + 0.017*\"narrat\" + 0.016*\"scot\" + 0.013*\"pope\" + 0.012*\"blur\" + 0.011*\"coalit\" + 0.010*\"nativist\" + 0.009*\"bahá\" + 0.009*\"fleet\"\n", + "2019-01-31 01:21:40,264 : INFO : topic diff=0.003052, rho=0.022923\n", + "2019-01-31 01:21:40,420 : INFO : PROGRESS: pass 0, at document #3808000/4922894\n", + "2019-01-31 01:21:41,797 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:21:42,063 : INFO : topic #48 (0.020): 0.083*\"sens\" + 0.078*\"march\" + 0.077*\"octob\" + 0.072*\"juli\" + 0.072*\"august\" + 0.070*\"judici\" + 0.069*\"notion\" + 0.068*\"januari\" + 0.067*\"april\" + 0.063*\"decatur\"\n", + "2019-01-31 01:21:42,064 : INFO : topic #31 (0.020): 0.052*\"fusiform\" + 0.027*\"scientist\" + 0.025*\"taxpay\" + 0.023*\"player\" + 0.020*\"place\" + 0.014*\"clot\" + 0.013*\"leagu\" + 0.011*\"folei\" + 0.010*\"yawn\" + 0.009*\"reconstruct\"\n", + "2019-01-31 01:21:42,065 : INFO : topic #15 (0.020): 0.011*\"small\" + 0.010*\"organ\" + 0.009*\"develop\" + 0.009*\"commun\" + 0.009*\"group\" + 0.008*\"word\" + 0.008*\"peopl\" + 0.007*\"woman\" + 0.007*\"human\" + 0.006*\"summerhil\"\n", + "2019-01-31 01:21:42,066 : INFO : topic #14 (0.020): 0.025*\"forc\" + 0.023*\"aggress\" + 0.021*\"armi\" + 0.020*\"walter\" + 0.018*\"com\" + 0.013*\"oper\" + 0.013*\"unionist\" + 0.013*\"militari\" + 0.012*\"airbu\" + 0.011*\"refut\"\n", + "2019-01-31 01:21:42,067 : INFO : topic #11 (0.020): 0.023*\"john\" + 0.011*\"jame\" + 0.011*\"david\" + 0.011*\"will\" + 0.010*\"rival\" + 0.009*\"mexican–american\" + 0.008*\"slur\" + 0.008*\"georg\" + 0.008*\"paul\" + 0.007*\"rhyme\"\n", + "2019-01-31 01:21:42,073 : INFO : topic diff=0.003396, rho=0.022917\n", + "2019-01-31 01:21:42,229 : INFO : PROGRESS: pass 0, at document #3810000/4922894\n", + "2019-01-31 01:21:43,593 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:21:43,859 : INFO : topic #22 (0.020): 0.035*\"spars\" + 0.019*\"factor\" + 0.012*\"plaisir\" + 0.011*\"genu\" + 0.010*\"western\" + 0.008*\"biom\" + 0.008*\"median\" + 0.007*\"incom\" + 0.006*\"florida\" + 0.006*\"trap\"\n", + "2019-01-31 01:21:43,861 : INFO : topic #33 (0.020): 0.060*\"french\" + 0.045*\"franc\" + 0.032*\"pari\" + 0.023*\"sail\" + 0.022*\"jean\" + 0.017*\"daphn\" + 0.014*\"lazi\" + 0.013*\"loui\" + 0.011*\"piec\" + 0.009*\"wine\"\n", + "2019-01-31 01:21:43,862 : INFO : topic #4 (0.020): 0.020*\"enfranchis\" + 0.015*\"depress\" + 0.014*\"pour\" + 0.009*\"veget\" + 0.008*\"elabor\" + 0.008*\"mode\" + 0.007*\"uruguayan\" + 0.006*\"turn\" + 0.006*\"produc\" + 0.006*\"develop\"\n", + "2019-01-31 01:21:43,863 : INFO : topic #14 (0.020): 0.025*\"forc\" + 0.023*\"aggress\" + 0.021*\"armi\" + 0.021*\"walter\" + 0.018*\"com\" + 0.013*\"oper\" + 0.013*\"unionist\" + 0.013*\"militari\" + 0.012*\"airbu\" + 0.011*\"refut\"\n", + "2019-01-31 01:21:43,864 : INFO : topic #42 (0.020): 0.048*\"german\" + 0.033*\"germani\" + 0.015*\"vol\" + 0.014*\"israel\" + 0.014*\"berlin\" + 0.014*\"jewish\" + 0.013*\"der\" + 0.011*\"european\" + 0.009*\"europ\" + 0.009*\"hungarian\"\n", + "2019-01-31 01:21:43,870 : INFO : topic diff=0.003541, rho=0.022911\n", + "2019-01-31 01:21:44,030 : INFO : PROGRESS: pass 0, at document #3812000/4922894\n", + "2019-01-31 01:21:45,430 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:21:45,697 : INFO : topic #49 (0.020): 0.044*\"india\" + 0.028*\"incumb\" + 0.015*\"pakistan\" + 0.013*\"islam\" + 0.013*\"muskoge\" + 0.011*\"anglo\" + 0.011*\"khalsa\" + 0.011*\"affection\" + 0.010*\"sri\" + 0.010*\"alam\"\n", + "2019-01-31 01:21:45,698 : INFO : topic #19 (0.020): 0.016*\"languag\" + 0.015*\"centuri\" + 0.010*\"woodcut\" + 0.009*\"form\" + 0.009*\"origin\" + 0.009*\"mean\" + 0.008*\"trade\" + 0.008*\"english\" + 0.007*\"known\" + 0.007*\"ancestor\"\n", + "2019-01-31 01:21:45,699 : INFO : topic #39 (0.020): 0.059*\"canada\" + 0.047*\"canadian\" + 0.024*\"hoar\" + 0.023*\"toronto\" + 0.021*\"ontario\" + 0.016*\"hydrogen\" + 0.015*\"new\" + 0.015*\"novotná\" + 0.013*\"misericordia\" + 0.012*\"quebec\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 01:21:45,700 : INFO : topic #20 (0.020): 0.145*\"scholar\" + 0.039*\"struggl\" + 0.033*\"high\" + 0.031*\"educ\" + 0.024*\"collector\" + 0.018*\"yawn\" + 0.013*\"prognosi\" + 0.010*\"district\" + 0.010*\"task\" + 0.009*\"start\"\n", + "2019-01-31 01:21:45,701 : INFO : topic #7 (0.020): 0.021*\"snatch\" + 0.020*\"di\" + 0.019*\"factor\" + 0.016*\"margin\" + 0.016*\"yawn\" + 0.014*\"bone\" + 0.013*\"life\" + 0.013*\"faster\" + 0.012*\"deal\" + 0.012*\"daughter\"\n", + "2019-01-31 01:21:45,707 : INFO : topic diff=0.004560, rho=0.022905\n", + "2019-01-31 01:21:45,866 : INFO : PROGRESS: pass 0, at document #3814000/4922894\n", + "2019-01-31 01:21:47,240 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:21:47,506 : INFO : topic #41 (0.020): 0.039*\"citi\" + 0.024*\"palmer\" + 0.020*\"new\" + 0.016*\"strategist\" + 0.013*\"open\" + 0.013*\"center\" + 0.011*\"includ\" + 0.011*\"lobe\" + 0.010*\"dai\" + 0.009*\"highli\"\n", + "2019-01-31 01:21:47,507 : INFO : topic #25 (0.020): 0.031*\"ring\" + 0.019*\"area\" + 0.017*\"lagrang\" + 0.016*\"warmth\" + 0.016*\"mount\" + 0.010*\"north\" + 0.009*\"sourc\" + 0.009*\"palmer\" + 0.009*\"lobe\" + 0.009*\"land\"\n", + "2019-01-31 01:21:47,508 : INFO : topic #22 (0.020): 0.035*\"spars\" + 0.019*\"factor\" + 0.012*\"plaisir\" + 0.011*\"genu\" + 0.010*\"western\" + 0.008*\"biom\" + 0.008*\"median\" + 0.007*\"incom\" + 0.006*\"florida\" + 0.006*\"trap\"\n", + "2019-01-31 01:21:47,509 : INFO : topic #44 (0.020): 0.030*\"rooftop\" + 0.026*\"final\" + 0.024*\"wife\" + 0.020*\"tourist\" + 0.020*\"champion\" + 0.015*\"martin\" + 0.014*\"taxpay\" + 0.014*\"tiepolo\" + 0.014*\"open\" + 0.013*\"chamber\"\n", + "2019-01-31 01:21:47,510 : INFO : topic #49 (0.020): 0.044*\"india\" + 0.028*\"incumb\" + 0.015*\"pakistan\" + 0.013*\"islam\" + 0.012*\"muskoge\" + 0.011*\"anglo\" + 0.011*\"khalsa\" + 0.011*\"affection\" + 0.010*\"sri\" + 0.010*\"alam\"\n", + "2019-01-31 01:21:47,516 : INFO : topic diff=0.003820, rho=0.022899\n", + "2019-01-31 01:21:47,669 : INFO : PROGRESS: pass 0, at document #3816000/4922894\n", + "2019-01-31 01:21:49,029 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:21:49,295 : INFO : topic #2 (0.020): 0.049*\"isl\" + 0.039*\"shield\" + 0.017*\"narrat\" + 0.015*\"scot\" + 0.012*\"pope\" + 0.012*\"blur\" + 0.011*\"coalit\" + 0.010*\"nativist\" + 0.009*\"bahá\" + 0.009*\"fleet\"\n", + "2019-01-31 01:21:49,296 : INFO : topic #46 (0.020): 0.017*\"stop\" + 0.016*\"norwai\" + 0.016*\"damag\" + 0.015*\"sweden\" + 0.014*\"swedish\" + 0.014*\"wind\" + 0.013*\"norwegian\" + 0.012*\"huntsvil\" + 0.012*\"treeless\" + 0.011*\"denmark\"\n", + "2019-01-31 01:21:49,297 : INFO : topic #4 (0.020): 0.020*\"enfranchis\" + 0.015*\"depress\" + 0.014*\"pour\" + 0.008*\"veget\" + 0.008*\"mode\" + 0.008*\"elabor\" + 0.007*\"uruguayan\" + 0.006*\"produc\" + 0.006*\"turn\" + 0.006*\"develop\"\n", + "2019-01-31 01:21:49,298 : INFO : topic #31 (0.020): 0.052*\"fusiform\" + 0.027*\"scientist\" + 0.025*\"taxpay\" + 0.023*\"player\" + 0.020*\"place\" + 0.014*\"clot\" + 0.013*\"leagu\" + 0.011*\"folei\" + 0.010*\"yawn\" + 0.009*\"reconstruct\"\n", + "2019-01-31 01:21:49,299 : INFO : topic #24 (0.020): 0.039*\"book\" + 0.034*\"publicis\" + 0.027*\"word\" + 0.019*\"new\" + 0.014*\"edit\" + 0.013*\"presid\" + 0.011*\"magazin\" + 0.011*\"worldwid\" + 0.011*\"storag\" + 0.011*\"author\"\n", + "2019-01-31 01:21:49,305 : INFO : topic diff=0.003664, rho=0.022893\n", + "2019-01-31 01:21:49,460 : INFO : PROGRESS: pass 0, at document #3818000/4922894\n", + "2019-01-31 01:21:50,823 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:21:51,090 : INFO : topic #5 (0.020): 0.038*\"abroad\" + 0.028*\"son\" + 0.027*\"rel\" + 0.025*\"reconstruct\" + 0.021*\"band\" + 0.016*\"muscl\" + 0.015*\"simultan\" + 0.014*\"charcoal\" + 0.014*\"toyota\" + 0.010*\"myspac\"\n", + "2019-01-31 01:21:51,091 : INFO : topic #1 (0.020): 0.057*\"china\" + 0.044*\"chilton\" + 0.026*\"hong\" + 0.025*\"kong\" + 0.020*\"korea\" + 0.018*\"kim\" + 0.018*\"korean\" + 0.016*\"leah\" + 0.016*\"sourc\" + 0.014*\"shirin\"\n", + "2019-01-31 01:21:51,092 : INFO : topic #32 (0.020): 0.053*\"district\" + 0.045*\"popolo\" + 0.042*\"vigour\" + 0.035*\"tortur\" + 0.034*\"cotton\" + 0.022*\"area\" + 0.022*\"adulthood\" + 0.021*\"multitud\" + 0.020*\"cede\" + 0.019*\"citi\"\n", + "2019-01-31 01:21:51,093 : INFO : topic #27 (0.020): 0.072*\"questionnair\" + 0.022*\"candid\" + 0.018*\"taxpay\" + 0.013*\"driver\" + 0.013*\"ret\" + 0.012*\"fool\" + 0.012*\"tornado\" + 0.011*\"find\" + 0.011*\"champion\" + 0.010*\"landslid\"\n", + "2019-01-31 01:21:51,094 : INFO : topic #39 (0.020): 0.059*\"canada\" + 0.047*\"canadian\" + 0.025*\"hoar\" + 0.023*\"toronto\" + 0.021*\"ontario\" + 0.017*\"hydrogen\" + 0.015*\"new\" + 0.015*\"novotná\" + 0.014*\"misericordia\" + 0.012*\"quebec\"\n", + "2019-01-31 01:21:51,100 : INFO : topic diff=0.003717, rho=0.022887\n", + "2019-01-31 01:21:53,770 : INFO : -11.499 per-word bound, 2893.6 perplexity estimate based on a held-out corpus of 2000 documents with 558226 words\n", + "2019-01-31 01:21:53,770 : INFO : PROGRESS: pass 0, at document #3820000/4922894\n", + "2019-01-31 01:21:55,131 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:21:55,397 : INFO : topic #40 (0.020): 0.084*\"unit\" + 0.023*\"schuster\" + 0.022*\"institut\" + 0.021*\"requir\" + 0.021*\"collector\" + 0.019*\"student\" + 0.014*\"professor\" + 0.012*\"http\" + 0.012*\"word\" + 0.011*\"degre\"\n", + "2019-01-31 01:21:55,398 : INFO : topic #16 (0.020): 0.060*\"king\" + 0.030*\"priest\" + 0.021*\"duke\" + 0.018*\"rotterdam\" + 0.018*\"quarterli\" + 0.018*\"idiosyncrat\" + 0.016*\"grammat\" + 0.013*\"count\" + 0.013*\"kingdom\" + 0.012*\"brazil\"\n", + "2019-01-31 01:21:55,399 : INFO : topic #46 (0.020): 0.016*\"stop\" + 0.016*\"norwai\" + 0.015*\"damag\" + 0.015*\"sweden\" + 0.014*\"swedish\" + 0.013*\"wind\" + 0.013*\"norwegian\" + 0.012*\"huntsvil\" + 0.011*\"treeless\" + 0.011*\"denmark\"\n", + "2019-01-31 01:21:55,400 : INFO : topic #45 (0.020): 0.038*\"arsen\" + 0.029*\"jpg\" + 0.026*\"fifteenth\" + 0.026*\"museo\" + 0.021*\"pain\" + 0.020*\"illicit\" + 0.015*\"colder\" + 0.014*\"gai\" + 0.014*\"exhaust\" + 0.012*\"artist\"\n", + "2019-01-31 01:21:55,401 : INFO : topic #3 (0.020): 0.034*\"present\" + 0.026*\"offic\" + 0.025*\"minist\" + 0.023*\"nation\" + 0.022*\"govern\" + 0.022*\"serv\" + 0.020*\"member\" + 0.016*\"start\" + 0.016*\"gener\" + 0.013*\"chickasaw\"\n", + "2019-01-31 01:21:55,407 : INFO : topic diff=0.002928, rho=0.022881\n", + "2019-01-31 01:21:55,561 : INFO : PROGRESS: pass 0, at document #3822000/4922894\n", + "2019-01-31 01:21:56,928 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:21:57,234 : INFO : topic #6 (0.020): 0.070*\"fewer\" + 0.025*\"epiru\" + 0.020*\"septemb\" + 0.018*\"teacher\" + 0.015*\"stake\" + 0.012*\"rodríguez\" + 0.012*\"proclaim\" + 0.011*\"direct\" + 0.011*\"movi\" + 0.010*\"acrimoni\"\n", + "2019-01-31 01:21:57,235 : INFO : topic #45 (0.020): 0.038*\"arsen\" + 0.029*\"jpg\" + 0.027*\"fifteenth\" + 0.026*\"museo\" + 0.021*\"pain\" + 0.020*\"illicit\" + 0.015*\"colder\" + 0.014*\"exhaust\" + 0.014*\"gai\" + 0.012*\"artist\"\n", + "2019-01-31 01:21:57,236 : INFO : topic #46 (0.020): 0.016*\"stop\" + 0.016*\"norwai\" + 0.015*\"damag\" + 0.015*\"sweden\" + 0.014*\"swedish\" + 0.013*\"wind\" + 0.013*\"norwegian\" + 0.012*\"huntsvil\" + 0.011*\"denmark\" + 0.011*\"treeless\"\n", + "2019-01-31 01:21:57,237 : INFO : topic #2 (0.020): 0.049*\"isl\" + 0.039*\"shield\" + 0.017*\"narrat\" + 0.015*\"scot\" + 0.012*\"pope\" + 0.012*\"blur\" + 0.011*\"coalit\" + 0.010*\"nativist\" + 0.009*\"bahá\" + 0.009*\"fleet\"\n", + "2019-01-31 01:21:57,238 : INFO : topic #24 (0.020): 0.039*\"book\" + 0.034*\"publicis\" + 0.027*\"word\" + 0.019*\"new\" + 0.014*\"edit\" + 0.013*\"presid\" + 0.011*\"magazin\" + 0.011*\"worldwid\" + 0.011*\"storag\" + 0.011*\"author\"\n", + "2019-01-31 01:21:57,245 : INFO : topic diff=0.003490, rho=0.022875\n", + "2019-01-31 01:21:57,398 : INFO : PROGRESS: pass 0, at document #3824000/4922894\n", + "2019-01-31 01:21:58,759 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:21:59,026 : INFO : topic #34 (0.020): 0.064*\"start\" + 0.034*\"new\" + 0.031*\"american\" + 0.027*\"unionist\" + 0.027*\"cotton\" + 0.021*\"year\" + 0.015*\"california\" + 0.014*\"terri\" + 0.013*\"warrior\" + 0.012*\"citi\"\n", + "2019-01-31 01:21:59,027 : INFO : topic #38 (0.020): 0.023*\"walter\" + 0.009*\"aza\" + 0.009*\"battalion\" + 0.008*\"forc\" + 0.007*\"armi\" + 0.007*\"empath\" + 0.006*\"teufel\" + 0.006*\"citi\" + 0.006*\"govern\" + 0.006*\"militari\"\n", + "2019-01-31 01:21:59,028 : INFO : topic #33 (0.020): 0.061*\"french\" + 0.046*\"franc\" + 0.032*\"pari\" + 0.023*\"sail\" + 0.022*\"jean\" + 0.018*\"daphn\" + 0.014*\"lazi\" + 0.013*\"loui\" + 0.011*\"piec\" + 0.009*\"wine\"\n", + "2019-01-31 01:21:59,029 : INFO : topic #36 (0.020): 0.011*\"prognosi\" + 0.011*\"network\" + 0.010*\"pop\" + 0.008*\"develop\" + 0.008*\"cytokin\" + 0.008*\"diggin\" + 0.008*\"softwar\" + 0.008*\"uruguayan\" + 0.008*\"user\" + 0.007*\"championship\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 01:21:59,030 : INFO : topic #28 (0.020): 0.034*\"build\" + 0.030*\"hous\" + 0.018*\"buford\" + 0.015*\"histor\" + 0.012*\"linear\" + 0.011*\"constitut\" + 0.011*\"silicon\" + 0.011*\"depress\" + 0.011*\"briarwood\" + 0.011*\"centuri\"\n", + "2019-01-31 01:21:59,036 : INFO : topic diff=0.003194, rho=0.022869\n", + "2019-01-31 01:21:59,186 : INFO : PROGRESS: pass 0, at document #3826000/4922894\n", + "2019-01-31 01:22:00,510 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:22:00,777 : INFO : topic #27 (0.020): 0.072*\"questionnair\" + 0.022*\"candid\" + 0.018*\"taxpay\" + 0.013*\"driver\" + 0.013*\"ret\" + 0.012*\"tornado\" + 0.012*\"fool\" + 0.011*\"find\" + 0.011*\"champion\" + 0.010*\"landslid\"\n", + "2019-01-31 01:22:00,778 : INFO : topic #48 (0.020): 0.083*\"sens\" + 0.079*\"march\" + 0.078*\"octob\" + 0.073*\"juli\" + 0.072*\"august\" + 0.071*\"januari\" + 0.070*\"notion\" + 0.070*\"judici\" + 0.067*\"april\" + 0.065*\"decatur\"\n", + "2019-01-31 01:22:00,779 : INFO : topic #18 (0.020): 0.011*\"théori\" + 0.007*\"sack\" + 0.007*\"later\" + 0.006*\"dai\" + 0.006*\"kill\" + 0.005*\"like\" + 0.005*\"retrospect\" + 0.005*\"end\" + 0.004*\"call\" + 0.004*\"help\"\n", + "2019-01-31 01:22:00,780 : INFO : topic #24 (0.020): 0.039*\"book\" + 0.034*\"publicis\" + 0.027*\"word\" + 0.019*\"new\" + 0.014*\"edit\" + 0.013*\"presid\" + 0.011*\"magazin\" + 0.011*\"worldwid\" + 0.011*\"storag\" + 0.011*\"author\"\n", + "2019-01-31 01:22:00,781 : INFO : topic #32 (0.020): 0.053*\"district\" + 0.044*\"popolo\" + 0.042*\"vigour\" + 0.035*\"tortur\" + 0.034*\"cotton\" + 0.022*\"area\" + 0.021*\"adulthood\" + 0.021*\"multitud\" + 0.019*\"cede\" + 0.019*\"citi\"\n", + "2019-01-31 01:22:00,787 : INFO : topic diff=0.003850, rho=0.022863\n", + "2019-01-31 01:22:00,947 : INFO : PROGRESS: pass 0, at document #3828000/4922894\n", + "2019-01-31 01:22:02,332 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:22:02,599 : INFO : topic #17 (0.020): 0.077*\"church\" + 0.022*\"cathol\" + 0.022*\"christian\" + 0.021*\"bishop\" + 0.017*\"sail\" + 0.015*\"retroflex\" + 0.010*\"relationship\" + 0.009*\"cathedr\" + 0.009*\"parish\" + 0.009*\"historiographi\"\n", + "2019-01-31 01:22:02,600 : INFO : topic #1 (0.020): 0.056*\"china\" + 0.044*\"chilton\" + 0.026*\"hong\" + 0.025*\"kong\" + 0.020*\"korea\" + 0.019*\"korean\" + 0.018*\"kim\" + 0.016*\"leah\" + 0.015*\"sourc\" + 0.013*\"shirin\"\n", + "2019-01-31 01:22:02,601 : INFO : topic #0 (0.020): 0.065*\"statewid\" + 0.044*\"line\" + 0.030*\"raid\" + 0.027*\"rosenwald\" + 0.025*\"rivièr\" + 0.019*\"traceabl\" + 0.019*\"serv\" + 0.017*\"airmen\" + 0.015*\"oper\" + 0.010*\"transient\"\n", + "2019-01-31 01:22:02,602 : INFO : topic #46 (0.020): 0.018*\"stop\" + 0.016*\"norwai\" + 0.015*\"damag\" + 0.015*\"sweden\" + 0.014*\"swedish\" + 0.013*\"wind\" + 0.013*\"treeless\" + 0.013*\"norwegian\" + 0.013*\"huntsvil\" + 0.011*\"denmark\"\n", + "2019-01-31 01:22:02,603 : INFO : topic #8 (0.020): 0.026*\"law\" + 0.022*\"cortic\" + 0.019*\"start\" + 0.015*\"act\" + 0.012*\"case\" + 0.012*\"ricardo\" + 0.010*\"replac\" + 0.010*\"polaris\" + 0.009*\"legal\" + 0.007*\"justic\"\n", + "2019-01-31 01:22:02,609 : INFO : topic diff=0.004031, rho=0.022858\n", + "2019-01-31 01:22:02,768 : INFO : PROGRESS: pass 0, at document #3830000/4922894\n", + "2019-01-31 01:22:04,131 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:22:04,398 : INFO : topic #36 (0.020): 0.011*\"network\" + 0.011*\"prognosi\" + 0.010*\"pop\" + 0.008*\"cytokin\" + 0.008*\"develop\" + 0.008*\"softwar\" + 0.008*\"diggin\" + 0.008*\"uruguayan\" + 0.008*\"user\" + 0.007*\"includ\"\n", + "2019-01-31 01:22:04,399 : INFO : topic #9 (0.020): 0.073*\"bone\" + 0.046*\"american\" + 0.029*\"valour\" + 0.019*\"folei\" + 0.019*\"dutch\" + 0.018*\"player\" + 0.017*\"polit\" + 0.016*\"english\" + 0.012*\"acrimoni\" + 0.012*\"simpler\"\n", + "2019-01-31 01:22:04,401 : INFO : topic #37 (0.020): 0.013*\"charact\" + 0.011*\"septemb\" + 0.011*\"anim\" + 0.010*\"man\" + 0.008*\"comic\" + 0.007*\"appear\" + 0.007*\"storag\" + 0.006*\"workplac\" + 0.006*\"fusiform\" + 0.006*\"vision\"\n", + "2019-01-31 01:22:04,402 : INFO : topic #32 (0.020): 0.053*\"district\" + 0.044*\"popolo\" + 0.042*\"vigour\" + 0.035*\"tortur\" + 0.034*\"cotton\" + 0.022*\"area\" + 0.021*\"adulthood\" + 0.021*\"multitud\" + 0.020*\"cede\" + 0.019*\"citi\"\n", + "2019-01-31 01:22:04,403 : INFO : topic #4 (0.020): 0.020*\"enfranchis\" + 0.015*\"depress\" + 0.015*\"pour\" + 0.008*\"veget\" + 0.008*\"elabor\" + 0.008*\"mode\" + 0.007*\"uruguayan\" + 0.006*\"produc\" + 0.006*\"turn\" + 0.006*\"develop\"\n", + "2019-01-31 01:22:04,409 : INFO : topic diff=0.003274, rho=0.022852\n", + "2019-01-31 01:22:04,563 : INFO : PROGRESS: pass 0, at document #3832000/4922894\n", + "2019-01-31 01:22:05,923 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:22:06,189 : INFO : topic #17 (0.020): 0.077*\"church\" + 0.022*\"christian\" + 0.022*\"cathol\" + 0.021*\"bishop\" + 0.017*\"sail\" + 0.015*\"retroflex\" + 0.010*\"relationship\" + 0.009*\"cathedr\" + 0.009*\"parish\" + 0.009*\"historiographi\"\n", + "2019-01-31 01:22:06,190 : INFO : topic #42 (0.020): 0.048*\"german\" + 0.033*\"germani\" + 0.015*\"vol\" + 0.014*\"jewish\" + 0.014*\"berlin\" + 0.014*\"israel\" + 0.013*\"der\" + 0.011*\"european\" + 0.009*\"hungarian\" + 0.009*\"europ\"\n", + "2019-01-31 01:22:06,192 : INFO : topic #38 (0.020): 0.023*\"walter\" + 0.009*\"battalion\" + 0.009*\"aza\" + 0.008*\"forc\" + 0.007*\"armi\" + 0.007*\"empath\" + 0.007*\"teufel\" + 0.006*\"citi\" + 0.006*\"govern\" + 0.006*\"militari\"\n", + "2019-01-31 01:22:06,192 : INFO : topic #16 (0.020): 0.062*\"king\" + 0.030*\"priest\" + 0.020*\"duke\" + 0.018*\"idiosyncrat\" + 0.018*\"rotterdam\" + 0.018*\"quarterli\" + 0.016*\"grammat\" + 0.013*\"kingdom\" + 0.013*\"count\" + 0.012*\"portugues\"\n", + "2019-01-31 01:22:06,193 : INFO : topic #32 (0.020): 0.053*\"district\" + 0.044*\"popolo\" + 0.042*\"vigour\" + 0.035*\"tortur\" + 0.034*\"cotton\" + 0.022*\"area\" + 0.021*\"adulthood\" + 0.021*\"multitud\" + 0.020*\"cede\" + 0.019*\"citi\"\n", + "2019-01-31 01:22:06,199 : INFO : topic diff=0.003031, rho=0.022846\n", + "2019-01-31 01:22:06,354 : INFO : PROGRESS: pass 0, at document #3834000/4922894\n", + "2019-01-31 01:22:07,716 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:22:07,982 : INFO : topic #1 (0.020): 0.056*\"china\" + 0.044*\"chilton\" + 0.026*\"hong\" + 0.024*\"kong\" + 0.020*\"korea\" + 0.019*\"korean\" + 0.018*\"kim\" + 0.016*\"leah\" + 0.015*\"sourc\" + 0.014*\"shirin\"\n", + "2019-01-31 01:22:07,983 : INFO : topic #48 (0.020): 0.083*\"sens\" + 0.080*\"march\" + 0.078*\"octob\" + 0.073*\"juli\" + 0.072*\"august\" + 0.070*\"januari\" + 0.070*\"notion\" + 0.070*\"judici\" + 0.067*\"april\" + 0.065*\"decatur\"\n", + "2019-01-31 01:22:07,984 : INFO : topic #31 (0.020): 0.052*\"fusiform\" + 0.027*\"scientist\" + 0.025*\"taxpay\" + 0.024*\"player\" + 0.020*\"place\" + 0.014*\"clot\" + 0.013*\"leagu\" + 0.011*\"folei\" + 0.010*\"yawn\" + 0.009*\"reconstruct\"\n", + "2019-01-31 01:22:07,985 : INFO : topic #21 (0.020): 0.035*\"samford\" + 0.024*\"spain\" + 0.019*\"del\" + 0.018*\"mexico\" + 0.016*\"italian\" + 0.014*\"soviet\" + 0.012*\"santa\" + 0.011*\"carlo\" + 0.010*\"lizard\" + 0.010*\"juan\"\n", + "2019-01-31 01:22:07,986 : INFO : topic #40 (0.020): 0.086*\"unit\" + 0.024*\"schuster\" + 0.023*\"institut\" + 0.021*\"collector\" + 0.021*\"requir\" + 0.019*\"student\" + 0.014*\"professor\" + 0.011*\"degre\" + 0.011*\"word\" + 0.011*\"http\"\n", + "2019-01-31 01:22:07,992 : INFO : topic diff=0.003450, rho=0.022840\n", + "2019-01-31 01:22:08,147 : INFO : PROGRESS: pass 0, at document #3836000/4922894\n", + "2019-01-31 01:22:09,509 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:22:09,775 : INFO : topic #38 (0.020): 0.023*\"walter\" + 0.009*\"battalion\" + 0.009*\"aza\" + 0.008*\"forc\" + 0.007*\"armi\" + 0.007*\"empath\" + 0.006*\"teufel\" + 0.006*\"citi\" + 0.006*\"govern\" + 0.006*\"militari\"\n", + "2019-01-31 01:22:09,776 : INFO : topic #22 (0.020): 0.034*\"spars\" + 0.019*\"factor\" + 0.012*\"plaisir\" + 0.011*\"genu\" + 0.010*\"western\" + 0.009*\"biom\" + 0.008*\"median\" + 0.007*\"incom\" + 0.006*\"florida\" + 0.006*\"male\"\n", + "2019-01-31 01:22:09,777 : INFO : topic #13 (0.020): 0.026*\"australia\" + 0.025*\"sourc\" + 0.025*\"london\" + 0.025*\"new\" + 0.023*\"england\" + 0.022*\"australian\" + 0.019*\"british\" + 0.017*\"ireland\" + 0.014*\"youth\" + 0.013*\"wale\"\n", + "2019-01-31 01:22:09,778 : INFO : topic #0 (0.020): 0.065*\"statewid\" + 0.044*\"line\" + 0.031*\"raid\" + 0.026*\"rosenwald\" + 0.025*\"rivièr\" + 0.019*\"traceabl\" + 0.019*\"serv\" + 0.017*\"airmen\" + 0.015*\"oper\" + 0.010*\"transient\"\n", + "2019-01-31 01:22:09,779 : INFO : topic #17 (0.020): 0.078*\"church\" + 0.022*\"christian\" + 0.022*\"cathol\" + 0.021*\"bishop\" + 0.017*\"sail\" + 0.015*\"retroflex\" + 0.010*\"relationship\" + 0.009*\"parish\" + 0.009*\"cathedr\" + 0.009*\"historiographi\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 01:22:09,785 : INFO : topic diff=0.003379, rho=0.022834\n", + "2019-01-31 01:22:09,940 : INFO : PROGRESS: pass 0, at document #3838000/4922894\n", + "2019-01-31 01:22:11,288 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:22:11,554 : INFO : topic #28 (0.020): 0.035*\"build\" + 0.030*\"hous\" + 0.019*\"buford\" + 0.015*\"histor\" + 0.012*\"linear\" + 0.011*\"constitut\" + 0.011*\"silicon\" + 0.011*\"depress\" + 0.011*\"briarwood\" + 0.010*\"centuri\"\n", + "2019-01-31 01:22:11,555 : INFO : topic #49 (0.020): 0.044*\"india\" + 0.028*\"incumb\" + 0.014*\"pakistan\" + 0.012*\"islam\" + 0.012*\"muskoge\" + 0.011*\"anglo\" + 0.011*\"khalsa\" + 0.010*\"alam\" + 0.010*\"sri\" + 0.010*\"affection\"\n", + "2019-01-31 01:22:11,556 : INFO : topic #48 (0.020): 0.082*\"sens\" + 0.079*\"march\" + 0.077*\"octob\" + 0.072*\"juli\" + 0.071*\"august\" + 0.070*\"januari\" + 0.069*\"notion\" + 0.069*\"judici\" + 0.066*\"april\" + 0.064*\"decatur\"\n", + "2019-01-31 01:22:11,557 : INFO : topic #22 (0.020): 0.034*\"spars\" + 0.019*\"factor\" + 0.012*\"plaisir\" + 0.011*\"genu\" + 0.010*\"western\" + 0.009*\"biom\" + 0.008*\"median\" + 0.007*\"incom\" + 0.006*\"florida\" + 0.006*\"male\"\n", + "2019-01-31 01:22:11,559 : INFO : topic #18 (0.020): 0.011*\"théori\" + 0.007*\"sack\" + 0.007*\"later\" + 0.006*\"dai\" + 0.006*\"kill\" + 0.005*\"like\" + 0.005*\"retrospect\" + 0.005*\"end\" + 0.005*\"call\" + 0.004*\"help\"\n", + "2019-01-31 01:22:11,564 : INFO : topic diff=0.003153, rho=0.022828\n", + "2019-01-31 01:22:14,291 : INFO : -11.945 per-word bound, 3943.6 perplexity estimate based on a held-out corpus of 2000 documents with 554865 words\n", + "2019-01-31 01:22:14,291 : INFO : PROGRESS: pass 0, at document #3840000/4922894\n", + "2019-01-31 01:22:15,660 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:22:15,926 : INFO : topic #40 (0.020): 0.086*\"unit\" + 0.024*\"schuster\" + 0.023*\"institut\" + 0.022*\"collector\" + 0.021*\"requir\" + 0.019*\"student\" + 0.014*\"professor\" + 0.011*\"degre\" + 0.011*\"http\" + 0.011*\"word\"\n", + "2019-01-31 01:22:15,927 : INFO : topic #41 (0.020): 0.040*\"citi\" + 0.024*\"palmer\" + 0.020*\"new\" + 0.015*\"strategist\" + 0.013*\"open\" + 0.013*\"center\" + 0.011*\"includ\" + 0.011*\"lobe\" + 0.010*\"dai\" + 0.009*\"local\"\n", + "2019-01-31 01:22:15,928 : INFO : topic #39 (0.020): 0.059*\"canada\" + 0.048*\"canadian\" + 0.024*\"hoar\" + 0.023*\"toronto\" + 0.022*\"ontario\" + 0.018*\"hydrogen\" + 0.015*\"new\" + 0.014*\"novotná\" + 0.013*\"misericordia\" + 0.013*\"quebec\"\n", + "2019-01-31 01:22:15,929 : INFO : topic #19 (0.020): 0.016*\"languag\" + 0.015*\"centuri\" + 0.011*\"woodcut\" + 0.009*\"form\" + 0.009*\"mean\" + 0.009*\"origin\" + 0.008*\"trade\" + 0.008*\"english\" + 0.007*\"known\" + 0.007*\"ancestor\"\n", + "2019-01-31 01:22:15,930 : INFO : topic #35 (0.020): 0.056*\"russia\" + 0.036*\"sovereignti\" + 0.035*\"rural\" + 0.025*\"poison\" + 0.024*\"personifi\" + 0.023*\"reprint\" + 0.019*\"moscow\" + 0.018*\"poland\" + 0.015*\"tyrant\" + 0.014*\"turin\"\n", + "2019-01-31 01:22:15,936 : INFO : topic diff=0.003116, rho=0.022822\n", + "2019-01-31 01:22:16,091 : INFO : PROGRESS: pass 0, at document #3842000/4922894\n", + "2019-01-31 01:22:17,450 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:22:17,716 : INFO : topic #20 (0.020): 0.143*\"scholar\" + 0.039*\"struggl\" + 0.033*\"high\" + 0.031*\"educ\" + 0.024*\"collector\" + 0.017*\"yawn\" + 0.014*\"prognosi\" + 0.010*\"district\" + 0.010*\"gothic\" + 0.010*\"task\"\n", + "2019-01-31 01:22:17,717 : INFO : topic #34 (0.020): 0.064*\"start\" + 0.035*\"new\" + 0.031*\"american\" + 0.028*\"cotton\" + 0.027*\"unionist\" + 0.021*\"year\" + 0.015*\"california\" + 0.014*\"terri\" + 0.013*\"warrior\" + 0.012*\"citi\"\n", + "2019-01-31 01:22:17,718 : INFO : topic #12 (0.020): 0.009*\"number\" + 0.007*\"frontal\" + 0.007*\"gener\" + 0.006*\"exampl\" + 0.006*\"poet\" + 0.006*\"utopian\" + 0.006*\"southern\" + 0.006*\"théori\" + 0.006*\"servitud\" + 0.006*\"method\"\n", + "2019-01-31 01:22:17,719 : INFO : topic #35 (0.020): 0.056*\"russia\" + 0.036*\"sovereignti\" + 0.035*\"rural\" + 0.025*\"poison\" + 0.024*\"personifi\" + 0.023*\"reprint\" + 0.019*\"moscow\" + 0.018*\"poland\" + 0.015*\"tyrant\" + 0.014*\"turin\"\n", + "2019-01-31 01:22:17,720 : INFO : topic #40 (0.020): 0.086*\"unit\" + 0.024*\"schuster\" + 0.023*\"institut\" + 0.022*\"collector\" + 0.021*\"requir\" + 0.019*\"student\" + 0.014*\"professor\" + 0.012*\"http\" + 0.011*\"degre\" + 0.011*\"word\"\n", + "2019-01-31 01:22:17,726 : INFO : topic diff=0.003861, rho=0.022816\n", + "2019-01-31 01:22:17,876 : INFO : PROGRESS: pass 0, at document #3844000/4922894\n", + "2019-01-31 01:22:19,207 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:22:19,474 : INFO : topic #48 (0.020): 0.082*\"sens\" + 0.080*\"march\" + 0.078*\"octob\" + 0.072*\"juli\" + 0.072*\"august\" + 0.070*\"januari\" + 0.069*\"notion\" + 0.069*\"judici\" + 0.067*\"april\" + 0.065*\"decatur\"\n", + "2019-01-31 01:22:19,475 : INFO : topic #28 (0.020): 0.035*\"build\" + 0.030*\"hous\" + 0.019*\"buford\" + 0.015*\"histor\" + 0.012*\"linear\" + 0.011*\"constitut\" + 0.011*\"silicon\" + 0.011*\"depress\" + 0.010*\"centuri\" + 0.010*\"briarwood\"\n", + "2019-01-31 01:22:19,476 : INFO : topic #16 (0.020): 0.061*\"king\" + 0.029*\"priest\" + 0.020*\"duke\" + 0.018*\"idiosyncrat\" + 0.018*\"quarterli\" + 0.018*\"rotterdam\" + 0.017*\"grammat\" + 0.013*\"kingdom\" + 0.013*\"count\" + 0.012*\"portugues\"\n", + "2019-01-31 01:22:19,477 : INFO : topic #1 (0.020): 0.055*\"china\" + 0.044*\"chilton\" + 0.026*\"hong\" + 0.026*\"kong\" + 0.020*\"korea\" + 0.019*\"korean\" + 0.017*\"kim\" + 0.015*\"sourc\" + 0.015*\"leah\" + 0.014*\"shirin\"\n", + "2019-01-31 01:22:19,478 : INFO : topic #36 (0.020): 0.011*\"prognosi\" + 0.011*\"network\" + 0.010*\"pop\" + 0.008*\"develop\" + 0.008*\"cytokin\" + 0.008*\"softwar\" + 0.008*\"diggin\" + 0.008*\"user\" + 0.008*\"uruguayan\" + 0.007*\"includ\"\n", + "2019-01-31 01:22:19,483 : INFO : topic diff=0.003386, rho=0.022810\n", + "2019-01-31 01:22:19,641 : INFO : PROGRESS: pass 0, at document #3846000/4922894\n", + "2019-01-31 01:22:21,002 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:22:21,268 : INFO : topic #9 (0.020): 0.072*\"bone\" + 0.045*\"american\" + 0.028*\"valour\" + 0.019*\"dutch\" + 0.018*\"folei\" + 0.017*\"player\" + 0.017*\"polit\" + 0.016*\"english\" + 0.012*\"simpler\" + 0.012*\"acrimoni\"\n", + "2019-01-31 01:22:21,269 : INFO : topic #39 (0.020): 0.059*\"canada\" + 0.047*\"canadian\" + 0.024*\"hoar\" + 0.023*\"toronto\" + 0.022*\"ontario\" + 0.017*\"hydrogen\" + 0.015*\"new\" + 0.015*\"misericordia\" + 0.014*\"novotná\" + 0.012*\"quebec\"\n", + "2019-01-31 01:22:21,271 : INFO : topic #26 (0.020): 0.032*\"workplac\" + 0.030*\"champion\" + 0.026*\"woman\" + 0.025*\"men\" + 0.024*\"olymp\" + 0.022*\"medal\" + 0.020*\"event\" + 0.019*\"rainfal\" + 0.018*\"taxpay\" + 0.017*\"atheist\"\n", + "2019-01-31 01:22:21,272 : INFO : topic #37 (0.020): 0.013*\"charact\" + 0.011*\"septemb\" + 0.011*\"anim\" + 0.010*\"man\" + 0.009*\"comic\" + 0.007*\"appear\" + 0.007*\"storag\" + 0.007*\"workplac\" + 0.006*\"fusiform\" + 0.006*\"vision\"\n", + "2019-01-31 01:22:21,273 : INFO : topic #25 (0.020): 0.031*\"ring\" + 0.019*\"area\" + 0.017*\"lagrang\" + 0.016*\"mount\" + 0.016*\"warmth\" + 0.010*\"north\" + 0.009*\"sourc\" + 0.009*\"palmer\" + 0.009*\"land\" + 0.009*\"lobe\"\n", + "2019-01-31 01:22:21,279 : INFO : topic diff=0.004282, rho=0.022804\n", + "2019-01-31 01:22:21,436 : INFO : PROGRESS: pass 0, at document #3848000/4922894\n", + "2019-01-31 01:22:22,833 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:22:23,099 : INFO : topic #30 (0.020): 0.036*\"cleveland\" + 0.035*\"leagu\" + 0.029*\"place\" + 0.028*\"taxpay\" + 0.024*\"scientist\" + 0.023*\"crete\" + 0.021*\"folei\" + 0.016*\"goal\" + 0.016*\"martin\" + 0.012*\"schmitz\"\n", + "2019-01-31 01:22:23,100 : INFO : topic #21 (0.020): 0.034*\"samford\" + 0.023*\"spain\" + 0.019*\"del\" + 0.018*\"mexico\" + 0.017*\"italian\" + 0.014*\"soviet\" + 0.012*\"santa\" + 0.011*\"juan\" + 0.011*\"carlo\" + 0.010*\"lizard\"\n", + "2019-01-31 01:22:23,101 : INFO : topic #44 (0.020): 0.031*\"rooftop\" + 0.027*\"final\" + 0.023*\"wife\" + 0.020*\"tourist\" + 0.019*\"champion\" + 0.015*\"martin\" + 0.015*\"taxpay\" + 0.014*\"tiepolo\" + 0.013*\"open\" + 0.013*\"chamber\"\n", + "2019-01-31 01:22:23,102 : INFO : topic #16 (0.020): 0.061*\"king\" + 0.029*\"priest\" + 0.021*\"duke\" + 0.018*\"idiosyncrat\" + 0.018*\"quarterli\" + 0.017*\"rotterdam\" + 0.016*\"grammat\" + 0.013*\"kingdom\" + 0.013*\"count\" + 0.012*\"portugues\"\n", + "2019-01-31 01:22:23,103 : INFO : topic #1 (0.020): 0.055*\"china\" + 0.044*\"chilton\" + 0.026*\"hong\" + 0.025*\"kong\" + 0.020*\"korea\" + 0.019*\"korean\" + 0.018*\"kim\" + 0.016*\"leah\" + 0.016*\"sourc\" + 0.014*\"shirin\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 01:22:23,109 : INFO : topic diff=0.003134, rho=0.022798\n", + "2019-01-31 01:22:23,267 : INFO : PROGRESS: pass 0, at document #3850000/4922894\n", + "2019-01-31 01:22:24,659 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:22:24,926 : INFO : topic #39 (0.020): 0.058*\"canada\" + 0.047*\"canadian\" + 0.024*\"hoar\" + 0.023*\"toronto\" + 0.021*\"ontario\" + 0.017*\"hydrogen\" + 0.015*\"new\" + 0.014*\"misericordia\" + 0.014*\"novotná\" + 0.012*\"quebec\"\n", + "2019-01-31 01:22:24,927 : INFO : topic #10 (0.020): 0.012*\"cdd\" + 0.009*\"media\" + 0.008*\"hormon\" + 0.008*\"disco\" + 0.007*\"have\" + 0.007*\"pathwai\" + 0.007*\"caus\" + 0.006*\"effect\" + 0.006*\"proper\" + 0.006*\"treat\"\n", + "2019-01-31 01:22:24,928 : INFO : topic #1 (0.020): 0.055*\"china\" + 0.044*\"chilton\" + 0.026*\"hong\" + 0.025*\"kong\" + 0.020*\"korea\" + 0.019*\"korean\" + 0.018*\"kim\" + 0.016*\"leah\" + 0.016*\"sourc\" + 0.014*\"shirin\"\n", + "2019-01-31 01:22:24,929 : INFO : topic #41 (0.020): 0.040*\"citi\" + 0.024*\"palmer\" + 0.020*\"new\" + 0.016*\"strategist\" + 0.013*\"center\" + 0.013*\"open\" + 0.011*\"includ\" + 0.011*\"lobe\" + 0.010*\"dai\" + 0.009*\"local\"\n", + "2019-01-31 01:22:24,930 : INFO : topic #45 (0.020): 0.037*\"arsen\" + 0.030*\"jpg\" + 0.027*\"fifteenth\" + 0.026*\"museo\" + 0.021*\"illicit\" + 0.021*\"pain\" + 0.015*\"exhaust\" + 0.015*\"colder\" + 0.014*\"gai\" + 0.013*\"artist\"\n", + "2019-01-31 01:22:24,936 : INFO : topic diff=0.003043, rho=0.022792\n", + "2019-01-31 01:22:25,093 : INFO : PROGRESS: pass 0, at document #3852000/4922894\n", + "2019-01-31 01:22:26,452 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:22:26,719 : INFO : topic #25 (0.020): 0.032*\"ring\" + 0.019*\"area\" + 0.017*\"lagrang\" + 0.016*\"mount\" + 0.016*\"warmth\" + 0.010*\"north\" + 0.009*\"palmer\" + 0.009*\"sourc\" + 0.009*\"land\" + 0.009*\"lobe\"\n", + "2019-01-31 01:22:26,720 : INFO : topic #8 (0.020): 0.026*\"law\" + 0.022*\"cortic\" + 0.019*\"start\" + 0.017*\"act\" + 0.012*\"ricardo\" + 0.012*\"case\" + 0.010*\"polaris\" + 0.010*\"replac\" + 0.008*\"legal\" + 0.006*\"rudolf\"\n", + "2019-01-31 01:22:26,721 : INFO : topic #22 (0.020): 0.034*\"spars\" + 0.019*\"factor\" + 0.012*\"plaisir\" + 0.011*\"genu\" + 0.010*\"western\" + 0.009*\"biom\" + 0.008*\"median\" + 0.007*\"incom\" + 0.006*\"male\" + 0.006*\"florida\"\n", + "2019-01-31 01:22:26,722 : INFO : topic #9 (0.020): 0.072*\"bone\" + 0.045*\"american\" + 0.028*\"valour\" + 0.019*\"dutch\" + 0.018*\"folei\" + 0.017*\"player\" + 0.017*\"polit\" + 0.016*\"english\" + 0.012*\"simpler\" + 0.012*\"acrimoni\"\n", + "2019-01-31 01:22:26,723 : INFO : topic #40 (0.020): 0.085*\"unit\" + 0.024*\"schuster\" + 0.022*\"institut\" + 0.022*\"collector\" + 0.021*\"requir\" + 0.019*\"student\" + 0.014*\"professor\" + 0.012*\"http\" + 0.011*\"word\" + 0.011*\"degre\"\n", + "2019-01-31 01:22:26,729 : INFO : topic diff=0.003337, rho=0.022786\n", + "2019-01-31 01:22:26,882 : INFO : PROGRESS: pass 0, at document #3854000/4922894\n", + "2019-01-31 01:22:28,223 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:22:28,490 : INFO : topic #13 (0.020): 0.026*\"london\" + 0.026*\"australia\" + 0.025*\"sourc\" + 0.025*\"new\" + 0.023*\"england\" + 0.022*\"australian\" + 0.019*\"british\" + 0.018*\"ireland\" + 0.014*\"youth\" + 0.014*\"wale\"\n", + "2019-01-31 01:22:28,491 : INFO : topic #21 (0.020): 0.034*\"samford\" + 0.023*\"spain\" + 0.019*\"del\" + 0.017*\"mexico\" + 0.017*\"italian\" + 0.014*\"soviet\" + 0.012*\"santa\" + 0.011*\"juan\" + 0.011*\"carlo\" + 0.010*\"lizard\"\n", + "2019-01-31 01:22:28,492 : INFO : topic #4 (0.020): 0.020*\"enfranchis\" + 0.015*\"depress\" + 0.014*\"pour\" + 0.008*\"veget\" + 0.008*\"mode\" + 0.008*\"elabor\" + 0.007*\"uruguayan\" + 0.006*\"turn\" + 0.006*\"produc\" + 0.006*\"develop\"\n", + "2019-01-31 01:22:28,493 : INFO : topic #6 (0.020): 0.069*\"fewer\" + 0.025*\"epiru\" + 0.021*\"septemb\" + 0.018*\"teacher\" + 0.015*\"stake\" + 0.012*\"rodríguez\" + 0.012*\"proclaim\" + 0.011*\"movi\" + 0.011*\"direct\" + 0.010*\"acrimoni\"\n", + "2019-01-31 01:22:28,494 : INFO : topic #37 (0.020): 0.013*\"charact\" + 0.012*\"septemb\" + 0.011*\"anim\" + 0.010*\"man\" + 0.009*\"comic\" + 0.007*\"appear\" + 0.007*\"storag\" + 0.006*\"workplac\" + 0.006*\"fusiform\" + 0.006*\"vision\"\n", + "2019-01-31 01:22:28,500 : INFO : topic diff=0.003256, rho=0.022780\n", + "2019-01-31 01:22:28,659 : INFO : PROGRESS: pass 0, at document #3856000/4922894\n", + "2019-01-31 01:22:30,046 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:22:30,312 : INFO : topic #48 (0.020): 0.082*\"sens\" + 0.079*\"march\" + 0.078*\"octob\" + 0.073*\"juli\" + 0.072*\"august\" + 0.070*\"januari\" + 0.069*\"notion\" + 0.069*\"judici\" + 0.067*\"april\" + 0.065*\"decatur\"\n", + "2019-01-31 01:22:30,313 : INFO : topic #33 (0.020): 0.062*\"french\" + 0.048*\"franc\" + 0.031*\"pari\" + 0.023*\"sail\" + 0.022*\"jean\" + 0.018*\"daphn\" + 0.014*\"lazi\" + 0.013*\"loui\" + 0.011*\"piec\" + 0.010*\"wine\"\n", + "2019-01-31 01:22:30,314 : INFO : topic #34 (0.020): 0.063*\"start\" + 0.035*\"new\" + 0.031*\"american\" + 0.028*\"cotton\" + 0.027*\"unionist\" + 0.021*\"year\" + 0.014*\"california\" + 0.013*\"terri\" + 0.013*\"warrior\" + 0.012*\"citi\"\n", + "2019-01-31 01:22:30,315 : INFO : topic #32 (0.020): 0.053*\"district\" + 0.044*\"popolo\" + 0.042*\"vigour\" + 0.036*\"tortur\" + 0.034*\"cotton\" + 0.022*\"area\" + 0.021*\"multitud\" + 0.021*\"adulthood\" + 0.019*\"cede\" + 0.019*\"citi\"\n", + "2019-01-31 01:22:30,316 : INFO : topic #19 (0.020): 0.016*\"languag\" + 0.015*\"centuri\" + 0.011*\"woodcut\" + 0.009*\"form\" + 0.009*\"mean\" + 0.009*\"origin\" + 0.008*\"trade\" + 0.008*\"english\" + 0.007*\"known\" + 0.006*\"ancestor\"\n", + "2019-01-31 01:22:30,322 : INFO : topic diff=0.003599, rho=0.022774\n", + "2019-01-31 01:22:30,483 : INFO : PROGRESS: pass 0, at document #3858000/4922894\n", + "2019-01-31 01:22:31,868 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:22:32,135 : INFO : topic #3 (0.020): 0.035*\"present\" + 0.026*\"offic\" + 0.026*\"minist\" + 0.023*\"nation\" + 0.022*\"govern\" + 0.021*\"serv\" + 0.020*\"member\" + 0.016*\"start\" + 0.016*\"gener\" + 0.014*\"chickasaw\"\n", + "2019-01-31 01:22:32,136 : INFO : topic #29 (0.020): 0.031*\"companhia\" + 0.012*\"busi\" + 0.012*\"million\" + 0.012*\"market\" + 0.011*\"produc\" + 0.010*\"bank\" + 0.010*\"industri\" + 0.009*\"yawn\" + 0.008*\"manag\" + 0.007*\"function\"\n", + "2019-01-31 01:22:32,137 : INFO : topic #2 (0.020): 0.049*\"isl\" + 0.039*\"shield\" + 0.017*\"narrat\" + 0.015*\"scot\" + 0.013*\"blur\" + 0.012*\"pope\" + 0.011*\"nativist\" + 0.010*\"coalit\" + 0.009*\"fleet\" + 0.009*\"sai\"\n", + "2019-01-31 01:22:32,138 : INFO : topic #23 (0.020): 0.134*\"audit\" + 0.067*\"best\" + 0.033*\"yawn\" + 0.031*\"jacksonvil\" + 0.024*\"japanes\" + 0.021*\"noll\" + 0.018*\"women\" + 0.018*\"festiv\" + 0.017*\"intern\" + 0.013*\"winner\"\n", + "2019-01-31 01:22:32,139 : INFO : topic #33 (0.020): 0.062*\"french\" + 0.048*\"franc\" + 0.031*\"pari\" + 0.023*\"sail\" + 0.022*\"jean\" + 0.018*\"daphn\" + 0.013*\"lazi\" + 0.013*\"loui\" + 0.011*\"piec\" + 0.010*\"wine\"\n", + "2019-01-31 01:22:32,145 : INFO : topic diff=0.002901, rho=0.022768\n", + "2019-01-31 01:22:34,710 : INFO : -11.644 per-word bound, 3199.7 perplexity estimate based on a held-out corpus of 2000 documents with 509170 words\n", + "2019-01-31 01:22:34,711 : INFO : PROGRESS: pass 0, at document #3860000/4922894\n", + "2019-01-31 01:22:36,036 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:22:36,302 : INFO : topic #40 (0.020): 0.084*\"unit\" + 0.024*\"schuster\" + 0.023*\"institut\" + 0.022*\"collector\" + 0.021*\"requir\" + 0.019*\"student\" + 0.014*\"professor\" + 0.012*\"http\" + 0.012*\"word\" + 0.012*\"degre\"\n", + "2019-01-31 01:22:36,303 : INFO : topic #10 (0.020): 0.011*\"cdd\" + 0.009*\"media\" + 0.008*\"disco\" + 0.008*\"hormon\" + 0.007*\"have\" + 0.007*\"pathwai\" + 0.007*\"caus\" + 0.006*\"effect\" + 0.006*\"proper\" + 0.006*\"treat\"\n", + "2019-01-31 01:22:36,305 : INFO : topic #18 (0.020): 0.011*\"théori\" + 0.007*\"sack\" + 0.007*\"later\" + 0.006*\"dai\" + 0.006*\"kill\" + 0.005*\"like\" + 0.005*\"retrospect\" + 0.005*\"end\" + 0.004*\"call\" + 0.004*\"help\"\n", + "2019-01-31 01:22:36,306 : INFO : topic #32 (0.020): 0.053*\"district\" + 0.044*\"popolo\" + 0.042*\"vigour\" + 0.036*\"tortur\" + 0.034*\"cotton\" + 0.022*\"area\" + 0.021*\"multitud\" + 0.021*\"adulthood\" + 0.020*\"cede\" + 0.019*\"citi\"\n", + "2019-01-31 01:22:36,307 : INFO : topic #3 (0.020): 0.034*\"present\" + 0.026*\"offic\" + 0.025*\"minist\" + 0.023*\"nation\" + 0.022*\"govern\" + 0.021*\"serv\" + 0.020*\"member\" + 0.016*\"start\" + 0.016*\"gener\" + 0.014*\"chickasaw\"\n", + "2019-01-31 01:22:36,313 : INFO : topic diff=0.003388, rho=0.022763\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 01:22:36,468 : INFO : PROGRESS: pass 0, at document #3862000/4922894\n", + "2019-01-31 01:22:37,826 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:22:38,092 : INFO : topic #22 (0.020): 0.034*\"spars\" + 0.019*\"factor\" + 0.012*\"plaisir\" + 0.011*\"genu\" + 0.010*\"western\" + 0.009*\"biom\" + 0.008*\"median\" + 0.007*\"incom\" + 0.006*\"florida\" + 0.006*\"brown\"\n", + "2019-01-31 01:22:38,093 : INFO : topic #30 (0.020): 0.036*\"cleveland\" + 0.035*\"leagu\" + 0.029*\"place\" + 0.028*\"taxpay\" + 0.024*\"scientist\" + 0.023*\"crete\" + 0.021*\"folei\" + 0.016*\"goal\" + 0.015*\"martin\" + 0.012*\"schmitz\"\n", + "2019-01-31 01:22:38,094 : INFO : topic #47 (0.020): 0.064*\"muscl\" + 0.033*\"perceptu\" + 0.022*\"theater\" + 0.019*\"place\" + 0.017*\"compos\" + 0.017*\"damn\" + 0.014*\"orchestr\" + 0.013*\"physician\" + 0.012*\"olympo\" + 0.011*\"word\"\n", + "2019-01-31 01:22:38,095 : INFO : topic #4 (0.020): 0.019*\"enfranchis\" + 0.014*\"depress\" + 0.014*\"pour\" + 0.008*\"mode\" + 0.008*\"veget\" + 0.008*\"elabor\" + 0.007*\"uruguayan\" + 0.006*\"turn\" + 0.006*\"produc\" + 0.006*\"develop\"\n", + "2019-01-31 01:22:38,096 : INFO : topic #31 (0.020): 0.051*\"fusiform\" + 0.027*\"scientist\" + 0.025*\"taxpay\" + 0.023*\"player\" + 0.020*\"place\" + 0.014*\"clot\" + 0.013*\"leagu\" + 0.011*\"folei\" + 0.010*\"yawn\" + 0.009*\"reconstruct\"\n", + "2019-01-31 01:22:38,102 : INFO : topic diff=0.003561, rho=0.022757\n", + "2019-01-31 01:22:38,257 : INFO : PROGRESS: pass 0, at document #3864000/4922894\n", + "2019-01-31 01:22:39,620 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:22:39,886 : INFO : topic #31 (0.020): 0.051*\"fusiform\" + 0.027*\"scientist\" + 0.025*\"taxpay\" + 0.023*\"player\" + 0.020*\"place\" + 0.014*\"clot\" + 0.013*\"leagu\" + 0.011*\"folei\" + 0.010*\"yawn\" + 0.009*\"reconstruct\"\n", + "2019-01-31 01:22:39,887 : INFO : topic #47 (0.020): 0.064*\"muscl\" + 0.033*\"perceptu\" + 0.022*\"theater\" + 0.019*\"place\" + 0.017*\"compos\" + 0.017*\"damn\" + 0.014*\"orchestr\" + 0.013*\"physician\" + 0.012*\"olympo\" + 0.011*\"word\"\n", + "2019-01-31 01:22:39,888 : INFO : topic #9 (0.020): 0.073*\"bone\" + 0.047*\"american\" + 0.028*\"valour\" + 0.019*\"dutch\" + 0.018*\"folei\" + 0.017*\"player\" + 0.017*\"english\" + 0.017*\"polit\" + 0.012*\"simpler\" + 0.012*\"acrimoni\"\n", + "2019-01-31 01:22:39,889 : INFO : topic #38 (0.020): 0.023*\"walter\" + 0.009*\"aza\" + 0.009*\"battalion\" + 0.008*\"forc\" + 0.007*\"armi\" + 0.007*\"empath\" + 0.007*\"teufel\" + 0.006*\"citi\" + 0.006*\"govern\" + 0.006*\"militari\"\n", + "2019-01-31 01:22:39,891 : INFO : topic #40 (0.020): 0.084*\"unit\" + 0.024*\"schuster\" + 0.022*\"institut\" + 0.022*\"collector\" + 0.021*\"requir\" + 0.019*\"student\" + 0.014*\"professor\" + 0.012*\"http\" + 0.012*\"word\" + 0.011*\"degre\"\n", + "2019-01-31 01:22:39,896 : INFO : topic diff=0.003511, rho=0.022751\n", + "2019-01-31 01:22:40,054 : INFO : PROGRESS: pass 0, at document #3866000/4922894\n", + "2019-01-31 01:22:41,427 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:22:41,694 : INFO : topic #41 (0.020): 0.041*\"citi\" + 0.024*\"palmer\" + 0.020*\"new\" + 0.016*\"strategist\" + 0.013*\"center\" + 0.013*\"open\" + 0.011*\"includ\" + 0.011*\"lobe\" + 0.010*\"dai\" + 0.009*\"highli\"\n", + "2019-01-31 01:22:41,695 : INFO : topic #27 (0.020): 0.071*\"questionnair\" + 0.021*\"candid\" + 0.017*\"taxpay\" + 0.014*\"ret\" + 0.014*\"driver\" + 0.012*\"tornado\" + 0.012*\"fool\" + 0.011*\"find\" + 0.011*\"landslid\" + 0.010*\"champion\"\n", + "2019-01-31 01:22:41,696 : INFO : topic #19 (0.020): 0.017*\"languag\" + 0.015*\"centuri\" + 0.011*\"woodcut\" + 0.009*\"form\" + 0.009*\"origin\" + 0.009*\"mean\" + 0.008*\"trade\" + 0.008*\"english\" + 0.007*\"known\" + 0.006*\"ancestor\"\n", + "2019-01-31 01:22:41,697 : INFO : topic #6 (0.020): 0.070*\"fewer\" + 0.024*\"epiru\" + 0.020*\"septemb\" + 0.018*\"teacher\" + 0.015*\"stake\" + 0.012*\"rodríguez\" + 0.012*\"proclaim\" + 0.011*\"movi\" + 0.011*\"direct\" + 0.010*\"acrimoni\"\n", + "2019-01-31 01:22:41,698 : INFO : topic #30 (0.020): 0.036*\"cleveland\" + 0.035*\"leagu\" + 0.029*\"place\" + 0.028*\"taxpay\" + 0.024*\"scientist\" + 0.023*\"crete\" + 0.021*\"folei\" + 0.016*\"goal\" + 0.015*\"martin\" + 0.012*\"schmitz\"\n", + "2019-01-31 01:22:41,704 : INFO : topic diff=0.002898, rho=0.022745\n", + "2019-01-31 01:22:41,863 : INFO : PROGRESS: pass 0, at document #3868000/4922894\n", + "2019-01-31 01:22:43,239 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:22:43,506 : INFO : topic #33 (0.020): 0.061*\"french\" + 0.047*\"franc\" + 0.031*\"pari\" + 0.023*\"sail\" + 0.022*\"jean\" + 0.018*\"daphn\" + 0.014*\"loui\" + 0.013*\"lazi\" + 0.011*\"piec\" + 0.010*\"wine\"\n", + "2019-01-31 01:22:43,507 : INFO : topic #30 (0.020): 0.036*\"cleveland\" + 0.035*\"leagu\" + 0.029*\"place\" + 0.027*\"taxpay\" + 0.024*\"scientist\" + 0.023*\"crete\" + 0.021*\"folei\" + 0.016*\"goal\" + 0.015*\"martin\" + 0.012*\"schmitz\"\n", + "2019-01-31 01:22:43,509 : INFO : topic #29 (0.020): 0.031*\"companhia\" + 0.012*\"busi\" + 0.012*\"million\" + 0.012*\"market\" + 0.011*\"produc\" + 0.010*\"bank\" + 0.010*\"industri\" + 0.009*\"yawn\" + 0.008*\"manag\" + 0.007*\"function\"\n", + "2019-01-31 01:22:43,510 : INFO : topic #4 (0.020): 0.019*\"enfranchis\" + 0.014*\"depress\" + 0.014*\"pour\" + 0.008*\"mode\" + 0.008*\"veget\" + 0.008*\"elabor\" + 0.008*\"uruguayan\" + 0.006*\"turn\" + 0.006*\"produc\" + 0.006*\"develop\"\n", + "2019-01-31 01:22:43,511 : INFO : topic #45 (0.020): 0.038*\"arsen\" + 0.030*\"jpg\" + 0.028*\"fifteenth\" + 0.026*\"museo\" + 0.021*\"pain\" + 0.021*\"illicit\" + 0.015*\"exhaust\" + 0.014*\"gai\" + 0.014*\"colder\" + 0.013*\"artist\"\n", + "2019-01-31 01:22:43,517 : INFO : topic diff=0.003780, rho=0.022739\n", + "2019-01-31 01:22:43,729 : INFO : PROGRESS: pass 0, at document #3870000/4922894\n", + "2019-01-31 01:22:45,100 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:22:45,367 : INFO : topic #36 (0.020): 0.011*\"network\" + 0.011*\"prognosi\" + 0.010*\"pop\" + 0.008*\"develop\" + 0.008*\"cytokin\" + 0.008*\"diggin\" + 0.008*\"softwar\" + 0.008*\"user\" + 0.008*\"uruguayan\" + 0.007*\"includ\"\n", + "2019-01-31 01:22:45,368 : INFO : topic #1 (0.020): 0.055*\"china\" + 0.046*\"chilton\" + 0.026*\"hong\" + 0.026*\"kong\" + 0.019*\"korea\" + 0.017*\"korean\" + 0.016*\"kim\" + 0.016*\"leah\" + 0.015*\"sourc\" + 0.014*\"shirin\"\n", + "2019-01-31 01:22:45,368 : INFO : topic #23 (0.020): 0.135*\"audit\" + 0.067*\"best\" + 0.034*\"yawn\" + 0.030*\"jacksonvil\" + 0.023*\"japanes\" + 0.021*\"noll\" + 0.018*\"women\" + 0.018*\"festiv\" + 0.016*\"intern\" + 0.013*\"prison\"\n", + "2019-01-31 01:22:45,369 : INFO : topic #42 (0.020): 0.048*\"german\" + 0.033*\"germani\" + 0.015*\"vol\" + 0.014*\"jewish\" + 0.014*\"israel\" + 0.014*\"berlin\" + 0.014*\"der\" + 0.010*\"european\" + 0.009*\"europ\" + 0.009*\"austria\"\n", + "2019-01-31 01:22:45,370 : INFO : topic #2 (0.020): 0.050*\"isl\" + 0.039*\"shield\" + 0.017*\"narrat\" + 0.015*\"scot\" + 0.013*\"pope\" + 0.012*\"blur\" + 0.011*\"coalit\" + 0.010*\"nativist\" + 0.009*\"class\" + 0.009*\"fleet\"\n", + "2019-01-31 01:22:45,376 : INFO : topic diff=0.003167, rho=0.022733\n", + "2019-01-31 01:22:45,537 : INFO : PROGRESS: pass 0, at document #3872000/4922894\n", + "2019-01-31 01:22:46,920 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:22:47,186 : INFO : topic #14 (0.020): 0.025*\"forc\" + 0.022*\"aggress\" + 0.021*\"armi\" + 0.021*\"walter\" + 0.017*\"com\" + 0.014*\"unionist\" + 0.013*\"oper\" + 0.012*\"militari\" + 0.012*\"airbu\" + 0.012*\"diversifi\"\n", + "2019-01-31 01:22:47,187 : INFO : topic #13 (0.020): 0.027*\"london\" + 0.026*\"australia\" + 0.025*\"sourc\" + 0.024*\"new\" + 0.023*\"england\" + 0.022*\"australian\" + 0.019*\"british\" + 0.019*\"ireland\" + 0.014*\"youth\" + 0.014*\"wale\"\n", + "2019-01-31 01:22:47,188 : INFO : topic #35 (0.020): 0.056*\"russia\" + 0.037*\"sovereignti\" + 0.036*\"rural\" + 0.026*\"poison\" + 0.025*\"personifi\" + 0.022*\"reprint\" + 0.020*\"moscow\" + 0.019*\"poland\" + 0.015*\"turin\" + 0.015*\"tyrant\"\n", + "2019-01-31 01:22:47,189 : INFO : topic #1 (0.020): 0.055*\"china\" + 0.046*\"chilton\" + 0.026*\"hong\" + 0.026*\"kong\" + 0.020*\"korea\" + 0.017*\"korean\" + 0.016*\"kim\" + 0.016*\"leah\" + 0.015*\"sourc\" + 0.014*\"shirin\"\n", + "2019-01-31 01:22:47,190 : INFO : topic #48 (0.020): 0.084*\"march\" + 0.079*\"sens\" + 0.077*\"octob\" + 0.071*\"januari\" + 0.070*\"juli\" + 0.069*\"august\" + 0.068*\"notion\" + 0.067*\"judici\" + 0.065*\"april\" + 0.064*\"decatur\"\n", + "2019-01-31 01:22:47,196 : INFO : topic diff=0.003341, rho=0.022727\n", + "2019-01-31 01:22:47,357 : INFO : PROGRESS: pass 0, at document #3874000/4922894\n", + "2019-01-31 01:22:48,750 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 01:22:49,016 : INFO : topic #46 (0.020): 0.017*\"sweden\" + 0.017*\"norwai\" + 0.017*\"stop\" + 0.015*\"swedish\" + 0.014*\"damag\" + 0.014*\"wind\" + 0.014*\"norwegian\" + 0.012*\"treeless\" + 0.011*\"denmark\" + 0.011*\"huntsvil\"\n", + "2019-01-31 01:22:49,017 : INFO : topic #35 (0.020): 0.056*\"russia\" + 0.037*\"sovereignti\" + 0.036*\"rural\" + 0.026*\"poison\" + 0.025*\"personifi\" + 0.022*\"reprint\" + 0.020*\"moscow\" + 0.019*\"poland\" + 0.015*\"turin\" + 0.015*\"tyrant\"\n", + "2019-01-31 01:22:49,018 : INFO : topic #14 (0.020): 0.025*\"forc\" + 0.022*\"aggress\" + 0.021*\"armi\" + 0.021*\"walter\" + 0.017*\"com\" + 0.014*\"unionist\" + 0.013*\"oper\" + 0.012*\"militari\" + 0.012*\"airbu\" + 0.012*\"diversifi\"\n", + "2019-01-31 01:22:49,019 : INFO : topic #10 (0.020): 0.012*\"cdd\" + 0.009*\"media\" + 0.008*\"disco\" + 0.008*\"hormon\" + 0.007*\"have\" + 0.007*\"pathwai\" + 0.007*\"caus\" + 0.006*\"effect\" + 0.006*\"treat\" + 0.006*\"proper\"\n", + "2019-01-31 01:22:49,020 : INFO : topic #28 (0.020): 0.034*\"build\" + 0.029*\"hous\" + 0.019*\"buford\" + 0.015*\"histor\" + 0.012*\"linear\" + 0.011*\"constitut\" + 0.011*\"depress\" + 0.011*\"silicon\" + 0.011*\"centuri\" + 0.010*\"briarwood\"\n", + "2019-01-31 01:22:49,026 : INFO : topic diff=0.003746, rho=0.022721\n", + "2019-01-31 01:22:49,182 : INFO : PROGRESS: pass 0, at document #3876000/4922894\n", + "2019-01-31 01:22:50,554 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:22:50,820 : INFO : topic #8 (0.020): 0.026*\"law\" + 0.021*\"cortic\" + 0.019*\"start\" + 0.018*\"act\" + 0.012*\"ricardo\" + 0.012*\"case\" + 0.010*\"replac\" + 0.010*\"polaris\" + 0.008*\"legal\" + 0.006*\"rudolf\"\n", + "2019-01-31 01:22:50,821 : INFO : topic #2 (0.020): 0.050*\"isl\" + 0.039*\"shield\" + 0.017*\"narrat\" + 0.015*\"scot\" + 0.012*\"blur\" + 0.012*\"pope\" + 0.011*\"coalit\" + 0.010*\"nativist\" + 0.009*\"class\" + 0.009*\"fleet\"\n", + "2019-01-31 01:22:50,822 : INFO : topic #33 (0.020): 0.062*\"french\" + 0.047*\"franc\" + 0.032*\"pari\" + 0.023*\"sail\" + 0.023*\"jean\" + 0.018*\"daphn\" + 0.014*\"loui\" + 0.013*\"lazi\" + 0.011*\"piec\" + 0.010*\"wine\"\n", + "2019-01-31 01:22:50,823 : INFO : topic #26 (0.020): 0.031*\"workplac\" + 0.029*\"champion\" + 0.026*\"woman\" + 0.024*\"men\" + 0.024*\"olymp\" + 0.022*\"medal\" + 0.020*\"event\" + 0.019*\"alic\" + 0.018*\"taxpay\" + 0.018*\"rainfal\"\n", + "2019-01-31 01:22:50,824 : INFO : topic #4 (0.020): 0.019*\"enfranchis\" + 0.014*\"depress\" + 0.014*\"pour\" + 0.008*\"mode\" + 0.008*\"elabor\" + 0.008*\"veget\" + 0.008*\"uruguayan\" + 0.006*\"turn\" + 0.006*\"teratogen\" + 0.006*\"produc\"\n", + "2019-01-31 01:22:50,830 : INFO : topic diff=0.003502, rho=0.022716\n", + "2019-01-31 01:22:50,988 : INFO : PROGRESS: pass 0, at document #3878000/4922894\n", + "2019-01-31 01:22:52,355 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:22:52,622 : INFO : topic #11 (0.020): 0.023*\"john\" + 0.011*\"will\" + 0.011*\"jame\" + 0.011*\"david\" + 0.010*\"rival\" + 0.009*\"mexican–american\" + 0.008*\"slur\" + 0.008*\"georg\" + 0.008*\"paul\" + 0.007*\"rhyme\"\n", + "2019-01-31 01:22:52,623 : INFO : topic #22 (0.020): 0.034*\"spars\" + 0.019*\"factor\" + 0.012*\"plaisir\" + 0.010*\"genu\" + 0.010*\"western\" + 0.009*\"biom\" + 0.008*\"median\" + 0.007*\"incom\" + 0.006*\"florida\" + 0.006*\"trap\"\n", + "2019-01-31 01:22:52,624 : INFO : topic #21 (0.020): 0.033*\"samford\" + 0.022*\"spain\" + 0.019*\"del\" + 0.017*\"mexico\" + 0.017*\"italian\" + 0.014*\"soviet\" + 0.012*\"santa\" + 0.011*\"juan\" + 0.010*\"carlo\" + 0.010*\"itali\"\n", + "2019-01-31 01:22:52,625 : INFO : topic #43 (0.020): 0.064*\"elect\" + 0.053*\"parti\" + 0.023*\"democrat\" + 0.023*\"voluntari\" + 0.021*\"member\" + 0.016*\"polici\" + 0.016*\"republ\" + 0.014*\"bypass\" + 0.013*\"seaport\" + 0.013*\"report\"\n", + "2019-01-31 01:22:52,626 : INFO : topic #39 (0.020): 0.058*\"canada\" + 0.046*\"canadian\" + 0.024*\"hoar\" + 0.022*\"toronto\" + 0.022*\"ontario\" + 0.017*\"hydrogen\" + 0.015*\"new\" + 0.015*\"novotná\" + 0.014*\"misericordia\" + 0.013*\"quebec\"\n", + "2019-01-31 01:22:52,632 : INFO : topic diff=0.003351, rho=0.022710\n", + "2019-01-31 01:22:55,342 : INFO : -11.877 per-word bound, 3762.1 perplexity estimate based on a held-out corpus of 2000 documents with 572994 words\n", + "2019-01-31 01:22:55,342 : INFO : PROGRESS: pass 0, at document #3880000/4922894\n", + "2019-01-31 01:22:56,727 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:22:56,993 : INFO : topic #7 (0.020): 0.021*\"snatch\" + 0.020*\"di\" + 0.019*\"factor\" + 0.016*\"yawn\" + 0.016*\"margin\" + 0.014*\"bone\" + 0.013*\"faster\" + 0.013*\"life\" + 0.012*\"will\" + 0.012*\"deal\"\n", + "2019-01-31 01:22:56,995 : INFO : topic #28 (0.020): 0.034*\"build\" + 0.029*\"hous\" + 0.019*\"buford\" + 0.015*\"histor\" + 0.012*\"linear\" + 0.011*\"constitut\" + 0.011*\"depress\" + 0.011*\"silicon\" + 0.010*\"centuri\" + 0.010*\"pistol\"\n", + "2019-01-31 01:22:56,996 : INFO : topic #49 (0.020): 0.044*\"india\" + 0.029*\"incumb\" + 0.013*\"pakistan\" + 0.012*\"islam\" + 0.011*\"muskoge\" + 0.011*\"anglo\" + 0.011*\"televis\" + 0.011*\"sri\" + 0.011*\"khalsa\" + 0.010*\"affection\"\n", + "2019-01-31 01:22:56,997 : INFO : topic #32 (0.020): 0.051*\"district\" + 0.045*\"popolo\" + 0.042*\"vigour\" + 0.036*\"tortur\" + 0.034*\"cotton\" + 0.022*\"area\" + 0.022*\"multitud\" + 0.021*\"adulthood\" + 0.020*\"cede\" + 0.019*\"citi\"\n", + "2019-01-31 01:22:56,998 : INFO : topic #41 (0.020): 0.041*\"citi\" + 0.023*\"palmer\" + 0.020*\"new\" + 0.016*\"strategist\" + 0.013*\"center\" + 0.013*\"open\" + 0.011*\"includ\" + 0.011*\"lobe\" + 0.010*\"dai\" + 0.009*\"highli\"\n", + "2019-01-31 01:22:57,004 : INFO : topic diff=0.003418, rho=0.022704\n", + "2019-01-31 01:22:57,161 : INFO : PROGRESS: pass 0, at document #3882000/4922894\n", + "2019-01-31 01:22:58,522 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:22:58,789 : INFO : topic #33 (0.020): 0.062*\"french\" + 0.046*\"franc\" + 0.032*\"pari\" + 0.023*\"sail\" + 0.022*\"jean\" + 0.018*\"daphn\" + 0.014*\"loui\" + 0.013*\"lazi\" + 0.011*\"piec\" + 0.010*\"wine\"\n", + "2019-01-31 01:22:58,790 : INFO : topic #19 (0.020): 0.017*\"languag\" + 0.015*\"centuri\" + 0.010*\"woodcut\" + 0.009*\"form\" + 0.009*\"origin\" + 0.009*\"mean\" + 0.008*\"trade\" + 0.008*\"english\" + 0.007*\"known\" + 0.007*\"ancestor\"\n", + "2019-01-31 01:22:58,791 : INFO : topic #22 (0.020): 0.034*\"spars\" + 0.019*\"factor\" + 0.012*\"plaisir\" + 0.010*\"genu\" + 0.010*\"western\" + 0.009*\"biom\" + 0.008*\"median\" + 0.007*\"incom\" + 0.006*\"male\" + 0.006*\"florida\"\n", + "2019-01-31 01:22:58,792 : INFO : topic #46 (0.020): 0.017*\"sweden\" + 0.017*\"norwai\" + 0.017*\"stop\" + 0.015*\"damag\" + 0.015*\"swedish\" + 0.014*\"wind\" + 0.014*\"norwegian\" + 0.011*\"treeless\" + 0.011*\"denmark\" + 0.011*\"huntsvil\"\n", + "2019-01-31 01:22:58,793 : INFO : topic #27 (0.020): 0.071*\"questionnair\" + 0.021*\"candid\" + 0.017*\"taxpay\" + 0.014*\"driver\" + 0.013*\"ret\" + 0.012*\"fool\" + 0.012*\"tornado\" + 0.011*\"find\" + 0.011*\"landslid\" + 0.010*\"champion\"\n", + "2019-01-31 01:22:58,799 : INFO : topic diff=0.002982, rho=0.022698\n", + "2019-01-31 01:22:58,953 : INFO : PROGRESS: pass 0, at document #3884000/4922894\n", + "2019-01-31 01:23:00,310 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:23:00,577 : INFO : topic #22 (0.020): 0.034*\"spars\" + 0.019*\"factor\" + 0.012*\"plaisir\" + 0.010*\"genu\" + 0.010*\"western\" + 0.009*\"biom\" + 0.008*\"median\" + 0.007*\"incom\" + 0.006*\"male\" + 0.006*\"florida\"\n", + "2019-01-31 01:23:00,578 : INFO : topic #3 (0.020): 0.034*\"present\" + 0.026*\"offic\" + 0.025*\"minist\" + 0.023*\"nation\" + 0.022*\"govern\" + 0.021*\"serv\" + 0.020*\"member\" + 0.016*\"start\" + 0.016*\"gener\" + 0.014*\"chickasaw\"\n", + "2019-01-31 01:23:00,579 : INFO : topic #10 (0.020): 0.011*\"cdd\" + 0.009*\"media\" + 0.008*\"hormon\" + 0.008*\"disco\" + 0.007*\"have\" + 0.007*\"pathwai\" + 0.007*\"caus\" + 0.006*\"effect\" + 0.006*\"treat\" + 0.006*\"proper\"\n", + "2019-01-31 01:23:00,580 : INFO : topic #40 (0.020): 0.085*\"unit\" + 0.024*\"schuster\" + 0.022*\"institut\" + 0.022*\"collector\" + 0.021*\"requir\" + 0.019*\"student\" + 0.014*\"professor\" + 0.012*\"http\" + 0.012*\"word\" + 0.011*\"degre\"\n", + "2019-01-31 01:23:00,581 : INFO : topic #32 (0.020): 0.051*\"district\" + 0.044*\"popolo\" + 0.042*\"vigour\" + 0.036*\"tortur\" + 0.034*\"cotton\" + 0.022*\"area\" + 0.022*\"multitud\" + 0.021*\"adulthood\" + 0.019*\"cede\" + 0.019*\"citi\"\n", + "2019-01-31 01:23:00,587 : INFO : topic diff=0.003440, rho=0.022692\n", + "2019-01-31 01:23:00,743 : INFO : PROGRESS: pass 0, at document #3886000/4922894\n", + "2019-01-31 01:23:02,114 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:23:02,381 : INFO : topic #46 (0.020): 0.017*\"stop\" + 0.017*\"sweden\" + 0.016*\"norwai\" + 0.015*\"damag\" + 0.014*\"swedish\" + 0.014*\"wind\" + 0.014*\"norwegian\" + 0.011*\"treeless\" + 0.011*\"huntsvil\" + 0.011*\"denmark\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 01:23:02,382 : INFO : topic #39 (0.020): 0.057*\"canada\" + 0.046*\"canadian\" + 0.024*\"hoar\" + 0.023*\"toronto\" + 0.022*\"ontario\" + 0.017*\"hydrogen\" + 0.015*\"new\" + 0.014*\"misericordia\" + 0.014*\"novotná\" + 0.013*\"quebec\"\n", + "2019-01-31 01:23:02,383 : INFO : topic #20 (0.020): 0.143*\"scholar\" + 0.040*\"struggl\" + 0.033*\"high\" + 0.031*\"educ\" + 0.024*\"collector\" + 0.018*\"yawn\" + 0.013*\"prognosi\" + 0.010*\"district\" + 0.010*\"task\" + 0.010*\"gothic\"\n", + "2019-01-31 01:23:02,384 : INFO : topic #7 (0.020): 0.021*\"snatch\" + 0.020*\"di\" + 0.019*\"factor\" + 0.016*\"yawn\" + 0.016*\"margin\" + 0.014*\"bone\" + 0.013*\"faster\" + 0.013*\"life\" + 0.012*\"will\" + 0.012*\"deal\"\n", + "2019-01-31 01:23:02,385 : INFO : topic #35 (0.020): 0.055*\"russia\" + 0.037*\"sovereignti\" + 0.035*\"rural\" + 0.026*\"poison\" + 0.025*\"personifi\" + 0.022*\"reprint\" + 0.020*\"moscow\" + 0.019*\"poland\" + 0.014*\"tyrant\" + 0.014*\"turin\"\n", + "2019-01-31 01:23:02,391 : INFO : topic diff=0.003566, rho=0.022686\n", + "2019-01-31 01:23:02,545 : INFO : PROGRESS: pass 0, at document #3888000/4922894\n", + "2019-01-31 01:23:03,904 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:23:04,170 : INFO : topic #43 (0.020): 0.064*\"elect\" + 0.053*\"parti\" + 0.024*\"voluntari\" + 0.023*\"democrat\" + 0.020*\"member\" + 0.016*\"polici\" + 0.015*\"republ\" + 0.014*\"bypass\" + 0.013*\"seaport\" + 0.013*\"report\"\n", + "2019-01-31 01:23:04,171 : INFO : topic #37 (0.020): 0.013*\"charact\" + 0.011*\"septemb\" + 0.011*\"anim\" + 0.010*\"man\" + 0.008*\"comic\" + 0.007*\"appear\" + 0.007*\"storag\" + 0.006*\"workplac\" + 0.006*\"fusiform\" + 0.006*\"vision\"\n", + "2019-01-31 01:23:04,172 : INFO : topic #17 (0.020): 0.077*\"church\" + 0.023*\"christian\" + 0.022*\"cathol\" + 0.021*\"bishop\" + 0.017*\"sail\" + 0.015*\"retroflex\" + 0.010*\"relationship\" + 0.009*\"historiographi\" + 0.009*\"cathedr\" + 0.009*\"parish\"\n", + "2019-01-31 01:23:04,174 : INFO : topic #18 (0.020): 0.011*\"théori\" + 0.007*\"later\" + 0.007*\"sack\" + 0.006*\"dai\" + 0.005*\"kill\" + 0.005*\"like\" + 0.005*\"retrospect\" + 0.005*\"end\" + 0.004*\"call\" + 0.004*\"help\"\n", + "2019-01-31 01:23:04,175 : INFO : topic #42 (0.020): 0.047*\"german\" + 0.032*\"germani\" + 0.015*\"vol\" + 0.014*\"jewish\" + 0.014*\"israel\" + 0.014*\"der\" + 0.014*\"berlin\" + 0.010*\"european\" + 0.009*\"europ\" + 0.009*\"austria\"\n", + "2019-01-31 01:23:04,181 : INFO : topic diff=0.003030, rho=0.022680\n", + "2019-01-31 01:23:04,337 : INFO : PROGRESS: pass 0, at document #3890000/4922894\n", + "2019-01-31 01:23:05,714 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:23:05,980 : INFO : topic #20 (0.020): 0.143*\"scholar\" + 0.040*\"struggl\" + 0.033*\"high\" + 0.031*\"educ\" + 0.025*\"collector\" + 0.018*\"yawn\" + 0.013*\"prognosi\" + 0.010*\"district\" + 0.010*\"task\" + 0.010*\"gothic\"\n", + "2019-01-31 01:23:05,981 : INFO : topic #37 (0.020): 0.013*\"charact\" + 0.011*\"septemb\" + 0.011*\"anim\" + 0.010*\"man\" + 0.008*\"comic\" + 0.007*\"appear\" + 0.007*\"storag\" + 0.007*\"workplac\" + 0.006*\"fusiform\" + 0.006*\"vision\"\n", + "2019-01-31 01:23:05,982 : INFO : topic #9 (0.020): 0.071*\"bone\" + 0.046*\"american\" + 0.028*\"valour\" + 0.019*\"dutch\" + 0.018*\"folei\" + 0.018*\"player\" + 0.017*\"polit\" + 0.017*\"english\" + 0.012*\"acrimoni\" + 0.012*\"simpler\"\n", + "2019-01-31 01:23:05,983 : INFO : topic #41 (0.020): 0.041*\"citi\" + 0.023*\"palmer\" + 0.020*\"new\" + 0.016*\"strategist\" + 0.013*\"center\" + 0.013*\"open\" + 0.011*\"includ\" + 0.011*\"lobe\" + 0.010*\"dai\" + 0.009*\"local\"\n", + "2019-01-31 01:23:05,984 : INFO : topic #24 (0.020): 0.039*\"book\" + 0.034*\"publicis\" + 0.027*\"word\" + 0.019*\"new\" + 0.014*\"edit\" + 0.013*\"presid\" + 0.011*\"storag\" + 0.011*\"magazin\" + 0.011*\"worldwid\" + 0.011*\"nicola\"\n", + "2019-01-31 01:23:05,991 : INFO : topic diff=0.003599, rho=0.022675\n", + "2019-01-31 01:23:06,143 : INFO : PROGRESS: pass 0, at document #3892000/4922894\n", + "2019-01-31 01:23:07,495 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:23:07,761 : INFO : topic #4 (0.020): 0.019*\"enfranchis\" + 0.014*\"pour\" + 0.014*\"depress\" + 0.009*\"elabor\" + 0.008*\"mode\" + 0.008*\"veget\" + 0.008*\"uruguayan\" + 0.006*\"turn\" + 0.006*\"produc\" + 0.006*\"teratogen\"\n", + "2019-01-31 01:23:07,762 : INFO : topic #24 (0.020): 0.039*\"book\" + 0.034*\"publicis\" + 0.027*\"word\" + 0.019*\"new\" + 0.014*\"edit\" + 0.013*\"presid\" + 0.011*\"nicola\" + 0.011*\"author\" + 0.011*\"storag\" + 0.011*\"magazin\"\n", + "2019-01-31 01:23:07,763 : INFO : topic #28 (0.020): 0.034*\"build\" + 0.030*\"hous\" + 0.019*\"buford\" + 0.015*\"histor\" + 0.012*\"linear\" + 0.011*\"constitut\" + 0.011*\"depress\" + 0.011*\"silicon\" + 0.010*\"centuri\" + 0.010*\"pistol\"\n", + "2019-01-31 01:23:07,764 : INFO : topic #40 (0.020): 0.084*\"unit\" + 0.024*\"schuster\" + 0.022*\"institut\" + 0.022*\"collector\" + 0.021*\"requir\" + 0.019*\"student\" + 0.014*\"professor\" + 0.012*\"http\" + 0.011*\"word\" + 0.011*\"degre\"\n", + "2019-01-31 01:23:07,765 : INFO : topic #29 (0.020): 0.031*\"companhia\" + 0.013*\"busi\" + 0.012*\"million\" + 0.012*\"market\" + 0.011*\"produc\" + 0.010*\"bank\" + 0.010*\"industri\" + 0.009*\"yawn\" + 0.008*\"manag\" + 0.007*\"function\"\n", + "2019-01-31 01:23:07,771 : INFO : topic diff=0.003965, rho=0.022669\n", + "2019-01-31 01:23:07,925 : INFO : PROGRESS: pass 0, at document #3894000/4922894\n", + "2019-01-31 01:23:09,293 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:23:09,560 : INFO : topic #30 (0.020): 0.036*\"cleveland\" + 0.035*\"leagu\" + 0.029*\"place\" + 0.027*\"taxpay\" + 0.024*\"scientist\" + 0.023*\"crete\" + 0.021*\"folei\" + 0.016*\"goal\" + 0.016*\"martin\" + 0.012*\"schmitz\"\n", + "2019-01-31 01:23:09,562 : INFO : topic #45 (0.020): 0.038*\"arsen\" + 0.029*\"jpg\" + 0.028*\"fifteenth\" + 0.025*\"museo\" + 0.022*\"pain\" + 0.020*\"illicit\" + 0.015*\"exhaust\" + 0.015*\"colder\" + 0.015*\"gai\" + 0.014*\"artist\"\n", + "2019-01-31 01:23:09,563 : INFO : topic #26 (0.020): 0.030*\"workplac\" + 0.028*\"champion\" + 0.027*\"woman\" + 0.025*\"men\" + 0.024*\"olymp\" + 0.022*\"medal\" + 0.020*\"event\" + 0.020*\"alic\" + 0.018*\"taxpay\" + 0.018*\"rainfal\"\n", + "2019-01-31 01:23:09,564 : INFO : topic #21 (0.020): 0.033*\"samford\" + 0.023*\"spain\" + 0.018*\"del\" + 0.018*\"italian\" + 0.016*\"mexico\" + 0.014*\"soviet\" + 0.012*\"santa\" + 0.011*\"juan\" + 0.010*\"carlo\" + 0.010*\"itali\"\n", + "2019-01-31 01:23:09,565 : INFO : topic #15 (0.020): 0.011*\"small\" + 0.010*\"organ\" + 0.010*\"develop\" + 0.009*\"commun\" + 0.008*\"group\" + 0.008*\"peopl\" + 0.008*\"word\" + 0.007*\"human\" + 0.007*\"woman\" + 0.006*\"cultur\"\n", + "2019-01-31 01:23:09,571 : INFO : topic diff=0.003767, rho=0.022663\n", + "2019-01-31 01:23:09,728 : INFO : PROGRESS: pass 0, at document #3896000/4922894\n", + "2019-01-31 01:23:11,106 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:23:11,373 : INFO : topic #27 (0.020): 0.072*\"questionnair\" + 0.021*\"candid\" + 0.017*\"taxpay\" + 0.014*\"ret\" + 0.013*\"driver\" + 0.012*\"fool\" + 0.012*\"tornado\" + 0.011*\"find\" + 0.011*\"landslid\" + 0.010*\"champion\"\n", + "2019-01-31 01:23:11,374 : INFO : topic #13 (0.020): 0.027*\"australia\" + 0.026*\"london\" + 0.026*\"sourc\" + 0.025*\"new\" + 0.023*\"australian\" + 0.022*\"england\" + 0.019*\"british\" + 0.018*\"ireland\" + 0.014*\"wale\" + 0.014*\"youth\"\n", + "2019-01-31 01:23:11,375 : INFO : topic #31 (0.020): 0.050*\"fusiform\" + 0.027*\"scientist\" + 0.025*\"taxpay\" + 0.023*\"player\" + 0.020*\"place\" + 0.014*\"clot\" + 0.013*\"leagu\" + 0.011*\"folei\" + 0.010*\"yawn\" + 0.009*\"reconstruct\"\n", + "2019-01-31 01:23:11,376 : INFO : topic #33 (0.020): 0.061*\"french\" + 0.046*\"franc\" + 0.032*\"pari\" + 0.023*\"sail\" + 0.022*\"jean\" + 0.018*\"daphn\" + 0.013*\"loui\" + 0.013*\"lazi\" + 0.011*\"piec\" + 0.010*\"wine\"\n", + "2019-01-31 01:23:11,377 : INFO : topic #47 (0.020): 0.062*\"muscl\" + 0.033*\"perceptu\" + 0.021*\"theater\" + 0.019*\"place\" + 0.017*\"compos\" + 0.016*\"damn\" + 0.014*\"orchestr\" + 0.013*\"olympo\" + 0.013*\"physician\" + 0.011*\"word\"\n", + "2019-01-31 01:23:11,383 : INFO : topic diff=0.003605, rho=0.022657\n", + "2019-01-31 01:23:11,545 : INFO : PROGRESS: pass 0, at document #3898000/4922894\n", + "2019-01-31 01:23:12,935 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:23:13,201 : INFO : topic #9 (0.020): 0.072*\"bone\" + 0.045*\"american\" + 0.028*\"valour\" + 0.019*\"dutch\" + 0.018*\"folei\" + 0.017*\"player\" + 0.017*\"english\" + 0.017*\"polit\" + 0.012*\"simpler\" + 0.012*\"acrimoni\"\n", + "2019-01-31 01:23:13,202 : INFO : topic #21 (0.020): 0.033*\"samford\" + 0.023*\"spain\" + 0.018*\"del\" + 0.018*\"italian\" + 0.016*\"mexico\" + 0.014*\"soviet\" + 0.013*\"santa\" + 0.011*\"juan\" + 0.010*\"carlo\" + 0.010*\"itali\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 01:23:13,204 : INFO : topic #4 (0.020): 0.019*\"enfranchis\" + 0.015*\"pour\" + 0.014*\"depress\" + 0.009*\"elabor\" + 0.008*\"mode\" + 0.008*\"veget\" + 0.008*\"uruguayan\" + 0.006*\"turn\" + 0.006*\"produc\" + 0.006*\"develop\"\n", + "2019-01-31 01:23:13,205 : INFO : topic #7 (0.020): 0.021*\"snatch\" + 0.020*\"di\" + 0.018*\"factor\" + 0.016*\"margin\" + 0.016*\"yawn\" + 0.014*\"bone\" + 0.013*\"faster\" + 0.013*\"life\" + 0.012*\"will\" + 0.012*\"deal\"\n", + "2019-01-31 01:23:13,206 : INFO : topic #32 (0.020): 0.051*\"district\" + 0.045*\"popolo\" + 0.042*\"vigour\" + 0.036*\"tortur\" + 0.034*\"cotton\" + 0.022*\"multitud\" + 0.022*\"area\" + 0.021*\"adulthood\" + 0.020*\"cede\" + 0.018*\"regim\"\n", + "2019-01-31 01:23:13,211 : INFO : topic diff=0.003725, rho=0.022651\n", + "2019-01-31 01:23:15,903 : INFO : -11.718 per-word bound, 3369.1 perplexity estimate based on a held-out corpus of 2000 documents with 552483 words\n", + "2019-01-31 01:23:15,903 : INFO : PROGRESS: pass 0, at document #3900000/4922894\n", + "2019-01-31 01:23:17,280 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:23:17,547 : INFO : topic #33 (0.020): 0.061*\"french\" + 0.046*\"franc\" + 0.032*\"pari\" + 0.023*\"sail\" + 0.022*\"jean\" + 0.017*\"daphn\" + 0.014*\"lazi\" + 0.013*\"loui\" + 0.011*\"piec\" + 0.010*\"wine\"\n", + "2019-01-31 01:23:17,548 : INFO : topic #35 (0.020): 0.055*\"russia\" + 0.038*\"sovereignti\" + 0.036*\"rural\" + 0.028*\"poison\" + 0.024*\"personifi\" + 0.022*\"reprint\" + 0.020*\"moscow\" + 0.020*\"poland\" + 0.014*\"tyrant\" + 0.014*\"turin\"\n", + "2019-01-31 01:23:17,549 : INFO : topic #13 (0.020): 0.026*\"australia\" + 0.026*\"london\" + 0.025*\"sourc\" + 0.025*\"new\" + 0.023*\"australian\" + 0.022*\"england\" + 0.019*\"british\" + 0.018*\"ireland\" + 0.014*\"wale\" + 0.014*\"youth\"\n", + "2019-01-31 01:23:17,550 : INFO : topic #7 (0.020): 0.021*\"snatch\" + 0.020*\"di\" + 0.018*\"factor\" + 0.016*\"margin\" + 0.016*\"yawn\" + 0.014*\"bone\" + 0.013*\"faster\" + 0.013*\"life\" + 0.012*\"deal\" + 0.012*\"will\"\n", + "2019-01-31 01:23:17,551 : INFO : topic #45 (0.020): 0.038*\"arsen\" + 0.029*\"jpg\" + 0.028*\"fifteenth\" + 0.025*\"museo\" + 0.022*\"pain\" + 0.020*\"illicit\" + 0.015*\"colder\" + 0.015*\"exhaust\" + 0.015*\"gai\" + 0.014*\"artist\"\n", + "2019-01-31 01:23:17,558 : INFO : topic diff=0.002951, rho=0.022646\n", + "2019-01-31 01:23:17,713 : INFO : PROGRESS: pass 0, at document #3902000/4922894\n", + "2019-01-31 01:23:19,062 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:23:19,328 : INFO : topic #46 (0.020): 0.017*\"sweden\" + 0.016*\"stop\" + 0.016*\"norwai\" + 0.015*\"damag\" + 0.014*\"swedish\" + 0.014*\"norwegian\" + 0.013*\"wind\" + 0.011*\"denmark\" + 0.011*\"treeless\" + 0.011*\"huntsvil\"\n", + "2019-01-31 01:23:19,330 : INFO : topic #18 (0.020): 0.011*\"théori\" + 0.007*\"later\" + 0.007*\"sack\" + 0.006*\"dai\" + 0.006*\"kill\" + 0.005*\"like\" + 0.005*\"retrospect\" + 0.005*\"end\" + 0.004*\"call\" + 0.004*\"help\"\n", + "2019-01-31 01:23:19,331 : INFO : topic #28 (0.020): 0.034*\"build\" + 0.030*\"hous\" + 0.019*\"buford\" + 0.015*\"histor\" + 0.011*\"linear\" + 0.011*\"constitut\" + 0.011*\"depress\" + 0.011*\"silicon\" + 0.010*\"centuri\" + 0.010*\"pistol\"\n", + "2019-01-31 01:23:19,332 : INFO : topic #42 (0.020): 0.047*\"german\" + 0.032*\"germani\" + 0.015*\"vol\" + 0.015*\"jewish\" + 0.014*\"berlin\" + 0.013*\"der\" + 0.013*\"israel\" + 0.010*\"european\" + 0.009*\"austria\" + 0.009*\"europ\"\n", + "2019-01-31 01:23:19,333 : INFO : topic #29 (0.020): 0.031*\"companhia\" + 0.013*\"busi\" + 0.012*\"million\" + 0.012*\"market\" + 0.011*\"produc\" + 0.010*\"bank\" + 0.010*\"industri\" + 0.009*\"yawn\" + 0.008*\"manag\" + 0.007*\"function\"\n", + "2019-01-31 01:23:19,339 : INFO : topic diff=0.002800, rho=0.022640\n", + "2019-01-31 01:23:19,552 : INFO : PROGRESS: pass 0, at document #3904000/4922894\n", + "2019-01-31 01:23:20,912 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:23:21,178 : INFO : topic #5 (0.020): 0.039*\"abroad\" + 0.028*\"son\" + 0.028*\"rel\" + 0.026*\"reconstruct\" + 0.021*\"band\" + 0.016*\"muscl\" + 0.016*\"simultan\" + 0.014*\"charcoal\" + 0.013*\"toyota\" + 0.009*\"vocabulari\"\n", + "2019-01-31 01:23:21,179 : INFO : topic #30 (0.020): 0.036*\"cleveland\" + 0.035*\"leagu\" + 0.029*\"place\" + 0.027*\"taxpay\" + 0.024*\"scientist\" + 0.024*\"crete\" + 0.021*\"folei\" + 0.016*\"goal\" + 0.015*\"martin\" + 0.012*\"schmitz\"\n", + "2019-01-31 01:23:21,181 : INFO : topic #41 (0.020): 0.040*\"citi\" + 0.023*\"palmer\" + 0.020*\"new\" + 0.016*\"strategist\" + 0.013*\"center\" + 0.013*\"open\" + 0.011*\"includ\" + 0.011*\"lobe\" + 0.010*\"dai\" + 0.008*\"local\"\n", + "2019-01-31 01:23:21,182 : INFO : topic #11 (0.020): 0.024*\"john\" + 0.011*\"will\" + 0.011*\"jame\" + 0.011*\"david\" + 0.010*\"rival\" + 0.009*\"mexican–american\" + 0.008*\"slur\" + 0.008*\"paul\" + 0.008*\"georg\" + 0.007*\"rhyme\"\n", + "2019-01-31 01:23:21,183 : INFO : topic #32 (0.020): 0.050*\"district\" + 0.045*\"popolo\" + 0.042*\"vigour\" + 0.036*\"tortur\" + 0.034*\"cotton\" + 0.022*\"multitud\" + 0.022*\"area\" + 0.021*\"adulthood\" + 0.020*\"cede\" + 0.018*\"citi\"\n", + "2019-01-31 01:23:21,189 : INFO : topic diff=0.003208, rho=0.022634\n", + "2019-01-31 01:23:21,347 : INFO : PROGRESS: pass 0, at document #3906000/4922894\n", + "2019-01-31 01:23:22,710 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:23:22,976 : INFO : topic #24 (0.020): 0.038*\"book\" + 0.034*\"publicis\" + 0.027*\"word\" + 0.019*\"new\" + 0.014*\"edit\" + 0.013*\"presid\" + 0.011*\"storag\" + 0.011*\"nicola\" + 0.011*\"author\" + 0.011*\"magazin\"\n", + "2019-01-31 01:23:22,977 : INFO : topic #23 (0.020): 0.136*\"audit\" + 0.070*\"best\" + 0.033*\"yawn\" + 0.030*\"jacksonvil\" + 0.024*\"japanes\" + 0.021*\"noll\" + 0.019*\"festiv\" + 0.018*\"women\" + 0.017*\"intern\" + 0.014*\"winner\"\n", + "2019-01-31 01:23:22,978 : INFO : topic #13 (0.020): 0.026*\"australia\" + 0.026*\"london\" + 0.025*\"sourc\" + 0.025*\"new\" + 0.023*\"australian\" + 0.022*\"england\" + 0.019*\"british\" + 0.018*\"ireland\" + 0.014*\"wale\" + 0.014*\"youth\"\n", + "2019-01-31 01:23:22,979 : INFO : topic #0 (0.020): 0.065*\"statewid\" + 0.042*\"line\" + 0.030*\"raid\" + 0.026*\"rivièr\" + 0.026*\"rosenwald\" + 0.024*\"airmen\" + 0.018*\"traceabl\" + 0.018*\"serv\" + 0.014*\"oper\" + 0.011*\"radiu\"\n", + "2019-01-31 01:23:22,980 : INFO : topic #17 (0.020): 0.076*\"church\" + 0.023*\"christian\" + 0.022*\"cathol\" + 0.020*\"bishop\" + 0.017*\"sail\" + 0.015*\"retroflex\" + 0.010*\"relationship\" + 0.009*\"parish\" + 0.009*\"cathedr\" + 0.009*\"historiographi\"\n", + "2019-01-31 01:23:22,986 : INFO : topic diff=0.003594, rho=0.022628\n", + "2019-01-31 01:23:23,143 : INFO : PROGRESS: pass 0, at document #3908000/4922894\n", + "2019-01-31 01:23:24,520 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:23:24,786 : INFO : topic #7 (0.020): 0.021*\"snatch\" + 0.020*\"di\" + 0.018*\"factor\" + 0.016*\"margin\" + 0.016*\"yawn\" + 0.014*\"bone\" + 0.013*\"faster\" + 0.013*\"life\" + 0.012*\"deal\" + 0.012*\"daughter\"\n", + "2019-01-31 01:23:24,787 : INFO : topic #2 (0.020): 0.050*\"isl\" + 0.039*\"shield\" + 0.017*\"narrat\" + 0.015*\"scot\" + 0.013*\"blur\" + 0.013*\"pope\" + 0.011*\"coalit\" + 0.010*\"nativist\" + 0.009*\"class\" + 0.009*\"fleet\"\n", + "2019-01-31 01:23:24,788 : INFO : topic #26 (0.020): 0.031*\"workplac\" + 0.029*\"champion\" + 0.027*\"woman\" + 0.025*\"men\" + 0.024*\"olymp\" + 0.022*\"medal\" + 0.020*\"event\" + 0.019*\"alic\" + 0.018*\"taxpay\" + 0.018*\"rainfal\"\n", + "2019-01-31 01:23:24,790 : INFO : topic #18 (0.020): 0.011*\"théori\" + 0.007*\"later\" + 0.007*\"sack\" + 0.006*\"dai\" + 0.006*\"kill\" + 0.005*\"like\" + 0.005*\"retrospect\" + 0.005*\"end\" + 0.004*\"call\" + 0.004*\"help\"\n", + "2019-01-31 01:23:24,791 : INFO : topic #24 (0.020): 0.038*\"book\" + 0.035*\"publicis\" + 0.027*\"word\" + 0.019*\"new\" + 0.014*\"edit\" + 0.013*\"presid\" + 0.011*\"storag\" + 0.011*\"nicola\" + 0.011*\"author\" + 0.011*\"worldwid\"\n", + "2019-01-31 01:23:24,796 : INFO : topic diff=0.004238, rho=0.022622\n", + "2019-01-31 01:23:24,952 : INFO : PROGRESS: pass 0, at document #3910000/4922894\n", + "2019-01-31 01:23:26,318 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:23:26,584 : INFO : topic #4 (0.020): 0.020*\"enfranchis\" + 0.014*\"pour\" + 0.014*\"depress\" + 0.008*\"mode\" + 0.008*\"elabor\" + 0.008*\"veget\" + 0.008*\"uruguayan\" + 0.006*\"turn\" + 0.006*\"produc\" + 0.006*\"develop\"\n", + "2019-01-31 01:23:26,585 : INFO : topic #21 (0.020): 0.033*\"samford\" + 0.023*\"spain\" + 0.018*\"del\" + 0.018*\"italian\" + 0.016*\"mexico\" + 0.014*\"soviet\" + 0.013*\"santa\" + 0.011*\"juan\" + 0.010*\"carlo\" + 0.010*\"francisco\"\n", + "2019-01-31 01:23:26,586 : INFO : topic #19 (0.020): 0.017*\"languag\" + 0.015*\"centuri\" + 0.010*\"woodcut\" + 0.009*\"origin\" + 0.009*\"form\" + 0.009*\"mean\" + 0.008*\"trade\" + 0.008*\"english\" + 0.007*\"known\" + 0.007*\"ancestor\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 01:23:26,587 : INFO : topic #27 (0.020): 0.072*\"questionnair\" + 0.021*\"candid\" + 0.017*\"taxpay\" + 0.014*\"driver\" + 0.013*\"fool\" + 0.013*\"ret\" + 0.012*\"tornado\" + 0.011*\"find\" + 0.010*\"landslid\" + 0.010*\"champion\"\n", + "2019-01-31 01:23:26,588 : INFO : topic #32 (0.020): 0.050*\"district\" + 0.044*\"popolo\" + 0.042*\"vigour\" + 0.036*\"tortur\" + 0.034*\"cotton\" + 0.022*\"area\" + 0.022*\"multitud\" + 0.021*\"adulthood\" + 0.019*\"cede\" + 0.018*\"regim\"\n", + "2019-01-31 01:23:26,595 : INFO : topic diff=0.003804, rho=0.022617\n", + "2019-01-31 01:23:26,751 : INFO : PROGRESS: pass 0, at document #3912000/4922894\n", + "2019-01-31 01:23:28,299 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:23:28,567 : INFO : topic #4 (0.020): 0.020*\"enfranchis\" + 0.014*\"pour\" + 0.014*\"depress\" + 0.008*\"elabor\" + 0.008*\"mode\" + 0.008*\"veget\" + 0.008*\"uruguayan\" + 0.006*\"turn\" + 0.006*\"produc\" + 0.006*\"develop\"\n", + "2019-01-31 01:23:28,568 : INFO : topic #14 (0.020): 0.024*\"forc\" + 0.022*\"aggress\" + 0.021*\"armi\" + 0.021*\"walter\" + 0.018*\"com\" + 0.013*\"oper\" + 0.013*\"unionist\" + 0.012*\"militari\" + 0.012*\"diversifi\" + 0.012*\"airbu\"\n", + "2019-01-31 01:23:28,569 : INFO : topic #2 (0.020): 0.050*\"isl\" + 0.039*\"shield\" + 0.017*\"narrat\" + 0.015*\"scot\" + 0.013*\"blur\" + 0.013*\"pope\" + 0.011*\"coalit\" + 0.010*\"nativist\" + 0.009*\"class\" + 0.009*\"fleet\"\n", + "2019-01-31 01:23:28,570 : INFO : topic #44 (0.020): 0.030*\"rooftop\" + 0.027*\"final\" + 0.023*\"wife\" + 0.019*\"tourist\" + 0.019*\"champion\" + 0.015*\"martin\" + 0.015*\"taxpay\" + 0.014*\"chamber\" + 0.014*\"tiepolo\" + 0.013*\"open\"\n", + "2019-01-31 01:23:28,571 : INFO : topic #23 (0.020): 0.136*\"audit\" + 0.069*\"best\" + 0.033*\"yawn\" + 0.030*\"jacksonvil\" + 0.024*\"japanes\" + 0.021*\"noll\" + 0.019*\"festiv\" + 0.018*\"women\" + 0.017*\"intern\" + 0.014*\"winner\"\n", + "2019-01-31 01:23:28,577 : INFO : topic diff=0.003631, rho=0.022611\n", + "2019-01-31 01:23:28,734 : INFO : PROGRESS: pass 0, at document #3914000/4922894\n", + "2019-01-31 01:23:30,105 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:23:30,372 : INFO : topic #48 (0.020): 0.080*\"march\" + 0.079*\"sens\" + 0.077*\"octob\" + 0.070*\"juli\" + 0.069*\"januari\" + 0.068*\"august\" + 0.067*\"notion\" + 0.066*\"judici\" + 0.064*\"april\" + 0.063*\"decatur\"\n", + "2019-01-31 01:23:30,373 : INFO : topic #24 (0.020): 0.038*\"book\" + 0.034*\"publicis\" + 0.027*\"word\" + 0.019*\"new\" + 0.014*\"edit\" + 0.013*\"presid\" + 0.011*\"nicola\" + 0.011*\"storag\" + 0.011*\"magazin\" + 0.011*\"author\"\n", + "2019-01-31 01:23:30,374 : INFO : topic #37 (0.020): 0.013*\"charact\" + 0.012*\"septemb\" + 0.011*\"anim\" + 0.010*\"man\" + 0.008*\"comic\" + 0.007*\"appear\" + 0.007*\"storag\" + 0.007*\"workplac\" + 0.006*\"fusiform\" + 0.006*\"vision\"\n", + "2019-01-31 01:23:30,375 : INFO : topic #12 (0.020): 0.008*\"number\" + 0.007*\"frontal\" + 0.007*\"gener\" + 0.007*\"southern\" + 0.006*\"poet\" + 0.006*\"exampl\" + 0.006*\"théori\" + 0.006*\"utopian\" + 0.006*\"method\" + 0.006*\"servitud\"\n", + "2019-01-31 01:23:30,376 : INFO : topic #27 (0.020): 0.072*\"questionnair\" + 0.021*\"candid\" + 0.017*\"taxpay\" + 0.013*\"driver\" + 0.012*\"fool\" + 0.012*\"tornado\" + 0.012*\"ret\" + 0.011*\"find\" + 0.010*\"landslid\" + 0.010*\"champion\"\n", + "2019-01-31 01:23:30,382 : INFO : topic diff=0.002952, rho=0.022605\n", + "2019-01-31 01:23:30,543 : INFO : PROGRESS: pass 0, at document #3916000/4922894\n", + "2019-01-31 01:23:31,944 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:23:32,210 : INFO : topic #23 (0.020): 0.136*\"audit\" + 0.069*\"best\" + 0.033*\"yawn\" + 0.029*\"jacksonvil\" + 0.024*\"japanes\" + 0.021*\"noll\" + 0.019*\"festiv\" + 0.019*\"women\" + 0.017*\"intern\" + 0.014*\"winner\"\n", + "2019-01-31 01:23:32,211 : INFO : topic #19 (0.020): 0.017*\"languag\" + 0.015*\"centuri\" + 0.010*\"woodcut\" + 0.009*\"form\" + 0.009*\"origin\" + 0.009*\"mean\" + 0.008*\"trade\" + 0.008*\"english\" + 0.007*\"known\" + 0.007*\"ancestor\"\n", + "2019-01-31 01:23:32,212 : INFO : topic #41 (0.020): 0.040*\"citi\" + 0.023*\"palmer\" + 0.020*\"new\" + 0.017*\"strategist\" + 0.013*\"center\" + 0.013*\"open\" + 0.011*\"includ\" + 0.011*\"lobe\" + 0.010*\"dai\" + 0.009*\"local\"\n", + "2019-01-31 01:23:32,213 : INFO : topic #17 (0.020): 0.076*\"church\" + 0.023*\"christian\" + 0.022*\"cathol\" + 0.020*\"bishop\" + 0.017*\"sail\" + 0.015*\"retroflex\" + 0.010*\"relationship\" + 0.009*\"historiographi\" + 0.009*\"cathedr\" + 0.009*\"parish\"\n", + "2019-01-31 01:23:32,214 : INFO : topic #37 (0.020): 0.013*\"charact\" + 0.012*\"septemb\" + 0.011*\"anim\" + 0.010*\"man\" + 0.008*\"comic\" + 0.007*\"appear\" + 0.007*\"storag\" + 0.007*\"workplac\" + 0.006*\"fusiform\" + 0.006*\"vision\"\n", + "2019-01-31 01:23:32,220 : INFO : topic diff=0.004120, rho=0.022599\n", + "2019-01-31 01:23:32,372 : INFO : PROGRESS: pass 0, at document #3918000/4922894\n", + "2019-01-31 01:23:33,710 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:23:33,976 : INFO : topic #40 (0.020): 0.084*\"unit\" + 0.024*\"schuster\" + 0.022*\"institut\" + 0.021*\"collector\" + 0.021*\"requir\" + 0.019*\"student\" + 0.014*\"professor\" + 0.012*\"word\" + 0.012*\"http\" + 0.011*\"degre\"\n", + "2019-01-31 01:23:33,977 : INFO : topic #29 (0.020): 0.031*\"companhia\" + 0.013*\"busi\" + 0.012*\"million\" + 0.012*\"market\" + 0.011*\"produc\" + 0.010*\"bank\" + 0.010*\"industri\" + 0.009*\"yawn\" + 0.008*\"manag\" + 0.007*\"function\"\n", + "2019-01-31 01:23:33,978 : INFO : topic #46 (0.020): 0.017*\"stop\" + 0.016*\"norwai\" + 0.016*\"sweden\" + 0.015*\"damag\" + 0.015*\"swedish\" + 0.014*\"norwegian\" + 0.014*\"wind\" + 0.013*\"treeless\" + 0.011*\"denmark\" + 0.011*\"huntsvil\"\n", + "2019-01-31 01:23:33,979 : INFO : topic #47 (0.020): 0.063*\"muscl\" + 0.033*\"perceptu\" + 0.021*\"theater\" + 0.019*\"place\" + 0.017*\"compos\" + 0.016*\"damn\" + 0.014*\"orchestr\" + 0.013*\"olympo\" + 0.013*\"physician\" + 0.011*\"word\"\n", + "2019-01-31 01:23:33,980 : INFO : topic #3 (0.020): 0.033*\"present\" + 0.026*\"offic\" + 0.024*\"minist\" + 0.023*\"nation\" + 0.022*\"govern\" + 0.021*\"member\" + 0.019*\"serv\" + 0.016*\"start\" + 0.016*\"gener\" + 0.014*\"chickasaw\"\n", + "2019-01-31 01:23:33,986 : INFO : topic diff=0.003299, rho=0.022593\n", + "2019-01-31 01:23:36,659 : INFO : -11.674 per-word bound, 3267.7 perplexity estimate based on a held-out corpus of 2000 documents with 549204 words\n", + "2019-01-31 01:23:36,660 : INFO : PROGRESS: pass 0, at document #3920000/4922894\n", + "2019-01-31 01:23:38,034 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:23:38,300 : INFO : topic #17 (0.020): 0.076*\"church\" + 0.023*\"christian\" + 0.022*\"cathol\" + 0.020*\"bishop\" + 0.017*\"sail\" + 0.015*\"retroflex\" + 0.010*\"relationship\" + 0.009*\"historiographi\" + 0.009*\"cathedr\" + 0.009*\"parish\"\n", + "2019-01-31 01:23:38,301 : INFO : topic #35 (0.020): 0.058*\"russia\" + 0.038*\"sovereignti\" + 0.035*\"rural\" + 0.027*\"poison\" + 0.024*\"personifi\" + 0.022*\"reprint\" + 0.021*\"moscow\" + 0.020*\"poland\" + 0.014*\"turin\" + 0.014*\"tyrant\"\n", + "2019-01-31 01:23:38,302 : INFO : topic #12 (0.020): 0.008*\"number\" + 0.007*\"frontal\" + 0.007*\"gener\" + 0.007*\"southern\" + 0.006*\"poet\" + 0.006*\"exampl\" + 0.006*\"théori\" + 0.006*\"utopian\" + 0.006*\"method\" + 0.006*\"servitud\"\n", + "2019-01-31 01:23:38,303 : INFO : topic #21 (0.020): 0.033*\"samford\" + 0.024*\"spain\" + 0.018*\"del\" + 0.017*\"italian\" + 0.016*\"mexico\" + 0.014*\"soviet\" + 0.013*\"santa\" + 0.011*\"juan\" + 0.010*\"francisco\" + 0.010*\"carlo\"\n", + "2019-01-31 01:23:38,304 : INFO : topic #25 (0.020): 0.032*\"ring\" + 0.018*\"area\" + 0.017*\"lagrang\" + 0.015*\"mount\" + 0.015*\"warmth\" + 0.010*\"north\" + 0.009*\"sourc\" + 0.009*\"land\" + 0.009*\"palmer\" + 0.008*\"lobe\"\n", + "2019-01-31 01:23:38,310 : INFO : topic diff=0.003144, rho=0.022588\n", + "2019-01-31 01:23:38,461 : INFO : PROGRESS: pass 0, at document #3922000/4922894\n", + "2019-01-31 01:23:39,794 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:23:40,060 : INFO : topic #26 (0.020): 0.032*\"workplac\" + 0.028*\"champion\" + 0.027*\"woman\" + 0.024*\"men\" + 0.024*\"olymp\" + 0.022*\"medal\" + 0.020*\"event\" + 0.019*\"alic\" + 0.018*\"taxpay\" + 0.018*\"atheist\"\n", + "2019-01-31 01:23:40,061 : INFO : topic #6 (0.020): 0.069*\"fewer\" + 0.023*\"epiru\" + 0.020*\"septemb\" + 0.018*\"teacher\" + 0.015*\"stake\" + 0.012*\"rodríguez\" + 0.012*\"proclaim\" + 0.011*\"movi\" + 0.010*\"direct\" + 0.010*\"acrimoni\"\n", + "2019-01-31 01:23:40,062 : INFO : topic #34 (0.020): 0.065*\"start\" + 0.035*\"new\" + 0.031*\"american\" + 0.028*\"unionist\" + 0.027*\"cotton\" + 0.021*\"year\" + 0.015*\"california\" + 0.013*\"warrior\" + 0.013*\"terri\" + 0.011*\"citi\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 01:23:40,063 : INFO : topic #46 (0.020): 0.017*\"stop\" + 0.016*\"norwai\" + 0.016*\"sweden\" + 0.015*\"swedish\" + 0.014*\"damag\" + 0.014*\"norwegian\" + 0.014*\"wind\" + 0.013*\"treeless\" + 0.011*\"denmark\" + 0.011*\"huntsvil\"\n", + "2019-01-31 01:23:40,065 : INFO : topic #19 (0.020): 0.017*\"languag\" + 0.015*\"centuri\" + 0.011*\"woodcut\" + 0.009*\"form\" + 0.009*\"origin\" + 0.009*\"mean\" + 0.008*\"trade\" + 0.007*\"english\" + 0.007*\"known\" + 0.007*\"uruguayan\"\n", + "2019-01-31 01:23:40,071 : INFO : topic diff=0.003439, rho=0.022582\n", + "2019-01-31 01:23:40,222 : INFO : PROGRESS: pass 0, at document #3924000/4922894\n", + "2019-01-31 01:23:41,558 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:23:41,824 : INFO : topic #1 (0.020): 0.054*\"china\" + 0.046*\"chilton\" + 0.025*\"hong\" + 0.024*\"kong\" + 0.019*\"korea\" + 0.017*\"korean\" + 0.015*\"leah\" + 0.015*\"sourc\" + 0.015*\"kim\" + 0.014*\"shirin\"\n", + "2019-01-31 01:23:41,825 : INFO : topic #24 (0.020): 0.039*\"book\" + 0.034*\"publicis\" + 0.027*\"word\" + 0.019*\"new\" + 0.014*\"edit\" + 0.013*\"presid\" + 0.011*\"nicola\" + 0.011*\"storag\" + 0.011*\"magazin\" + 0.011*\"author\"\n", + "2019-01-31 01:23:41,827 : INFO : topic #0 (0.020): 0.065*\"statewid\" + 0.040*\"line\" + 0.030*\"raid\" + 0.027*\"rosenwald\" + 0.026*\"rivièr\" + 0.023*\"airmen\" + 0.019*\"serv\" + 0.018*\"traceabl\" + 0.014*\"oper\" + 0.010*\"radiu\"\n", + "2019-01-31 01:23:41,828 : INFO : topic #28 (0.020): 0.036*\"build\" + 0.030*\"hous\" + 0.019*\"buford\" + 0.015*\"histor\" + 0.013*\"linear\" + 0.011*\"constitut\" + 0.011*\"silicon\" + 0.011*\"depress\" + 0.010*\"centuri\" + 0.010*\"pistol\"\n", + "2019-01-31 01:23:41,829 : INFO : topic #36 (0.020): 0.011*\"network\" + 0.010*\"prognosi\" + 0.010*\"pop\" + 0.008*\"cytokin\" + 0.008*\"develop\" + 0.008*\"softwar\" + 0.008*\"championship\" + 0.008*\"diggin\" + 0.008*\"user\" + 0.008*\"uruguayan\"\n", + "2019-01-31 01:23:41,835 : INFO : topic diff=0.003635, rho=0.022576\n", + "2019-01-31 01:23:41,989 : INFO : PROGRESS: pass 0, at document #3926000/4922894\n", + "2019-01-31 01:23:43,335 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:23:43,602 : INFO : topic #46 (0.020): 0.017*\"stop\" + 0.017*\"sweden\" + 0.016*\"norwai\" + 0.015*\"swedish\" + 0.014*\"damag\" + 0.014*\"norwegian\" + 0.014*\"wind\" + 0.013*\"treeless\" + 0.011*\"huntsvil\" + 0.011*\"denmark\"\n", + "2019-01-31 01:23:43,603 : INFO : topic #8 (0.020): 0.027*\"law\" + 0.022*\"cortic\" + 0.019*\"start\" + 0.017*\"act\" + 0.012*\"ricardo\" + 0.012*\"case\" + 0.010*\"replac\" + 0.010*\"polaris\" + 0.008*\"legal\" + 0.006*\"rudolf\"\n", + "2019-01-31 01:23:43,604 : INFO : topic #23 (0.020): 0.138*\"audit\" + 0.069*\"best\" + 0.033*\"yawn\" + 0.030*\"jacksonvil\" + 0.024*\"japanes\" + 0.021*\"noll\" + 0.019*\"women\" + 0.018*\"festiv\" + 0.017*\"intern\" + 0.014*\"winner\"\n", + "2019-01-31 01:23:43,605 : INFO : topic #44 (0.020): 0.031*\"rooftop\" + 0.027*\"final\" + 0.023*\"wife\" + 0.019*\"tourist\" + 0.018*\"champion\" + 0.015*\"taxpay\" + 0.014*\"martin\" + 0.014*\"chamber\" + 0.014*\"tiepolo\" + 0.012*\"open\"\n", + "2019-01-31 01:23:43,606 : INFO : topic #36 (0.020): 0.011*\"network\" + 0.010*\"prognosi\" + 0.010*\"pop\" + 0.008*\"cytokin\" + 0.008*\"develop\" + 0.008*\"diggin\" + 0.008*\"championship\" + 0.008*\"softwar\" + 0.008*\"user\" + 0.008*\"uruguayan\"\n", + "2019-01-31 01:23:43,612 : INFO : topic diff=0.003061, rho=0.022570\n", + "2019-01-31 01:23:43,767 : INFO : PROGRESS: pass 0, at document #3928000/4922894\n", + "2019-01-31 01:23:45,137 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:23:45,403 : INFO : topic #1 (0.020): 0.054*\"china\" + 0.045*\"chilton\" + 0.024*\"hong\" + 0.024*\"kong\" + 0.020*\"korea\" + 0.018*\"korean\" + 0.016*\"sourc\" + 0.016*\"leah\" + 0.015*\"kim\" + 0.014*\"shirin\"\n", + "2019-01-31 01:23:45,404 : INFO : topic #0 (0.020): 0.065*\"statewid\" + 0.041*\"line\" + 0.030*\"raid\" + 0.027*\"rosenwald\" + 0.026*\"rivièr\" + 0.023*\"airmen\" + 0.018*\"serv\" + 0.018*\"traceabl\" + 0.014*\"oper\" + 0.010*\"radiu\"\n", + "2019-01-31 01:23:45,406 : INFO : topic #14 (0.020): 0.024*\"forc\" + 0.022*\"aggress\" + 0.021*\"walter\" + 0.020*\"armi\" + 0.018*\"com\" + 0.014*\"unionist\" + 0.013*\"oper\" + 0.012*\"militari\" + 0.012*\"airbu\" + 0.011*\"diversifi\"\n", + "2019-01-31 01:23:45,407 : INFO : topic #45 (0.020): 0.039*\"arsen\" + 0.029*\"jpg\" + 0.028*\"fifteenth\" + 0.025*\"museo\" + 0.021*\"pain\" + 0.019*\"illicit\" + 0.015*\"exhaust\" + 0.015*\"colder\" + 0.014*\"gai\" + 0.014*\"artist\"\n", + "2019-01-31 01:23:45,408 : INFO : topic #39 (0.020): 0.058*\"canada\" + 0.046*\"canadian\" + 0.024*\"hoar\" + 0.023*\"toronto\" + 0.022*\"ontario\" + 0.017*\"hydrogen\" + 0.015*\"new\" + 0.014*\"misericordia\" + 0.014*\"novotná\" + 0.013*\"quebec\"\n", + "2019-01-31 01:23:45,414 : INFO : topic diff=0.003247, rho=0.022565\n", + "2019-01-31 01:23:45,570 : INFO : PROGRESS: pass 0, at document #3930000/4922894\n", + "2019-01-31 01:23:46,920 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:23:47,186 : INFO : topic #9 (0.020): 0.072*\"bone\" + 0.043*\"american\" + 0.029*\"valour\" + 0.020*\"dutch\" + 0.018*\"folei\" + 0.018*\"polit\" + 0.017*\"player\" + 0.017*\"english\" + 0.011*\"acrimoni\" + 0.011*\"simpler\"\n", + "2019-01-31 01:23:47,187 : INFO : topic #0 (0.020): 0.065*\"statewid\" + 0.041*\"line\" + 0.030*\"raid\" + 0.027*\"rivièr\" + 0.027*\"rosenwald\" + 0.023*\"airmen\" + 0.019*\"serv\" + 0.018*\"traceabl\" + 0.014*\"oper\" + 0.011*\"radiu\"\n", + "2019-01-31 01:23:47,188 : INFO : topic #3 (0.020): 0.033*\"present\" + 0.026*\"offic\" + 0.024*\"minist\" + 0.023*\"nation\" + 0.022*\"govern\" + 0.021*\"member\" + 0.019*\"serv\" + 0.016*\"start\" + 0.016*\"gener\" + 0.014*\"chickasaw\"\n", + "2019-01-31 01:23:47,189 : INFO : topic #28 (0.020): 0.036*\"build\" + 0.029*\"hous\" + 0.019*\"buford\" + 0.015*\"histor\" + 0.013*\"linear\" + 0.011*\"constitut\" + 0.011*\"silicon\" + 0.011*\"depress\" + 0.010*\"centuri\" + 0.010*\"pistol\"\n", + "2019-01-31 01:23:47,190 : INFO : topic #25 (0.020): 0.032*\"ring\" + 0.018*\"area\" + 0.017*\"lagrang\" + 0.015*\"mount\" + 0.015*\"warmth\" + 0.010*\"north\" + 0.009*\"sourc\" + 0.009*\"land\" + 0.009*\"palmer\" + 0.008*\"lobe\"\n", + "2019-01-31 01:23:47,196 : INFO : topic diff=0.004011, rho=0.022559\n", + "2019-01-31 01:23:47,350 : INFO : PROGRESS: pass 0, at document #3932000/4922894\n", + "2019-01-31 01:23:48,707 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:23:48,973 : INFO : topic #32 (0.020): 0.050*\"district\" + 0.044*\"popolo\" + 0.044*\"vigour\" + 0.036*\"tortur\" + 0.034*\"cotton\" + 0.022*\"multitud\" + 0.022*\"area\" + 0.021*\"adulthood\" + 0.019*\"cede\" + 0.018*\"regim\"\n", + "2019-01-31 01:23:48,974 : INFO : topic #14 (0.020): 0.024*\"forc\" + 0.022*\"aggress\" + 0.021*\"walter\" + 0.020*\"armi\" + 0.018*\"com\" + 0.013*\"unionist\" + 0.013*\"oper\" + 0.012*\"militari\" + 0.012*\"airbu\" + 0.011*\"diversifi\"\n", + "2019-01-31 01:23:48,975 : INFO : topic #1 (0.020): 0.055*\"china\" + 0.045*\"chilton\" + 0.024*\"hong\" + 0.023*\"kong\" + 0.020*\"korea\" + 0.018*\"korean\" + 0.016*\"sourc\" + 0.016*\"leah\" + 0.014*\"kim\" + 0.014*\"shirin\"\n", + "2019-01-31 01:23:48,976 : INFO : topic #23 (0.020): 0.137*\"audit\" + 0.068*\"best\" + 0.033*\"yawn\" + 0.030*\"jacksonvil\" + 0.024*\"japanes\" + 0.021*\"noll\" + 0.019*\"women\" + 0.018*\"festiv\" + 0.017*\"intern\" + 0.014*\"winner\"\n", + "2019-01-31 01:23:48,977 : INFO : topic #49 (0.020): 0.044*\"india\" + 0.030*\"incumb\" + 0.014*\"pakistan\" + 0.012*\"islam\" + 0.011*\"anglo\" + 0.011*\"sri\" + 0.011*\"muskoge\" + 0.011*\"televis\" + 0.011*\"khalsa\" + 0.010*\"alam\"\n", + "2019-01-31 01:23:48,983 : INFO : topic diff=0.003621, rho=0.022553\n", + "2019-01-31 01:23:49,193 : INFO : PROGRESS: pass 0, at document #3934000/4922894\n", + "2019-01-31 01:23:50,559 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:23:50,825 : INFO : topic #22 (0.020): 0.033*\"spars\" + 0.018*\"factor\" + 0.012*\"plaisir\" + 0.010*\"western\" + 0.010*\"genu\" + 0.009*\"biom\" + 0.008*\"median\" + 0.007*\"incom\" + 0.006*\"male\" + 0.006*\"feel\"\n", + "2019-01-31 01:23:50,826 : INFO : topic #44 (0.020): 0.030*\"rooftop\" + 0.027*\"final\" + 0.022*\"wife\" + 0.019*\"tourist\" + 0.018*\"champion\" + 0.014*\"taxpay\" + 0.014*\"martin\" + 0.014*\"chamber\" + 0.014*\"tiepolo\" + 0.012*\"open\"\n", + "2019-01-31 01:23:50,827 : INFO : topic #32 (0.020): 0.050*\"district\" + 0.044*\"popolo\" + 0.044*\"vigour\" + 0.036*\"tortur\" + 0.034*\"cotton\" + 0.022*\"multitud\" + 0.022*\"area\" + 0.021*\"adulthood\" + 0.019*\"cede\" + 0.018*\"regim\"\n", + "2019-01-31 01:23:50,828 : INFO : topic #39 (0.020): 0.058*\"canada\" + 0.045*\"canadian\" + 0.024*\"hoar\" + 0.023*\"toronto\" + 0.022*\"ontario\" + 0.016*\"hydrogen\" + 0.015*\"new\" + 0.014*\"misericordia\" + 0.014*\"novotná\" + 0.013*\"quebec\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 01:23:50,830 : INFO : topic #30 (0.020): 0.036*\"cleveland\" + 0.035*\"leagu\" + 0.030*\"place\" + 0.027*\"taxpay\" + 0.024*\"scientist\" + 0.023*\"crete\" + 0.021*\"folei\" + 0.016*\"goal\" + 0.015*\"martin\" + 0.012*\"schmitz\"\n", + "2019-01-31 01:23:50,836 : INFO : topic diff=0.004053, rho=0.022547\n", + "2019-01-31 01:23:50,991 : INFO : PROGRESS: pass 0, at document #3936000/4922894\n", + "2019-01-31 01:23:52,345 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:23:52,612 : INFO : topic #29 (0.020): 0.030*\"companhia\" + 0.013*\"busi\" + 0.012*\"million\" + 0.012*\"market\" + 0.011*\"produc\" + 0.010*\"bank\" + 0.010*\"industri\" + 0.009*\"yawn\" + 0.008*\"manag\" + 0.007*\"trace\"\n", + "2019-01-31 01:23:52,613 : INFO : topic #30 (0.020): 0.036*\"cleveland\" + 0.035*\"leagu\" + 0.030*\"place\" + 0.027*\"taxpay\" + 0.024*\"scientist\" + 0.023*\"crete\" + 0.021*\"folei\" + 0.016*\"goal\" + 0.015*\"martin\" + 0.012*\"schmitz\"\n", + "2019-01-31 01:23:52,615 : INFO : topic #26 (0.020): 0.031*\"workplac\" + 0.028*\"champion\" + 0.027*\"woman\" + 0.025*\"men\" + 0.024*\"olymp\" + 0.022*\"medal\" + 0.020*\"event\" + 0.019*\"alic\" + 0.018*\"atheist\" + 0.018*\"rainfal\"\n", + "2019-01-31 01:23:52,616 : INFO : topic #39 (0.020): 0.058*\"canada\" + 0.046*\"canadian\" + 0.023*\"hoar\" + 0.023*\"toronto\" + 0.022*\"ontario\" + 0.017*\"hydrogen\" + 0.015*\"new\" + 0.014*\"misericordia\" + 0.014*\"novotná\" + 0.013*\"quebec\"\n", + "2019-01-31 01:23:52,617 : INFO : topic #36 (0.020): 0.011*\"network\" + 0.010*\"prognosi\" + 0.010*\"pop\" + 0.008*\"cytokin\" + 0.008*\"develop\" + 0.008*\"softwar\" + 0.008*\"diggin\" + 0.008*\"user\" + 0.008*\"uruguayan\" + 0.008*\"championship\"\n", + "2019-01-31 01:23:52,623 : INFO : topic diff=0.003619, rho=0.022542\n", + "2019-01-31 01:23:52,785 : INFO : PROGRESS: pass 0, at document #3938000/4922894\n", + "2019-01-31 01:23:54,176 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:23:54,443 : INFO : topic #16 (0.020): 0.058*\"king\" + 0.031*\"priest\" + 0.019*\"duke\" + 0.017*\"idiosyncrat\" + 0.017*\"rotterdam\" + 0.017*\"grammat\" + 0.017*\"quarterli\" + 0.013*\"count\" + 0.012*\"portugues\" + 0.012*\"maria\"\n", + "2019-01-31 01:23:54,444 : INFO : topic #22 (0.020): 0.033*\"spars\" + 0.018*\"factor\" + 0.012*\"plaisir\" + 0.010*\"western\" + 0.010*\"genu\" + 0.009*\"biom\" + 0.008*\"median\" + 0.007*\"incom\" + 0.006*\"male\" + 0.006*\"feel\"\n", + "2019-01-31 01:23:54,445 : INFO : topic #14 (0.020): 0.024*\"forc\" + 0.022*\"aggress\" + 0.021*\"walter\" + 0.021*\"armi\" + 0.018*\"com\" + 0.013*\"unionist\" + 0.013*\"oper\" + 0.012*\"militari\" + 0.012*\"airbu\" + 0.012*\"diversifi\"\n", + "2019-01-31 01:23:54,446 : INFO : topic #31 (0.020): 0.051*\"fusiform\" + 0.027*\"scientist\" + 0.026*\"taxpay\" + 0.022*\"player\" + 0.020*\"place\" + 0.014*\"clot\" + 0.013*\"leagu\" + 0.011*\"folei\" + 0.010*\"yawn\" + 0.009*\"reconstruct\"\n", + "2019-01-31 01:23:54,448 : INFO : topic #12 (0.020): 0.008*\"number\" + 0.007*\"frontal\" + 0.007*\"gener\" + 0.006*\"poet\" + 0.006*\"exampl\" + 0.006*\"southern\" + 0.006*\"théori\" + 0.006*\"utopian\" + 0.006*\"method\" + 0.006*\"servitud\"\n", + "2019-01-31 01:23:54,454 : INFO : topic diff=0.003983, rho=0.022536\n", + "2019-01-31 01:23:57,204 : INFO : -11.613 per-word bound, 3132.6 perplexity estimate based on a held-out corpus of 2000 documents with 554556 words\n", + "2019-01-31 01:23:57,204 : INFO : PROGRESS: pass 0, at document #3940000/4922894\n", + "2019-01-31 01:23:58,586 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:23:58,852 : INFO : topic #35 (0.020): 0.055*\"russia\" + 0.039*\"rural\" + 0.037*\"sovereignti\" + 0.026*\"poison\" + 0.023*\"personifi\" + 0.022*\"reprint\" + 0.020*\"moscow\" + 0.019*\"poland\" + 0.014*\"tyrant\" + 0.014*\"turin\"\n", + "2019-01-31 01:23:58,853 : INFO : topic #18 (0.020): 0.011*\"théori\" + 0.007*\"later\" + 0.007*\"sack\" + 0.006*\"dai\" + 0.006*\"kill\" + 0.005*\"like\" + 0.005*\"retrospect\" + 0.005*\"end\" + 0.004*\"call\" + 0.004*\"help\"\n", + "2019-01-31 01:23:58,855 : INFO : topic #14 (0.020): 0.024*\"forc\" + 0.022*\"aggress\" + 0.021*\"walter\" + 0.021*\"armi\" + 0.018*\"com\" + 0.013*\"unionist\" + 0.013*\"oper\" + 0.012*\"militari\" + 0.012*\"airbu\" + 0.012*\"diversifi\"\n", + "2019-01-31 01:23:58,856 : INFO : topic #41 (0.020): 0.040*\"citi\" + 0.023*\"palmer\" + 0.020*\"new\" + 0.017*\"strategist\" + 0.013*\"center\" + 0.013*\"open\" + 0.011*\"includ\" + 0.011*\"lobe\" + 0.010*\"dai\" + 0.008*\"highli\"\n", + "2019-01-31 01:23:58,857 : INFO : topic #45 (0.020): 0.040*\"arsen\" + 0.029*\"jpg\" + 0.028*\"fifteenth\" + 0.025*\"museo\" + 0.021*\"pain\" + 0.020*\"illicit\" + 0.015*\"colder\" + 0.015*\"exhaust\" + 0.015*\"gai\" + 0.014*\"artist\"\n", + "2019-01-31 01:23:58,863 : INFO : topic diff=0.003189, rho=0.022530\n", + "2019-01-31 01:23:59,020 : INFO : PROGRESS: pass 0, at document #3942000/4922894\n", + "2019-01-31 01:24:00,383 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:24:00,650 : INFO : topic #28 (0.020): 0.036*\"build\" + 0.030*\"hous\" + 0.019*\"buford\" + 0.015*\"histor\" + 0.013*\"linear\" + 0.011*\"constitut\" + 0.011*\"depress\" + 0.011*\"silicon\" + 0.010*\"centuri\" + 0.010*\"pistol\"\n", + "2019-01-31 01:24:00,651 : INFO : topic #1 (0.020): 0.055*\"china\" + 0.045*\"chilton\" + 0.024*\"hong\" + 0.023*\"kong\" + 0.020*\"korea\" + 0.018*\"korean\" + 0.016*\"leah\" + 0.016*\"sourc\" + 0.014*\"kim\" + 0.014*\"shirin\"\n", + "2019-01-31 01:24:00,652 : INFO : topic #7 (0.020): 0.021*\"snatch\" + 0.020*\"di\" + 0.019*\"factor\" + 0.016*\"yawn\" + 0.016*\"margin\" + 0.014*\"bone\" + 0.013*\"faster\" + 0.013*\"life\" + 0.012*\"daughter\" + 0.012*\"deal\"\n", + "2019-01-31 01:24:00,653 : INFO : topic #8 (0.020): 0.027*\"law\" + 0.022*\"cortic\" + 0.019*\"start\" + 0.017*\"act\" + 0.012*\"ricardo\" + 0.012*\"case\" + 0.010*\"replac\" + 0.009*\"polaris\" + 0.008*\"legal\" + 0.006*\"rudolf\"\n", + "2019-01-31 01:24:00,654 : INFO : topic #6 (0.020): 0.069*\"fewer\" + 0.023*\"epiru\" + 0.020*\"septemb\" + 0.018*\"teacher\" + 0.015*\"stake\" + 0.012*\"rodríguez\" + 0.012*\"proclaim\" + 0.011*\"movi\" + 0.011*\"direct\" + 0.010*\"acrimoni\"\n", + "2019-01-31 01:24:00,660 : INFO : topic diff=0.003902, rho=0.022525\n", + "2019-01-31 01:24:00,816 : INFO : PROGRESS: pass 0, at document #3944000/4922894\n", + "2019-01-31 01:24:02,194 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:24:02,460 : INFO : topic #3 (0.020): 0.033*\"present\" + 0.026*\"offic\" + 0.026*\"minist\" + 0.023*\"nation\" + 0.022*\"govern\" + 0.021*\"member\" + 0.019*\"serv\" + 0.016*\"start\" + 0.015*\"gener\" + 0.014*\"chickasaw\"\n", + "2019-01-31 01:24:02,461 : INFO : topic #12 (0.020): 0.008*\"number\" + 0.007*\"frontal\" + 0.006*\"gener\" + 0.006*\"exampl\" + 0.006*\"poet\" + 0.006*\"southern\" + 0.006*\"théori\" + 0.006*\"utopian\" + 0.006*\"servitud\" + 0.006*\"method\"\n", + "2019-01-31 01:24:02,462 : INFO : topic #0 (0.020): 0.065*\"statewid\" + 0.041*\"line\" + 0.029*\"raid\" + 0.027*\"rivièr\" + 0.026*\"rosenwald\" + 0.023*\"airmen\" + 0.019*\"serv\" + 0.018*\"traceabl\" + 0.014*\"oper\" + 0.011*\"radiu\"\n", + "2019-01-31 01:24:02,463 : INFO : topic #28 (0.020): 0.036*\"build\" + 0.030*\"hous\" + 0.019*\"buford\" + 0.015*\"histor\" + 0.013*\"linear\" + 0.011*\"constitut\" + 0.011*\"depress\" + 0.011*\"silicon\" + 0.010*\"centuri\" + 0.010*\"pistol\"\n", + "2019-01-31 01:24:02,464 : INFO : topic #1 (0.020): 0.055*\"china\" + 0.045*\"chilton\" + 0.023*\"hong\" + 0.023*\"kong\" + 0.020*\"korea\" + 0.018*\"korean\" + 0.016*\"leah\" + 0.016*\"sourc\" + 0.014*\"kim\" + 0.014*\"shirin\"\n", + "2019-01-31 01:24:02,470 : INFO : topic diff=0.003213, rho=0.022519\n", + "2019-01-31 01:24:02,629 : INFO : PROGRESS: pass 0, at document #3946000/4922894\n", + "2019-01-31 01:24:04,018 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:24:04,285 : INFO : topic #31 (0.020): 0.050*\"fusiform\" + 0.026*\"scientist\" + 0.026*\"taxpay\" + 0.022*\"player\" + 0.020*\"place\" + 0.014*\"clot\" + 0.013*\"leagu\" + 0.011*\"folei\" + 0.010*\"yawn\" + 0.009*\"reconstruct\"\n", + "2019-01-31 01:24:04,286 : INFO : topic #39 (0.020): 0.059*\"canada\" + 0.048*\"canadian\" + 0.024*\"hoar\" + 0.023*\"toronto\" + 0.022*\"ontario\" + 0.016*\"hydrogen\" + 0.015*\"new\" + 0.015*\"misericordia\" + 0.014*\"quebec\" + 0.014*\"novotná\"\n", + "2019-01-31 01:24:04,287 : INFO : topic #10 (0.020): 0.011*\"cdd\" + 0.009*\"media\" + 0.008*\"hormon\" + 0.008*\"disco\" + 0.008*\"pathwai\" + 0.007*\"have\" + 0.007*\"caus\" + 0.006*\"effect\" + 0.006*\"treat\" + 0.006*\"proper\"\n", + "2019-01-31 01:24:04,288 : INFO : topic #7 (0.020): 0.021*\"snatch\" + 0.020*\"di\" + 0.019*\"factor\" + 0.016*\"yawn\" + 0.016*\"margin\" + 0.014*\"bone\" + 0.013*\"faster\" + 0.013*\"life\" + 0.012*\"daughter\" + 0.012*\"deal\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 01:24:04,289 : INFO : topic #21 (0.020): 0.034*\"samford\" + 0.024*\"spain\" + 0.017*\"del\" + 0.017*\"italian\" + 0.016*\"mexico\" + 0.014*\"soviet\" + 0.012*\"santa\" + 0.011*\"juan\" + 0.010*\"lizard\" + 0.010*\"josé\"\n", + "2019-01-31 01:24:04,295 : INFO : topic diff=0.003324, rho=0.022513\n", + "2019-01-31 01:24:04,452 : INFO : PROGRESS: pass 0, at document #3948000/4922894\n", + "2019-01-31 01:24:05,828 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:24:06,094 : INFO : topic #21 (0.020): 0.034*\"samford\" + 0.023*\"spain\" + 0.017*\"del\" + 0.017*\"italian\" + 0.016*\"mexico\" + 0.014*\"soviet\" + 0.012*\"santa\" + 0.011*\"juan\" + 0.010*\"francisco\" + 0.010*\"josé\"\n", + "2019-01-31 01:24:06,095 : INFO : topic #0 (0.020): 0.065*\"statewid\" + 0.041*\"line\" + 0.030*\"raid\" + 0.027*\"rivièr\" + 0.026*\"rosenwald\" + 0.022*\"airmen\" + 0.018*\"traceabl\" + 0.018*\"serv\" + 0.014*\"oper\" + 0.010*\"radiu\"\n", + "2019-01-31 01:24:06,096 : INFO : topic #29 (0.020): 0.031*\"companhia\" + 0.013*\"busi\" + 0.012*\"million\" + 0.011*\"market\" + 0.011*\"produc\" + 0.010*\"bank\" + 0.010*\"industri\" + 0.009*\"yawn\" + 0.008*\"manag\" + 0.007*\"trace\"\n", + "2019-01-31 01:24:06,097 : INFO : topic #35 (0.020): 0.055*\"russia\" + 0.039*\"rural\" + 0.036*\"sovereignti\" + 0.026*\"poison\" + 0.024*\"personifi\" + 0.022*\"reprint\" + 0.020*\"moscow\" + 0.019*\"poland\" + 0.014*\"tyrant\" + 0.014*\"turin\"\n", + "2019-01-31 01:24:06,098 : INFO : topic #23 (0.020): 0.138*\"audit\" + 0.068*\"best\" + 0.033*\"yawn\" + 0.030*\"jacksonvil\" + 0.024*\"japanes\" + 0.021*\"noll\" + 0.019*\"women\" + 0.018*\"festiv\" + 0.017*\"intern\" + 0.014*\"winner\"\n", + "2019-01-31 01:24:06,104 : INFO : topic diff=0.002940, rho=0.022507\n", + "2019-01-31 01:24:06,265 : INFO : PROGRESS: pass 0, at document #3950000/4922894\n", + "2019-01-31 01:24:07,622 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:24:07,887 : INFO : topic #0 (0.020): 0.065*\"statewid\" + 0.041*\"line\" + 0.030*\"raid\" + 0.027*\"rivièr\" + 0.026*\"rosenwald\" + 0.022*\"airmen\" + 0.019*\"serv\" + 0.018*\"traceabl\" + 0.014*\"oper\" + 0.010*\"radiu\"\n", + "2019-01-31 01:24:07,888 : INFO : topic #3 (0.020): 0.033*\"present\" + 0.026*\"offic\" + 0.026*\"minist\" + 0.023*\"nation\" + 0.022*\"govern\" + 0.021*\"member\" + 0.019*\"serv\" + 0.016*\"start\" + 0.015*\"gener\" + 0.014*\"seri\"\n", + "2019-01-31 01:24:07,889 : INFO : topic #44 (0.020): 0.030*\"rooftop\" + 0.026*\"final\" + 0.022*\"wife\" + 0.019*\"tourist\" + 0.019*\"champion\" + 0.015*\"martin\" + 0.014*\"taxpay\" + 0.014*\"tiepolo\" + 0.014*\"chamber\" + 0.012*\"open\"\n", + "2019-01-31 01:24:07,890 : INFO : topic #33 (0.020): 0.061*\"french\" + 0.046*\"franc\" + 0.031*\"pari\" + 0.023*\"jean\" + 0.022*\"sail\" + 0.017*\"daphn\" + 0.014*\"lazi\" + 0.013*\"loui\" + 0.012*\"piec\" + 0.009*\"wine\"\n", + "2019-01-31 01:24:07,892 : INFO : topic #28 (0.020): 0.036*\"build\" + 0.030*\"hous\" + 0.019*\"buford\" + 0.015*\"histor\" + 0.012*\"linear\" + 0.011*\"constitut\" + 0.011*\"depress\" + 0.011*\"silicon\" + 0.010*\"centuri\" + 0.010*\"pistol\"\n", + "2019-01-31 01:24:07,897 : INFO : topic diff=0.003183, rho=0.022502\n", + "2019-01-31 01:24:08,054 : INFO : PROGRESS: pass 0, at document #3952000/4922894\n", + "2019-01-31 01:24:09,443 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:24:09,710 : INFO : topic #8 (0.020): 0.028*\"law\" + 0.022*\"cortic\" + 0.019*\"start\" + 0.017*\"act\" + 0.012*\"ricardo\" + 0.012*\"case\" + 0.010*\"replac\" + 0.009*\"polaris\" + 0.008*\"legal\" + 0.006*\"judaism\"\n", + "2019-01-31 01:24:09,711 : INFO : topic #23 (0.020): 0.137*\"audit\" + 0.069*\"best\" + 0.033*\"yawn\" + 0.030*\"jacksonvil\" + 0.024*\"japanes\" + 0.021*\"noll\" + 0.019*\"women\" + 0.018*\"festiv\" + 0.017*\"intern\" + 0.014*\"winner\"\n", + "2019-01-31 01:24:09,712 : INFO : topic #24 (0.020): 0.039*\"book\" + 0.034*\"publicis\" + 0.027*\"word\" + 0.019*\"new\" + 0.014*\"edit\" + 0.013*\"presid\" + 0.011*\"storag\" + 0.011*\"author\" + 0.011*\"magazin\" + 0.011*\"nicola\"\n", + "2019-01-31 01:24:09,713 : INFO : topic #13 (0.020): 0.026*\"london\" + 0.026*\"australia\" + 0.025*\"sourc\" + 0.024*\"new\" + 0.023*\"england\" + 0.023*\"australian\" + 0.019*\"british\" + 0.019*\"ireland\" + 0.014*\"youth\" + 0.014*\"wale\"\n", + "2019-01-31 01:24:09,714 : INFO : topic #34 (0.020): 0.066*\"start\" + 0.035*\"new\" + 0.031*\"american\" + 0.028*\"unionist\" + 0.026*\"cotton\" + 0.022*\"year\" + 0.016*\"california\" + 0.014*\"warrior\" + 0.013*\"terri\" + 0.011*\"citi\"\n", + "2019-01-31 01:24:09,720 : INFO : topic diff=0.003415, rho=0.022496\n", + "2019-01-31 01:24:09,875 : INFO : PROGRESS: pass 0, at document #3954000/4922894\n", + "2019-01-31 01:24:11,238 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:24:11,504 : INFO : topic #32 (0.020): 0.050*\"district\" + 0.044*\"popolo\" + 0.043*\"vigour\" + 0.035*\"tortur\" + 0.034*\"cotton\" + 0.022*\"multitud\" + 0.022*\"area\" + 0.021*\"adulthood\" + 0.019*\"cede\" + 0.018*\"citi\"\n", + "2019-01-31 01:24:11,505 : INFO : topic #8 (0.020): 0.027*\"law\" + 0.022*\"cortic\" + 0.019*\"start\" + 0.017*\"act\" + 0.012*\"ricardo\" + 0.012*\"case\" + 0.010*\"replac\" + 0.009*\"polaris\" + 0.008*\"legal\" + 0.006*\"judaism\"\n", + "2019-01-31 01:24:11,506 : INFO : topic #7 (0.020): 0.021*\"snatch\" + 0.021*\"di\" + 0.018*\"factor\" + 0.016*\"yawn\" + 0.016*\"margin\" + 0.014*\"bone\" + 0.013*\"faster\" + 0.013*\"life\" + 0.012*\"daughter\" + 0.012*\"deal\"\n", + "2019-01-31 01:24:11,507 : INFO : topic #1 (0.020): 0.055*\"china\" + 0.046*\"chilton\" + 0.023*\"hong\" + 0.023*\"kong\" + 0.020*\"korea\" + 0.018*\"korean\" + 0.016*\"sourc\" + 0.016*\"leah\" + 0.014*\"kim\" + 0.013*\"shirin\"\n", + "2019-01-31 01:24:11,508 : INFO : topic #18 (0.020): 0.011*\"théori\" + 0.007*\"later\" + 0.007*\"sack\" + 0.006*\"dai\" + 0.006*\"kill\" + 0.005*\"like\" + 0.005*\"retrospect\" + 0.005*\"end\" + 0.004*\"call\" + 0.004*\"help\"\n", + "2019-01-31 01:24:11,514 : INFO : topic diff=0.003443, rho=0.022490\n", + "2019-01-31 01:24:11,673 : INFO : PROGRESS: pass 0, at document #3956000/4922894\n", + "2019-01-31 01:24:13,061 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:24:13,327 : INFO : topic #14 (0.020): 0.024*\"forc\" + 0.021*\"aggress\" + 0.021*\"walter\" + 0.021*\"armi\" + 0.018*\"com\" + 0.013*\"unionist\" + 0.013*\"oper\" + 0.012*\"militari\" + 0.012*\"airbu\" + 0.012*\"diversifi\"\n", + "2019-01-31 01:24:13,328 : INFO : topic #44 (0.020): 0.031*\"rooftop\" + 0.026*\"final\" + 0.022*\"wife\" + 0.019*\"tourist\" + 0.019*\"champion\" + 0.015*\"martin\" + 0.014*\"taxpay\" + 0.014*\"chamber\" + 0.014*\"tiepolo\" + 0.012*\"open\"\n", + "2019-01-31 01:24:13,329 : INFO : topic #26 (0.020): 0.031*\"workplac\" + 0.028*\"champion\" + 0.027*\"woman\" + 0.025*\"men\" + 0.024*\"olymp\" + 0.022*\"medal\" + 0.020*\"event\" + 0.019*\"atheist\" + 0.019*\"alic\" + 0.018*\"taxpay\"\n", + "2019-01-31 01:24:13,330 : INFO : topic #17 (0.020): 0.077*\"church\" + 0.022*\"christian\" + 0.022*\"cathol\" + 0.020*\"bishop\" + 0.017*\"sail\" + 0.015*\"retroflex\" + 0.010*\"relationship\" + 0.009*\"cathedr\" + 0.009*\"parish\" + 0.009*\"historiographi\"\n", + "2019-01-31 01:24:13,331 : INFO : topic #38 (0.020): 0.023*\"walter\" + 0.010*\"aza\" + 0.009*\"battalion\" + 0.009*\"forc\" + 0.007*\"armi\" + 0.007*\"teufel\" + 0.007*\"empath\" + 0.006*\"citi\" + 0.006*\"militari\" + 0.006*\"govern\"\n", + "2019-01-31 01:24:13,337 : INFO : topic diff=0.003558, rho=0.022485\n", + "2019-01-31 01:24:13,491 : INFO : PROGRESS: pass 0, at document #3958000/4922894\n", + "2019-01-31 01:24:14,854 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:24:15,120 : INFO : topic #47 (0.020): 0.063*\"muscl\" + 0.032*\"perceptu\" + 0.021*\"theater\" + 0.018*\"place\" + 0.017*\"compos\" + 0.015*\"damn\" + 0.014*\"olympo\" + 0.014*\"orchestr\" + 0.012*\"physician\" + 0.011*\"word\"\n", + "2019-01-31 01:24:15,122 : INFO : topic #38 (0.020): 0.024*\"walter\" + 0.010*\"aza\" + 0.009*\"battalion\" + 0.009*\"forc\" + 0.007*\"armi\" + 0.007*\"teufel\" + 0.007*\"empath\" + 0.006*\"citi\" + 0.006*\"militari\" + 0.006*\"govern\"\n", + "2019-01-31 01:24:15,123 : INFO : topic #6 (0.020): 0.069*\"fewer\" + 0.023*\"epiru\" + 0.020*\"septemb\" + 0.018*\"teacher\" + 0.015*\"stake\" + 0.012*\"rodríguez\" + 0.012*\"proclaim\" + 0.011*\"movi\" + 0.011*\"direct\" + 0.010*\"acrimoni\"\n", + "2019-01-31 01:24:15,124 : INFO : topic #1 (0.020): 0.055*\"china\" + 0.046*\"chilton\" + 0.024*\"hong\" + 0.023*\"kong\" + 0.020*\"korea\" + 0.018*\"korean\" + 0.016*\"sourc\" + 0.016*\"leah\" + 0.014*\"kim\" + 0.013*\"shirin\"\n", + "2019-01-31 01:24:15,125 : INFO : topic #9 (0.020): 0.071*\"bone\" + 0.042*\"american\" + 0.030*\"valour\" + 0.020*\"dutch\" + 0.017*\"folei\" + 0.017*\"polit\" + 0.017*\"player\" + 0.017*\"english\" + 0.011*\"acrimoni\" + 0.011*\"simpler\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 01:24:15,131 : INFO : topic diff=0.002872, rho=0.022479\n", + "2019-01-31 01:24:17,762 : INFO : -11.462 per-word bound, 2821.3 perplexity estimate based on a held-out corpus of 2000 documents with 536698 words\n", + "2019-01-31 01:24:17,763 : INFO : PROGRESS: pass 0, at document #3960000/4922894\n", + "2019-01-31 01:24:19,116 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:24:19,383 : INFO : topic #36 (0.020): 0.011*\"network\" + 0.010*\"prognosi\" + 0.010*\"pop\" + 0.008*\"softwar\" + 0.008*\"cytokin\" + 0.008*\"develop\" + 0.008*\"user\" + 0.008*\"diggin\" + 0.008*\"uruguayan\" + 0.008*\"championship\"\n", + "2019-01-31 01:24:19,384 : INFO : topic #5 (0.020): 0.038*\"abroad\" + 0.029*\"son\" + 0.028*\"rel\" + 0.026*\"reconstruct\" + 0.021*\"band\" + 0.017*\"muscl\" + 0.015*\"simultan\" + 0.014*\"charcoal\" + 0.013*\"toyota\" + 0.009*\"vocabulari\"\n", + "2019-01-31 01:24:19,385 : INFO : topic #2 (0.020): 0.052*\"isl\" + 0.037*\"shield\" + 0.018*\"narrat\" + 0.015*\"scot\" + 0.013*\"blur\" + 0.013*\"pope\" + 0.011*\"coalit\" + 0.010*\"nativist\" + 0.009*\"class\" + 0.009*\"vernon\"\n", + "2019-01-31 01:24:19,386 : INFO : topic #42 (0.020): 0.047*\"german\" + 0.031*\"germani\" + 0.016*\"vol\" + 0.014*\"jewish\" + 0.014*\"berlin\" + 0.013*\"der\" + 0.013*\"israel\" + 0.010*\"european\" + 0.009*\"hungarian\" + 0.009*\"austria\"\n", + "2019-01-31 01:24:19,387 : INFO : topic #38 (0.020): 0.024*\"walter\" + 0.010*\"aza\" + 0.009*\"battalion\" + 0.009*\"forc\" + 0.007*\"armi\" + 0.007*\"teufel\" + 0.007*\"empath\" + 0.006*\"citi\" + 0.006*\"militari\" + 0.006*\"govern\"\n", + "2019-01-31 01:24:19,393 : INFO : topic diff=0.003214, rho=0.022473\n", + "2019-01-31 01:24:19,549 : INFO : PROGRESS: pass 0, at document #3962000/4922894\n", + "2019-01-31 01:24:20,913 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:24:21,179 : INFO : topic #5 (0.020): 0.038*\"abroad\" + 0.029*\"son\" + 0.028*\"rel\" + 0.026*\"reconstruct\" + 0.021*\"band\" + 0.017*\"muscl\" + 0.015*\"simultan\" + 0.014*\"charcoal\" + 0.013*\"toyota\" + 0.009*\"vocabulari\"\n", + "2019-01-31 01:24:21,180 : INFO : topic #17 (0.020): 0.077*\"church\" + 0.022*\"christian\" + 0.022*\"cathol\" + 0.020*\"bishop\" + 0.016*\"sail\" + 0.015*\"retroflex\" + 0.010*\"relationship\" + 0.009*\"cathedr\" + 0.009*\"parish\" + 0.009*\"historiographi\"\n", + "2019-01-31 01:24:21,181 : INFO : topic #23 (0.020): 0.138*\"audit\" + 0.068*\"best\" + 0.033*\"yawn\" + 0.030*\"jacksonvil\" + 0.025*\"japanes\" + 0.021*\"noll\" + 0.019*\"women\" + 0.018*\"festiv\" + 0.016*\"intern\" + 0.014*\"winner\"\n", + "2019-01-31 01:24:21,182 : INFO : topic #27 (0.020): 0.075*\"questionnair\" + 0.021*\"candid\" + 0.017*\"taxpay\" + 0.013*\"tornado\" + 0.013*\"driver\" + 0.013*\"ret\" + 0.013*\"fool\" + 0.010*\"find\" + 0.010*\"landslid\" + 0.010*\"horac\"\n", + "2019-01-31 01:24:21,183 : INFO : topic #13 (0.020): 0.026*\"london\" + 0.026*\"australia\" + 0.025*\"sourc\" + 0.024*\"new\" + 0.023*\"england\" + 0.023*\"australian\" + 0.019*\"british\" + 0.019*\"ireland\" + 0.014*\"youth\" + 0.014*\"wale\"\n", + "2019-01-31 01:24:21,189 : INFO : topic diff=0.003078, rho=0.022468\n", + "2019-01-31 01:24:21,347 : INFO : PROGRESS: pass 0, at document #3964000/4922894\n", + "2019-01-31 01:24:22,731 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:24:22,997 : INFO : topic #27 (0.020): 0.075*\"questionnair\" + 0.021*\"candid\" + 0.018*\"taxpay\" + 0.013*\"tornado\" + 0.013*\"driver\" + 0.012*\"fool\" + 0.012*\"ret\" + 0.010*\"find\" + 0.010*\"landslid\" + 0.010*\"horac\"\n", + "2019-01-31 01:24:22,998 : INFO : topic #40 (0.020): 0.085*\"unit\" + 0.023*\"schuster\" + 0.022*\"collector\" + 0.022*\"institut\" + 0.020*\"requir\" + 0.019*\"student\" + 0.014*\"professor\" + 0.012*\"degre\" + 0.012*\"http\" + 0.012*\"word\"\n", + "2019-01-31 01:24:22,998 : INFO : topic #13 (0.020): 0.026*\"london\" + 0.026*\"australia\" + 0.025*\"sourc\" + 0.024*\"new\" + 0.023*\"england\" + 0.023*\"australian\" + 0.019*\"british\" + 0.019*\"ireland\" + 0.014*\"youth\" + 0.014*\"wale\"\n", + "2019-01-31 01:24:22,999 : INFO : topic #33 (0.020): 0.061*\"french\" + 0.046*\"franc\" + 0.032*\"pari\" + 0.022*\"jean\" + 0.022*\"sail\" + 0.018*\"daphn\" + 0.014*\"lazi\" + 0.013*\"loui\" + 0.011*\"piec\" + 0.009*\"wine\"\n", + "2019-01-31 01:24:23,000 : INFO : topic #47 (0.020): 0.062*\"muscl\" + 0.032*\"perceptu\" + 0.021*\"theater\" + 0.018*\"place\" + 0.017*\"compos\" + 0.016*\"damn\" + 0.014*\"olympo\" + 0.014*\"orchestr\" + 0.012*\"physician\" + 0.011*\"word\"\n", + "2019-01-31 01:24:23,006 : INFO : topic diff=0.002975, rho=0.022462\n", + "2019-01-31 01:24:23,216 : INFO : PROGRESS: pass 0, at document #3966000/4922894\n", + "2019-01-31 01:24:24,596 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:24:24,862 : INFO : topic #39 (0.020): 0.058*\"canada\" + 0.047*\"canadian\" + 0.026*\"hoar\" + 0.024*\"toronto\" + 0.022*\"ontario\" + 0.017*\"hydrogen\" + 0.015*\"new\" + 0.015*\"misericordia\" + 0.014*\"quebec\" + 0.014*\"novotná\"\n", + "2019-01-31 01:24:24,863 : INFO : topic #20 (0.020): 0.142*\"scholar\" + 0.040*\"struggl\" + 0.032*\"high\" + 0.030*\"educ\" + 0.024*\"collector\" + 0.017*\"yawn\" + 0.013*\"prognosi\" + 0.011*\"district\" + 0.010*\"gothic\" + 0.010*\"task\"\n", + "2019-01-31 01:24:24,864 : INFO : topic #48 (0.020): 0.081*\"march\" + 0.079*\"sens\" + 0.077*\"octob\" + 0.070*\"juli\" + 0.069*\"januari\" + 0.068*\"august\" + 0.067*\"notion\" + 0.066*\"judici\" + 0.065*\"april\" + 0.064*\"decatur\"\n", + "2019-01-31 01:24:24,865 : INFO : topic #2 (0.020): 0.052*\"isl\" + 0.037*\"shield\" + 0.017*\"narrat\" + 0.015*\"scot\" + 0.013*\"blur\" + 0.013*\"pope\" + 0.011*\"coalit\" + 0.011*\"nativist\" + 0.009*\"class\" + 0.009*\"fleet\"\n", + "2019-01-31 01:24:24,866 : INFO : topic #41 (0.020): 0.040*\"citi\" + 0.023*\"palmer\" + 0.020*\"new\" + 0.016*\"strategist\" + 0.013*\"center\" + 0.012*\"open\" + 0.011*\"includ\" + 0.011*\"lobe\" + 0.010*\"dai\" + 0.009*\"highli\"\n", + "2019-01-31 01:24:24,872 : INFO : topic diff=0.003814, rho=0.022456\n", + "2019-01-31 01:24:25,026 : INFO : PROGRESS: pass 0, at document #3968000/4922894\n", + "2019-01-31 01:24:26,366 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:24:26,632 : INFO : topic #40 (0.020): 0.085*\"unit\" + 0.023*\"schuster\" + 0.022*\"collector\" + 0.022*\"institut\" + 0.020*\"requir\" + 0.019*\"student\" + 0.014*\"professor\" + 0.012*\"degre\" + 0.012*\"http\" + 0.011*\"word\"\n", + "2019-01-31 01:24:26,633 : INFO : topic #17 (0.020): 0.076*\"church\" + 0.022*\"christian\" + 0.022*\"cathol\" + 0.020*\"bishop\" + 0.016*\"sail\" + 0.015*\"retroflex\" + 0.010*\"relationship\" + 0.009*\"cathedr\" + 0.009*\"parish\" + 0.009*\"historiographi\"\n", + "2019-01-31 01:24:26,635 : INFO : topic #18 (0.020): 0.011*\"théori\" + 0.007*\"later\" + 0.007*\"sack\" + 0.006*\"dai\" + 0.005*\"kill\" + 0.005*\"like\" + 0.005*\"retrospect\" + 0.005*\"end\" + 0.004*\"call\" + 0.004*\"help\"\n", + "2019-01-31 01:24:26,636 : INFO : topic #6 (0.020): 0.069*\"fewer\" + 0.024*\"epiru\" + 0.020*\"septemb\" + 0.018*\"teacher\" + 0.015*\"stake\" + 0.012*\"rodríguez\" + 0.012*\"proclaim\" + 0.011*\"direct\" + 0.011*\"movi\" + 0.010*\"acrimoni\"\n", + "2019-01-31 01:24:26,637 : INFO : topic #14 (0.020): 0.024*\"forc\" + 0.022*\"aggress\" + 0.021*\"walter\" + 0.021*\"armi\" + 0.018*\"com\" + 0.013*\"unionist\" + 0.013*\"oper\" + 0.012*\"militari\" + 0.012*\"airbu\" + 0.012*\"diversifi\"\n", + "2019-01-31 01:24:26,643 : INFO : topic diff=0.003495, rho=0.022451\n", + "2019-01-31 01:24:26,800 : INFO : PROGRESS: pass 0, at document #3970000/4922894\n", + "2019-01-31 01:24:28,182 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:24:28,450 : INFO : topic #15 (0.020): 0.011*\"small\" + 0.010*\"organ\" + 0.010*\"develop\" + 0.009*\"commun\" + 0.008*\"group\" + 0.008*\"word\" + 0.008*\"peopl\" + 0.007*\"woman\" + 0.007*\"human\" + 0.006*\"summerhil\"\n", + "2019-01-31 01:24:28,451 : INFO : topic #19 (0.020): 0.016*\"languag\" + 0.015*\"centuri\" + 0.011*\"woodcut\" + 0.009*\"form\" + 0.009*\"mean\" + 0.008*\"origin\" + 0.008*\"trade\" + 0.007*\"english\" + 0.007*\"known\" + 0.007*\"uruguayan\"\n", + "2019-01-31 01:24:28,452 : INFO : topic #25 (0.020): 0.032*\"ring\" + 0.018*\"area\" + 0.017*\"lagrang\" + 0.017*\"mount\" + 0.016*\"warmth\" + 0.010*\"north\" + 0.009*\"sourc\" + 0.009*\"land\" + 0.009*\"crayfish\" + 0.008*\"lobe\"\n", + "2019-01-31 01:24:28,453 : INFO : topic #0 (0.020): 0.064*\"statewid\" + 0.041*\"line\" + 0.031*\"raid\" + 0.028*\"rivièr\" + 0.026*\"rosenwald\" + 0.023*\"airmen\" + 0.018*\"serv\" + 0.018*\"traceabl\" + 0.014*\"oper\" + 0.010*\"transient\"\n", + "2019-01-31 01:24:28,454 : INFO : topic #43 (0.020): 0.064*\"elect\" + 0.054*\"parti\" + 0.024*\"voluntari\" + 0.023*\"democrat\" + 0.020*\"member\" + 0.016*\"polici\" + 0.015*\"republ\" + 0.014*\"bypass\" + 0.013*\"report\" + 0.013*\"selma\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 01:24:28,460 : INFO : topic diff=0.003436, rho=0.022445\n", + "2019-01-31 01:24:28,614 : INFO : PROGRESS: pass 0, at document #3972000/4922894\n", + "2019-01-31 01:24:29,958 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:24:30,224 : INFO : topic #6 (0.020): 0.069*\"fewer\" + 0.024*\"epiru\" + 0.020*\"septemb\" + 0.018*\"teacher\" + 0.015*\"stake\" + 0.012*\"rodríguez\" + 0.012*\"proclaim\" + 0.011*\"direct\" + 0.011*\"movi\" + 0.010*\"acrimoni\"\n", + "2019-01-31 01:24:30,225 : INFO : topic #24 (0.020): 0.039*\"book\" + 0.034*\"publicis\" + 0.027*\"word\" + 0.019*\"new\" + 0.014*\"edit\" + 0.013*\"presid\" + 0.011*\"magazin\" + 0.011*\"author\" + 0.011*\"storag\" + 0.011*\"nicola\"\n", + "2019-01-31 01:24:30,226 : INFO : topic #10 (0.020): 0.011*\"cdd\" + 0.009*\"media\" + 0.008*\"hormon\" + 0.008*\"disco\" + 0.008*\"pathwai\" + 0.007*\"have\" + 0.007*\"caus\" + 0.006*\"treat\" + 0.006*\"effect\" + 0.006*\"proper\"\n", + "2019-01-31 01:24:30,227 : INFO : topic #5 (0.020): 0.038*\"abroad\" + 0.029*\"son\" + 0.027*\"rel\" + 0.026*\"reconstruct\" + 0.021*\"band\" + 0.017*\"muscl\" + 0.015*\"simultan\" + 0.014*\"charcoal\" + 0.013*\"toyota\" + 0.009*\"vocabulari\"\n", + "2019-01-31 01:24:30,229 : INFO : topic #38 (0.020): 0.023*\"walter\" + 0.010*\"aza\" + 0.009*\"battalion\" + 0.009*\"forc\" + 0.007*\"armi\" + 0.007*\"empath\" + 0.007*\"teufel\" + 0.006*\"citi\" + 0.006*\"militari\" + 0.006*\"govern\"\n", + "2019-01-31 01:24:30,234 : INFO : topic diff=0.002874, rho=0.022439\n", + "2019-01-31 01:24:30,392 : INFO : PROGRESS: pass 0, at document #3974000/4922894\n", + "2019-01-31 01:24:31,736 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:24:32,002 : INFO : topic #45 (0.020): 0.041*\"arsen\" + 0.029*\"jpg\" + 0.028*\"fifteenth\" + 0.025*\"museo\" + 0.022*\"pain\" + 0.020*\"illicit\" + 0.015*\"colder\" + 0.015*\"gai\" + 0.015*\"exhaust\" + 0.014*\"artist\"\n", + "2019-01-31 01:24:32,003 : INFO : topic #18 (0.020): 0.011*\"théori\" + 0.007*\"later\" + 0.007*\"sack\" + 0.006*\"dai\" + 0.005*\"kill\" + 0.005*\"like\" + 0.005*\"retrospect\" + 0.005*\"end\" + 0.004*\"call\" + 0.004*\"help\"\n", + "2019-01-31 01:24:32,004 : INFO : topic #31 (0.020): 0.052*\"fusiform\" + 0.026*\"taxpay\" + 0.026*\"scientist\" + 0.024*\"player\" + 0.020*\"place\" + 0.014*\"clot\" + 0.013*\"leagu\" + 0.011*\"folei\" + 0.010*\"yawn\" + 0.009*\"reconstruct\"\n", + "2019-01-31 01:24:32,006 : INFO : topic #22 (0.020): 0.034*\"spars\" + 0.018*\"factor\" + 0.011*\"plaisir\" + 0.010*\"genu\" + 0.010*\"western\" + 0.009*\"biom\" + 0.008*\"median\" + 0.006*\"incom\" + 0.006*\"trap\" + 0.006*\"male\"\n", + "2019-01-31 01:24:32,007 : INFO : topic #19 (0.020): 0.016*\"languag\" + 0.015*\"centuri\" + 0.010*\"woodcut\" + 0.009*\"form\" + 0.009*\"mean\" + 0.008*\"origin\" + 0.008*\"trade\" + 0.007*\"english\" + 0.007*\"known\" + 0.007*\"uruguayan\"\n", + "2019-01-31 01:24:32,013 : INFO : topic diff=0.003560, rho=0.022434\n", + "2019-01-31 01:24:32,172 : INFO : PROGRESS: pass 0, at document #3976000/4922894\n", + "2019-01-31 01:24:33,539 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:24:33,807 : INFO : topic #25 (0.020): 0.033*\"ring\" + 0.018*\"area\" + 0.017*\"lagrang\" + 0.017*\"mount\" + 0.016*\"warmth\" + 0.010*\"north\" + 0.009*\"sourc\" + 0.009*\"land\" + 0.009*\"crayfish\" + 0.008*\"lobe\"\n", + "2019-01-31 01:24:33,808 : INFO : topic #29 (0.020): 0.030*\"companhia\" + 0.013*\"busi\" + 0.012*\"million\" + 0.011*\"produc\" + 0.011*\"market\" + 0.010*\"bank\" + 0.010*\"industri\" + 0.009*\"yawn\" + 0.008*\"manag\" + 0.007*\"serv\"\n", + "2019-01-31 01:24:33,809 : INFO : topic #42 (0.020): 0.048*\"german\" + 0.032*\"germani\" + 0.015*\"vol\" + 0.015*\"jewish\" + 0.014*\"berlin\" + 0.013*\"israel\" + 0.013*\"der\" + 0.010*\"european\" + 0.009*\"europ\" + 0.009*\"austria\"\n", + "2019-01-31 01:24:33,810 : INFO : topic #6 (0.020): 0.069*\"fewer\" + 0.024*\"epiru\" + 0.020*\"septemb\" + 0.018*\"teacher\" + 0.015*\"stake\" + 0.012*\"rodríguez\" + 0.012*\"proclaim\" + 0.011*\"direct\" + 0.011*\"movi\" + 0.010*\"acrimoni\"\n", + "2019-01-31 01:24:33,811 : INFO : topic #40 (0.020): 0.086*\"unit\" + 0.023*\"schuster\" + 0.022*\"collector\" + 0.022*\"institut\" + 0.020*\"requir\" + 0.019*\"student\" + 0.014*\"professor\" + 0.012*\"degre\" + 0.012*\"http\" + 0.011*\"word\"\n", + "2019-01-31 01:24:33,817 : INFO : topic diff=0.003857, rho=0.022428\n", + "2019-01-31 01:24:33,977 : INFO : PROGRESS: pass 0, at document #3978000/4922894\n", + "2019-01-31 01:24:35,358 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:24:35,625 : INFO : topic #15 (0.020): 0.011*\"small\" + 0.010*\"organ\" + 0.010*\"develop\" + 0.009*\"commun\" + 0.008*\"group\" + 0.008*\"word\" + 0.008*\"peopl\" + 0.007*\"woman\" + 0.007*\"human\" + 0.006*\"summerhil\"\n", + "2019-01-31 01:24:35,626 : INFO : topic #44 (0.020): 0.030*\"rooftop\" + 0.026*\"final\" + 0.022*\"wife\" + 0.020*\"tourist\" + 0.019*\"champion\" + 0.015*\"martin\" + 0.015*\"taxpay\" + 0.014*\"chamber\" + 0.014*\"tiepolo\" + 0.012*\"women\"\n", + "2019-01-31 01:24:35,628 : INFO : topic #34 (0.020): 0.067*\"start\" + 0.035*\"new\" + 0.032*\"american\" + 0.028*\"unionist\" + 0.026*\"cotton\" + 0.022*\"year\" + 0.016*\"california\" + 0.013*\"warrior\" + 0.012*\"terri\" + 0.011*\"citi\"\n", + "2019-01-31 01:24:35,629 : INFO : topic #14 (0.020): 0.024*\"forc\" + 0.021*\"aggress\" + 0.021*\"walter\" + 0.021*\"armi\" + 0.018*\"com\" + 0.014*\"unionist\" + 0.013*\"oper\" + 0.012*\"diversifi\" + 0.012*\"militari\" + 0.012*\"airbu\"\n", + "2019-01-31 01:24:35,630 : INFO : topic #33 (0.020): 0.059*\"french\" + 0.045*\"franc\" + 0.032*\"pari\" + 0.023*\"jean\" + 0.022*\"sail\" + 0.017*\"daphn\" + 0.014*\"lazi\" + 0.013*\"loui\" + 0.011*\"piec\" + 0.009*\"wine\"\n", + "2019-01-31 01:24:35,635 : INFO : topic diff=0.003372, rho=0.022422\n", + "2019-01-31 01:24:38,339 : INFO : -11.565 per-word bound, 3030.1 perplexity estimate based on a held-out corpus of 2000 documents with 581484 words\n", + "2019-01-31 01:24:38,339 : INFO : PROGRESS: pass 0, at document #3980000/4922894\n", + "2019-01-31 01:24:39,718 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:24:39,984 : INFO : topic #47 (0.020): 0.063*\"muscl\" + 0.032*\"perceptu\" + 0.021*\"theater\" + 0.018*\"place\" + 0.018*\"compos\" + 0.015*\"damn\" + 0.014*\"olympo\" + 0.013*\"orchestr\" + 0.013*\"physician\" + 0.011*\"word\"\n", + "2019-01-31 01:24:39,985 : INFO : topic #46 (0.020): 0.017*\"stop\" + 0.016*\"sweden\" + 0.016*\"norwai\" + 0.015*\"wind\" + 0.015*\"swedish\" + 0.014*\"damag\" + 0.014*\"norwegian\" + 0.011*\"treeless\" + 0.011*\"denmark\" + 0.010*\"huntsvil\"\n", + "2019-01-31 01:24:39,986 : INFO : topic #9 (0.020): 0.073*\"bone\" + 0.042*\"american\" + 0.030*\"valour\" + 0.019*\"dutch\" + 0.017*\"player\" + 0.017*\"folei\" + 0.017*\"polit\" + 0.017*\"english\" + 0.011*\"acrimoni\" + 0.011*\"simpler\"\n", + "2019-01-31 01:24:39,987 : INFO : topic #41 (0.020): 0.040*\"citi\" + 0.023*\"palmer\" + 0.020*\"new\" + 0.016*\"strategist\" + 0.013*\"center\" + 0.012*\"open\" + 0.011*\"lobe\" + 0.011*\"includ\" + 0.010*\"dai\" + 0.009*\"highli\"\n", + "2019-01-31 01:24:39,988 : INFO : topic #13 (0.020): 0.026*\"london\" + 0.026*\"australia\" + 0.026*\"sourc\" + 0.024*\"new\" + 0.023*\"england\" + 0.022*\"australian\" + 0.019*\"british\" + 0.019*\"ireland\" + 0.014*\"youth\" + 0.014*\"wale\"\n", + "2019-01-31 01:24:39,993 : INFO : topic diff=0.003445, rho=0.022417\n", + "2019-01-31 01:24:40,148 : INFO : PROGRESS: pass 0, at document #3982000/4922894\n", + "2019-01-31 01:24:41,501 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:24:41,767 : INFO : topic #11 (0.020): 0.023*\"john\" + 0.011*\"jame\" + 0.011*\"will\" + 0.011*\"david\" + 0.010*\"rival\" + 0.009*\"mexican–american\" + 0.008*\"slur\" + 0.008*\"paul\" + 0.008*\"rhyme\" + 0.007*\"georg\"\n", + "2019-01-31 01:24:41,768 : INFO : topic #41 (0.020): 0.040*\"citi\" + 0.023*\"palmer\" + 0.020*\"new\" + 0.016*\"strategist\" + 0.013*\"center\" + 0.012*\"open\" + 0.011*\"lobe\" + 0.011*\"includ\" + 0.010*\"dai\" + 0.009*\"highli\"\n", + "2019-01-31 01:24:41,769 : INFO : topic #28 (0.020): 0.036*\"build\" + 0.029*\"hous\" + 0.019*\"buford\" + 0.015*\"histor\" + 0.012*\"linear\" + 0.011*\"constitut\" + 0.011*\"silicon\" + 0.011*\"depress\" + 0.010*\"pistol\" + 0.010*\"centuri\"\n", + "2019-01-31 01:24:41,770 : INFO : topic #49 (0.020): 0.043*\"india\" + 0.031*\"incumb\" + 0.014*\"pakistan\" + 0.012*\"islam\" + 0.012*\"anglo\" + 0.011*\"muskoge\" + 0.011*\"khalsa\" + 0.011*\"televis\" + 0.010*\"sri\" + 0.010*\"alam\"\n", + "2019-01-31 01:24:41,771 : INFO : topic #40 (0.020): 0.086*\"unit\" + 0.023*\"schuster\" + 0.022*\"institut\" + 0.022*\"collector\" + 0.020*\"requir\" + 0.019*\"student\" + 0.014*\"professor\" + 0.012*\"degre\" + 0.012*\"http\" + 0.011*\"word\"\n", + "2019-01-31 01:24:41,778 : INFO : topic diff=0.003602, rho=0.022411\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 01:24:41,935 : INFO : PROGRESS: pass 0, at document #3984000/4922894\n", + "2019-01-31 01:24:43,301 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:24:43,569 : INFO : topic #18 (0.020): 0.011*\"théori\" + 0.007*\"later\" + 0.007*\"sack\" + 0.006*\"dai\" + 0.005*\"kill\" + 0.005*\"like\" + 0.005*\"retrospect\" + 0.005*\"end\" + 0.004*\"call\" + 0.004*\"help\"\n", + "2019-01-31 01:24:43,570 : INFO : topic #42 (0.020): 0.048*\"german\" + 0.031*\"germani\" + 0.016*\"vol\" + 0.015*\"jewish\" + 0.014*\"berlin\" + 0.013*\"israel\" + 0.013*\"der\" + 0.010*\"european\" + 0.009*\"austria\" + 0.009*\"europ\"\n", + "2019-01-31 01:24:43,571 : INFO : topic #23 (0.020): 0.139*\"audit\" + 0.070*\"best\" + 0.033*\"yawn\" + 0.029*\"jacksonvil\" + 0.024*\"japanes\" + 0.020*\"noll\" + 0.018*\"women\" + 0.018*\"festiv\" + 0.016*\"intern\" + 0.014*\"winner\"\n", + "2019-01-31 01:24:43,572 : INFO : topic #31 (0.020): 0.052*\"fusiform\" + 0.026*\"scientist\" + 0.026*\"taxpay\" + 0.023*\"player\" + 0.020*\"place\" + 0.014*\"clot\" + 0.013*\"leagu\" + 0.011*\"folei\" + 0.010*\"yawn\" + 0.009*\"reconstruct\"\n", + "2019-01-31 01:24:43,573 : INFO : topic #46 (0.020): 0.017*\"stop\" + 0.016*\"sweden\" + 0.016*\"norwai\" + 0.015*\"wind\" + 0.015*\"swedish\" + 0.014*\"damag\" + 0.014*\"norwegian\" + 0.011*\"treeless\" + 0.011*\"denmark\" + 0.011*\"huntsvil\"\n", + "2019-01-31 01:24:43,579 : INFO : topic diff=0.003115, rho=0.022406\n", + "2019-01-31 01:24:43,742 : INFO : PROGRESS: pass 0, at document #3986000/4922894\n", + "2019-01-31 01:24:45,137 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:24:45,403 : INFO : topic #12 (0.020): 0.008*\"number\" + 0.007*\"frontal\" + 0.007*\"poet\" + 0.006*\"gener\" + 0.006*\"utopian\" + 0.006*\"exampl\" + 0.006*\"théori\" + 0.006*\"southern\" + 0.006*\"servitud\" + 0.005*\"method\"\n", + "2019-01-31 01:24:45,404 : INFO : topic #4 (0.020): 0.019*\"enfranchis\" + 0.014*\"pour\" + 0.014*\"depress\" + 0.008*\"elabor\" + 0.008*\"mode\" + 0.008*\"uruguayan\" + 0.007*\"veget\" + 0.006*\"turn\" + 0.006*\"develop\" + 0.006*\"produc\"\n", + "2019-01-31 01:24:45,405 : INFO : topic #9 (0.020): 0.073*\"bone\" + 0.042*\"american\" + 0.030*\"valour\" + 0.019*\"dutch\" + 0.017*\"player\" + 0.017*\"folei\" + 0.017*\"polit\" + 0.017*\"english\" + 0.011*\"acrimoni\" + 0.011*\"simpler\"\n", + "2019-01-31 01:24:45,406 : INFO : topic #41 (0.020): 0.040*\"citi\" + 0.023*\"palmer\" + 0.020*\"new\" + 0.016*\"strategist\" + 0.013*\"center\" + 0.012*\"open\" + 0.011*\"lobe\" + 0.011*\"includ\" + 0.010*\"dai\" + 0.009*\"highli\"\n", + "2019-01-31 01:24:45,407 : INFO : topic #17 (0.020): 0.077*\"church\" + 0.022*\"christian\" + 0.022*\"cathol\" + 0.020*\"bishop\" + 0.017*\"sail\" + 0.015*\"retroflex\" + 0.010*\"relationship\" + 0.009*\"cathedr\" + 0.009*\"parish\" + 0.009*\"historiographi\"\n", + "2019-01-31 01:24:45,413 : INFO : topic diff=0.004412, rho=0.022400\n", + "2019-01-31 01:24:45,570 : INFO : PROGRESS: pass 0, at document #3988000/4922894\n", + "2019-01-31 01:24:46,926 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:24:47,192 : INFO : topic #6 (0.020): 0.069*\"fewer\" + 0.024*\"epiru\" + 0.020*\"septemb\" + 0.018*\"teacher\" + 0.015*\"stake\" + 0.012*\"rodríguez\" + 0.012*\"proclaim\" + 0.011*\"direct\" + 0.010*\"movi\" + 0.010*\"acrimoni\"\n", + "2019-01-31 01:24:47,194 : INFO : topic #36 (0.020): 0.011*\"network\" + 0.010*\"prognosi\" + 0.010*\"pop\" + 0.009*\"cytokin\" + 0.008*\"softwar\" + 0.008*\"develop\" + 0.008*\"user\" + 0.008*\"uruguayan\" + 0.007*\"diggin\" + 0.007*\"includ\"\n", + "2019-01-31 01:24:47,195 : INFO : topic #23 (0.020): 0.139*\"audit\" + 0.070*\"best\" + 0.033*\"yawn\" + 0.028*\"jacksonvil\" + 0.023*\"japanes\" + 0.021*\"noll\" + 0.019*\"festiv\" + 0.018*\"women\" + 0.016*\"intern\" + 0.014*\"winner\"\n", + "2019-01-31 01:24:47,196 : INFO : topic #34 (0.020): 0.066*\"start\" + 0.035*\"new\" + 0.031*\"american\" + 0.028*\"unionist\" + 0.026*\"cotton\" + 0.022*\"year\" + 0.016*\"california\" + 0.013*\"warrior\" + 0.012*\"terri\" + 0.011*\"north\"\n", + "2019-01-31 01:24:47,197 : INFO : topic #0 (0.020): 0.062*\"statewid\" + 0.040*\"line\" + 0.030*\"raid\" + 0.028*\"rivièr\" + 0.027*\"rosenwald\" + 0.022*\"airmen\" + 0.018*\"serv\" + 0.017*\"traceabl\" + 0.014*\"oper\" + 0.011*\"rail\"\n", + "2019-01-31 01:24:47,202 : INFO : topic diff=0.003197, rho=0.022394\n", + "2019-01-31 01:24:47,358 : INFO : PROGRESS: pass 0, at document #3990000/4922894\n", + "2019-01-31 01:24:48,727 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:24:48,993 : INFO : topic #17 (0.020): 0.077*\"church\" + 0.022*\"christian\" + 0.022*\"cathol\" + 0.019*\"bishop\" + 0.017*\"sail\" + 0.015*\"retroflex\" + 0.010*\"relationship\" + 0.009*\"parish\" + 0.009*\"cathedr\" + 0.009*\"historiographi\"\n", + "2019-01-31 01:24:48,995 : INFO : topic #8 (0.020): 0.027*\"law\" + 0.023*\"cortic\" + 0.019*\"start\" + 0.019*\"act\" + 0.012*\"case\" + 0.012*\"ricardo\" + 0.010*\"replac\" + 0.009*\"polaris\" + 0.008*\"legal\" + 0.007*\"judaism\"\n", + "2019-01-31 01:24:48,996 : INFO : topic #21 (0.020): 0.034*\"samford\" + 0.022*\"spain\" + 0.017*\"del\" + 0.017*\"italian\" + 0.016*\"mexico\" + 0.014*\"soviet\" + 0.012*\"santa\" + 0.011*\"juan\" + 0.010*\"carlo\" + 0.010*\"francisco\"\n", + "2019-01-31 01:24:48,996 : INFO : topic #39 (0.020): 0.057*\"canada\" + 0.046*\"canadian\" + 0.026*\"hoar\" + 0.023*\"toronto\" + 0.022*\"ontario\" + 0.017*\"hydrogen\" + 0.016*\"new\" + 0.015*\"misericordia\" + 0.015*\"novotná\" + 0.014*\"quebec\"\n", + "2019-01-31 01:24:48,997 : INFO : topic #19 (0.020): 0.016*\"languag\" + 0.015*\"centuri\" + 0.010*\"woodcut\" + 0.009*\"form\" + 0.009*\"origin\" + 0.009*\"mean\" + 0.008*\"trade\" + 0.007*\"english\" + 0.007*\"known\" + 0.007*\"uruguayan\"\n", + "2019-01-31 01:24:49,003 : INFO : topic diff=0.002406, rho=0.022389\n", + "2019-01-31 01:24:49,161 : INFO : PROGRESS: pass 0, at document #3992000/4922894\n", + "2019-01-31 01:24:50,551 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:24:50,817 : INFO : topic #43 (0.020): 0.064*\"elect\" + 0.053*\"parti\" + 0.024*\"voluntari\" + 0.022*\"democrat\" + 0.020*\"member\" + 0.016*\"polici\" + 0.015*\"republ\" + 0.014*\"bypass\" + 0.014*\"report\" + 0.013*\"selma\"\n", + "2019-01-31 01:24:50,818 : INFO : topic #2 (0.020): 0.050*\"isl\" + 0.037*\"shield\" + 0.017*\"narrat\" + 0.015*\"scot\" + 0.014*\"blur\" + 0.014*\"pope\" + 0.011*\"coalit\" + 0.010*\"nativist\" + 0.009*\"class\" + 0.009*\"vernon\"\n", + "2019-01-31 01:24:50,819 : INFO : topic #15 (0.020): 0.011*\"small\" + 0.010*\"organ\" + 0.010*\"develop\" + 0.009*\"commun\" + 0.008*\"word\" + 0.008*\"group\" + 0.008*\"peopl\" + 0.007*\"woman\" + 0.007*\"human\" + 0.006*\"summerhil\"\n", + "2019-01-31 01:24:50,820 : INFO : topic #10 (0.020): 0.011*\"cdd\" + 0.009*\"media\" + 0.009*\"hormon\" + 0.008*\"have\" + 0.008*\"disco\" + 0.007*\"pathwai\" + 0.007*\"caus\" + 0.006*\"proper\" + 0.006*\"effect\" + 0.006*\"treat\"\n", + "2019-01-31 01:24:50,821 : INFO : topic #13 (0.020): 0.026*\"sourc\" + 0.025*\"london\" + 0.025*\"australia\" + 0.024*\"new\" + 0.023*\"england\" + 0.022*\"australian\" + 0.019*\"ireland\" + 0.019*\"british\" + 0.014*\"youth\" + 0.013*\"wale\"\n", + "2019-01-31 01:24:50,827 : INFO : topic diff=0.002651, rho=0.022383\n", + "2019-01-31 01:24:50,987 : INFO : PROGRESS: pass 0, at document #3994000/4922894\n", + "2019-01-31 01:24:52,368 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:24:52,636 : INFO : topic #6 (0.020): 0.069*\"fewer\" + 0.024*\"epiru\" + 0.021*\"septemb\" + 0.018*\"teacher\" + 0.015*\"stake\" + 0.012*\"rodríguez\" + 0.012*\"proclaim\" + 0.011*\"direct\" + 0.011*\"movi\" + 0.010*\"acrimoni\"\n", + "2019-01-31 01:24:52,637 : INFO : topic #22 (0.020): 0.034*\"spars\" + 0.018*\"factor\" + 0.012*\"plaisir\" + 0.010*\"genu\" + 0.010*\"western\" + 0.009*\"biom\" + 0.008*\"median\" + 0.006*\"incom\" + 0.006*\"trap\" + 0.006*\"male\"\n", + "2019-01-31 01:24:52,639 : INFO : topic #45 (0.020): 0.042*\"arsen\" + 0.030*\"jpg\" + 0.028*\"fifteenth\" + 0.025*\"museo\" + 0.021*\"pain\" + 0.019*\"illicit\" + 0.015*\"colder\" + 0.015*\"exhaust\" + 0.015*\"gai\" + 0.014*\"artist\"\n", + "2019-01-31 01:24:52,640 : INFO : topic #41 (0.020): 0.040*\"citi\" + 0.023*\"palmer\" + 0.020*\"new\" + 0.016*\"strategist\" + 0.013*\"center\" + 0.013*\"open\" + 0.011*\"lobe\" + 0.011*\"includ\" + 0.010*\"dai\" + 0.009*\"highli\"\n", + "2019-01-31 01:24:52,641 : INFO : topic #11 (0.020): 0.023*\"john\" + 0.011*\"jame\" + 0.011*\"will\" + 0.011*\"david\" + 0.010*\"rival\" + 0.009*\"mexican–american\" + 0.008*\"slur\" + 0.007*\"georg\" + 0.007*\"rhyme\" + 0.007*\"paul\"\n", + "2019-01-31 01:24:52,647 : INFO : topic diff=0.004230, rho=0.022377\n", + "2019-01-31 01:24:52,801 : INFO : PROGRESS: pass 0, at document #3996000/4922894\n", + "2019-01-31 01:24:54,166 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 01:24:54,433 : INFO : topic #0 (0.020): 0.063*\"statewid\" + 0.040*\"line\" + 0.030*\"raid\" + 0.028*\"rivièr\" + 0.027*\"rosenwald\" + 0.022*\"airmen\" + 0.018*\"serv\" + 0.017*\"traceabl\" + 0.014*\"oper\" + 0.010*\"rail\"\n", + "2019-01-31 01:24:54,434 : INFO : topic #27 (0.020): 0.074*\"questionnair\" + 0.020*\"candid\" + 0.017*\"taxpay\" + 0.014*\"tornado\" + 0.013*\"ret\" + 0.012*\"driver\" + 0.012*\"fool\" + 0.011*\"horac\" + 0.010*\"find\" + 0.010*\"théori\"\n", + "2019-01-31 01:24:54,435 : INFO : topic #11 (0.020): 0.023*\"john\" + 0.011*\"jame\" + 0.011*\"will\" + 0.011*\"david\" + 0.010*\"rival\" + 0.009*\"mexican–american\" + 0.008*\"slur\" + 0.007*\"georg\" + 0.007*\"rhyme\" + 0.007*\"paul\"\n", + "2019-01-31 01:24:54,436 : INFO : topic #18 (0.020): 0.011*\"théori\" + 0.007*\"later\" + 0.007*\"sack\" + 0.006*\"dai\" + 0.005*\"kill\" + 0.005*\"like\" + 0.005*\"retrospect\" + 0.005*\"end\" + 0.004*\"call\" + 0.004*\"help\"\n", + "2019-01-31 01:24:54,437 : INFO : topic #4 (0.020): 0.019*\"enfranchis\" + 0.014*\"depress\" + 0.014*\"pour\" + 0.008*\"elabor\" + 0.008*\"mode\" + 0.008*\"uruguayan\" + 0.007*\"veget\" + 0.006*\"turn\" + 0.006*\"produc\" + 0.006*\"develop\"\n", + "2019-01-31 01:24:54,443 : INFO : topic diff=0.002595, rho=0.022372\n", + "2019-01-31 01:24:54,593 : INFO : PROGRESS: pass 0, at document #3998000/4922894\n", + "2019-01-31 01:24:55,917 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:24:56,183 : INFO : topic #29 (0.020): 0.031*\"companhia\" + 0.013*\"busi\" + 0.012*\"million\" + 0.011*\"market\" + 0.011*\"produc\" + 0.010*\"bank\" + 0.010*\"industri\" + 0.009*\"yawn\" + 0.008*\"manag\" + 0.007*\"serv\"\n", + "2019-01-31 01:24:56,184 : INFO : topic #38 (0.020): 0.023*\"walter\" + 0.010*\"aza\" + 0.009*\"battalion\" + 0.009*\"forc\" + 0.007*\"armi\" + 0.007*\"teufel\" + 0.007*\"empath\" + 0.006*\"citi\" + 0.006*\"militari\" + 0.006*\"govern\"\n", + "2019-01-31 01:24:56,185 : INFO : topic #44 (0.020): 0.030*\"rooftop\" + 0.027*\"final\" + 0.022*\"wife\" + 0.021*\"tourist\" + 0.019*\"champion\" + 0.015*\"martin\" + 0.014*\"taxpay\" + 0.014*\"chamber\" + 0.014*\"tiepolo\" + 0.012*\"open\"\n", + "2019-01-31 01:24:56,186 : INFO : topic #15 (0.020): 0.011*\"small\" + 0.010*\"organ\" + 0.010*\"develop\" + 0.009*\"commun\" + 0.009*\"word\" + 0.008*\"group\" + 0.008*\"peopl\" + 0.007*\"woman\" + 0.007*\"human\" + 0.006*\"summerhil\"\n", + "2019-01-31 01:24:56,187 : INFO : topic #1 (0.020): 0.055*\"china\" + 0.047*\"chilton\" + 0.023*\"hong\" + 0.022*\"kong\" + 0.020*\"korea\" + 0.018*\"korean\" + 0.016*\"sourc\" + 0.015*\"kim\" + 0.015*\"leah\" + 0.013*\"shirin\"\n", + "2019-01-31 01:24:56,193 : INFO : topic diff=0.003609, rho=0.022366\n", + "2019-01-31 01:24:58,969 : INFO : -11.467 per-word bound, 2831.4 perplexity estimate based on a held-out corpus of 2000 documents with 564962 words\n", + "2019-01-31 01:24:58,970 : INFO : PROGRESS: pass 0, at document #4000000/4922894\n", + "2019-01-31 01:25:00,356 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:25:00,623 : INFO : topic #3 (0.020): 0.033*\"present\" + 0.026*\"offic\" + 0.024*\"minist\" + 0.024*\"nation\" + 0.022*\"govern\" + 0.021*\"member\" + 0.018*\"serv\" + 0.016*\"start\" + 0.016*\"gener\" + 0.014*\"seri\"\n", + "2019-01-31 01:25:00,624 : INFO : topic #16 (0.020): 0.057*\"king\" + 0.031*\"priest\" + 0.019*\"duke\" + 0.019*\"grammat\" + 0.017*\"idiosyncrat\" + 0.016*\"rotterdam\" + 0.015*\"quarterli\" + 0.014*\"kingdom\" + 0.013*\"portugues\" + 0.013*\"brazil\"\n", + "2019-01-31 01:25:00,625 : INFO : topic #20 (0.020): 0.142*\"scholar\" + 0.040*\"struggl\" + 0.032*\"high\" + 0.030*\"educ\" + 0.024*\"collector\" + 0.018*\"yawn\" + 0.013*\"prognosi\" + 0.010*\"district\" + 0.010*\"task\" + 0.010*\"gothic\"\n", + "2019-01-31 01:25:00,626 : INFO : topic #31 (0.020): 0.051*\"fusiform\" + 0.026*\"scientist\" + 0.026*\"taxpay\" + 0.023*\"player\" + 0.020*\"place\" + 0.014*\"clot\" + 0.013*\"leagu\" + 0.011*\"folei\" + 0.010*\"yawn\" + 0.009*\"reconstruct\"\n", + "2019-01-31 01:25:00,627 : INFO : topic #14 (0.020): 0.024*\"forc\" + 0.022*\"aggress\" + 0.021*\"walter\" + 0.021*\"armi\" + 0.018*\"com\" + 0.014*\"unionist\" + 0.013*\"oper\" + 0.012*\"militari\" + 0.012*\"diversifi\" + 0.012*\"airbu\"\n", + "2019-01-31 01:25:00,633 : INFO : topic diff=0.003644, rho=0.022361\n", + "2019-01-31 01:25:00,789 : INFO : PROGRESS: pass 0, at document #4002000/4922894\n", + "2019-01-31 01:25:02,147 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:25:02,413 : INFO : topic #26 (0.020): 0.032*\"workplac\" + 0.029*\"champion\" + 0.026*\"woman\" + 0.025*\"olymp\" + 0.024*\"men\" + 0.021*\"medal\" + 0.020*\"event\" + 0.019*\"atheist\" + 0.018*\"taxpay\" + 0.018*\"rainfal\"\n", + "2019-01-31 01:25:02,414 : INFO : topic #45 (0.020): 0.042*\"arsen\" + 0.030*\"jpg\" + 0.028*\"fifteenth\" + 0.025*\"museo\" + 0.021*\"pain\" + 0.019*\"illicit\" + 0.015*\"colder\" + 0.015*\"exhaust\" + 0.015*\"gai\" + 0.014*\"artist\"\n", + "2019-01-31 01:25:02,416 : INFO : topic #8 (0.020): 0.027*\"law\" + 0.023*\"cortic\" + 0.019*\"start\" + 0.018*\"act\" + 0.012*\"case\" + 0.012*\"ricardo\" + 0.010*\"replac\" + 0.009*\"polaris\" + 0.008*\"legal\" + 0.007*\"judaism\"\n", + "2019-01-31 01:25:02,417 : INFO : topic #0 (0.020): 0.063*\"statewid\" + 0.040*\"line\" + 0.030*\"raid\" + 0.029*\"rivièr\" + 0.027*\"rosenwald\" + 0.022*\"airmen\" + 0.018*\"serv\" + 0.017*\"traceabl\" + 0.014*\"oper\" + 0.010*\"transient\"\n", + "2019-01-31 01:25:02,418 : INFO : topic #49 (0.020): 0.044*\"india\" + 0.031*\"incumb\" + 0.013*\"pakistan\" + 0.012*\"islam\" + 0.012*\"anglo\" + 0.011*\"khalsa\" + 0.011*\"televis\" + 0.011*\"muskoge\" + 0.011*\"sri\" + 0.010*\"affection\"\n", + "2019-01-31 01:25:02,423 : INFO : topic diff=0.003159, rho=0.022355\n", + "2019-01-31 01:25:02,577 : INFO : PROGRESS: pass 0, at document #4004000/4922894\n", + "2019-01-31 01:25:03,935 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:25:04,201 : INFO : topic #19 (0.020): 0.016*\"languag\" + 0.015*\"centuri\" + 0.011*\"woodcut\" + 0.009*\"form\" + 0.009*\"origin\" + 0.008*\"mean\" + 0.008*\"trade\" + 0.007*\"english\" + 0.007*\"known\" + 0.007*\"uruguayan\"\n", + "2019-01-31 01:25:04,202 : INFO : topic #18 (0.020): 0.011*\"théori\" + 0.007*\"later\" + 0.007*\"sack\" + 0.006*\"dai\" + 0.005*\"kill\" + 0.005*\"like\" + 0.005*\"retrospect\" + 0.005*\"end\" + 0.004*\"call\" + 0.004*\"help\"\n", + "2019-01-31 01:25:04,203 : INFO : topic #35 (0.020): 0.056*\"russia\" + 0.037*\"sovereignti\" + 0.035*\"rural\" + 0.026*\"poison\" + 0.025*\"personifi\" + 0.022*\"reprint\" + 0.020*\"moscow\" + 0.019*\"poland\" + 0.014*\"tyrant\" + 0.013*\"czech\"\n", + "2019-01-31 01:25:04,204 : INFO : topic #37 (0.020): 0.013*\"charact\" + 0.013*\"septemb\" + 0.011*\"anim\" + 0.011*\"comic\" + 0.010*\"man\" + 0.007*\"appear\" + 0.007*\"fusiform\" + 0.007*\"storag\" + 0.007*\"workplac\" + 0.006*\"vision\"\n", + "2019-01-31 01:25:04,205 : INFO : topic #10 (0.020): 0.011*\"cdd\" + 0.009*\"media\" + 0.009*\"hormon\" + 0.008*\"have\" + 0.007*\"disco\" + 0.007*\"pathwai\" + 0.007*\"caus\" + 0.006*\"effect\" + 0.006*\"treat\" + 0.006*\"proper\"\n", + "2019-01-31 01:25:04,211 : INFO : topic diff=0.003707, rho=0.022350\n", + "2019-01-31 01:25:04,365 : INFO : PROGRESS: pass 0, at document #4006000/4922894\n", + "2019-01-31 01:25:05,729 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:25:05,996 : INFO : topic #0 (0.020): 0.063*\"statewid\" + 0.039*\"line\" + 0.030*\"raid\" + 0.029*\"rivièr\" + 0.027*\"rosenwald\" + 0.022*\"airmen\" + 0.018*\"serv\" + 0.017*\"traceabl\" + 0.014*\"oper\" + 0.011*\"brook\"\n", + "2019-01-31 01:25:05,997 : INFO : topic #4 (0.020): 0.019*\"enfranchis\" + 0.014*\"depress\" + 0.014*\"pour\" + 0.008*\"mode\" + 0.008*\"elabor\" + 0.008*\"uruguayan\" + 0.007*\"veget\" + 0.006*\"turn\" + 0.006*\"produc\" + 0.006*\"develop\"\n", + "2019-01-31 01:25:05,998 : INFO : topic #7 (0.020): 0.022*\"snatch\" + 0.020*\"di\" + 0.019*\"factor\" + 0.016*\"margin\" + 0.016*\"yawn\" + 0.014*\"bone\" + 0.013*\"faster\" + 0.013*\"life\" + 0.012*\"deal\" + 0.012*\"daughter\"\n", + "2019-01-31 01:25:05,999 : INFO : topic #22 (0.020): 0.033*\"spars\" + 0.019*\"factor\" + 0.012*\"plaisir\" + 0.010*\"genu\" + 0.010*\"western\" + 0.009*\"biom\" + 0.008*\"median\" + 0.007*\"incom\" + 0.006*\"trap\" + 0.006*\"black\"\n", + "2019-01-31 01:25:06,001 : INFO : topic #18 (0.020): 0.011*\"théori\" + 0.007*\"later\" + 0.007*\"sack\" + 0.006*\"dai\" + 0.005*\"kill\" + 0.005*\"like\" + 0.005*\"retrospect\" + 0.005*\"end\" + 0.004*\"call\" + 0.004*\"help\"\n", + "2019-01-31 01:25:06,006 : INFO : topic diff=0.003550, rho=0.022344\n", + "2019-01-31 01:25:06,162 : INFO : PROGRESS: pass 0, at document #4008000/4922894\n", + "2019-01-31 01:25:07,533 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:25:07,800 : INFO : topic #25 (0.020): 0.033*\"ring\" + 0.018*\"area\" + 0.017*\"lagrang\" + 0.016*\"mount\" + 0.016*\"warmth\" + 0.010*\"north\" + 0.009*\"sourc\" + 0.009*\"land\" + 0.008*\"vacant\" + 0.008*\"lobe\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 01:25:07,801 : INFO : topic #11 (0.020): 0.023*\"john\" + 0.011*\"will\" + 0.011*\"jame\" + 0.011*\"david\" + 0.010*\"rival\" + 0.009*\"mexican–american\" + 0.008*\"slur\" + 0.007*\"georg\" + 0.007*\"paul\" + 0.007*\"rhyme\"\n", + "2019-01-31 01:25:07,802 : INFO : topic #4 (0.020): 0.019*\"enfranchis\" + 0.014*\"depress\" + 0.014*\"pour\" + 0.008*\"mode\" + 0.008*\"elabor\" + 0.008*\"uruguayan\" + 0.007*\"veget\" + 0.006*\"turn\" + 0.006*\"produc\" + 0.006*\"develop\"\n", + "2019-01-31 01:25:07,804 : INFO : topic #42 (0.020): 0.049*\"german\" + 0.031*\"germani\" + 0.016*\"vol\" + 0.015*\"jewish\" + 0.014*\"berlin\" + 0.013*\"israel\" + 0.013*\"der\" + 0.010*\"european\" + 0.009*\"jeremiah\" + 0.009*\"austria\"\n", + "2019-01-31 01:25:07,805 : INFO : topic #38 (0.020): 0.023*\"walter\" + 0.010*\"aza\" + 0.009*\"battalion\" + 0.009*\"forc\" + 0.007*\"armi\" + 0.007*\"teufel\" + 0.007*\"empath\" + 0.006*\"citi\" + 0.006*\"militari\" + 0.006*\"govern\"\n", + "2019-01-31 01:25:07,811 : INFO : topic diff=0.002982, rho=0.022338\n", + "2019-01-31 01:25:07,969 : INFO : PROGRESS: pass 0, at document #4010000/4922894\n", + "2019-01-31 01:25:09,346 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:25:09,613 : INFO : topic #12 (0.020): 0.008*\"number\" + 0.008*\"frontal\" + 0.007*\"gener\" + 0.006*\"poet\" + 0.006*\"exampl\" + 0.006*\"utopian\" + 0.006*\"théori\" + 0.006*\"southern\" + 0.006*\"servitud\" + 0.006*\"method\"\n", + "2019-01-31 01:25:09,614 : INFO : topic #45 (0.020): 0.041*\"arsen\" + 0.030*\"jpg\" + 0.028*\"fifteenth\" + 0.025*\"museo\" + 0.021*\"pain\" + 0.019*\"illicit\" + 0.015*\"colder\" + 0.014*\"exhaust\" + 0.014*\"artist\" + 0.014*\"gai\"\n", + "2019-01-31 01:25:09,615 : INFO : topic #39 (0.020): 0.057*\"canada\" + 0.046*\"canadian\" + 0.026*\"hoar\" + 0.023*\"toronto\" + 0.022*\"ontario\" + 0.017*\"hydrogen\" + 0.016*\"new\" + 0.015*\"novotná\" + 0.014*\"misericordia\" + 0.014*\"quebec\"\n", + "2019-01-31 01:25:09,616 : INFO : topic #30 (0.020): 0.036*\"cleveland\" + 0.035*\"leagu\" + 0.029*\"place\" + 0.027*\"taxpay\" + 0.024*\"scientist\" + 0.023*\"crete\" + 0.021*\"folei\" + 0.016*\"goal\" + 0.015*\"martin\" + 0.012*\"schmitz\"\n", + "2019-01-31 01:25:09,617 : INFO : topic #47 (0.020): 0.062*\"muscl\" + 0.033*\"perceptu\" + 0.020*\"theater\" + 0.018*\"place\" + 0.018*\"compos\" + 0.015*\"damn\" + 0.013*\"olympo\" + 0.013*\"orchestr\" + 0.012*\"physician\" + 0.011*\"word\"\n", + "2019-01-31 01:25:09,623 : INFO : topic diff=0.003590, rho=0.022333\n", + "2019-01-31 01:25:09,778 : INFO : PROGRESS: pass 0, at document #4012000/4922894\n", + "2019-01-31 01:25:11,121 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:25:11,387 : INFO : topic #38 (0.020): 0.023*\"walter\" + 0.010*\"aza\" + 0.009*\"battalion\" + 0.009*\"forc\" + 0.007*\"teufel\" + 0.007*\"armi\" + 0.007*\"empath\" + 0.006*\"citi\" + 0.006*\"militari\" + 0.006*\"govern\"\n", + "2019-01-31 01:25:11,388 : INFO : topic #4 (0.020): 0.019*\"enfranchis\" + 0.014*\"depress\" + 0.014*\"pour\" + 0.008*\"elabor\" + 0.008*\"mode\" + 0.008*\"uruguayan\" + 0.007*\"veget\" + 0.006*\"turn\" + 0.006*\"produc\" + 0.006*\"develop\"\n", + "2019-01-31 01:25:11,389 : INFO : topic #1 (0.020): 0.054*\"china\" + 0.048*\"chilton\" + 0.024*\"hong\" + 0.023*\"kong\" + 0.020*\"korea\" + 0.017*\"korean\" + 0.015*\"sourc\" + 0.015*\"leah\" + 0.014*\"kim\" + 0.013*\"shirin\"\n", + "2019-01-31 01:25:11,390 : INFO : topic #40 (0.020): 0.087*\"unit\" + 0.023*\"schuster\" + 0.022*\"collector\" + 0.022*\"institut\" + 0.021*\"requir\" + 0.019*\"student\" + 0.014*\"professor\" + 0.012*\"degre\" + 0.012*\"word\" + 0.012*\"http\"\n", + "2019-01-31 01:25:11,391 : INFO : topic #22 (0.020): 0.034*\"spars\" + 0.019*\"factor\" + 0.012*\"plaisir\" + 0.010*\"western\" + 0.010*\"genu\" + 0.009*\"biom\" + 0.008*\"median\" + 0.007*\"incom\" + 0.006*\"trap\" + 0.006*\"black\"\n", + "2019-01-31 01:25:11,397 : INFO : topic diff=0.002659, rho=0.022327\n", + "2019-01-31 01:25:11,556 : INFO : PROGRESS: pass 0, at document #4014000/4922894\n", + "2019-01-31 01:25:12,940 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:25:13,207 : INFO : topic #25 (0.020): 0.034*\"ring\" + 0.018*\"area\" + 0.016*\"lagrang\" + 0.016*\"mount\" + 0.016*\"warmth\" + 0.010*\"north\" + 0.009*\"land\" + 0.009*\"sourc\" + 0.008*\"lobe\" + 0.008*\"vacant\"\n", + "2019-01-31 01:25:13,208 : INFO : topic #20 (0.020): 0.142*\"scholar\" + 0.040*\"struggl\" + 0.033*\"high\" + 0.030*\"educ\" + 0.024*\"collector\" + 0.018*\"yawn\" + 0.013*\"prognosi\" + 0.010*\"district\" + 0.010*\"task\" + 0.009*\"gothic\"\n", + "2019-01-31 01:25:13,209 : INFO : topic #29 (0.020): 0.031*\"companhia\" + 0.013*\"busi\" + 0.012*\"million\" + 0.011*\"market\" + 0.011*\"produc\" + 0.010*\"bank\" + 0.010*\"industri\" + 0.009*\"yawn\" + 0.008*\"manag\" + 0.007*\"serv\"\n", + "2019-01-31 01:25:13,210 : INFO : topic #0 (0.020): 0.063*\"statewid\" + 0.039*\"line\" + 0.030*\"raid\" + 0.028*\"rosenwald\" + 0.028*\"rivièr\" + 0.022*\"airmen\" + 0.018*\"serv\" + 0.017*\"traceabl\" + 0.014*\"oper\" + 0.011*\"brook\"\n", + "2019-01-31 01:25:13,211 : INFO : topic #22 (0.020): 0.034*\"spars\" + 0.019*\"factor\" + 0.012*\"plaisir\" + 0.010*\"genu\" + 0.010*\"western\" + 0.009*\"biom\" + 0.008*\"median\" + 0.007*\"incom\" + 0.006*\"trap\" + 0.006*\"black\"\n", + "2019-01-31 01:25:13,217 : INFO : topic diff=0.003417, rho=0.022322\n", + "2019-01-31 01:25:13,371 : INFO : PROGRESS: pass 0, at document #4016000/4922894\n", + "2019-01-31 01:25:14,730 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:25:14,996 : INFO : topic #32 (0.020): 0.049*\"district\" + 0.045*\"popolo\" + 0.045*\"vigour\" + 0.035*\"tortur\" + 0.032*\"cotton\" + 0.022*\"area\" + 0.021*\"adulthood\" + 0.021*\"multitud\" + 0.020*\"cede\" + 0.018*\"citi\"\n", + "2019-01-31 01:25:14,997 : INFO : topic #45 (0.020): 0.041*\"arsen\" + 0.030*\"jpg\" + 0.028*\"fifteenth\" + 0.025*\"museo\" + 0.021*\"pain\" + 0.019*\"illicit\" + 0.015*\"colder\" + 0.015*\"exhaust\" + 0.014*\"artist\" + 0.014*\"gai\"\n", + "2019-01-31 01:25:14,998 : INFO : topic #43 (0.020): 0.064*\"elect\" + 0.053*\"parti\" + 0.024*\"voluntari\" + 0.023*\"democrat\" + 0.020*\"member\" + 0.016*\"polici\" + 0.015*\"republ\" + 0.014*\"bypass\" + 0.014*\"selma\" + 0.013*\"report\"\n", + "2019-01-31 01:25:14,999 : INFO : topic #5 (0.020): 0.038*\"abroad\" + 0.028*\"son\" + 0.027*\"rel\" + 0.025*\"reconstruct\" + 0.020*\"band\" + 0.017*\"muscl\" + 0.016*\"simultan\" + 0.014*\"charcoal\" + 0.013*\"toyota\" + 0.009*\"vocabulari\"\n", + "2019-01-31 01:25:15,000 : INFO : topic #7 (0.020): 0.022*\"snatch\" + 0.020*\"di\" + 0.018*\"factor\" + 0.016*\"yawn\" + 0.016*\"margin\" + 0.014*\"bone\" + 0.013*\"faster\" + 0.013*\"life\" + 0.012*\"deal\" + 0.012*\"daughter\"\n", + "2019-01-31 01:25:15,006 : INFO : topic diff=0.003130, rho=0.022316\n", + "2019-01-31 01:25:15,167 : INFO : PROGRESS: pass 0, at document #4018000/4922894\n", + "2019-01-31 01:25:16,571 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:25:16,838 : INFO : topic #47 (0.020): 0.062*\"muscl\" + 0.033*\"perceptu\" + 0.020*\"theater\" + 0.018*\"place\" + 0.018*\"compos\" + 0.015*\"damn\" + 0.013*\"olympo\" + 0.013*\"orchestr\" + 0.012*\"physician\" + 0.011*\"word\"\n", + "2019-01-31 01:25:16,839 : INFO : topic #6 (0.020): 0.070*\"fewer\" + 0.024*\"epiru\" + 0.021*\"septemb\" + 0.018*\"teacher\" + 0.015*\"stake\" + 0.012*\"rodríguez\" + 0.012*\"proclaim\" + 0.011*\"direct\" + 0.010*\"movi\" + 0.010*\"acrimoni\"\n", + "2019-01-31 01:25:16,841 : INFO : topic #38 (0.020): 0.023*\"walter\" + 0.010*\"aza\" + 0.009*\"battalion\" + 0.009*\"forc\" + 0.007*\"armi\" + 0.007*\"teufel\" + 0.007*\"empath\" + 0.006*\"citi\" + 0.006*\"militari\" + 0.006*\"govern\"\n", + "2019-01-31 01:25:16,842 : INFO : topic #10 (0.020): 0.010*\"cdd\" + 0.009*\"media\" + 0.008*\"hormon\" + 0.008*\"have\" + 0.008*\"disco\" + 0.007*\"pathwai\" + 0.007*\"caus\" + 0.006*\"viru\" + 0.006*\"proper\" + 0.006*\"effect\"\n", + "2019-01-31 01:25:16,842 : INFO : topic #13 (0.020): 0.026*\"london\" + 0.026*\"australia\" + 0.025*\"sourc\" + 0.024*\"new\" + 0.023*\"england\" + 0.022*\"australian\" + 0.020*\"british\" + 0.019*\"ireland\" + 0.014*\"youth\" + 0.013*\"wale\"\n", + "2019-01-31 01:25:16,848 : INFO : topic diff=0.003366, rho=0.022311\n", + "2019-01-31 01:25:19,589 : INFO : -11.564 per-word bound, 3027.2 perplexity estimate based on a held-out corpus of 2000 documents with 600277 words\n", + "2019-01-31 01:25:19,590 : INFO : PROGRESS: pass 0, at document #4020000/4922894\n", + "2019-01-31 01:25:20,989 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:25:21,256 : INFO : topic #43 (0.020): 0.064*\"elect\" + 0.053*\"parti\" + 0.024*\"voluntari\" + 0.023*\"democrat\" + 0.020*\"member\" + 0.016*\"polici\" + 0.015*\"republ\" + 0.014*\"bypass\" + 0.014*\"selma\" + 0.013*\"report\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 01:25:21,257 : INFO : topic #14 (0.020): 0.024*\"forc\" + 0.022*\"aggress\" + 0.021*\"walter\" + 0.021*\"armi\" + 0.018*\"com\" + 0.014*\"unionist\" + 0.013*\"oper\" + 0.013*\"militari\" + 0.012*\"airbu\" + 0.011*\"refut\"\n", + "2019-01-31 01:25:21,258 : INFO : topic #12 (0.020): 0.008*\"number\" + 0.008*\"frontal\" + 0.006*\"gener\" + 0.006*\"poet\" + 0.006*\"exampl\" + 0.006*\"utopian\" + 0.006*\"servitud\" + 0.006*\"théori\" + 0.006*\"southern\" + 0.005*\"method\"\n", + "2019-01-31 01:25:21,260 : INFO : topic #6 (0.020): 0.070*\"fewer\" + 0.024*\"epiru\" + 0.020*\"septemb\" + 0.018*\"teacher\" + 0.015*\"stake\" + 0.012*\"rodríguez\" + 0.012*\"proclaim\" + 0.011*\"direct\" + 0.010*\"movi\" + 0.010*\"acrimoni\"\n", + "2019-01-31 01:25:21,261 : INFO : topic #44 (0.020): 0.030*\"rooftop\" + 0.027*\"final\" + 0.023*\"wife\" + 0.021*\"tourist\" + 0.019*\"champion\" + 0.015*\"martin\" + 0.015*\"taxpay\" + 0.014*\"chamber\" + 0.014*\"tiepolo\" + 0.013*\"open\"\n", + "2019-01-31 01:25:21,267 : INFO : topic diff=0.004216, rho=0.022305\n", + "2019-01-31 01:25:21,424 : INFO : PROGRESS: pass 0, at document #4022000/4922894\n", + "2019-01-31 01:25:22,804 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:25:23,070 : INFO : topic #23 (0.020): 0.138*\"audit\" + 0.072*\"best\" + 0.035*\"yawn\" + 0.027*\"jacksonvil\" + 0.023*\"japanes\" + 0.021*\"noll\" + 0.019*\"festiv\" + 0.019*\"women\" + 0.016*\"intern\" + 0.014*\"winner\"\n", + "2019-01-31 01:25:23,071 : INFO : topic #13 (0.020): 0.026*\"australia\" + 0.026*\"london\" + 0.025*\"sourc\" + 0.024*\"new\" + 0.023*\"england\" + 0.023*\"australian\" + 0.020*\"ireland\" + 0.020*\"british\" + 0.014*\"youth\" + 0.013*\"wale\"\n", + "2019-01-31 01:25:23,072 : INFO : topic #26 (0.020): 0.032*\"workplac\" + 0.029*\"champion\" + 0.027*\"woman\" + 0.025*\"olymp\" + 0.024*\"men\" + 0.021*\"medal\" + 0.019*\"event\" + 0.018*\"taxpay\" + 0.018*\"atheist\" + 0.018*\"rainfal\"\n", + "2019-01-31 01:25:23,074 : INFO : topic #48 (0.020): 0.080*\"march\" + 0.080*\"sens\" + 0.078*\"octob\" + 0.071*\"juli\" + 0.069*\"august\" + 0.069*\"januari\" + 0.068*\"notion\" + 0.067*\"april\" + 0.067*\"judici\" + 0.064*\"decatur\"\n", + "2019-01-31 01:25:23,075 : INFO : topic #32 (0.020): 0.048*\"district\" + 0.045*\"vigour\" + 0.045*\"popolo\" + 0.035*\"tortur\" + 0.032*\"cotton\" + 0.026*\"multitud\" + 0.022*\"area\" + 0.021*\"adulthood\" + 0.019*\"cede\" + 0.018*\"citi\"\n", + "2019-01-31 01:25:23,081 : INFO : topic diff=0.003779, rho=0.022299\n", + "2019-01-31 01:25:23,236 : INFO : PROGRESS: pass 0, at document #4024000/4922894\n", + "2019-01-31 01:25:24,624 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:25:24,890 : INFO : topic #1 (0.020): 0.054*\"china\" + 0.047*\"chilton\" + 0.024*\"hong\" + 0.022*\"kong\" + 0.020*\"korea\" + 0.017*\"korean\" + 0.016*\"leah\" + 0.016*\"kim\" + 0.015*\"sourc\" + 0.013*\"shirin\"\n", + "2019-01-31 01:25:24,891 : INFO : topic #30 (0.020): 0.036*\"cleveland\" + 0.035*\"leagu\" + 0.030*\"place\" + 0.027*\"taxpay\" + 0.024*\"scientist\" + 0.023*\"crete\" + 0.021*\"folei\" + 0.016*\"goal\" + 0.015*\"martin\" + 0.012*\"schmitz\"\n", + "2019-01-31 01:25:24,893 : INFO : topic #10 (0.020): 0.010*\"cdd\" + 0.009*\"media\" + 0.008*\"hormon\" + 0.008*\"have\" + 0.008*\"disco\" + 0.007*\"pathwai\" + 0.007*\"caus\" + 0.006*\"proper\" + 0.006*\"viru\" + 0.006*\"effect\"\n", + "2019-01-31 01:25:24,894 : INFO : topic #42 (0.020): 0.048*\"german\" + 0.032*\"germani\" + 0.016*\"vol\" + 0.015*\"jewish\" + 0.014*\"israel\" + 0.014*\"berlin\" + 0.013*\"der\" + 0.010*\"european\" + 0.009*\"austria\" + 0.009*\"europ\"\n", + "2019-01-31 01:25:24,895 : INFO : topic #37 (0.020): 0.013*\"charact\" + 0.013*\"septemb\" + 0.011*\"comic\" + 0.010*\"anim\" + 0.010*\"man\" + 0.007*\"appear\" + 0.007*\"storag\" + 0.007*\"fusiform\" + 0.007*\"workplac\" + 0.006*\"vision\"\n", + "2019-01-31 01:25:24,901 : INFO : topic diff=0.002904, rho=0.022294\n", + "2019-01-31 01:25:25,060 : INFO : PROGRESS: pass 0, at document #4026000/4922894\n", + "2019-01-31 01:25:26,447 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:25:26,715 : INFO : topic #27 (0.020): 0.073*\"questionnair\" + 0.020*\"candid\" + 0.017*\"taxpay\" + 0.014*\"tornado\" + 0.013*\"fool\" + 0.012*\"driver\" + 0.012*\"ret\" + 0.011*\"horac\" + 0.010*\"find\" + 0.010*\"théori\"\n", + "2019-01-31 01:25:26,716 : INFO : topic #22 (0.020): 0.034*\"spars\" + 0.018*\"factor\" + 0.012*\"plaisir\" + 0.010*\"genu\" + 0.010*\"western\" + 0.009*\"biom\" + 0.008*\"median\" + 0.006*\"incom\" + 0.006*\"trap\" + 0.006*\"male\"\n", + "2019-01-31 01:25:26,717 : INFO : topic #21 (0.020): 0.035*\"samford\" + 0.022*\"spain\" + 0.017*\"del\" + 0.017*\"italian\" + 0.016*\"mexico\" + 0.014*\"soviet\" + 0.013*\"santa\" + 0.011*\"juan\" + 0.011*\"carlo\" + 0.010*\"francisco\"\n", + "2019-01-31 01:25:26,718 : INFO : topic #10 (0.020): 0.010*\"cdd\" + 0.009*\"media\" + 0.008*\"hormon\" + 0.008*\"have\" + 0.008*\"disco\" + 0.007*\"pathwai\" + 0.007*\"caus\" + 0.006*\"proper\" + 0.006*\"viru\" + 0.006*\"effect\"\n", + "2019-01-31 01:25:26,719 : INFO : topic #16 (0.020): 0.055*\"king\" + 0.031*\"priest\" + 0.021*\"grammat\" + 0.019*\"duke\" + 0.017*\"idiosyncrat\" + 0.016*\"rotterdam\" + 0.015*\"quarterli\" + 0.013*\"kingdom\" + 0.013*\"brazil\" + 0.013*\"portugues\"\n", + "2019-01-31 01:25:26,725 : INFO : topic diff=0.003221, rho=0.022288\n", + "2019-01-31 01:25:26,878 : INFO : PROGRESS: pass 0, at document #4028000/4922894\n", + "2019-01-31 01:25:28,226 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:25:28,493 : INFO : topic #42 (0.020): 0.048*\"german\" + 0.032*\"germani\" + 0.016*\"vol\" + 0.016*\"jewish\" + 0.014*\"israel\" + 0.014*\"berlin\" + 0.013*\"der\" + 0.010*\"european\" + 0.009*\"austria\" + 0.009*\"europ\"\n", + "2019-01-31 01:25:28,494 : INFO : topic #45 (0.020): 0.041*\"arsen\" + 0.030*\"jpg\" + 0.028*\"fifteenth\" + 0.025*\"museo\" + 0.021*\"pain\" + 0.020*\"illicit\" + 0.015*\"exhaust\" + 0.015*\"artist\" + 0.015*\"colder\" + 0.014*\"gai\"\n", + "2019-01-31 01:25:28,495 : INFO : topic #21 (0.020): 0.035*\"samford\" + 0.022*\"spain\" + 0.017*\"del\" + 0.017*\"italian\" + 0.016*\"mexico\" + 0.013*\"soviet\" + 0.013*\"santa\" + 0.011*\"juan\" + 0.011*\"carlo\" + 0.010*\"francisco\"\n", + "2019-01-31 01:25:28,496 : INFO : topic #26 (0.020): 0.032*\"workplac\" + 0.029*\"champion\" + 0.027*\"woman\" + 0.025*\"olymp\" + 0.024*\"men\" + 0.021*\"medal\" + 0.019*\"event\" + 0.018*\"taxpay\" + 0.018*\"alic\" + 0.018*\"atheist\"\n", + "2019-01-31 01:25:28,497 : INFO : topic #8 (0.020): 0.027*\"law\" + 0.022*\"cortic\" + 0.020*\"act\" + 0.019*\"start\" + 0.012*\"ricardo\" + 0.012*\"case\" + 0.010*\"replac\" + 0.009*\"polaris\" + 0.008*\"legal\" + 0.007*\"judaism\"\n", + "2019-01-31 01:25:28,503 : INFO : topic diff=0.004118, rho=0.022283\n", + "2019-01-31 01:25:28,717 : INFO : PROGRESS: pass 0, at document #4030000/4922894\n", + "2019-01-31 01:25:30,100 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:25:30,367 : INFO : topic #37 (0.020): 0.013*\"charact\" + 0.013*\"septemb\" + 0.010*\"anim\" + 0.010*\"man\" + 0.010*\"comic\" + 0.007*\"appear\" + 0.007*\"storag\" + 0.007*\"fusiform\" + 0.007*\"workplac\" + 0.006*\"vision\"\n", + "2019-01-31 01:25:30,368 : INFO : topic #2 (0.020): 0.050*\"isl\" + 0.038*\"shield\" + 0.018*\"narrat\" + 0.015*\"scot\" + 0.014*\"blur\" + 0.013*\"pope\" + 0.011*\"nativist\" + 0.010*\"coalit\" + 0.010*\"class\" + 0.009*\"fleet\"\n", + "2019-01-31 01:25:30,369 : INFO : topic #13 (0.020): 0.026*\"london\" + 0.026*\"australia\" + 0.026*\"sourc\" + 0.024*\"new\" + 0.023*\"england\" + 0.022*\"australian\" + 0.020*\"ireland\" + 0.020*\"british\" + 0.014*\"youth\" + 0.013*\"wale\"\n", + "2019-01-31 01:25:30,370 : INFO : topic #23 (0.020): 0.136*\"audit\" + 0.071*\"best\" + 0.034*\"yawn\" + 0.027*\"jacksonvil\" + 0.023*\"japanes\" + 0.022*\"noll\" + 0.019*\"festiv\" + 0.019*\"women\" + 0.016*\"intern\" + 0.014*\"winner\"\n", + "2019-01-31 01:25:30,371 : INFO : topic #14 (0.020): 0.024*\"forc\" + 0.022*\"armi\" + 0.022*\"aggress\" + 0.021*\"walter\" + 0.018*\"com\" + 0.014*\"unionist\" + 0.013*\"oper\" + 0.013*\"militari\" + 0.012*\"airbu\" + 0.012*\"refut\"\n", + "2019-01-31 01:25:30,377 : INFO : topic diff=0.003081, rho=0.022277\n", + "2019-01-31 01:25:30,529 : INFO : PROGRESS: pass 0, at document #4032000/4922894\n", + "2019-01-31 01:25:31,874 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:25:32,140 : INFO : topic #28 (0.020): 0.035*\"build\" + 0.028*\"hous\" + 0.018*\"buford\" + 0.015*\"histor\" + 0.012*\"linear\" + 0.011*\"constitut\" + 0.011*\"depress\" + 0.011*\"silicon\" + 0.010*\"pistol\" + 0.010*\"centuri\"\n", + "2019-01-31 01:25:32,141 : INFO : topic #39 (0.020): 0.058*\"canada\" + 0.046*\"canadian\" + 0.025*\"hoar\" + 0.023*\"toronto\" + 0.022*\"ontario\" + 0.017*\"new\" + 0.016*\"hydrogen\" + 0.015*\"quebec\" + 0.015*\"misericordia\" + 0.014*\"novotná\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 01:25:32,142 : INFO : topic #31 (0.020): 0.050*\"fusiform\" + 0.027*\"scientist\" + 0.026*\"taxpay\" + 0.023*\"player\" + 0.020*\"place\" + 0.014*\"clot\" + 0.013*\"leagu\" + 0.011*\"folei\" + 0.010*\"yawn\" + 0.009*\"reconstruct\"\n", + "2019-01-31 01:25:32,143 : INFO : topic #9 (0.020): 0.074*\"bone\" + 0.043*\"american\" + 0.029*\"valour\" + 0.019*\"dutch\" + 0.018*\"player\" + 0.018*\"folei\" + 0.017*\"polit\" + 0.016*\"english\" + 0.012*\"acrimoni\" + 0.011*\"simpler\"\n", + "2019-01-31 01:25:32,144 : INFO : topic #33 (0.020): 0.059*\"french\" + 0.045*\"franc\" + 0.031*\"pari\" + 0.022*\"sail\" + 0.022*\"jean\" + 0.017*\"daphn\" + 0.014*\"lazi\" + 0.013*\"loui\" + 0.012*\"piec\" + 0.009*\"wine\"\n", + "2019-01-31 01:25:32,150 : INFO : topic diff=0.003248, rho=0.022272\n", + "2019-01-31 01:25:32,301 : INFO : PROGRESS: pass 0, at document #4034000/4922894\n", + "2019-01-31 01:25:33,642 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:25:33,909 : INFO : topic #28 (0.020): 0.035*\"build\" + 0.028*\"hous\" + 0.018*\"buford\" + 0.015*\"histor\" + 0.012*\"linear\" + 0.012*\"constitut\" + 0.011*\"depress\" + 0.011*\"silicon\" + 0.010*\"pistol\" + 0.010*\"centuri\"\n", + "2019-01-31 01:25:33,910 : INFO : topic #4 (0.020): 0.020*\"enfranchis\" + 0.014*\"depress\" + 0.014*\"pour\" + 0.008*\"mode\" + 0.008*\"elabor\" + 0.008*\"uruguayan\" + 0.007*\"veget\" + 0.006*\"turn\" + 0.006*\"produc\" + 0.006*\"develop\"\n", + "2019-01-31 01:25:33,911 : INFO : topic #38 (0.020): 0.022*\"walter\" + 0.010*\"aza\" + 0.009*\"forc\" + 0.009*\"battalion\" + 0.007*\"teufel\" + 0.007*\"empath\" + 0.007*\"armi\" + 0.006*\"citi\" + 0.006*\"govern\" + 0.006*\"militari\"\n", + "2019-01-31 01:25:33,912 : INFO : topic #42 (0.020): 0.048*\"german\" + 0.032*\"germani\" + 0.016*\"vol\" + 0.015*\"jewish\" + 0.014*\"israel\" + 0.014*\"berlin\" + 0.013*\"der\" + 0.010*\"european\" + 0.009*\"austria\" + 0.009*\"europ\"\n", + "2019-01-31 01:25:33,913 : INFO : topic #10 (0.020): 0.010*\"cdd\" + 0.009*\"media\" + 0.008*\"hormon\" + 0.008*\"have\" + 0.008*\"disco\" + 0.007*\"pathwai\" + 0.007*\"caus\" + 0.006*\"proper\" + 0.006*\"effect\" + 0.006*\"viru\"\n", + "2019-01-31 01:25:33,919 : INFO : topic diff=0.003288, rho=0.022266\n", + "2019-01-31 01:25:34,077 : INFO : PROGRESS: pass 0, at document #4036000/4922894\n", + "2019-01-31 01:25:35,465 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:25:35,731 : INFO : topic #26 (0.020): 0.032*\"workplac\" + 0.029*\"champion\" + 0.026*\"woman\" + 0.024*\"olymp\" + 0.023*\"men\" + 0.022*\"medal\" + 0.019*\"event\" + 0.018*\"taxpay\" + 0.018*\"atheist\" + 0.018*\"rainfal\"\n", + "2019-01-31 01:25:35,732 : INFO : topic #8 (0.020): 0.026*\"law\" + 0.023*\"cortic\" + 0.020*\"act\" + 0.019*\"start\" + 0.012*\"ricardo\" + 0.012*\"case\" + 0.010*\"replac\" + 0.009*\"polaris\" + 0.009*\"legal\" + 0.007*\"judaism\"\n", + "2019-01-31 01:25:35,733 : INFO : topic #27 (0.020): 0.074*\"questionnair\" + 0.020*\"candid\" + 0.017*\"taxpay\" + 0.013*\"tornado\" + 0.012*\"fool\" + 0.012*\"driver\" + 0.011*\"ret\" + 0.011*\"horac\" + 0.011*\"find\" + 0.010*\"théori\"\n", + "2019-01-31 01:25:35,734 : INFO : topic #2 (0.020): 0.050*\"isl\" + 0.038*\"shield\" + 0.018*\"narrat\" + 0.015*\"scot\" + 0.014*\"blur\" + 0.013*\"pope\" + 0.011*\"nativist\" + 0.010*\"coalit\" + 0.009*\"class\" + 0.009*\"fleet\"\n", + "2019-01-31 01:25:35,735 : INFO : topic #23 (0.020): 0.136*\"audit\" + 0.071*\"best\" + 0.034*\"yawn\" + 0.028*\"jacksonvil\" + 0.023*\"japanes\" + 0.022*\"noll\" + 0.019*\"women\" + 0.019*\"festiv\" + 0.016*\"intern\" + 0.014*\"winner\"\n", + "2019-01-31 01:25:35,741 : INFO : topic diff=0.003350, rho=0.022261\n", + "2019-01-31 01:25:35,895 : INFO : PROGRESS: pass 0, at document #4038000/4922894\n", + "2019-01-31 01:25:37,227 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:25:37,493 : INFO : topic #13 (0.020): 0.026*\"australia\" + 0.026*\"sourc\" + 0.026*\"london\" + 0.024*\"new\" + 0.023*\"england\" + 0.023*\"australian\" + 0.019*\"ireland\" + 0.019*\"british\" + 0.014*\"youth\" + 0.013*\"wale\"\n", + "2019-01-31 01:25:37,494 : INFO : topic #5 (0.020): 0.038*\"abroad\" + 0.028*\"son\" + 0.027*\"rel\" + 0.026*\"reconstruct\" + 0.020*\"band\" + 0.017*\"muscl\" + 0.016*\"simultan\" + 0.014*\"charcoal\" + 0.013*\"toyota\" + 0.009*\"vocabulari\"\n", + "2019-01-31 01:25:37,495 : INFO : topic #49 (0.020): 0.044*\"india\" + 0.032*\"incumb\" + 0.013*\"pakistan\" + 0.013*\"islam\" + 0.012*\"anglo\" + 0.012*\"televis\" + 0.011*\"khalsa\" + 0.011*\"muskoge\" + 0.010*\"sri\" + 0.010*\"affection\"\n", + "2019-01-31 01:25:37,496 : INFO : topic #34 (0.020): 0.067*\"start\" + 0.035*\"new\" + 0.032*\"american\" + 0.028*\"unionist\" + 0.025*\"cotton\" + 0.022*\"year\" + 0.016*\"california\" + 0.013*\"warrior\" + 0.012*\"terri\" + 0.011*\"citi\"\n", + "2019-01-31 01:25:37,497 : INFO : topic #10 (0.020): 0.010*\"cdd\" + 0.009*\"media\" + 0.008*\"hormon\" + 0.008*\"have\" + 0.008*\"disco\" + 0.007*\"pathwai\" + 0.007*\"caus\" + 0.006*\"proper\" + 0.006*\"effect\" + 0.006*\"treat\"\n", + "2019-01-31 01:25:37,503 : INFO : topic diff=0.002925, rho=0.022255\n", + "2019-01-31 01:25:40,142 : INFO : -11.667 per-word bound, 3252.0 perplexity estimate based on a held-out corpus of 2000 documents with 556180 words\n", + "2019-01-31 01:25:40,143 : INFO : PROGRESS: pass 0, at document #4040000/4922894\n", + "2019-01-31 01:25:41,493 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:25:41,759 : INFO : topic #28 (0.020): 0.035*\"build\" + 0.028*\"hous\" + 0.018*\"buford\" + 0.015*\"histor\" + 0.012*\"linear\" + 0.011*\"constitut\" + 0.011*\"depress\" + 0.011*\"silicon\" + 0.010*\"pistol\" + 0.010*\"centuri\"\n", + "2019-01-31 01:25:41,760 : INFO : topic #12 (0.020): 0.008*\"number\" + 0.007*\"frontal\" + 0.007*\"gener\" + 0.006*\"poet\" + 0.006*\"exampl\" + 0.006*\"utopian\" + 0.006*\"southern\" + 0.006*\"théori\" + 0.006*\"servitud\" + 0.006*\"measur\"\n", + "2019-01-31 01:25:41,762 : INFO : topic #37 (0.020): 0.013*\"charact\" + 0.012*\"septemb\" + 0.011*\"anim\" + 0.010*\"comic\" + 0.010*\"man\" + 0.007*\"appear\" + 0.007*\"storag\" + 0.007*\"fusiform\" + 0.007*\"workplac\" + 0.006*\"vision\"\n", + "2019-01-31 01:25:41,763 : INFO : topic #49 (0.020): 0.044*\"india\" + 0.032*\"incumb\" + 0.013*\"pakistan\" + 0.013*\"islam\" + 0.012*\"anglo\" + 0.012*\"televis\" + 0.011*\"khalsa\" + 0.011*\"muskoge\" + 0.010*\"sri\" + 0.010*\"affection\"\n", + "2019-01-31 01:25:41,764 : INFO : topic #29 (0.020): 0.031*\"companhia\" + 0.013*\"busi\" + 0.012*\"million\" + 0.011*\"produc\" + 0.011*\"market\" + 0.010*\"bank\" + 0.010*\"industri\" + 0.008*\"yawn\" + 0.008*\"manag\" + 0.007*\"serv\"\n", + "2019-01-31 01:25:41,770 : INFO : topic diff=0.003412, rho=0.022250\n", + "2019-01-31 01:25:41,925 : INFO : PROGRESS: pass 0, at document #4042000/4922894\n", + "2019-01-31 01:25:43,281 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:25:43,547 : INFO : topic #20 (0.020): 0.144*\"scholar\" + 0.041*\"struggl\" + 0.034*\"high\" + 0.030*\"educ\" + 0.025*\"collector\" + 0.018*\"yawn\" + 0.013*\"prognosi\" + 0.009*\"task\" + 0.009*\"district\" + 0.009*\"gothic\"\n", + "2019-01-31 01:25:43,548 : INFO : topic #39 (0.020): 0.059*\"canada\" + 0.047*\"canadian\" + 0.025*\"hoar\" + 0.023*\"toronto\" + 0.022*\"ontario\" + 0.016*\"new\" + 0.016*\"hydrogen\" + 0.015*\"quebec\" + 0.015*\"misericordia\" + 0.013*\"novotná\"\n", + "2019-01-31 01:25:43,549 : INFO : topic #3 (0.020): 0.033*\"present\" + 0.026*\"offic\" + 0.024*\"nation\" + 0.023*\"minist\" + 0.023*\"govern\" + 0.021*\"member\" + 0.019*\"serv\" + 0.016*\"start\" + 0.016*\"gener\" + 0.014*\"chickasaw\"\n", + "2019-01-31 01:25:43,550 : INFO : topic #21 (0.020): 0.034*\"samford\" + 0.022*\"spain\" + 0.017*\"del\" + 0.017*\"italian\" + 0.016*\"mexico\" + 0.013*\"soviet\" + 0.012*\"santa\" + 0.011*\"juan\" + 0.011*\"carlo\" + 0.010*\"francisco\"\n", + "2019-01-31 01:25:43,551 : INFO : topic #9 (0.020): 0.073*\"bone\" + 0.043*\"american\" + 0.029*\"valour\" + 0.019*\"dutch\" + 0.018*\"player\" + 0.018*\"folei\" + 0.017*\"polit\" + 0.016*\"english\" + 0.012*\"acrimoni\" + 0.011*\"simpler\"\n", + "2019-01-31 01:25:43,557 : INFO : topic diff=0.003158, rho=0.022244\n", + "2019-01-31 01:25:43,720 : INFO : PROGRESS: pass 0, at document #4044000/4922894\n", + "2019-01-31 01:25:45,141 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:25:45,408 : INFO : topic #4 (0.020): 0.019*\"enfranchis\" + 0.014*\"depress\" + 0.014*\"pour\" + 0.008*\"mode\" + 0.008*\"elabor\" + 0.008*\"uruguayan\" + 0.007*\"veget\" + 0.006*\"turn\" + 0.006*\"develop\" + 0.006*\"produc\"\n", + "2019-01-31 01:25:45,409 : INFO : topic #14 (0.020): 0.024*\"forc\" + 0.022*\"aggress\" + 0.021*\"armi\" + 0.021*\"walter\" + 0.018*\"com\" + 0.014*\"unionist\" + 0.013*\"oper\" + 0.013*\"militari\" + 0.012*\"airbu\" + 0.011*\"refut\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 01:25:45,410 : INFO : topic #30 (0.020): 0.036*\"leagu\" + 0.035*\"cleveland\" + 0.029*\"place\" + 0.027*\"taxpay\" + 0.024*\"scientist\" + 0.024*\"crete\" + 0.021*\"folei\" + 0.016*\"goal\" + 0.015*\"martin\" + 0.012*\"schmitz\"\n", + "2019-01-31 01:25:45,411 : INFO : topic #17 (0.020): 0.076*\"church\" + 0.023*\"cathol\" + 0.022*\"christian\" + 0.021*\"bishop\" + 0.016*\"sail\" + 0.015*\"retroflex\" + 0.010*\"poll\" + 0.010*\"parish\" + 0.009*\"relationship\" + 0.009*\"historiographi\"\n", + "2019-01-31 01:25:45,412 : INFO : topic #31 (0.020): 0.050*\"fusiform\" + 0.027*\"scientist\" + 0.026*\"taxpay\" + 0.022*\"player\" + 0.019*\"place\" + 0.014*\"clot\" + 0.013*\"leagu\" + 0.011*\"folei\" + 0.010*\"yawn\" + 0.009*\"reconstruct\"\n", + "2019-01-31 01:25:45,418 : INFO : topic diff=0.004157, rho=0.022239\n", + "2019-01-31 01:25:45,580 : INFO : PROGRESS: pass 0, at document #4046000/4922894\n", + "2019-01-31 01:25:46,947 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:25:47,214 : INFO : topic #4 (0.020): 0.019*\"enfranchis\" + 0.014*\"depress\" + 0.014*\"pour\" + 0.008*\"mode\" + 0.008*\"elabor\" + 0.008*\"uruguayan\" + 0.007*\"veget\" + 0.006*\"develop\" + 0.006*\"turn\" + 0.006*\"produc\"\n", + "2019-01-31 01:25:47,215 : INFO : topic #2 (0.020): 0.050*\"isl\" + 0.038*\"shield\" + 0.018*\"narrat\" + 0.015*\"scot\" + 0.013*\"blur\" + 0.013*\"pope\" + 0.011*\"nativist\" + 0.010*\"coalit\" + 0.009*\"class\" + 0.009*\"fleet\"\n", + "2019-01-31 01:25:47,216 : INFO : topic #16 (0.020): 0.055*\"king\" + 0.031*\"priest\" + 0.021*\"grammat\" + 0.019*\"duke\" + 0.017*\"idiosyncrat\" + 0.016*\"rotterdam\" + 0.015*\"quarterli\" + 0.014*\"brazil\" + 0.013*\"kingdom\" + 0.013*\"portugues\"\n", + "2019-01-31 01:25:47,216 : INFO : topic #13 (0.020): 0.026*\"australia\" + 0.026*\"sourc\" + 0.026*\"london\" + 0.024*\"new\" + 0.023*\"england\" + 0.023*\"australian\" + 0.019*\"british\" + 0.019*\"ireland\" + 0.014*\"youth\" + 0.013*\"wale\"\n", + "2019-01-31 01:25:47,218 : INFO : topic #6 (0.020): 0.070*\"fewer\" + 0.023*\"epiru\" + 0.020*\"septemb\" + 0.018*\"teacher\" + 0.016*\"stake\" + 0.012*\"rodríguez\" + 0.012*\"direct\" + 0.012*\"proclaim\" + 0.010*\"movi\" + 0.010*\"acrimoni\"\n", + "2019-01-31 01:25:47,223 : INFO : topic diff=0.003119, rho=0.022233\n", + "2019-01-31 01:25:47,379 : INFO : PROGRESS: pass 0, at document #4048000/4922894\n", + "2019-01-31 01:25:48,749 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:25:49,015 : INFO : topic #40 (0.020): 0.087*\"unit\" + 0.023*\"schuster\" + 0.022*\"collector\" + 0.021*\"institut\" + 0.021*\"requir\" + 0.019*\"student\" + 0.014*\"professor\" + 0.012*\"http\" + 0.012*\"degre\" + 0.012*\"word\"\n", + "2019-01-31 01:25:49,017 : INFO : topic #28 (0.020): 0.035*\"build\" + 0.029*\"hous\" + 0.018*\"buford\" + 0.015*\"histor\" + 0.012*\"linear\" + 0.011*\"constitut\" + 0.011*\"depress\" + 0.011*\"silicon\" + 0.010*\"pistol\" + 0.010*\"centuri\"\n", + "2019-01-31 01:25:49,018 : INFO : topic #32 (0.020): 0.049*\"district\" + 0.045*\"popolo\" + 0.044*\"vigour\" + 0.035*\"tortur\" + 0.032*\"cotton\" + 0.025*\"multitud\" + 0.022*\"area\" + 0.021*\"adulthood\" + 0.019*\"cede\" + 0.018*\"citi\"\n", + "2019-01-31 01:25:49,019 : INFO : topic #38 (0.020): 0.022*\"walter\" + 0.010*\"aza\" + 0.009*\"forc\" + 0.009*\"battalion\" + 0.007*\"empath\" + 0.007*\"teufel\" + 0.007*\"armi\" + 0.007*\"citi\" + 0.006*\"militari\" + 0.006*\"govern\"\n", + "2019-01-31 01:25:49,020 : INFO : topic #31 (0.020): 0.050*\"fusiform\" + 0.027*\"scientist\" + 0.026*\"taxpay\" + 0.023*\"player\" + 0.020*\"place\" + 0.014*\"clot\" + 0.013*\"leagu\" + 0.011*\"folei\" + 0.010*\"yawn\" + 0.009*\"reconstruct\"\n", + "2019-01-31 01:25:49,026 : INFO : topic diff=0.003227, rho=0.022228\n", + "2019-01-31 01:25:49,183 : INFO : PROGRESS: pass 0, at document #4050000/4922894\n", + "2019-01-31 01:25:50,540 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:25:50,807 : INFO : topic #17 (0.020): 0.076*\"church\" + 0.023*\"cathol\" + 0.022*\"christian\" + 0.020*\"bishop\" + 0.016*\"sail\" + 0.015*\"retroflex\" + 0.010*\"parish\" + 0.010*\"relationship\" + 0.009*\"poll\" + 0.009*\"historiographi\"\n", + "2019-01-31 01:25:50,808 : INFO : topic #5 (0.020): 0.038*\"abroad\" + 0.029*\"son\" + 0.027*\"rel\" + 0.026*\"reconstruct\" + 0.020*\"band\" + 0.017*\"muscl\" + 0.016*\"simultan\" + 0.014*\"charcoal\" + 0.013*\"toyota\" + 0.009*\"vocabulari\"\n", + "2019-01-31 01:25:50,809 : INFO : topic #10 (0.020): 0.011*\"cdd\" + 0.009*\"media\" + 0.008*\"hormon\" + 0.008*\"have\" + 0.008*\"disco\" + 0.007*\"pathwai\" + 0.007*\"caus\" + 0.006*\"proper\" + 0.006*\"effect\" + 0.006*\"treat\"\n", + "2019-01-31 01:25:50,810 : INFO : topic #41 (0.020): 0.040*\"citi\" + 0.023*\"palmer\" + 0.021*\"new\" + 0.016*\"strategist\" + 0.013*\"center\" + 0.013*\"open\" + 0.011*\"includ\" + 0.011*\"lobe\" + 0.010*\"dai\" + 0.009*\"highli\"\n", + "2019-01-31 01:25:50,811 : INFO : topic #27 (0.020): 0.074*\"questionnair\" + 0.020*\"candid\" + 0.017*\"taxpay\" + 0.013*\"driver\" + 0.013*\"tornado\" + 0.012*\"fool\" + 0.011*\"horac\" + 0.011*\"ret\" + 0.011*\"find\" + 0.010*\"théori\"\n", + "2019-01-31 01:25:50,817 : INFO : topic diff=0.003542, rho=0.022222\n", + "2019-01-31 01:25:50,974 : INFO : PROGRESS: pass 0, at document #4052000/4922894\n", + "2019-01-31 01:25:52,330 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:25:52,597 : INFO : topic #45 (0.020): 0.041*\"arsen\" + 0.030*\"jpg\" + 0.028*\"fifteenth\" + 0.025*\"museo\" + 0.021*\"pain\" + 0.021*\"illicit\" + 0.016*\"exhaust\" + 0.015*\"artist\" + 0.015*\"gai\" + 0.014*\"colder\"\n", + "2019-01-31 01:25:52,598 : INFO : topic #22 (0.020): 0.034*\"spars\" + 0.020*\"factor\" + 0.012*\"plaisir\" + 0.010*\"genu\" + 0.010*\"western\" + 0.009*\"biom\" + 0.008*\"median\" + 0.007*\"incom\" + 0.007*\"trap\" + 0.006*\"florida\"\n", + "2019-01-31 01:25:52,599 : INFO : topic #25 (0.020): 0.033*\"ring\" + 0.018*\"area\" + 0.017*\"lagrang\" + 0.016*\"mount\" + 0.016*\"warmth\" + 0.010*\"north\" + 0.009*\"land\" + 0.009*\"sourc\" + 0.009*\"palmer\" + 0.008*\"vacant\"\n", + "2019-01-31 01:25:52,601 : INFO : topic #5 (0.020): 0.038*\"abroad\" + 0.029*\"son\" + 0.027*\"rel\" + 0.026*\"reconstruct\" + 0.020*\"band\" + 0.017*\"muscl\" + 0.016*\"simultan\" + 0.014*\"charcoal\" + 0.013*\"toyota\" + 0.009*\"vocabulari\"\n", + "2019-01-31 01:25:52,602 : INFO : topic #41 (0.020): 0.040*\"citi\" + 0.023*\"palmer\" + 0.021*\"new\" + 0.016*\"strategist\" + 0.013*\"center\" + 0.013*\"open\" + 0.011*\"includ\" + 0.011*\"lobe\" + 0.010*\"dai\" + 0.008*\"highli\"\n", + "2019-01-31 01:25:52,608 : INFO : topic diff=0.003277, rho=0.022217\n", + "2019-01-31 01:25:52,763 : INFO : PROGRESS: pass 0, at document #4054000/4922894\n", + "2019-01-31 01:25:54,130 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:25:54,396 : INFO : topic #25 (0.020): 0.033*\"ring\" + 0.018*\"area\" + 0.017*\"lagrang\" + 0.016*\"mount\" + 0.016*\"warmth\" + 0.010*\"north\" + 0.009*\"sourc\" + 0.009*\"land\" + 0.009*\"palmer\" + 0.008*\"foam\"\n", + "2019-01-31 01:25:54,398 : INFO : topic #19 (0.020): 0.017*\"languag\" + 0.016*\"centuri\" + 0.010*\"woodcut\" + 0.009*\"form\" + 0.009*\"origin\" + 0.009*\"mean\" + 0.008*\"trade\" + 0.007*\"english\" + 0.007*\"known\" + 0.007*\"ancestor\"\n", + "2019-01-31 01:25:54,399 : INFO : topic #39 (0.020): 0.059*\"canada\" + 0.047*\"canadian\" + 0.024*\"hoar\" + 0.023*\"toronto\" + 0.022*\"ontario\" + 0.016*\"new\" + 0.016*\"hydrogen\" + 0.015*\"quebec\" + 0.014*\"misericordia\" + 0.014*\"novotná\"\n", + "2019-01-31 01:25:54,400 : INFO : topic #23 (0.020): 0.137*\"audit\" + 0.071*\"best\" + 0.034*\"yawn\" + 0.027*\"jacksonvil\" + 0.023*\"japanes\" + 0.023*\"noll\" + 0.019*\"women\" + 0.019*\"festiv\" + 0.017*\"intern\" + 0.014*\"prison\"\n", + "2019-01-31 01:25:54,401 : INFO : topic #47 (0.020): 0.061*\"muscl\" + 0.032*\"perceptu\" + 0.020*\"theater\" + 0.018*\"place\" + 0.017*\"compos\" + 0.015*\"damn\" + 0.014*\"physician\" + 0.013*\"orchestr\" + 0.013*\"olympo\" + 0.011*\"word\"\n", + "2019-01-31 01:25:54,407 : INFO : topic diff=0.003286, rho=0.022211\n", + "2019-01-31 01:25:54,564 : INFO : PROGRESS: pass 0, at document #4056000/4922894\n", + "2019-01-31 01:25:55,921 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:25:56,187 : INFO : topic #27 (0.020): 0.074*\"questionnair\" + 0.020*\"candid\" + 0.017*\"taxpay\" + 0.013*\"tornado\" + 0.013*\"driver\" + 0.012*\"fool\" + 0.011*\"horac\" + 0.011*\"ret\" + 0.011*\"find\" + 0.010*\"théori\"\n", + "2019-01-31 01:25:56,188 : INFO : topic #16 (0.020): 0.054*\"king\" + 0.030*\"priest\" + 0.021*\"grammat\" + 0.019*\"duke\" + 0.017*\"idiosyncrat\" + 0.016*\"rotterdam\" + 0.015*\"quarterli\" + 0.014*\"brazil\" + 0.013*\"kingdom\" + 0.013*\"portugues\"\n", + "2019-01-31 01:25:56,189 : INFO : topic #39 (0.020): 0.059*\"canada\" + 0.046*\"canadian\" + 0.024*\"hoar\" + 0.023*\"toronto\" + 0.022*\"ontario\" + 0.016*\"new\" + 0.016*\"hydrogen\" + 0.015*\"quebec\" + 0.014*\"misericordia\" + 0.014*\"novotná\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 01:25:56,190 : INFO : topic #41 (0.020): 0.040*\"citi\" + 0.023*\"palmer\" + 0.021*\"new\" + 0.016*\"strategist\" + 0.013*\"center\" + 0.013*\"open\" + 0.011*\"includ\" + 0.011*\"lobe\" + 0.010*\"dai\" + 0.008*\"highli\"\n", + "2019-01-31 01:25:56,191 : INFO : topic #48 (0.020): 0.081*\"march\" + 0.079*\"sens\" + 0.079*\"octob\" + 0.072*\"juli\" + 0.071*\"august\" + 0.070*\"januari\" + 0.069*\"notion\" + 0.068*\"april\" + 0.067*\"judici\" + 0.065*\"decatur\"\n", + "2019-01-31 01:25:56,197 : INFO : topic diff=0.002664, rho=0.022206\n", + "2019-01-31 01:25:56,356 : INFO : PROGRESS: pass 0, at document #4058000/4922894\n", + "2019-01-31 01:25:57,775 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:25:58,041 : INFO : topic #12 (0.020): 0.008*\"number\" + 0.007*\"frontal\" + 0.006*\"gener\" + 0.006*\"exampl\" + 0.006*\"poet\" + 0.006*\"southern\" + 0.006*\"utopian\" + 0.006*\"théori\" + 0.006*\"measur\" + 0.006*\"servitud\"\n", + "2019-01-31 01:25:58,042 : INFO : topic #26 (0.020): 0.032*\"workplac\" + 0.029*\"champion\" + 0.026*\"woman\" + 0.024*\"olymp\" + 0.023*\"men\" + 0.022*\"medal\" + 0.020*\"event\" + 0.018*\"rainfal\" + 0.018*\"taxpay\" + 0.018*\"atheist\"\n", + "2019-01-31 01:25:58,044 : INFO : topic #14 (0.020): 0.025*\"forc\" + 0.022*\"aggress\" + 0.021*\"armi\" + 0.021*\"walter\" + 0.018*\"com\" + 0.014*\"unionist\" + 0.013*\"oper\" + 0.013*\"militari\" + 0.012*\"airbu\" + 0.011*\"refut\"\n", + "2019-01-31 01:25:58,045 : INFO : topic #7 (0.020): 0.021*\"snatch\" + 0.020*\"di\" + 0.018*\"factor\" + 0.016*\"yawn\" + 0.016*\"margin\" + 0.014*\"bone\" + 0.013*\"faster\" + 0.013*\"life\" + 0.012*\"deal\" + 0.012*\"daughter\"\n", + "2019-01-31 01:25:58,046 : INFO : topic #34 (0.020): 0.067*\"start\" + 0.035*\"new\" + 0.032*\"american\" + 0.029*\"unionist\" + 0.025*\"cotton\" + 0.023*\"year\" + 0.016*\"california\" + 0.013*\"warrior\" + 0.012*\"terri\" + 0.011*\"citi\"\n", + "2019-01-31 01:25:58,051 : INFO : topic diff=0.002453, rho=0.022200\n", + "2019-01-31 01:26:00,758 : INFO : -11.755 per-word bound, 3456.8 perplexity estimate based on a held-out corpus of 2000 documents with 580737 words\n", + "2019-01-31 01:26:00,758 : INFO : PROGRESS: pass 0, at document #4060000/4922894\n", + "2019-01-31 01:26:02,143 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:26:02,409 : INFO : topic #40 (0.020): 0.086*\"unit\" + 0.023*\"schuster\" + 0.022*\"institut\" + 0.022*\"collector\" + 0.021*\"requir\" + 0.019*\"student\" + 0.014*\"professor\" + 0.012*\"http\" + 0.012*\"degre\" + 0.012*\"word\"\n", + "2019-01-31 01:26:02,410 : INFO : topic #9 (0.020): 0.073*\"bone\" + 0.042*\"american\" + 0.030*\"valour\" + 0.019*\"dutch\" + 0.018*\"player\" + 0.018*\"folei\" + 0.017*\"polit\" + 0.017*\"english\" + 0.012*\"acrimoni\" + 0.011*\"simpler\"\n", + "2019-01-31 01:26:02,411 : INFO : topic #34 (0.020): 0.067*\"start\" + 0.036*\"new\" + 0.032*\"american\" + 0.029*\"unionist\" + 0.025*\"cotton\" + 0.023*\"year\" + 0.016*\"california\" + 0.013*\"warrior\" + 0.012*\"terri\" + 0.011*\"citi\"\n", + "2019-01-31 01:26:02,412 : INFO : topic #21 (0.020): 0.035*\"samford\" + 0.021*\"spain\" + 0.018*\"del\" + 0.017*\"italian\" + 0.016*\"mexico\" + 0.014*\"soviet\" + 0.012*\"santa\" + 0.011*\"juan\" + 0.010*\"carlo\" + 0.010*\"lizard\"\n", + "2019-01-31 01:26:02,413 : INFO : topic #36 (0.020): 0.012*\"network\" + 0.011*\"prognosi\" + 0.010*\"pop\" + 0.009*\"cytokin\" + 0.008*\"softwar\" + 0.008*\"develop\" + 0.008*\"championship\" + 0.008*\"uruguayan\" + 0.008*\"user\" + 0.008*\"diggin\"\n", + "2019-01-31 01:26:02,419 : INFO : topic diff=0.003339, rho=0.022195\n", + "2019-01-31 01:26:02,629 : INFO : PROGRESS: pass 0, at document #4062000/4922894\n", + "2019-01-31 01:26:03,994 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:26:04,261 : INFO : topic #5 (0.020): 0.038*\"abroad\" + 0.029*\"son\" + 0.027*\"rel\" + 0.026*\"reconstruct\" + 0.021*\"band\" + 0.017*\"muscl\" + 0.016*\"simultan\" + 0.014*\"charcoal\" + 0.014*\"toyota\" + 0.009*\"myspac\"\n", + "2019-01-31 01:26:04,262 : INFO : topic #1 (0.020): 0.055*\"china\" + 0.047*\"chilton\" + 0.024*\"hong\" + 0.023*\"kong\" + 0.020*\"korea\" + 0.016*\"korean\" + 0.016*\"leah\" + 0.015*\"sourc\" + 0.015*\"kim\" + 0.014*\"shirin\"\n", + "2019-01-31 01:26:04,263 : INFO : topic #31 (0.020): 0.051*\"fusiform\" + 0.027*\"scientist\" + 0.026*\"taxpay\" + 0.023*\"player\" + 0.020*\"place\" + 0.014*\"clot\" + 0.013*\"leagu\" + 0.011*\"folei\" + 0.010*\"yawn\" + 0.009*\"reconstruct\"\n", + "2019-01-31 01:26:04,264 : INFO : topic #49 (0.020): 0.045*\"india\" + 0.032*\"incumb\" + 0.014*\"pakistan\" + 0.012*\"islam\" + 0.011*\"khalsa\" + 0.011*\"televis\" + 0.011*\"anglo\" + 0.011*\"muskoge\" + 0.010*\"affection\" + 0.010*\"sri\"\n", + "2019-01-31 01:26:04,265 : INFO : topic #26 (0.020): 0.032*\"workplac\" + 0.029*\"champion\" + 0.026*\"woman\" + 0.024*\"olymp\" + 0.023*\"men\" + 0.022*\"medal\" + 0.019*\"event\" + 0.019*\"atheist\" + 0.018*\"taxpay\" + 0.018*\"rainfal\"\n", + "2019-01-31 01:26:04,271 : INFO : topic diff=0.003126, rho=0.022189\n", + "2019-01-31 01:26:04,425 : INFO : PROGRESS: pass 0, at document #4064000/4922894\n", + "2019-01-31 01:26:05,763 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:26:06,030 : INFO : topic #24 (0.020): 0.039*\"book\" + 0.035*\"publicis\" + 0.027*\"word\" + 0.019*\"new\" + 0.014*\"edit\" + 0.013*\"presid\" + 0.012*\"magazin\" + 0.011*\"worldwid\" + 0.011*\"storag\" + 0.011*\"author\"\n", + "2019-01-31 01:26:06,031 : INFO : topic #7 (0.020): 0.021*\"snatch\" + 0.020*\"di\" + 0.018*\"factor\" + 0.016*\"yawn\" + 0.016*\"margin\" + 0.014*\"bone\" + 0.013*\"faster\" + 0.013*\"life\" + 0.012*\"deal\" + 0.012*\"daughter\"\n", + "2019-01-31 01:26:06,032 : INFO : topic #33 (0.020): 0.058*\"french\" + 0.044*\"franc\" + 0.030*\"pari\" + 0.022*\"sail\" + 0.022*\"jean\" + 0.017*\"daphn\" + 0.014*\"lazi\" + 0.012*\"loui\" + 0.011*\"piec\" + 0.010*\"wine\"\n", + "2019-01-31 01:26:06,033 : INFO : topic #45 (0.020): 0.041*\"arsen\" + 0.030*\"jpg\" + 0.028*\"fifteenth\" + 0.025*\"museo\" + 0.022*\"pain\" + 0.021*\"illicit\" + 0.016*\"exhaust\" + 0.015*\"artist\" + 0.015*\"gai\" + 0.014*\"colder\"\n", + "2019-01-31 01:26:06,034 : INFO : topic #6 (0.020): 0.070*\"fewer\" + 0.023*\"epiru\" + 0.020*\"septemb\" + 0.018*\"teacher\" + 0.015*\"stake\" + 0.012*\"rodríguez\" + 0.012*\"direct\" + 0.011*\"proclaim\" + 0.011*\"acrimoni\" + 0.010*\"movi\"\n", + "2019-01-31 01:26:06,040 : INFO : topic diff=0.003055, rho=0.022184\n", + "2019-01-31 01:26:06,210 : INFO : PROGRESS: pass 0, at document #4066000/4922894\n", + "2019-01-31 01:26:07,574 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:26:07,841 : INFO : topic #14 (0.020): 0.024*\"forc\" + 0.022*\"aggress\" + 0.021*\"walter\" + 0.021*\"armi\" + 0.018*\"com\" + 0.014*\"unionist\" + 0.013*\"oper\" + 0.013*\"militari\" + 0.012*\"airbu\" + 0.011*\"diversifi\"\n", + "2019-01-31 01:26:07,842 : INFO : topic #0 (0.020): 0.064*\"statewid\" + 0.039*\"line\" + 0.031*\"raid\" + 0.029*\"rivièr\" + 0.028*\"rosenwald\" + 0.021*\"airmen\" + 0.018*\"serv\" + 0.017*\"traceabl\" + 0.014*\"oper\" + 0.011*\"transient\"\n", + "2019-01-31 01:26:07,843 : INFO : topic #19 (0.020): 0.016*\"languag\" + 0.016*\"centuri\" + 0.010*\"woodcut\" + 0.009*\"form\" + 0.009*\"origin\" + 0.009*\"mean\" + 0.008*\"trade\" + 0.007*\"english\" + 0.007*\"known\" + 0.007*\"ancestor\"\n", + "2019-01-31 01:26:07,844 : INFO : topic #41 (0.020): 0.040*\"citi\" + 0.023*\"palmer\" + 0.021*\"new\" + 0.016*\"strategist\" + 0.013*\"center\" + 0.013*\"open\" + 0.011*\"includ\" + 0.011*\"lobe\" + 0.010*\"dai\" + 0.008*\"highli\"\n", + "2019-01-31 01:26:07,845 : INFO : topic #47 (0.020): 0.061*\"muscl\" + 0.033*\"perceptu\" + 0.019*\"theater\" + 0.018*\"place\" + 0.017*\"compos\" + 0.015*\"damn\" + 0.013*\"physician\" + 0.013*\"olympo\" + 0.013*\"orchestr\" + 0.012*\"word\"\n", + "2019-01-31 01:26:07,851 : INFO : topic diff=0.003010, rho=0.022178\n", + "2019-01-31 01:26:08,009 : INFO : PROGRESS: pass 0, at document #4068000/4922894\n", + "2019-01-31 01:26:09,393 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:26:09,660 : INFO : topic #33 (0.020): 0.058*\"french\" + 0.044*\"franc\" + 0.031*\"pari\" + 0.022*\"jean\" + 0.022*\"sail\" + 0.017*\"daphn\" + 0.014*\"lazi\" + 0.013*\"loui\" + 0.011*\"piec\" + 0.009*\"wine\"\n", + "2019-01-31 01:26:09,661 : INFO : topic #0 (0.020): 0.064*\"statewid\" + 0.039*\"line\" + 0.031*\"raid\" + 0.029*\"rivièr\" + 0.029*\"rosenwald\" + 0.021*\"airmen\" + 0.019*\"serv\" + 0.017*\"traceabl\" + 0.014*\"oper\" + 0.011*\"transient\"\n", + "2019-01-31 01:26:09,662 : INFO : topic #37 (0.020): 0.013*\"charact\" + 0.012*\"septemb\" + 0.010*\"anim\" + 0.010*\"man\" + 0.010*\"comic\" + 0.007*\"appear\" + 0.007*\"storag\" + 0.007*\"fusiform\" + 0.007*\"workplac\" + 0.006*\"vision\"\n", + "2019-01-31 01:26:09,663 : INFO : topic #38 (0.020): 0.022*\"walter\" + 0.010*\"aza\" + 0.009*\"forc\" + 0.009*\"battalion\" + 0.007*\"empath\" + 0.007*\"teufel\" + 0.007*\"armi\" + 0.007*\"citi\" + 0.006*\"militari\" + 0.006*\"govern\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 01:26:09,664 : INFO : topic #28 (0.020): 0.035*\"build\" + 0.028*\"hous\" + 0.018*\"buford\" + 0.015*\"histor\" + 0.012*\"linear\" + 0.011*\"constitut\" + 0.011*\"depress\" + 0.011*\"silicon\" + 0.010*\"pistol\" + 0.010*\"centuri\"\n", + "2019-01-31 01:26:09,670 : INFO : topic diff=0.003459, rho=0.022173\n", + "2019-01-31 01:26:09,831 : INFO : PROGRESS: pass 0, at document #4070000/4922894\n", + "2019-01-31 01:26:11,220 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:26:11,487 : INFO : topic #37 (0.020): 0.013*\"charact\" + 0.012*\"septemb\" + 0.010*\"anim\" + 0.010*\"man\" + 0.010*\"comic\" + 0.007*\"appear\" + 0.007*\"storag\" + 0.007*\"fusiform\" + 0.007*\"workplac\" + 0.006*\"vision\"\n", + "2019-01-31 01:26:11,488 : INFO : topic #9 (0.020): 0.073*\"bone\" + 0.041*\"american\" + 0.031*\"valour\" + 0.018*\"dutch\" + 0.018*\"player\" + 0.017*\"folei\" + 0.016*\"polit\" + 0.016*\"english\" + 0.014*\"acrimoni\" + 0.012*\"simpler\"\n", + "2019-01-31 01:26:11,489 : INFO : topic #20 (0.020): 0.143*\"scholar\" + 0.041*\"struggl\" + 0.035*\"high\" + 0.030*\"educ\" + 0.024*\"collector\" + 0.018*\"yawn\" + 0.013*\"prognosi\" + 0.010*\"district\" + 0.009*\"task\" + 0.009*\"start\"\n", + "2019-01-31 01:26:11,490 : INFO : topic #44 (0.020): 0.030*\"rooftop\" + 0.027*\"final\" + 0.022*\"wife\" + 0.021*\"tourist\" + 0.019*\"champion\" + 0.015*\"chamber\" + 0.014*\"taxpay\" + 0.014*\"tiepolo\" + 0.014*\"martin\" + 0.013*\"open\"\n", + "2019-01-31 01:26:11,491 : INFO : topic #16 (0.020): 0.054*\"king\" + 0.031*\"priest\" + 0.020*\"grammat\" + 0.019*\"duke\" + 0.017*\"idiosyncrat\" + 0.016*\"rotterdam\" + 0.015*\"quarterli\" + 0.013*\"kingdom\" + 0.013*\"brazil\" + 0.012*\"portugues\"\n", + "2019-01-31 01:26:11,497 : INFO : topic diff=0.004236, rho=0.022168\n", + "2019-01-31 01:26:11,656 : INFO : PROGRESS: pass 0, at document #4072000/4922894\n", + "2019-01-31 01:26:13,017 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:26:13,283 : INFO : topic #10 (0.020): 0.011*\"cdd\" + 0.009*\"media\" + 0.008*\"hormon\" + 0.008*\"disco\" + 0.008*\"have\" + 0.007*\"pathwai\" + 0.007*\"caus\" + 0.006*\"effect\" + 0.006*\"proper\" + 0.006*\"treat\"\n", + "2019-01-31 01:26:13,284 : INFO : topic #12 (0.020): 0.008*\"number\" + 0.007*\"frontal\" + 0.006*\"utopian\" + 0.006*\"gener\" + 0.006*\"exampl\" + 0.006*\"poet\" + 0.006*\"southern\" + 0.006*\"théori\" + 0.006*\"measur\" + 0.006*\"servitud\"\n", + "2019-01-31 01:26:13,286 : INFO : topic #20 (0.020): 0.143*\"scholar\" + 0.041*\"struggl\" + 0.034*\"high\" + 0.030*\"educ\" + 0.025*\"collector\" + 0.018*\"yawn\" + 0.013*\"prognosi\" + 0.010*\"task\" + 0.009*\"district\" + 0.009*\"start\"\n", + "2019-01-31 01:26:13,286 : INFO : topic #48 (0.020): 0.079*\"march\" + 0.079*\"sens\" + 0.077*\"octob\" + 0.071*\"juli\" + 0.070*\"august\" + 0.070*\"januari\" + 0.068*\"notion\" + 0.067*\"judici\" + 0.067*\"april\" + 0.064*\"decatur\"\n", + "2019-01-31 01:26:13,287 : INFO : topic #49 (0.020): 0.044*\"india\" + 0.032*\"incumb\" + 0.014*\"pakistan\" + 0.012*\"islam\" + 0.011*\"televis\" + 0.011*\"khalsa\" + 0.011*\"anglo\" + 0.011*\"muskoge\" + 0.010*\"affection\" + 0.010*\"sri\"\n", + "2019-01-31 01:26:13,293 : INFO : topic diff=0.002984, rho=0.022162\n", + "2019-01-31 01:26:13,453 : INFO : PROGRESS: pass 0, at document #4074000/4922894\n", + "2019-01-31 01:26:14,881 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:26:15,149 : INFO : topic #28 (0.020): 0.035*\"build\" + 0.028*\"hous\" + 0.018*\"buford\" + 0.015*\"histor\" + 0.012*\"linear\" + 0.011*\"constitut\" + 0.011*\"depress\" + 0.010*\"silicon\" + 0.010*\"centuri\" + 0.010*\"pistol\"\n", + "2019-01-31 01:26:15,149 : INFO : topic #16 (0.020): 0.054*\"king\" + 0.031*\"priest\" + 0.020*\"grammat\" + 0.019*\"duke\" + 0.017*\"idiosyncrat\" + 0.016*\"rotterdam\" + 0.016*\"quarterli\" + 0.013*\"order\" + 0.013*\"kingdom\" + 0.013*\"brazil\"\n", + "2019-01-31 01:26:15,151 : INFO : topic #10 (0.020): 0.011*\"cdd\" + 0.009*\"media\" + 0.008*\"hormon\" + 0.008*\"disco\" + 0.008*\"have\" + 0.007*\"pathwai\" + 0.007*\"caus\" + 0.006*\"effect\" + 0.006*\"proper\" + 0.006*\"treat\"\n", + "2019-01-31 01:26:15,152 : INFO : topic #45 (0.020): 0.042*\"arsen\" + 0.029*\"jpg\" + 0.027*\"fifteenth\" + 0.026*\"museo\" + 0.022*\"pain\" + 0.021*\"illicit\" + 0.016*\"artist\" + 0.016*\"exhaust\" + 0.015*\"gai\" + 0.014*\"colder\"\n", + "2019-01-31 01:26:15,153 : INFO : topic #9 (0.020): 0.073*\"bone\" + 0.041*\"american\" + 0.031*\"valour\" + 0.018*\"dutch\" + 0.018*\"player\" + 0.017*\"folei\" + 0.016*\"polit\" + 0.016*\"english\" + 0.014*\"acrimoni\" + 0.012*\"simpler\"\n", + "2019-01-31 01:26:15,159 : INFO : topic diff=0.002967, rho=0.022157\n", + "2019-01-31 01:26:15,315 : INFO : PROGRESS: pass 0, at document #4076000/4922894\n", + "2019-01-31 01:26:16,675 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:26:16,942 : INFO : topic #35 (0.020): 0.054*\"russia\" + 0.034*\"sovereignti\" + 0.034*\"rural\" + 0.027*\"poison\" + 0.025*\"personifi\" + 0.023*\"reprint\" + 0.021*\"moscow\" + 0.019*\"poland\" + 0.015*\"malaysia\" + 0.014*\"czech\"\n", + "2019-01-31 01:26:16,943 : INFO : topic #48 (0.020): 0.078*\"octob\" + 0.077*\"march\" + 0.077*\"sens\" + 0.068*\"juli\" + 0.068*\"januari\" + 0.068*\"august\" + 0.066*\"notion\" + 0.065*\"april\" + 0.065*\"judici\" + 0.063*\"decatur\"\n", + "2019-01-31 01:26:16,944 : INFO : topic #47 (0.020): 0.063*\"muscl\" + 0.033*\"perceptu\" + 0.019*\"theater\" + 0.017*\"place\" + 0.017*\"compos\" + 0.015*\"damn\" + 0.013*\"physician\" + 0.013*\"olympo\" + 0.013*\"orchestr\" + 0.011*\"word\"\n", + "2019-01-31 01:26:16,945 : INFO : topic #33 (0.020): 0.059*\"french\" + 0.045*\"franc\" + 0.031*\"pari\" + 0.022*\"jean\" + 0.021*\"sail\" + 0.018*\"daphn\" + 0.014*\"lazi\" + 0.013*\"loui\" + 0.012*\"piec\" + 0.009*\"wine\"\n", + "2019-01-31 01:26:16,946 : INFO : topic #39 (0.020): 0.059*\"canada\" + 0.046*\"canadian\" + 0.024*\"hoar\" + 0.023*\"toronto\" + 0.021*\"ontario\" + 0.016*\"new\" + 0.015*\"hydrogen\" + 0.015*\"misericordia\" + 0.015*\"quebec\" + 0.014*\"novotná\"\n", + "2019-01-31 01:26:16,952 : INFO : topic diff=0.004049, rho=0.022151\n", + "2019-01-31 01:26:17,106 : INFO : PROGRESS: pass 0, at document #4078000/4922894\n", + "2019-01-31 01:26:18,452 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:26:18,719 : INFO : topic #24 (0.020): 0.039*\"book\" + 0.035*\"publicis\" + 0.026*\"word\" + 0.019*\"new\" + 0.014*\"edit\" + 0.013*\"presid\" + 0.011*\"worldwid\" + 0.011*\"magazin\" + 0.011*\"nicola\" + 0.011*\"storag\"\n", + "2019-01-31 01:26:18,719 : INFO : topic #48 (0.020): 0.077*\"march\" + 0.077*\"octob\" + 0.077*\"sens\" + 0.068*\"juli\" + 0.068*\"august\" + 0.068*\"januari\" + 0.066*\"notion\" + 0.065*\"april\" + 0.064*\"judici\" + 0.062*\"decatur\"\n", + "2019-01-31 01:26:18,721 : INFO : topic #2 (0.020): 0.050*\"isl\" + 0.039*\"shield\" + 0.018*\"narrat\" + 0.015*\"scot\" + 0.013*\"blur\" + 0.012*\"pope\" + 0.012*\"nativist\" + 0.010*\"coalit\" + 0.009*\"class\" + 0.009*\"fleet\"\n", + "2019-01-31 01:26:18,722 : INFO : topic #41 (0.020): 0.040*\"citi\" + 0.023*\"palmer\" + 0.021*\"new\" + 0.016*\"strategist\" + 0.013*\"center\" + 0.013*\"open\" + 0.011*\"includ\" + 0.011*\"lobe\" + 0.010*\"dai\" + 0.009*\"highli\"\n", + "2019-01-31 01:26:18,723 : INFO : topic #49 (0.020): 0.045*\"india\" + 0.033*\"incumb\" + 0.014*\"pakistan\" + 0.012*\"islam\" + 0.011*\"televis\" + 0.011*\"khalsa\" + 0.011*\"muskoge\" + 0.011*\"anglo\" + 0.010*\"affection\" + 0.010*\"sri\"\n", + "2019-01-31 01:26:18,729 : INFO : topic diff=0.003817, rho=0.022146\n", + "2019-01-31 01:26:21,367 : INFO : -11.815 per-word bound, 3603.7 perplexity estimate based on a held-out corpus of 2000 documents with 532709 words\n", + "2019-01-31 01:26:21,368 : INFO : PROGRESS: pass 0, at document #4080000/4922894\n", + "2019-01-31 01:26:22,830 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:26:23,097 : INFO : topic #27 (0.020): 0.074*\"questionnair\" + 0.021*\"candid\" + 0.017*\"taxpay\" + 0.013*\"tornado\" + 0.012*\"driver\" + 0.012*\"fool\" + 0.011*\"horac\" + 0.011*\"find\" + 0.010*\"ret\" + 0.010*\"théori\"\n", + "2019-01-31 01:26:23,098 : INFO : topic #22 (0.020): 0.035*\"spars\" + 0.019*\"factor\" + 0.012*\"plaisir\" + 0.011*\"genu\" + 0.010*\"western\" + 0.008*\"biom\" + 0.008*\"median\" + 0.007*\"incom\" + 0.006*\"florida\" + 0.006*\"trap\"\n", + "2019-01-31 01:26:23,099 : INFO : topic #41 (0.020): 0.040*\"citi\" + 0.023*\"palmer\" + 0.021*\"new\" + 0.017*\"strategist\" + 0.013*\"center\" + 0.013*\"open\" + 0.011*\"includ\" + 0.011*\"lobe\" + 0.010*\"dai\" + 0.009*\"highli\"\n", + "2019-01-31 01:26:23,101 : INFO : topic #34 (0.020): 0.067*\"start\" + 0.036*\"new\" + 0.032*\"american\" + 0.029*\"unionist\" + 0.025*\"cotton\" + 0.023*\"year\" + 0.016*\"california\" + 0.013*\"warrior\" + 0.012*\"terri\" + 0.011*\"citi\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 01:26:23,102 : INFO : topic #35 (0.020): 0.055*\"russia\" + 0.034*\"rural\" + 0.034*\"sovereignti\" + 0.027*\"poison\" + 0.026*\"personifi\" + 0.023*\"reprint\" + 0.021*\"moscow\" + 0.019*\"poland\" + 0.015*\"malaysia\" + 0.014*\"czech\"\n", + "2019-01-31 01:26:23,108 : INFO : topic diff=0.003375, rho=0.022140\n", + "2019-01-31 01:26:23,265 : INFO : PROGRESS: pass 0, at document #4082000/4922894\n", + "2019-01-31 01:26:24,630 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:26:24,896 : INFO : topic #16 (0.020): 0.055*\"king\" + 0.031*\"priest\" + 0.020*\"grammat\" + 0.019*\"duke\" + 0.017*\"idiosyncrat\" + 0.016*\"rotterdam\" + 0.016*\"quarterli\" + 0.013*\"kingdom\" + 0.013*\"order\" + 0.013*\"brazil\"\n", + "2019-01-31 01:26:24,897 : INFO : topic #23 (0.020): 0.138*\"audit\" + 0.073*\"best\" + 0.033*\"yawn\" + 0.026*\"jacksonvil\" + 0.022*\"noll\" + 0.022*\"japanes\" + 0.019*\"women\" + 0.019*\"festiv\" + 0.016*\"intern\" + 0.015*\"prison\"\n", + "2019-01-31 01:26:24,899 : INFO : topic #33 (0.020): 0.058*\"french\" + 0.045*\"franc\" + 0.031*\"pari\" + 0.022*\"jean\" + 0.022*\"sail\" + 0.017*\"daphn\" + 0.013*\"lazi\" + 0.013*\"loui\" + 0.011*\"piec\" + 0.009*\"wine\"\n", + "2019-01-31 01:26:24,900 : INFO : topic #3 (0.020): 0.032*\"present\" + 0.026*\"offic\" + 0.024*\"nation\" + 0.023*\"minist\" + 0.022*\"govern\" + 0.020*\"member\" + 0.018*\"serv\" + 0.016*\"start\" + 0.015*\"gener\" + 0.014*\"chickasaw\"\n", + "2019-01-31 01:26:24,901 : INFO : topic #7 (0.020): 0.021*\"snatch\" + 0.020*\"di\" + 0.019*\"factor\" + 0.016*\"margin\" + 0.016*\"yawn\" + 0.014*\"bone\" + 0.013*\"faster\" + 0.012*\"life\" + 0.012*\"daughter\" + 0.012*\"deal\"\n", + "2019-01-31 01:26:24,907 : INFO : topic diff=0.003500, rho=0.022135\n", + "2019-01-31 01:26:25,069 : INFO : PROGRESS: pass 0, at document #4084000/4922894\n", + "2019-01-31 01:26:26,492 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:26:26,759 : INFO : topic #8 (0.020): 0.027*\"law\" + 0.022*\"cortic\" + 0.022*\"act\" + 0.019*\"start\" + 0.012*\"ricardo\" + 0.012*\"case\" + 0.010*\"replac\" + 0.009*\"polaris\" + 0.008*\"legal\" + 0.007*\"judaism\"\n", + "2019-01-31 01:26:26,760 : INFO : topic #15 (0.020): 0.011*\"small\" + 0.010*\"organ\" + 0.010*\"develop\" + 0.009*\"commun\" + 0.009*\"word\" + 0.008*\"group\" + 0.008*\"peopl\" + 0.007*\"human\" + 0.007*\"woman\" + 0.006*\"summerhil\"\n", + "2019-01-31 01:26:26,761 : INFO : topic #30 (0.020): 0.036*\"leagu\" + 0.036*\"cleveland\" + 0.029*\"place\" + 0.027*\"taxpay\" + 0.024*\"scientist\" + 0.024*\"crete\" + 0.022*\"folei\" + 0.016*\"goal\" + 0.015*\"martin\" + 0.012*\"schmitz\"\n", + "2019-01-31 01:26:26,762 : INFO : topic #34 (0.020): 0.066*\"start\" + 0.035*\"new\" + 0.032*\"american\" + 0.028*\"unionist\" + 0.025*\"cotton\" + 0.023*\"year\" + 0.016*\"california\" + 0.013*\"warrior\" + 0.012*\"terri\" + 0.011*\"citi\"\n", + "2019-01-31 01:26:26,764 : INFO : topic #21 (0.020): 0.034*\"samford\" + 0.021*\"spain\" + 0.018*\"del\" + 0.016*\"mexico\" + 0.016*\"italian\" + 0.013*\"soviet\" + 0.012*\"santa\" + 0.011*\"juan\" + 0.010*\"carlo\" + 0.010*\"lizard\"\n", + "2019-01-31 01:26:26,769 : INFO : topic diff=0.004004, rho=0.022130\n", + "2019-01-31 01:26:26,927 : INFO : PROGRESS: pass 0, at document #4086000/4922894\n", + "2019-01-31 01:26:28,299 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:26:28,566 : INFO : topic #43 (0.020): 0.064*\"elect\" + 0.054*\"parti\" + 0.024*\"voluntari\" + 0.023*\"democrat\" + 0.020*\"member\" + 0.016*\"polici\" + 0.015*\"republ\" + 0.014*\"bypass\" + 0.014*\"seaport\" + 0.013*\"liber\"\n", + "2019-01-31 01:26:28,567 : INFO : topic #24 (0.020): 0.039*\"book\" + 0.035*\"publicis\" + 0.027*\"word\" + 0.019*\"new\" + 0.014*\"edit\" + 0.013*\"presid\" + 0.011*\"magazin\" + 0.011*\"worldwid\" + 0.011*\"nicola\" + 0.011*\"author\"\n", + "2019-01-31 01:26:28,568 : INFO : topic #21 (0.020): 0.034*\"samford\" + 0.021*\"spain\" + 0.018*\"del\" + 0.016*\"italian\" + 0.016*\"mexico\" + 0.013*\"soviet\" + 0.012*\"santa\" + 0.011*\"juan\" + 0.010*\"carlo\" + 0.010*\"lizard\"\n", + "2019-01-31 01:26:28,569 : INFO : topic #1 (0.020): 0.054*\"china\" + 0.046*\"chilton\" + 0.024*\"hong\" + 0.023*\"kong\" + 0.020*\"korea\" + 0.017*\"leah\" + 0.016*\"korean\" + 0.015*\"sourc\" + 0.014*\"kim\" + 0.014*\"shirin\"\n", + "2019-01-31 01:26:28,570 : INFO : topic #42 (0.020): 0.047*\"german\" + 0.032*\"germani\" + 0.016*\"vol\" + 0.015*\"jewish\" + 0.014*\"berlin\" + 0.013*\"der\" + 0.013*\"israel\" + 0.010*\"european\" + 0.009*\"austria\" + 0.008*\"europ\"\n", + "2019-01-31 01:26:28,576 : INFO : topic diff=0.003410, rho=0.022124\n", + "2019-01-31 01:26:28,727 : INFO : PROGRESS: pass 0, at document #4088000/4922894\n", + "2019-01-31 01:26:30,080 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:26:30,347 : INFO : topic #29 (0.020): 0.031*\"companhia\" + 0.013*\"busi\" + 0.012*\"million\" + 0.011*\"produc\" + 0.011*\"market\" + 0.011*\"bank\" + 0.010*\"industri\" + 0.008*\"yawn\" + 0.008*\"manag\" + 0.007*\"serv\"\n", + "2019-01-31 01:26:30,348 : INFO : topic #5 (0.020): 0.039*\"abroad\" + 0.029*\"son\" + 0.027*\"rel\" + 0.025*\"reconstruct\" + 0.021*\"band\" + 0.017*\"muscl\" + 0.016*\"simultan\" + 0.014*\"charcoal\" + 0.014*\"toyota\" + 0.010*\"vocabulari\"\n", + "2019-01-31 01:26:30,349 : INFO : topic #12 (0.020): 0.008*\"number\" + 0.007*\"frontal\" + 0.006*\"utopian\" + 0.006*\"gener\" + 0.006*\"exampl\" + 0.006*\"measur\" + 0.006*\"southern\" + 0.006*\"poet\" + 0.006*\"théori\" + 0.005*\"servitud\"\n", + "2019-01-31 01:26:30,350 : INFO : topic #32 (0.020): 0.049*\"district\" + 0.045*\"popolo\" + 0.043*\"vigour\" + 0.035*\"tortur\" + 0.034*\"cotton\" + 0.024*\"multitud\" + 0.022*\"adulthood\" + 0.021*\"area\" + 0.019*\"cede\" + 0.018*\"citi\"\n", + "2019-01-31 01:26:30,351 : INFO : topic #23 (0.020): 0.139*\"audit\" + 0.073*\"best\" + 0.033*\"yawn\" + 0.026*\"jacksonvil\" + 0.022*\"noll\" + 0.022*\"japanes\" + 0.019*\"women\" + 0.019*\"festiv\" + 0.016*\"intern\" + 0.014*\"prison\"\n", + "2019-01-31 01:26:30,357 : INFO : topic diff=0.003410, rho=0.022119\n", + "2019-01-31 01:26:30,513 : INFO : PROGRESS: pass 0, at document #4090000/4922894\n", + "2019-01-31 01:26:31,876 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:26:32,143 : INFO : topic #28 (0.020): 0.035*\"build\" + 0.029*\"hous\" + 0.018*\"buford\" + 0.014*\"histor\" + 0.012*\"linear\" + 0.011*\"constitut\" + 0.011*\"depress\" + 0.010*\"silicon\" + 0.010*\"centuri\" + 0.010*\"pistol\"\n", + "2019-01-31 01:26:32,144 : INFO : topic #10 (0.020): 0.012*\"cdd\" + 0.009*\"media\" + 0.008*\"hormon\" + 0.008*\"disco\" + 0.008*\"have\" + 0.007*\"pathwai\" + 0.007*\"caus\" + 0.006*\"effect\" + 0.006*\"proper\" + 0.006*\"treat\"\n", + "2019-01-31 01:26:32,145 : INFO : topic #44 (0.020): 0.031*\"rooftop\" + 0.027*\"final\" + 0.023*\"wife\" + 0.022*\"tourist\" + 0.019*\"champion\" + 0.015*\"chamber\" + 0.015*\"taxpay\" + 0.014*\"tiepolo\" + 0.013*\"open\" + 0.013*\"martin\"\n", + "2019-01-31 01:26:32,146 : INFO : topic #9 (0.020): 0.071*\"bone\" + 0.042*\"american\" + 0.033*\"valour\" + 0.019*\"dutch\" + 0.018*\"player\" + 0.017*\"polit\" + 0.017*\"english\" + 0.017*\"folei\" + 0.013*\"acrimoni\" + 0.012*\"simpler\"\n", + "2019-01-31 01:26:32,148 : INFO : topic #46 (0.020): 0.017*\"stop\" + 0.016*\"wind\" + 0.016*\"sweden\" + 0.015*\"swedish\" + 0.015*\"norwai\" + 0.014*\"norwegian\" + 0.013*\"damag\" + 0.013*\"treeless\" + 0.011*\"huntsvil\" + 0.010*\"denmark\"\n", + "2019-01-31 01:26:32,154 : INFO : topic diff=0.003523, rho=0.022113\n", + "2019-01-31 01:26:32,316 : INFO : PROGRESS: pass 0, at document #4092000/4922894\n", + "2019-01-31 01:26:33,704 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:26:33,971 : INFO : topic #46 (0.020): 0.017*\"stop\" + 0.016*\"wind\" + 0.016*\"sweden\" + 0.015*\"swedish\" + 0.014*\"norwai\" + 0.014*\"norwegian\" + 0.013*\"treeless\" + 0.013*\"damag\" + 0.011*\"huntsvil\" + 0.010*\"denmark\"\n", + "2019-01-31 01:26:33,972 : INFO : topic #36 (0.020): 0.012*\"network\" + 0.011*\"prognosi\" + 0.010*\"pop\" + 0.009*\"cytokin\" + 0.008*\"develop\" + 0.008*\"softwar\" + 0.008*\"championship\" + 0.008*\"diggin\" + 0.008*\"uruguayan\" + 0.007*\"user\"\n", + "2019-01-31 01:26:33,973 : INFO : topic #10 (0.020): 0.011*\"cdd\" + 0.009*\"media\" + 0.009*\"hormon\" + 0.008*\"disco\" + 0.008*\"have\" + 0.007*\"pathwai\" + 0.007*\"caus\" + 0.006*\"effect\" + 0.006*\"proper\" + 0.006*\"treat\"\n", + "2019-01-31 01:26:33,975 : INFO : topic #47 (0.020): 0.061*\"muscl\" + 0.033*\"perceptu\" + 0.020*\"theater\" + 0.017*\"place\" + 0.017*\"compos\" + 0.015*\"damn\" + 0.014*\"physician\" + 0.013*\"olympo\" + 0.012*\"orchestr\" + 0.011*\"word\"\n", + "2019-01-31 01:26:33,976 : INFO : topic #30 (0.020): 0.036*\"leagu\" + 0.036*\"cleveland\" + 0.029*\"place\" + 0.027*\"taxpay\" + 0.024*\"scientist\" + 0.023*\"crete\" + 0.022*\"folei\" + 0.016*\"goal\" + 0.015*\"martin\" + 0.012*\"schmitz\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 01:26:33,982 : INFO : topic diff=0.002838, rho=0.022108\n", + "2019-01-31 01:26:34,139 : INFO : PROGRESS: pass 0, at document #4094000/4922894\n", + "2019-01-31 01:26:35,513 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:26:35,780 : INFO : topic #2 (0.020): 0.050*\"isl\" + 0.039*\"shield\" + 0.018*\"narrat\" + 0.015*\"scot\" + 0.013*\"blur\" + 0.012*\"pope\" + 0.011*\"nativist\" + 0.010*\"coalit\" + 0.009*\"fleet\" + 0.009*\"bahá\"\n", + "2019-01-31 01:26:35,781 : INFO : topic #40 (0.020): 0.087*\"unit\" + 0.023*\"schuster\" + 0.022*\"collector\" + 0.022*\"institut\" + 0.021*\"requir\" + 0.019*\"student\" + 0.014*\"professor\" + 0.012*\"http\" + 0.012*\"degre\" + 0.012*\"word\"\n", + "2019-01-31 01:26:35,782 : INFO : topic #31 (0.020): 0.050*\"fusiform\" + 0.027*\"scientist\" + 0.025*\"taxpay\" + 0.022*\"player\" + 0.019*\"place\" + 0.014*\"clot\" + 0.013*\"leagu\" + 0.011*\"folei\" + 0.010*\"yawn\" + 0.009*\"reconstruct\"\n", + "2019-01-31 01:26:35,784 : INFO : topic #24 (0.020): 0.039*\"book\" + 0.035*\"publicis\" + 0.027*\"word\" + 0.019*\"new\" + 0.014*\"edit\" + 0.014*\"presid\" + 0.011*\"magazin\" + 0.011*\"worldwid\" + 0.011*\"author\" + 0.011*\"nicola\"\n", + "2019-01-31 01:26:35,785 : INFO : topic #13 (0.020): 0.026*\"london\" + 0.025*\"sourc\" + 0.025*\"australia\" + 0.024*\"new\" + 0.023*\"england\" + 0.022*\"australian\" + 0.020*\"british\" + 0.018*\"ireland\" + 0.014*\"youth\" + 0.013*\"wale\"\n", + "2019-01-31 01:26:35,790 : INFO : topic diff=0.003079, rho=0.022102\n", + "2019-01-31 01:26:36,004 : INFO : PROGRESS: pass 0, at document #4096000/4922894\n", + "2019-01-31 01:26:37,356 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:26:37,622 : INFO : topic #5 (0.020): 0.039*\"abroad\" + 0.029*\"son\" + 0.027*\"rel\" + 0.025*\"reconstruct\" + 0.021*\"band\" + 0.017*\"muscl\" + 0.016*\"simultan\" + 0.014*\"charcoal\" + 0.014*\"toyota\" + 0.010*\"vocabulari\"\n", + "2019-01-31 01:26:37,624 : INFO : topic #10 (0.020): 0.012*\"cdd\" + 0.009*\"media\" + 0.009*\"hormon\" + 0.008*\"disco\" + 0.008*\"have\" + 0.007*\"pathwai\" + 0.007*\"caus\" + 0.006*\"proper\" + 0.006*\"effect\" + 0.006*\"treat\"\n", + "2019-01-31 01:26:37,625 : INFO : topic #4 (0.020): 0.019*\"enfranchis\" + 0.015*\"depress\" + 0.014*\"pour\" + 0.008*\"elabor\" + 0.008*\"mode\" + 0.008*\"uruguayan\" + 0.007*\"veget\" + 0.006*\"develop\" + 0.006*\"spectacl\" + 0.006*\"turn\"\n", + "2019-01-31 01:26:37,626 : INFO : topic #11 (0.020): 0.023*\"john\" + 0.011*\"jame\" + 0.011*\"will\" + 0.011*\"david\" + 0.010*\"rival\" + 0.009*\"mexican–american\" + 0.008*\"slur\" + 0.008*\"georg\" + 0.007*\"paul\" + 0.007*\"rhyme\"\n", + "2019-01-31 01:26:37,627 : INFO : topic #16 (0.020): 0.055*\"king\" + 0.031*\"priest\" + 0.020*\"grammat\" + 0.018*\"duke\" + 0.018*\"idiosyncrat\" + 0.016*\"rotterdam\" + 0.016*\"quarterli\" + 0.013*\"brazil\" + 0.013*\"kingdom\" + 0.013*\"order\"\n", + "2019-01-31 01:26:37,633 : INFO : topic diff=0.003419, rho=0.022097\n", + "2019-01-31 01:26:37,786 : INFO : PROGRESS: pass 0, at document #4098000/4922894\n", + "2019-01-31 01:26:39,124 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:26:39,390 : INFO : topic #37 (0.020): 0.013*\"charact\" + 0.012*\"septemb\" + 0.011*\"anim\" + 0.010*\"man\" + 0.009*\"comic\" + 0.007*\"appear\" + 0.007*\"storag\" + 0.007*\"fusiform\" + 0.007*\"workplac\" + 0.006*\"vision\"\n", + "2019-01-31 01:26:39,391 : INFO : topic #28 (0.020): 0.035*\"build\" + 0.029*\"hous\" + 0.018*\"buford\" + 0.015*\"histor\" + 0.012*\"linear\" + 0.011*\"constitut\" + 0.011*\"depress\" + 0.010*\"silicon\" + 0.010*\"pistol\" + 0.010*\"centuri\"\n", + "2019-01-31 01:26:39,393 : INFO : topic #1 (0.020): 0.054*\"china\" + 0.045*\"chilton\" + 0.024*\"hong\" + 0.022*\"kong\" + 0.020*\"korea\" + 0.016*\"leah\" + 0.016*\"korean\" + 0.015*\"sourc\" + 0.015*\"kim\" + 0.014*\"shirin\"\n", + "2019-01-31 01:26:39,394 : INFO : topic #26 (0.020): 0.031*\"workplac\" + 0.029*\"champion\" + 0.026*\"woman\" + 0.025*\"olymp\" + 0.023*\"medal\" + 0.022*\"men\" + 0.019*\"event\" + 0.018*\"taxpay\" + 0.018*\"nation\" + 0.017*\"atheist\"\n", + "2019-01-31 01:26:39,395 : INFO : topic #31 (0.020): 0.050*\"fusiform\" + 0.027*\"scientist\" + 0.025*\"taxpay\" + 0.022*\"player\" + 0.019*\"place\" + 0.014*\"clot\" + 0.013*\"leagu\" + 0.011*\"folei\" + 0.010*\"yawn\" + 0.009*\"reconstruct\"\n", + "2019-01-31 01:26:39,401 : INFO : topic diff=0.003625, rho=0.022092\n", + "2019-01-31 01:26:42,073 : INFO : -11.457 per-word bound, 2810.3 perplexity estimate based on a held-out corpus of 2000 documents with 559757 words\n", + "2019-01-31 01:26:42,074 : INFO : PROGRESS: pass 0, at document #4100000/4922894\n", + "2019-01-31 01:26:43,444 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:26:43,711 : INFO : topic #34 (0.020): 0.067*\"start\" + 0.035*\"new\" + 0.032*\"american\" + 0.028*\"unionist\" + 0.026*\"cotton\" + 0.022*\"year\" + 0.016*\"california\" + 0.013*\"terri\" + 0.013*\"warrior\" + 0.011*\"citi\"\n", + "2019-01-31 01:26:43,712 : INFO : topic #8 (0.020): 0.027*\"law\" + 0.023*\"cortic\" + 0.021*\"act\" + 0.019*\"start\" + 0.012*\"ricardo\" + 0.012*\"case\" + 0.010*\"replac\" + 0.009*\"polaris\" + 0.008*\"legal\" + 0.007*\"judaism\"\n", + "2019-01-31 01:26:43,713 : INFO : topic #12 (0.020): 0.008*\"number\" + 0.007*\"frontal\" + 0.006*\"gener\" + 0.006*\"exampl\" + 0.006*\"southern\" + 0.006*\"utopian\" + 0.006*\"poet\" + 0.006*\"measur\" + 0.006*\"théori\" + 0.005*\"method\"\n", + "2019-01-31 01:26:43,714 : INFO : topic #3 (0.020): 0.032*\"present\" + 0.025*\"offic\" + 0.025*\"nation\" + 0.023*\"minist\" + 0.023*\"govern\" + 0.020*\"member\" + 0.017*\"serv\" + 0.016*\"start\" + 0.015*\"gener\" + 0.014*\"chickasaw\"\n", + "2019-01-31 01:26:43,715 : INFO : topic #24 (0.020): 0.040*\"book\" + 0.035*\"publicis\" + 0.027*\"word\" + 0.019*\"new\" + 0.014*\"edit\" + 0.014*\"presid\" + 0.011*\"magazin\" + 0.011*\"worldwid\" + 0.011*\"author\" + 0.011*\"nicola\"\n", + "2019-01-31 01:26:43,721 : INFO : topic diff=0.003450, rho=0.022086\n", + "2019-01-31 01:26:43,877 : INFO : PROGRESS: pass 0, at document #4102000/4922894\n", + "2019-01-31 01:26:45,235 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:26:45,505 : INFO : topic #17 (0.020): 0.078*\"church\" + 0.023*\"cathol\" + 0.022*\"christian\" + 0.021*\"bishop\" + 0.016*\"sail\" + 0.015*\"retroflex\" + 0.010*\"relationship\" + 0.010*\"parish\" + 0.009*\"poll\" + 0.009*\"cathedr\"\n", + "2019-01-31 01:26:45,506 : INFO : topic #30 (0.020): 0.036*\"cleveland\" + 0.036*\"leagu\" + 0.029*\"place\" + 0.027*\"taxpay\" + 0.024*\"scientist\" + 0.024*\"crete\" + 0.022*\"folei\" + 0.016*\"goal\" + 0.015*\"martin\" + 0.012*\"schmitz\"\n", + "2019-01-31 01:26:45,508 : INFO : topic #19 (0.020): 0.016*\"languag\" + 0.015*\"centuri\" + 0.011*\"woodcut\" + 0.009*\"form\" + 0.009*\"origin\" + 0.009*\"mean\" + 0.008*\"trade\" + 0.008*\"english\" + 0.007*\"known\" + 0.006*\"uruguayan\"\n", + "2019-01-31 01:26:45,509 : INFO : topic #41 (0.020): 0.040*\"citi\" + 0.023*\"palmer\" + 0.020*\"new\" + 0.016*\"strategist\" + 0.013*\"open\" + 0.013*\"center\" + 0.011*\"includ\" + 0.011*\"lobe\" + 0.010*\"dai\" + 0.009*\"highli\"\n", + "2019-01-31 01:26:45,510 : INFO : topic #4 (0.020): 0.020*\"enfranchis\" + 0.015*\"depress\" + 0.014*\"pour\" + 0.008*\"elabor\" + 0.008*\"mode\" + 0.008*\"uruguayan\" + 0.008*\"veget\" + 0.006*\"develop\" + 0.006*\"spectacl\" + 0.006*\"turn\"\n", + "2019-01-31 01:26:45,516 : INFO : topic diff=0.003131, rho=0.022081\n", + "2019-01-31 01:26:45,671 : INFO : PROGRESS: pass 0, at document #4104000/4922894\n", + "2019-01-31 01:26:47,035 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:26:47,301 : INFO : topic #36 (0.020): 0.011*\"network\" + 0.011*\"prognosi\" + 0.010*\"pop\" + 0.009*\"cytokin\" + 0.008*\"softwar\" + 0.008*\"develop\" + 0.008*\"diggin\" + 0.008*\"uruguayan\" + 0.008*\"championship\" + 0.007*\"user\"\n", + "2019-01-31 01:26:47,303 : INFO : topic #1 (0.020): 0.054*\"china\" + 0.045*\"chilton\" + 0.024*\"hong\" + 0.023*\"kong\" + 0.020*\"korea\" + 0.016*\"korean\" + 0.016*\"leah\" + 0.015*\"sourc\" + 0.014*\"shirin\" + 0.014*\"kim\"\n", + "2019-01-31 01:26:47,304 : INFO : topic #10 (0.020): 0.012*\"cdd\" + 0.009*\"media\" + 0.008*\"hormon\" + 0.008*\"disco\" + 0.007*\"have\" + 0.007*\"pathwai\" + 0.007*\"caus\" + 0.006*\"proper\" + 0.006*\"effect\" + 0.006*\"treat\"\n", + "2019-01-31 01:26:47,305 : INFO : topic #32 (0.020): 0.050*\"district\" + 0.045*\"popolo\" + 0.043*\"vigour\" + 0.035*\"tortur\" + 0.034*\"cotton\" + 0.024*\"multitud\" + 0.022*\"adulthood\" + 0.021*\"area\" + 0.019*\"cede\" + 0.018*\"citi\"\n", + "2019-01-31 01:26:47,306 : INFO : topic #43 (0.020): 0.064*\"elect\" + 0.055*\"parti\" + 0.024*\"voluntari\" + 0.023*\"democrat\" + 0.020*\"member\" + 0.016*\"polici\" + 0.015*\"republ\" + 0.015*\"bypass\" + 0.014*\"seaport\" + 0.013*\"report\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 01:26:47,312 : INFO : topic diff=0.003904, rho=0.022076\n", + "2019-01-31 01:26:47,472 : INFO : PROGRESS: pass 0, at document #4106000/4922894\n", + "2019-01-31 01:26:48,860 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:26:49,127 : INFO : topic #38 (0.020): 0.022*\"walter\" + 0.010*\"aza\" + 0.009*\"forc\" + 0.008*\"battalion\" + 0.007*\"armi\" + 0.007*\"teufel\" + 0.007*\"empath\" + 0.006*\"citi\" + 0.006*\"militari\" + 0.006*\"govern\"\n", + "2019-01-31 01:26:49,128 : INFO : topic #0 (0.020): 0.064*\"statewid\" + 0.040*\"line\" + 0.032*\"raid\" + 0.027*\"rosenwald\" + 0.027*\"rivièr\" + 0.019*\"airmen\" + 0.019*\"serv\" + 0.018*\"traceabl\" + 0.014*\"oper\" + 0.010*\"transient\"\n", + "2019-01-31 01:26:49,129 : INFO : topic #9 (0.020): 0.069*\"bone\" + 0.042*\"american\" + 0.032*\"valour\" + 0.019*\"dutch\" + 0.018*\"player\" + 0.017*\"polit\" + 0.017*\"folei\" + 0.017*\"english\" + 0.014*\"acrimoni\" + 0.012*\"simpler\"\n", + "2019-01-31 01:26:49,130 : INFO : topic #18 (0.020): 0.011*\"théori\" + 0.007*\"later\" + 0.007*\"sack\" + 0.006*\"dai\" + 0.006*\"kill\" + 0.005*\"like\" + 0.005*\"end\" + 0.005*\"retrospect\" + 0.004*\"call\" + 0.004*\"help\"\n", + "2019-01-31 01:26:49,131 : INFO : topic #33 (0.020): 0.059*\"french\" + 0.045*\"franc\" + 0.031*\"pari\" + 0.023*\"jean\" + 0.021*\"sail\" + 0.017*\"daphn\" + 0.014*\"lazi\" + 0.013*\"loui\" + 0.012*\"piec\" + 0.010*\"wine\"\n", + "2019-01-31 01:26:49,137 : INFO : topic diff=0.003090, rho=0.022070\n", + "2019-01-31 01:26:49,300 : INFO : PROGRESS: pass 0, at document #4108000/4922894\n", + "2019-01-31 01:26:50,693 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:26:50,959 : INFO : topic #12 (0.020): 0.008*\"number\" + 0.007*\"frontal\" + 0.006*\"gener\" + 0.006*\"exampl\" + 0.006*\"utopian\" + 0.006*\"southern\" + 0.006*\"poet\" + 0.006*\"measur\" + 0.006*\"théori\" + 0.005*\"servitud\"\n", + "2019-01-31 01:26:50,961 : INFO : topic #20 (0.020): 0.141*\"scholar\" + 0.040*\"struggl\" + 0.033*\"high\" + 0.030*\"educ\" + 0.023*\"collector\" + 0.018*\"yawn\" + 0.013*\"prognosi\" + 0.010*\"district\" + 0.009*\"start\" + 0.009*\"gothic\"\n", + "2019-01-31 01:26:50,962 : INFO : topic #46 (0.020): 0.016*\"stop\" + 0.016*\"wind\" + 0.016*\"sweden\" + 0.015*\"swedish\" + 0.015*\"damag\" + 0.014*\"norwai\" + 0.013*\"norwegian\" + 0.012*\"treeless\" + 0.011*\"huntsvil\" + 0.010*\"denmark\"\n", + "2019-01-31 01:26:50,963 : INFO : topic #2 (0.020): 0.049*\"isl\" + 0.038*\"shield\" + 0.018*\"narrat\" + 0.015*\"scot\" + 0.012*\"pope\" + 0.012*\"blur\" + 0.011*\"nativist\" + 0.010*\"coalit\" + 0.009*\"class\" + 0.009*\"fleet\"\n", + "2019-01-31 01:26:50,964 : INFO : topic #29 (0.020): 0.030*\"companhia\" + 0.013*\"busi\" + 0.012*\"million\" + 0.011*\"produc\" + 0.011*\"market\" + 0.011*\"bank\" + 0.010*\"industri\" + 0.008*\"yawn\" + 0.008*\"manag\" + 0.007*\"serv\"\n", + "2019-01-31 01:26:50,970 : INFO : topic diff=0.003497, rho=0.022065\n", + "2019-01-31 01:26:51,123 : INFO : PROGRESS: pass 0, at document #4110000/4922894\n", + "2019-01-31 01:26:52,462 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:26:52,728 : INFO : topic #1 (0.020): 0.054*\"china\" + 0.047*\"chilton\" + 0.024*\"hong\" + 0.023*\"kong\" + 0.020*\"korea\" + 0.017*\"korean\" + 0.016*\"leah\" + 0.015*\"sourc\" + 0.014*\"shirin\" + 0.014*\"kim\"\n", + "2019-01-31 01:26:52,729 : INFO : topic #15 (0.020): 0.011*\"small\" + 0.010*\"organ\" + 0.009*\"develop\" + 0.009*\"commun\" + 0.009*\"word\" + 0.008*\"group\" + 0.008*\"peopl\" + 0.007*\"human\" + 0.007*\"woman\" + 0.006*\"summerhil\"\n", + "2019-01-31 01:26:52,731 : INFO : topic #44 (0.020): 0.031*\"rooftop\" + 0.027*\"final\" + 0.024*\"wife\" + 0.021*\"tourist\" + 0.019*\"champion\" + 0.015*\"chamber\" + 0.014*\"taxpay\" + 0.014*\"martin\" + 0.014*\"tiepolo\" + 0.013*\"open\"\n", + "2019-01-31 01:26:52,732 : INFO : topic #33 (0.020): 0.059*\"french\" + 0.045*\"franc\" + 0.031*\"pari\" + 0.022*\"jean\" + 0.021*\"sail\" + 0.017*\"daphn\" + 0.014*\"lazi\" + 0.013*\"loui\" + 0.012*\"piec\" + 0.010*\"wine\"\n", + "2019-01-31 01:26:52,733 : INFO : topic #7 (0.020): 0.021*\"snatch\" + 0.020*\"di\" + 0.019*\"factor\" + 0.016*\"margin\" + 0.016*\"yawn\" + 0.014*\"bone\" + 0.013*\"faster\" + 0.013*\"life\" + 0.012*\"daughter\" + 0.011*\"deal\"\n", + "2019-01-31 01:26:52,738 : INFO : topic diff=0.003606, rho=0.022059\n", + "2019-01-31 01:26:52,893 : INFO : PROGRESS: pass 0, at document #4112000/4922894\n", + "2019-01-31 01:26:54,255 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:26:54,521 : INFO : topic #37 (0.020): 0.013*\"charact\" + 0.012*\"septemb\" + 0.011*\"anim\" + 0.010*\"man\" + 0.009*\"comic\" + 0.007*\"appear\" + 0.007*\"storag\" + 0.007*\"workplac\" + 0.007*\"fusiform\" + 0.006*\"vision\"\n", + "2019-01-31 01:26:54,523 : INFO : topic #19 (0.020): 0.017*\"languag\" + 0.015*\"centuri\" + 0.011*\"woodcut\" + 0.009*\"form\" + 0.009*\"mean\" + 0.009*\"origin\" + 0.008*\"trade\" + 0.008*\"english\" + 0.007*\"known\" + 0.006*\"uruguayan\"\n", + "2019-01-31 01:26:54,524 : INFO : topic #17 (0.020): 0.077*\"church\" + 0.024*\"cathol\" + 0.022*\"christian\" + 0.021*\"bishop\" + 0.017*\"sail\" + 0.016*\"retroflex\" + 0.010*\"parish\" + 0.010*\"relationship\" + 0.009*\"poll\" + 0.009*\"cathedr\"\n", + "2019-01-31 01:26:54,525 : INFO : topic #44 (0.020): 0.031*\"rooftop\" + 0.027*\"final\" + 0.024*\"wife\" + 0.021*\"tourist\" + 0.019*\"champion\" + 0.015*\"chamber\" + 0.014*\"taxpay\" + 0.014*\"martin\" + 0.014*\"tiepolo\" + 0.013*\"open\"\n", + "2019-01-31 01:26:54,526 : INFO : topic #16 (0.020): 0.056*\"king\" + 0.031*\"priest\" + 0.020*\"grammat\" + 0.019*\"duke\" + 0.017*\"idiosyncrat\" + 0.017*\"quarterli\" + 0.016*\"rotterdam\" + 0.014*\"kingdom\" + 0.013*\"order\" + 0.013*\"brazil\"\n", + "2019-01-31 01:26:54,532 : INFO : topic diff=0.002802, rho=0.022054\n", + "2019-01-31 01:26:54,691 : INFO : PROGRESS: pass 0, at document #4114000/4922894\n", + "2019-01-31 01:26:56,077 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:26:56,344 : INFO : topic #43 (0.020): 0.064*\"elect\" + 0.055*\"parti\" + 0.025*\"voluntari\" + 0.022*\"democrat\" + 0.020*\"member\" + 0.016*\"polici\" + 0.014*\"republ\" + 0.014*\"bypass\" + 0.013*\"seaport\" + 0.013*\"report\"\n", + "2019-01-31 01:26:56,345 : INFO : topic #25 (0.020): 0.033*\"ring\" + 0.019*\"area\" + 0.018*\"lagrang\" + 0.017*\"warmth\" + 0.016*\"mount\" + 0.010*\"north\" + 0.009*\"land\" + 0.009*\"sourc\" + 0.009*\"foam\" + 0.008*\"lobe\"\n", + "2019-01-31 01:26:56,346 : INFO : topic #18 (0.020): 0.011*\"théori\" + 0.007*\"later\" + 0.006*\"sack\" + 0.006*\"dai\" + 0.006*\"kill\" + 0.005*\"like\" + 0.005*\"end\" + 0.005*\"retrospect\" + 0.004*\"call\" + 0.004*\"help\"\n", + "2019-01-31 01:26:56,347 : INFO : topic #35 (0.020): 0.054*\"russia\" + 0.037*\"sovereignti\" + 0.034*\"rural\" + 0.027*\"poison\" + 0.026*\"personifi\" + 0.024*\"reprint\" + 0.020*\"moscow\" + 0.019*\"poland\" + 0.015*\"malaysia\" + 0.014*\"unfortun\"\n", + "2019-01-31 01:26:56,348 : INFO : topic #16 (0.020): 0.056*\"king\" + 0.031*\"priest\" + 0.020*\"grammat\" + 0.019*\"duke\" + 0.018*\"idiosyncrat\" + 0.017*\"quarterli\" + 0.016*\"rotterdam\" + 0.014*\"kingdom\" + 0.013*\"order\" + 0.012*\"brazil\"\n", + "2019-01-31 01:26:56,354 : INFO : topic diff=0.003099, rho=0.022049\n", + "2019-01-31 01:26:56,510 : INFO : PROGRESS: pass 0, at document #4116000/4922894\n", + "2019-01-31 01:26:57,882 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:26:58,149 : INFO : topic #24 (0.020): 0.039*\"book\" + 0.035*\"publicis\" + 0.027*\"word\" + 0.019*\"new\" + 0.014*\"edit\" + 0.013*\"presid\" + 0.011*\"magazin\" + 0.011*\"worldwid\" + 0.011*\"author\" + 0.011*\"nicola\"\n", + "2019-01-31 01:26:58,150 : INFO : topic #44 (0.020): 0.031*\"rooftop\" + 0.028*\"final\" + 0.023*\"wife\" + 0.021*\"tourist\" + 0.019*\"champion\" + 0.015*\"chamber\" + 0.014*\"martin\" + 0.014*\"taxpay\" + 0.014*\"tiepolo\" + 0.013*\"open\"\n", + "2019-01-31 01:26:58,151 : INFO : topic #27 (0.020): 0.074*\"questionnair\" + 0.020*\"candid\" + 0.018*\"taxpay\" + 0.013*\"tornado\" + 0.013*\"fool\" + 0.013*\"ret\" + 0.012*\"driver\" + 0.011*\"horac\" + 0.010*\"find\" + 0.010*\"théori\"\n", + "2019-01-31 01:26:58,152 : INFO : topic #9 (0.020): 0.069*\"bone\" + 0.042*\"american\" + 0.031*\"valour\" + 0.019*\"dutch\" + 0.018*\"player\" + 0.017*\"polit\" + 0.017*\"folei\" + 0.017*\"english\" + 0.014*\"acrimoni\" + 0.012*\"simpler\"\n", + "2019-01-31 01:26:58,153 : INFO : topic #32 (0.020): 0.050*\"district\" + 0.045*\"popolo\" + 0.043*\"vigour\" + 0.035*\"tortur\" + 0.034*\"cotton\" + 0.023*\"multitud\" + 0.022*\"adulthood\" + 0.021*\"area\" + 0.019*\"cede\" + 0.018*\"citi\"\n", + "2019-01-31 01:26:58,159 : INFO : topic diff=0.003225, rho=0.022043\n", + "2019-01-31 01:26:58,314 : INFO : PROGRESS: pass 0, at document #4118000/4922894\n", + "2019-01-31 01:26:59,661 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 01:26:59,928 : INFO : topic #48 (0.020): 0.079*\"sens\" + 0.078*\"march\" + 0.077*\"octob\" + 0.070*\"august\" + 0.070*\"juli\" + 0.068*\"januari\" + 0.066*\"april\" + 0.066*\"notion\" + 0.065*\"judici\" + 0.063*\"decatur\"\n", + "2019-01-31 01:26:59,929 : INFO : topic #13 (0.020): 0.026*\"london\" + 0.026*\"sourc\" + 0.025*\"australia\" + 0.024*\"new\" + 0.023*\"england\" + 0.022*\"australian\" + 0.020*\"british\" + 0.019*\"ireland\" + 0.015*\"youth\" + 0.013*\"wale\"\n", + "2019-01-31 01:26:59,930 : INFO : topic #24 (0.020): 0.039*\"book\" + 0.035*\"publicis\" + 0.027*\"word\" + 0.019*\"new\" + 0.014*\"edit\" + 0.013*\"presid\" + 0.011*\"magazin\" + 0.011*\"worldwid\" + 0.011*\"author\" + 0.011*\"nicola\"\n", + "2019-01-31 01:26:59,931 : INFO : topic #45 (0.020): 0.042*\"arsen\" + 0.029*\"jpg\" + 0.027*\"fifteenth\" + 0.027*\"museo\" + 0.022*\"pain\" + 0.021*\"illicit\" + 0.015*\"artist\" + 0.015*\"exhaust\" + 0.015*\"gai\" + 0.014*\"colder\"\n", + "2019-01-31 01:26:59,932 : INFO : topic #16 (0.020): 0.057*\"king\" + 0.031*\"priest\" + 0.020*\"grammat\" + 0.018*\"duke\" + 0.017*\"idiosyncrat\" + 0.017*\"quarterli\" + 0.016*\"rotterdam\" + 0.014*\"order\" + 0.014*\"kingdom\" + 0.012*\"brazil\"\n", + "2019-01-31 01:26:59,938 : INFO : topic diff=0.003159, rho=0.022038\n", + "2019-01-31 01:27:02,676 : INFO : -11.624 per-word bound, 3155.6 perplexity estimate based on a held-out corpus of 2000 documents with 580547 words\n", + "2019-01-31 01:27:02,677 : INFO : PROGRESS: pass 0, at document #4120000/4922894\n", + "2019-01-31 01:27:04,067 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:27:04,334 : INFO : topic #22 (0.020): 0.034*\"spars\" + 0.019*\"factor\" + 0.012*\"plaisir\" + 0.010*\"genu\" + 0.010*\"western\" + 0.008*\"biom\" + 0.008*\"median\" + 0.007*\"florida\" + 0.007*\"incom\" + 0.007*\"trap\"\n", + "2019-01-31 01:27:04,335 : INFO : topic #20 (0.020): 0.141*\"scholar\" + 0.040*\"struggl\" + 0.033*\"high\" + 0.030*\"educ\" + 0.024*\"collector\" + 0.018*\"yawn\" + 0.013*\"prognosi\" + 0.010*\"district\" + 0.009*\"start\" + 0.009*\"class\"\n", + "2019-01-31 01:27:04,336 : INFO : topic #39 (0.020): 0.061*\"canada\" + 0.045*\"canadian\" + 0.024*\"toronto\" + 0.023*\"hoar\" + 0.021*\"ontario\" + 0.015*\"new\" + 0.015*\"hydrogen\" + 0.015*\"misericordia\" + 0.015*\"quebec\" + 0.014*\"novotná\"\n", + "2019-01-31 01:27:04,337 : INFO : topic #1 (0.020): 0.054*\"china\" + 0.047*\"chilton\" + 0.023*\"hong\" + 0.023*\"kong\" + 0.020*\"korea\" + 0.018*\"korean\" + 0.016*\"leah\" + 0.015*\"sourc\" + 0.014*\"shirin\" + 0.013*\"kim\"\n", + "2019-01-31 01:27:04,338 : INFO : topic #33 (0.020): 0.058*\"french\" + 0.045*\"franc\" + 0.031*\"pari\" + 0.023*\"jean\" + 0.021*\"sail\" + 0.017*\"daphn\" + 0.014*\"lazi\" + 0.013*\"loui\" + 0.012*\"piec\" + 0.011*\"wine\"\n", + "2019-01-31 01:27:04,344 : INFO : topic diff=0.003187, rho=0.022033\n", + "2019-01-31 01:27:04,510 : INFO : PROGRESS: pass 0, at document #4122000/4922894\n", + "2019-01-31 01:27:05,887 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:27:06,153 : INFO : topic #33 (0.020): 0.058*\"french\" + 0.045*\"franc\" + 0.031*\"pari\" + 0.023*\"jean\" + 0.022*\"sail\" + 0.017*\"daphn\" + 0.014*\"lazi\" + 0.013*\"loui\" + 0.012*\"piec\" + 0.011*\"wine\"\n", + "2019-01-31 01:27:06,154 : INFO : topic #8 (0.020): 0.026*\"law\" + 0.022*\"cortic\" + 0.020*\"act\" + 0.019*\"start\" + 0.012*\"ricardo\" + 0.012*\"case\" + 0.010*\"replac\" + 0.009*\"polaris\" + 0.008*\"legal\" + 0.007*\"judaism\"\n", + "2019-01-31 01:27:06,155 : INFO : topic #4 (0.020): 0.020*\"enfranchis\" + 0.015*\"pour\" + 0.014*\"depress\" + 0.008*\"elabor\" + 0.008*\"uruguayan\" + 0.008*\"veget\" + 0.008*\"mode\" + 0.006*\"spectacl\" + 0.006*\"develop\" + 0.006*\"turn\"\n", + "2019-01-31 01:27:06,157 : INFO : topic #47 (0.020): 0.061*\"muscl\" + 0.033*\"perceptu\" + 0.020*\"theater\" + 0.017*\"place\" + 0.017*\"compos\" + 0.015*\"damn\" + 0.014*\"physician\" + 0.013*\"olympo\" + 0.013*\"orchestr\" + 0.011*\"word\"\n", + "2019-01-31 01:27:06,157 : INFO : topic #46 (0.020): 0.017*\"stop\" + 0.016*\"damag\" + 0.016*\"wind\" + 0.015*\"sweden\" + 0.014*\"swedish\" + 0.014*\"norwai\" + 0.013*\"norwegian\" + 0.011*\"treeless\" + 0.011*\"huntsvil\" + 0.010*\"denmark\"\n", + "2019-01-31 01:27:06,163 : INFO : topic diff=0.003280, rho=0.022027\n", + "2019-01-31 01:27:06,321 : INFO : PROGRESS: pass 0, at document #4124000/4922894\n", + "2019-01-31 01:27:07,722 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:27:07,989 : INFO : topic #21 (0.020): 0.034*\"samford\" + 0.022*\"spain\" + 0.017*\"del\" + 0.017*\"italian\" + 0.016*\"mexico\" + 0.014*\"soviet\" + 0.012*\"santa\" + 0.011*\"juan\" + 0.010*\"carlo\" + 0.010*\"lizard\"\n", + "2019-01-31 01:27:07,990 : INFO : topic #23 (0.020): 0.138*\"audit\" + 0.072*\"best\" + 0.035*\"yawn\" + 0.026*\"jacksonvil\" + 0.022*\"noll\" + 0.021*\"japanes\" + 0.019*\"women\" + 0.018*\"festiv\" + 0.016*\"intern\" + 0.014*\"prison\"\n", + "2019-01-31 01:27:07,991 : INFO : topic #24 (0.020): 0.040*\"book\" + 0.035*\"publicis\" + 0.027*\"word\" + 0.019*\"new\" + 0.014*\"edit\" + 0.013*\"presid\" + 0.011*\"worldwid\" + 0.011*\"magazin\" + 0.011*\"author\" + 0.011*\"nicola\"\n", + "2019-01-31 01:27:07,992 : INFO : topic #12 (0.020): 0.008*\"number\" + 0.007*\"frontal\" + 0.006*\"gener\" + 0.006*\"poet\" + 0.006*\"southern\" + 0.006*\"exampl\" + 0.006*\"utopian\" + 0.006*\"measur\" + 0.006*\"théori\" + 0.006*\"servitud\"\n", + "2019-01-31 01:27:07,993 : INFO : topic #20 (0.020): 0.141*\"scholar\" + 0.040*\"struggl\" + 0.033*\"high\" + 0.030*\"educ\" + 0.024*\"collector\" + 0.017*\"yawn\" + 0.013*\"prognosi\" + 0.010*\"district\" + 0.009*\"class\" + 0.009*\"start\"\n", + "2019-01-31 01:27:07,999 : INFO : topic diff=0.003621, rho=0.022022\n", + "2019-01-31 01:27:08,212 : INFO : PROGRESS: pass 0, at document #4126000/4922894\n", + "2019-01-31 01:27:09,571 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:27:09,838 : INFO : topic #46 (0.020): 0.017*\"stop\" + 0.016*\"wind\" + 0.016*\"damag\" + 0.015*\"sweden\" + 0.014*\"swedish\" + 0.014*\"norwai\" + 0.013*\"norwegian\" + 0.012*\"treeless\" + 0.012*\"huntsvil\" + 0.010*\"denmark\"\n", + "2019-01-31 01:27:09,839 : INFO : topic #44 (0.020): 0.031*\"rooftop\" + 0.028*\"final\" + 0.023*\"wife\" + 0.022*\"tourist\" + 0.019*\"champion\" + 0.015*\"chamber\" + 0.014*\"martin\" + 0.014*\"taxpay\" + 0.014*\"tiepolo\" + 0.013*\"open\"\n", + "2019-01-31 01:27:09,840 : INFO : topic #4 (0.020): 0.020*\"enfranchis\" + 0.014*\"depress\" + 0.014*\"pour\" + 0.008*\"elabor\" + 0.008*\"uruguayan\" + 0.008*\"veget\" + 0.008*\"mode\" + 0.006*\"develop\" + 0.006*\"spectacl\" + 0.006*\"turn\"\n", + "2019-01-31 01:27:09,841 : INFO : topic #28 (0.020): 0.035*\"build\" + 0.030*\"hous\" + 0.018*\"buford\" + 0.015*\"histor\" + 0.012*\"linear\" + 0.011*\"depress\" + 0.011*\"constitut\" + 0.010*\"silicon\" + 0.010*\"pistol\" + 0.010*\"centuri\"\n", + "2019-01-31 01:27:09,842 : INFO : topic #38 (0.020): 0.022*\"walter\" + 0.010*\"aza\" + 0.009*\"forc\" + 0.008*\"battalion\" + 0.007*\"armi\" + 0.007*\"teufel\" + 0.007*\"empath\" + 0.006*\"citi\" + 0.006*\"militari\" + 0.006*\"govern\"\n", + "2019-01-31 01:27:09,849 : INFO : topic diff=0.003488, rho=0.022017\n", + "2019-01-31 01:27:10,003 : INFO : PROGRESS: pass 0, at document #4128000/4922894\n", + "2019-01-31 01:27:11,364 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:27:11,631 : INFO : topic #47 (0.020): 0.061*\"muscl\" + 0.033*\"perceptu\" + 0.020*\"theater\" + 0.017*\"place\" + 0.017*\"compos\" + 0.015*\"damn\" + 0.014*\"physician\" + 0.013*\"orchestr\" + 0.013*\"olympo\" + 0.011*\"word\"\n", + "2019-01-31 01:27:11,632 : INFO : topic #35 (0.020): 0.054*\"russia\" + 0.037*\"sovereignti\" + 0.033*\"rural\" + 0.026*\"poison\" + 0.025*\"personifi\" + 0.023*\"reprint\" + 0.021*\"moscow\" + 0.019*\"poland\" + 0.015*\"unfortun\" + 0.015*\"malaysia\"\n", + "2019-01-31 01:27:11,633 : INFO : topic #29 (0.020): 0.030*\"companhia\" + 0.013*\"busi\" + 0.012*\"million\" + 0.011*\"produc\" + 0.011*\"market\" + 0.010*\"bank\" + 0.010*\"industri\" + 0.008*\"yawn\" + 0.008*\"manag\" + 0.007*\"serv\"\n", + "2019-01-31 01:27:11,634 : INFO : topic #14 (0.020): 0.024*\"forc\" + 0.021*\"walter\" + 0.021*\"aggress\" + 0.021*\"armi\" + 0.018*\"com\" + 0.014*\"unionist\" + 0.013*\"oper\" + 0.013*\"militari\" + 0.012*\"airbu\" + 0.011*\"diversifi\"\n", + "2019-01-31 01:27:11,635 : INFO : topic #11 (0.020): 0.023*\"john\" + 0.011*\"david\" + 0.011*\"will\" + 0.011*\"jame\" + 0.010*\"rival\" + 0.009*\"mexican–american\" + 0.008*\"slur\" + 0.007*\"georg\" + 0.007*\"paul\" + 0.007*\"rhyme\"\n", + "2019-01-31 01:27:11,642 : INFO : topic diff=0.002884, rho=0.022011\n", + "2019-01-31 01:27:11,797 : INFO : PROGRESS: pass 0, at document #4130000/4922894\n", + "2019-01-31 01:27:13,163 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 01:27:13,429 : INFO : topic #17 (0.020): 0.078*\"church\" + 0.023*\"cathol\" + 0.022*\"christian\" + 0.021*\"bishop\" + 0.017*\"sail\" + 0.015*\"retroflex\" + 0.010*\"relationship\" + 0.009*\"cathedr\" + 0.009*\"parish\" + 0.009*\"historiographi\"\n", + "2019-01-31 01:27:13,430 : INFO : topic #6 (0.020): 0.071*\"fewer\" + 0.023*\"epiru\" + 0.020*\"septemb\" + 0.018*\"teacher\" + 0.015*\"stake\" + 0.012*\"rodríguez\" + 0.011*\"direct\" + 0.011*\"proclaim\" + 0.011*\"movi\" + 0.010*\"acrimoni\"\n", + "2019-01-31 01:27:13,431 : INFO : topic #21 (0.020): 0.034*\"samford\" + 0.022*\"spain\" + 0.017*\"del\" + 0.017*\"italian\" + 0.016*\"mexico\" + 0.014*\"soviet\" + 0.012*\"santa\" + 0.011*\"juan\" + 0.010*\"carlo\" + 0.010*\"lizard\"\n", + "2019-01-31 01:27:13,432 : INFO : topic #13 (0.020): 0.026*\"london\" + 0.026*\"sourc\" + 0.025*\"australia\" + 0.024*\"new\" + 0.023*\"england\" + 0.022*\"australian\" + 0.019*\"british\" + 0.019*\"ireland\" + 0.015*\"youth\" + 0.014*\"wale\"\n", + "2019-01-31 01:27:13,433 : INFO : topic #46 (0.020): 0.017*\"stop\" + 0.016*\"wind\" + 0.015*\"damag\" + 0.015*\"sweden\" + 0.014*\"swedish\" + 0.014*\"norwai\" + 0.013*\"norwegian\" + 0.012*\"huntsvil\" + 0.012*\"treeless\" + 0.010*\"denmark\"\n", + "2019-01-31 01:27:13,439 : INFO : topic diff=0.002967, rho=0.022006\n", + "2019-01-31 01:27:13,593 : INFO : PROGRESS: pass 0, at document #4132000/4922894\n", + "2019-01-31 01:27:14,973 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:27:15,239 : INFO : topic #32 (0.020): 0.049*\"district\" + 0.045*\"popolo\" + 0.043*\"vigour\" + 0.036*\"tortur\" + 0.033*\"cotton\" + 0.023*\"multitud\" + 0.022*\"adulthood\" + 0.021*\"area\" + 0.019*\"cede\" + 0.018*\"citi\"\n", + "2019-01-31 01:27:15,240 : INFO : topic #24 (0.020): 0.040*\"book\" + 0.035*\"publicis\" + 0.027*\"word\" + 0.019*\"new\" + 0.014*\"edit\" + 0.013*\"presid\" + 0.011*\"worldwid\" + 0.011*\"magazin\" + 0.011*\"author\" + 0.011*\"storag\"\n", + "2019-01-31 01:27:15,242 : INFO : topic #7 (0.020): 0.021*\"snatch\" + 0.020*\"di\" + 0.019*\"factor\" + 0.016*\"margin\" + 0.016*\"yawn\" + 0.014*\"bone\" + 0.013*\"faster\" + 0.013*\"life\" + 0.012*\"daughter\" + 0.012*\"deal\"\n", + "2019-01-31 01:27:15,242 : INFO : topic #1 (0.020): 0.054*\"china\" + 0.046*\"chilton\" + 0.025*\"kong\" + 0.024*\"hong\" + 0.020*\"korea\" + 0.018*\"korean\" + 0.016*\"leah\" + 0.015*\"sourc\" + 0.014*\"shirin\" + 0.013*\"kim\"\n", + "2019-01-31 01:27:15,243 : INFO : topic #31 (0.020): 0.050*\"fusiform\" + 0.027*\"scientist\" + 0.025*\"taxpay\" + 0.022*\"player\" + 0.019*\"place\" + 0.014*\"clot\" + 0.013*\"leagu\" + 0.011*\"folei\" + 0.010*\"yawn\" + 0.009*\"reconstruct\"\n", + "2019-01-31 01:27:15,249 : INFO : topic diff=0.003301, rho=0.022001\n", + "2019-01-31 01:27:15,405 : INFO : PROGRESS: pass 0, at document #4134000/4922894\n", + "2019-01-31 01:27:16,800 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:27:17,066 : INFO : topic #7 (0.020): 0.021*\"snatch\" + 0.020*\"di\" + 0.019*\"factor\" + 0.016*\"margin\" + 0.016*\"yawn\" + 0.014*\"bone\" + 0.013*\"life\" + 0.013*\"faster\" + 0.012*\"daughter\" + 0.011*\"deal\"\n", + "2019-01-31 01:27:17,067 : INFO : topic #0 (0.020): 0.064*\"statewid\" + 0.039*\"line\" + 0.031*\"raid\" + 0.028*\"rivièr\" + 0.027*\"rosenwald\" + 0.019*\"serv\" + 0.018*\"airmen\" + 0.018*\"traceabl\" + 0.013*\"oper\" + 0.010*\"transient\"\n", + "2019-01-31 01:27:17,069 : INFO : topic #6 (0.020): 0.071*\"fewer\" + 0.024*\"epiru\" + 0.020*\"septemb\" + 0.018*\"teacher\" + 0.015*\"stake\" + 0.012*\"rodríguez\" + 0.011*\"proclaim\" + 0.011*\"direct\" + 0.010*\"movi\" + 0.010*\"acrimoni\"\n", + "2019-01-31 01:27:17,070 : INFO : topic #33 (0.020): 0.060*\"french\" + 0.044*\"franc\" + 0.031*\"pari\" + 0.023*\"jean\" + 0.021*\"sail\" + 0.017*\"daphn\" + 0.014*\"lazi\" + 0.013*\"loui\" + 0.012*\"piec\" + 0.011*\"wine\"\n", + "2019-01-31 01:27:17,070 : INFO : topic #1 (0.020): 0.054*\"china\" + 0.046*\"chilton\" + 0.025*\"kong\" + 0.024*\"hong\" + 0.020*\"korea\" + 0.018*\"korean\" + 0.016*\"leah\" + 0.015*\"sourc\" + 0.015*\"shirin\" + 0.013*\"kim\"\n", + "2019-01-31 01:27:17,076 : INFO : topic diff=0.002866, rho=0.021995\n", + "2019-01-31 01:27:17,241 : INFO : PROGRESS: pass 0, at document #4136000/4922894\n", + "2019-01-31 01:27:18,643 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:27:18,912 : INFO : topic #24 (0.020): 0.040*\"book\" + 0.035*\"publicis\" + 0.027*\"word\" + 0.019*\"new\" + 0.014*\"edit\" + 0.013*\"presid\" + 0.011*\"worldwid\" + 0.011*\"magazin\" + 0.011*\"author\" + 0.011*\"storag\"\n", + "2019-01-31 01:27:18,913 : INFO : topic #16 (0.020): 0.056*\"king\" + 0.032*\"priest\" + 0.020*\"grammat\" + 0.019*\"duke\" + 0.018*\"idiosyncrat\" + 0.016*\"rotterdam\" + 0.016*\"quarterli\" + 0.014*\"kingdom\" + 0.013*\"order\" + 0.013*\"maria\"\n", + "2019-01-31 01:27:18,914 : INFO : topic #39 (0.020): 0.061*\"canada\" + 0.045*\"canadian\" + 0.024*\"toronto\" + 0.023*\"hoar\" + 0.020*\"ontario\" + 0.015*\"new\" + 0.015*\"misericordia\" + 0.015*\"hydrogen\" + 0.014*\"quebec\" + 0.014*\"novotná\"\n", + "2019-01-31 01:27:18,915 : INFO : topic #32 (0.020): 0.049*\"district\" + 0.045*\"popolo\" + 0.043*\"vigour\" + 0.036*\"tortur\" + 0.034*\"cotton\" + 0.023*\"multitud\" + 0.022*\"adulthood\" + 0.021*\"area\" + 0.020*\"cede\" + 0.018*\"citi\"\n", + "2019-01-31 01:27:18,916 : INFO : topic #45 (0.020): 0.043*\"arsen\" + 0.028*\"jpg\" + 0.027*\"museo\" + 0.027*\"fifteenth\" + 0.022*\"pain\" + 0.020*\"illicit\" + 0.016*\"artist\" + 0.016*\"exhaust\" + 0.016*\"gai\" + 0.015*\"colder\"\n", + "2019-01-31 01:27:18,922 : INFO : topic diff=0.003440, rho=0.021990\n", + "2019-01-31 01:27:19,085 : INFO : PROGRESS: pass 0, at document #4138000/4922894\n", + "2019-01-31 01:27:20,452 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:27:20,722 : INFO : topic #45 (0.020): 0.043*\"arsen\" + 0.029*\"jpg\" + 0.027*\"museo\" + 0.027*\"fifteenth\" + 0.022*\"pain\" + 0.020*\"illicit\" + 0.016*\"artist\" + 0.016*\"exhaust\" + 0.016*\"gai\" + 0.014*\"colder\"\n", + "2019-01-31 01:27:20,723 : INFO : topic #30 (0.020): 0.036*\"cleveland\" + 0.035*\"leagu\" + 0.029*\"place\" + 0.028*\"taxpay\" + 0.024*\"scientist\" + 0.023*\"crete\" + 0.022*\"folei\" + 0.016*\"goal\" + 0.015*\"martin\" + 0.012*\"schmitz\"\n", + "2019-01-31 01:27:20,724 : INFO : topic #40 (0.020): 0.087*\"unit\" + 0.023*\"schuster\" + 0.022*\"collector\" + 0.022*\"institut\" + 0.021*\"requir\" + 0.019*\"student\" + 0.014*\"professor\" + 0.012*\"http\" + 0.012*\"word\" + 0.012*\"degre\"\n", + "2019-01-31 01:27:20,725 : INFO : topic #7 (0.020): 0.021*\"snatch\" + 0.019*\"di\" + 0.019*\"factor\" + 0.016*\"margin\" + 0.016*\"yawn\" + 0.014*\"bone\" + 0.013*\"life\" + 0.013*\"faster\" + 0.012*\"daughter\" + 0.011*\"deal\"\n", + "2019-01-31 01:27:20,726 : INFO : topic #33 (0.020): 0.060*\"french\" + 0.044*\"franc\" + 0.031*\"pari\" + 0.023*\"jean\" + 0.021*\"sail\" + 0.017*\"daphn\" + 0.014*\"lazi\" + 0.013*\"loui\" + 0.012*\"piec\" + 0.011*\"wine\"\n", + "2019-01-31 01:27:20,732 : INFO : topic diff=0.003346, rho=0.021985\n", + "2019-01-31 01:27:23,382 : INFO : -11.737 per-word bound, 3412.4 perplexity estimate based on a held-out corpus of 2000 documents with 518973 words\n", + "2019-01-31 01:27:23,382 : INFO : PROGRESS: pass 0, at document #4140000/4922894\n", + "2019-01-31 01:27:24,751 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:27:25,020 : INFO : topic #26 (0.020): 0.030*\"workplac\" + 0.029*\"champion\" + 0.026*\"woman\" + 0.024*\"olymp\" + 0.023*\"men\" + 0.022*\"medal\" + 0.020*\"event\" + 0.019*\"taxpay\" + 0.018*\"nation\" + 0.017*\"atheist\"\n", + "2019-01-31 01:27:25,021 : INFO : topic #9 (0.020): 0.068*\"bone\" + 0.042*\"american\" + 0.030*\"valour\" + 0.019*\"dutch\" + 0.018*\"player\" + 0.017*\"polit\" + 0.017*\"folei\" + 0.016*\"english\" + 0.013*\"acrimoni\" + 0.013*\"simpler\"\n", + "2019-01-31 01:27:25,022 : INFO : topic #0 (0.020): 0.065*\"statewid\" + 0.039*\"line\" + 0.031*\"raid\" + 0.028*\"rivièr\" + 0.027*\"rosenwald\" + 0.019*\"serv\" + 0.019*\"traceabl\" + 0.018*\"airmen\" + 0.013*\"oper\" + 0.010*\"transient\"\n", + "2019-01-31 01:27:25,023 : INFO : topic #43 (0.020): 0.065*\"elect\" + 0.054*\"parti\" + 0.025*\"voluntari\" + 0.022*\"democrat\" + 0.020*\"member\" + 0.016*\"polici\" + 0.014*\"republ\" + 0.014*\"bypass\" + 0.013*\"selma\" + 0.013*\"seaport\"\n", + "2019-01-31 01:27:25,024 : INFO : topic #16 (0.020): 0.056*\"king\" + 0.032*\"priest\" + 0.020*\"grammat\" + 0.019*\"duke\" + 0.018*\"idiosyncrat\" + 0.016*\"quarterli\" + 0.016*\"rotterdam\" + 0.014*\"kingdom\" + 0.013*\"order\" + 0.013*\"maria\"\n", + "2019-01-31 01:27:25,030 : INFO : topic diff=0.002973, rho=0.021979\n", + "2019-01-31 01:27:25,189 : INFO : PROGRESS: pass 0, at document #4142000/4922894\n", + "2019-01-31 01:27:26,554 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 01:27:26,820 : INFO : topic #14 (0.020): 0.024*\"forc\" + 0.022*\"aggress\" + 0.022*\"walter\" + 0.021*\"armi\" + 0.019*\"com\" + 0.014*\"unionist\" + 0.013*\"militari\" + 0.013*\"oper\" + 0.012*\"airbu\" + 0.011*\"refut\"\n", + "2019-01-31 01:27:26,822 : INFO : topic #37 (0.020): 0.013*\"charact\" + 0.012*\"septemb\" + 0.011*\"man\" + 0.011*\"anim\" + 0.009*\"comic\" + 0.007*\"appear\" + 0.007*\"storag\" + 0.007*\"workplac\" + 0.007*\"fusiform\" + 0.006*\"vision\"\n", + "2019-01-31 01:27:26,823 : INFO : topic #8 (0.020): 0.026*\"law\" + 0.023*\"cortic\" + 0.020*\"act\" + 0.019*\"start\" + 0.012*\"ricardo\" + 0.012*\"case\" + 0.010*\"replac\" + 0.010*\"polaris\" + 0.008*\"legal\" + 0.007*\"judaism\"\n", + "2019-01-31 01:27:26,824 : INFO : topic #22 (0.020): 0.034*\"spars\" + 0.019*\"factor\" + 0.012*\"plaisir\" + 0.010*\"genu\" + 0.010*\"western\" + 0.008*\"biom\" + 0.008*\"median\" + 0.007*\"florida\" + 0.007*\"incom\" + 0.007*\"trap\"\n", + "2019-01-31 01:27:26,824 : INFO : topic #39 (0.020): 0.060*\"canada\" + 0.045*\"canadian\" + 0.024*\"toronto\" + 0.022*\"hoar\" + 0.021*\"ontario\" + 0.015*\"new\" + 0.015*\"misericordia\" + 0.014*\"hydrogen\" + 0.014*\"quebec\" + 0.013*\"novotná\"\n", + "2019-01-31 01:27:26,830 : INFO : topic diff=0.003530, rho=0.021974\n", + "2019-01-31 01:27:26,986 : INFO : PROGRESS: pass 0, at document #4144000/4922894\n", + "2019-01-31 01:27:28,370 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:27:28,636 : INFO : topic #30 (0.020): 0.036*\"cleveland\" + 0.036*\"leagu\" + 0.029*\"place\" + 0.028*\"taxpay\" + 0.024*\"scientist\" + 0.024*\"crete\" + 0.022*\"folei\" + 0.016*\"goal\" + 0.015*\"martin\" + 0.012*\"schmitz\"\n", + "2019-01-31 01:27:28,637 : INFO : topic #46 (0.020): 0.016*\"stop\" + 0.016*\"wind\" + 0.015*\"damag\" + 0.015*\"sweden\" + 0.014*\"norwai\" + 0.014*\"swedish\" + 0.013*\"norwegian\" + 0.011*\"huntsvil\" + 0.011*\"treeless\" + 0.010*\"denmark\"\n", + "2019-01-31 01:27:28,639 : INFO : topic #7 (0.020): 0.021*\"snatch\" + 0.020*\"di\" + 0.019*\"factor\" + 0.016*\"margin\" + 0.016*\"yawn\" + 0.014*\"bone\" + 0.013*\"life\" + 0.013*\"faster\" + 0.012*\"deal\" + 0.012*\"daughter\"\n", + "2019-01-31 01:27:28,640 : INFO : topic #37 (0.020): 0.013*\"charact\" + 0.012*\"septemb\" + 0.011*\"man\" + 0.011*\"anim\" + 0.009*\"comic\" + 0.007*\"appear\" + 0.007*\"workplac\" + 0.007*\"storag\" + 0.007*\"fusiform\" + 0.006*\"vision\"\n", + "2019-01-31 01:27:28,641 : INFO : topic #42 (0.020): 0.048*\"german\" + 0.031*\"germani\" + 0.016*\"vol\" + 0.015*\"jewish\" + 0.015*\"berlin\" + 0.014*\"der\" + 0.013*\"israel\" + 0.010*\"european\" + 0.009*\"europ\" + 0.009*\"austria\"\n", + "2019-01-31 01:27:28,647 : INFO : topic diff=0.003527, rho=0.021969\n", + "2019-01-31 01:27:28,804 : INFO : PROGRESS: pass 0, at document #4146000/4922894\n", + "2019-01-31 01:27:30,173 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:27:30,439 : INFO : topic #27 (0.020): 0.073*\"questionnair\" + 0.021*\"candid\" + 0.019*\"taxpay\" + 0.014*\"tornado\" + 0.012*\"driver\" + 0.012*\"fool\" + 0.012*\"ret\" + 0.011*\"horac\" + 0.010*\"find\" + 0.010*\"squatter\"\n", + "2019-01-31 01:27:30,440 : INFO : topic #29 (0.020): 0.030*\"companhia\" + 0.013*\"busi\" + 0.012*\"million\" + 0.012*\"produc\" + 0.011*\"market\" + 0.010*\"bank\" + 0.010*\"industri\" + 0.008*\"yawn\" + 0.008*\"manag\" + 0.007*\"serv\"\n", + "2019-01-31 01:27:30,441 : INFO : topic #49 (0.020): 0.044*\"india\" + 0.031*\"incumb\" + 0.013*\"pakistan\" + 0.013*\"islam\" + 0.012*\"televis\" + 0.011*\"khalsa\" + 0.011*\"muskoge\" + 0.011*\"anglo\" + 0.011*\"affection\" + 0.010*\"alam\"\n", + "2019-01-31 01:27:30,442 : INFO : topic #41 (0.020): 0.041*\"citi\" + 0.023*\"palmer\" + 0.020*\"new\" + 0.017*\"strategist\" + 0.013*\"open\" + 0.013*\"center\" + 0.011*\"includ\" + 0.011*\"lobe\" + 0.010*\"dai\" + 0.009*\"area\"\n", + "2019-01-31 01:27:30,443 : INFO : topic #25 (0.020): 0.033*\"ring\" + 0.019*\"area\" + 0.018*\"lagrang\" + 0.017*\"warmth\" + 0.016*\"mount\" + 0.009*\"north\" + 0.009*\"land\" + 0.009*\"sourc\" + 0.009*\"foam\" + 0.008*\"palmer\"\n", + "2019-01-31 01:27:30,449 : INFO : topic diff=0.003766, rho=0.021963\n", + "2019-01-31 01:27:30,609 : INFO : PROGRESS: pass 0, at document #4148000/4922894\n", + "2019-01-31 01:27:32,006 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:27:32,272 : INFO : topic #24 (0.020): 0.040*\"book\" + 0.035*\"publicis\" + 0.027*\"word\" + 0.019*\"new\" + 0.014*\"edit\" + 0.014*\"presid\" + 0.011*\"worldwid\" + 0.011*\"magazin\" + 0.011*\"author\" + 0.011*\"nicola\"\n", + "2019-01-31 01:27:32,273 : INFO : topic #37 (0.020): 0.013*\"charact\" + 0.012*\"septemb\" + 0.011*\"man\" + 0.011*\"anim\" + 0.009*\"comic\" + 0.007*\"appear\" + 0.007*\"workplac\" + 0.007*\"storag\" + 0.007*\"fusiform\" + 0.006*\"vision\"\n", + "2019-01-31 01:27:32,274 : INFO : topic #40 (0.020): 0.086*\"unit\" + 0.023*\"schuster\" + 0.022*\"collector\" + 0.021*\"institut\" + 0.021*\"requir\" + 0.019*\"student\" + 0.014*\"professor\" + 0.012*\"http\" + 0.012*\"word\" + 0.012*\"degre\"\n", + "2019-01-31 01:27:32,275 : INFO : topic #25 (0.020): 0.033*\"ring\" + 0.019*\"area\" + 0.018*\"lagrang\" + 0.017*\"warmth\" + 0.016*\"mount\" + 0.009*\"north\" + 0.009*\"land\" + 0.009*\"sourc\" + 0.008*\"foam\" + 0.008*\"lobe\"\n", + "2019-01-31 01:27:32,276 : INFO : topic #11 (0.020): 0.023*\"john\" + 0.012*\"david\" + 0.011*\"will\" + 0.011*\"jame\" + 0.010*\"rival\" + 0.009*\"mexican–american\" + 0.008*\"slur\" + 0.007*\"rhyme\" + 0.007*\"georg\" + 0.007*\"paul\"\n", + "2019-01-31 01:27:32,282 : INFO : topic diff=0.003889, rho=0.021958\n", + "2019-01-31 01:27:32,447 : INFO : PROGRESS: pass 0, at document #4150000/4922894\n", + "2019-01-31 01:27:33,828 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:27:34,098 : INFO : topic #28 (0.020): 0.035*\"build\" + 0.030*\"hous\" + 0.018*\"buford\" + 0.015*\"histor\" + 0.012*\"linear\" + 0.011*\"depress\" + 0.011*\"constitut\" + 0.011*\"silicon\" + 0.010*\"centuri\" + 0.010*\"pistol\"\n", + "2019-01-31 01:27:34,099 : INFO : topic #39 (0.020): 0.060*\"canada\" + 0.045*\"canadian\" + 0.023*\"toronto\" + 0.023*\"hoar\" + 0.021*\"ontario\" + 0.015*\"new\" + 0.015*\"hydrogen\" + 0.014*\"misericordia\" + 0.014*\"quebec\" + 0.013*\"novotná\"\n", + "2019-01-31 01:27:34,101 : INFO : topic #7 (0.020): 0.021*\"snatch\" + 0.020*\"di\" + 0.019*\"factor\" + 0.016*\"margin\" + 0.016*\"yawn\" + 0.014*\"bone\" + 0.013*\"life\" + 0.013*\"faster\" + 0.012*\"daughter\" + 0.012*\"deal\"\n", + "2019-01-31 01:27:34,102 : INFO : topic #41 (0.020): 0.041*\"citi\" + 0.023*\"palmer\" + 0.020*\"new\" + 0.017*\"strategist\" + 0.013*\"open\" + 0.013*\"center\" + 0.011*\"includ\" + 0.011*\"lobe\" + 0.010*\"dai\" + 0.009*\"area\"\n", + "2019-01-31 01:27:34,102 : INFO : topic #32 (0.020): 0.049*\"district\" + 0.046*\"popolo\" + 0.043*\"vigour\" + 0.036*\"tortur\" + 0.033*\"cotton\" + 0.024*\"multitud\" + 0.021*\"area\" + 0.021*\"adulthood\" + 0.019*\"cede\" + 0.018*\"citi\"\n", + "2019-01-31 01:27:34,108 : INFO : topic diff=0.003091, rho=0.021953\n", + "2019-01-31 01:27:34,266 : INFO : PROGRESS: pass 0, at document #4152000/4922894\n", + "2019-01-31 01:27:35,657 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:27:35,924 : INFO : topic #25 (0.020): 0.033*\"ring\" + 0.018*\"area\" + 0.018*\"lagrang\" + 0.017*\"warmth\" + 0.016*\"mount\" + 0.009*\"north\" + 0.009*\"land\" + 0.009*\"sourc\" + 0.009*\"foam\" + 0.008*\"lobe\"\n", + "2019-01-31 01:27:35,925 : INFO : topic #0 (0.020): 0.064*\"statewid\" + 0.039*\"line\" + 0.031*\"raid\" + 0.027*\"rivièr\" + 0.026*\"rosenwald\" + 0.023*\"airmen\" + 0.019*\"serv\" + 0.019*\"traceabl\" + 0.013*\"oper\" + 0.010*\"transient\"\n", + "2019-01-31 01:27:35,926 : INFO : topic #23 (0.020): 0.136*\"audit\" + 0.071*\"best\" + 0.034*\"yawn\" + 0.027*\"jacksonvil\" + 0.023*\"noll\" + 0.022*\"japanes\" + 0.019*\"women\" + 0.018*\"festiv\" + 0.016*\"intern\" + 0.013*\"prison\"\n", + "2019-01-31 01:27:35,927 : INFO : topic #48 (0.020): 0.079*\"sens\" + 0.079*\"march\" + 0.078*\"octob\" + 0.071*\"juli\" + 0.071*\"august\" + 0.071*\"januari\" + 0.068*\"notion\" + 0.067*\"april\" + 0.066*\"judici\" + 0.064*\"decatur\"\n", + "2019-01-31 01:27:35,928 : INFO : topic #24 (0.020): 0.039*\"book\" + 0.035*\"publicis\" + 0.027*\"word\" + 0.019*\"new\" + 0.014*\"edit\" + 0.014*\"presid\" + 0.011*\"worldwid\" + 0.011*\"magazin\" + 0.011*\"author\" + 0.011*\"nicola\"\n", + "2019-01-31 01:27:35,934 : INFO : topic diff=0.003224, rho=0.021948\n", + "2019-01-31 01:27:36,095 : INFO : PROGRESS: pass 0, at document #4154000/4922894\n", + "2019-01-31 01:27:37,492 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:27:37,759 : INFO : topic #6 (0.020): 0.070*\"fewer\" + 0.023*\"epiru\" + 0.020*\"septemb\" + 0.018*\"teacher\" + 0.015*\"stake\" + 0.012*\"rodríguez\" + 0.011*\"direct\" + 0.011*\"proclaim\" + 0.010*\"movi\" + 0.010*\"acrimoni\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 01:27:37,760 : INFO : topic #49 (0.020): 0.044*\"india\" + 0.031*\"incumb\" + 0.013*\"islam\" + 0.013*\"televis\" + 0.012*\"pakistan\" + 0.011*\"khalsa\" + 0.011*\"muskoge\" + 0.011*\"affection\" + 0.011*\"anglo\" + 0.010*\"sri\"\n", + "2019-01-31 01:27:37,761 : INFO : topic #44 (0.020): 0.031*\"rooftop\" + 0.028*\"final\" + 0.024*\"wife\" + 0.022*\"tourist\" + 0.019*\"champion\" + 0.015*\"chamber\" + 0.014*\"tiepolo\" + 0.014*\"taxpay\" + 0.014*\"martin\" + 0.013*\"open\"\n", + "2019-01-31 01:27:37,762 : INFO : topic #25 (0.020): 0.033*\"ring\" + 0.018*\"area\" + 0.018*\"lagrang\" + 0.017*\"warmth\" + 0.016*\"mount\" + 0.009*\"north\" + 0.009*\"land\" + 0.009*\"sourc\" + 0.009*\"foam\" + 0.009*\"palmer\"\n", + "2019-01-31 01:27:37,763 : INFO : topic #26 (0.020): 0.030*\"workplac\" + 0.029*\"champion\" + 0.026*\"woman\" + 0.024*\"olymp\" + 0.023*\"men\" + 0.022*\"medal\" + 0.019*\"event\" + 0.019*\"taxpay\" + 0.018*\"nation\" + 0.017*\"atheist\"\n", + "2019-01-31 01:27:37,769 : INFO : topic diff=0.003359, rho=0.021942\n", + "2019-01-31 01:27:37,926 : INFO : PROGRESS: pass 0, at document #4156000/4922894\n", + "2019-01-31 01:27:39,312 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:27:39,578 : INFO : topic #9 (0.020): 0.071*\"bone\" + 0.042*\"american\" + 0.029*\"valour\" + 0.020*\"dutch\" + 0.018*\"player\" + 0.017*\"folei\" + 0.017*\"polit\" + 0.016*\"english\" + 0.013*\"acrimoni\" + 0.013*\"simpler\"\n", + "2019-01-31 01:27:39,579 : INFO : topic #15 (0.020): 0.011*\"small\" + 0.010*\"organ\" + 0.010*\"develop\" + 0.009*\"commun\" + 0.009*\"word\" + 0.009*\"group\" + 0.008*\"peopl\" + 0.007*\"human\" + 0.007*\"woman\" + 0.006*\"summerhil\"\n", + "2019-01-31 01:27:39,580 : INFO : topic #29 (0.020): 0.031*\"companhia\" + 0.013*\"busi\" + 0.012*\"million\" + 0.011*\"produc\" + 0.011*\"market\" + 0.011*\"bank\" + 0.010*\"industri\" + 0.008*\"yawn\" + 0.008*\"manag\" + 0.007*\"serv\"\n", + "2019-01-31 01:27:39,582 : INFO : topic #0 (0.020): 0.064*\"statewid\" + 0.040*\"line\" + 0.031*\"raid\" + 0.027*\"rivièr\" + 0.026*\"rosenwald\" + 0.023*\"airmen\" + 0.019*\"serv\" + 0.019*\"traceabl\" + 0.014*\"oper\" + 0.010*\"transient\"\n", + "2019-01-31 01:27:39,583 : INFO : topic #36 (0.020): 0.011*\"network\" + 0.011*\"prognosi\" + 0.011*\"pop\" + 0.009*\"cytokin\" + 0.008*\"softwar\" + 0.008*\"develop\" + 0.008*\"diggin\" + 0.008*\"uruguayan\" + 0.008*\"championship\" + 0.007*\"user\"\n", + "2019-01-31 01:27:39,588 : INFO : topic diff=0.002757, rho=0.021937\n", + "2019-01-31 01:27:39,800 : INFO : PROGRESS: pass 0, at document #4158000/4922894\n", + "2019-01-31 01:27:41,147 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:27:41,414 : INFO : topic #17 (0.020): 0.079*\"church\" + 0.023*\"cathol\" + 0.022*\"christian\" + 0.021*\"bishop\" + 0.016*\"sail\" + 0.015*\"retroflex\" + 0.009*\"relationship\" + 0.009*\"parish\" + 0.009*\"cathedr\" + 0.009*\"poll\"\n", + "2019-01-31 01:27:41,415 : INFO : topic #45 (0.020): 0.043*\"arsen\" + 0.029*\"jpg\" + 0.027*\"museo\" + 0.027*\"fifteenth\" + 0.022*\"pain\" + 0.021*\"illicit\" + 0.016*\"artist\" + 0.016*\"exhaust\" + 0.016*\"gai\" + 0.015*\"colder\"\n", + "2019-01-31 01:27:41,417 : INFO : topic #41 (0.020): 0.041*\"citi\" + 0.023*\"palmer\" + 0.020*\"new\" + 0.017*\"strategist\" + 0.013*\"open\" + 0.013*\"center\" + 0.011*\"includ\" + 0.011*\"lobe\" + 0.011*\"dai\" + 0.009*\"local\"\n", + "2019-01-31 01:27:41,418 : INFO : topic #1 (0.020): 0.055*\"china\" + 0.046*\"chilton\" + 0.026*\"kong\" + 0.025*\"hong\" + 0.020*\"korea\" + 0.018*\"korean\" + 0.016*\"shirin\" + 0.015*\"leah\" + 0.015*\"sourc\" + 0.014*\"kim\"\n", + "2019-01-31 01:27:41,419 : INFO : topic #27 (0.020): 0.074*\"questionnair\" + 0.021*\"candid\" + 0.019*\"taxpay\" + 0.014*\"tornado\" + 0.012*\"driver\" + 0.012*\"fool\" + 0.011*\"ret\" + 0.011*\"find\" + 0.011*\"horac\" + 0.010*\"squatter\"\n", + "2019-01-31 01:27:41,426 : INFO : topic diff=0.003258, rho=0.021932\n", + "2019-01-31 01:27:44,081 : INFO : -11.643 per-word bound, 3198.3 perplexity estimate based on a held-out corpus of 2000 documents with 541281 words\n", + "2019-01-31 01:27:44,082 : INFO : PROGRESS: pass 0, at document #4160000/4922894\n", + "2019-01-31 01:27:45,451 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:27:45,718 : INFO : topic #3 (0.020): 0.033*\"present\" + 0.025*\"offic\" + 0.024*\"nation\" + 0.023*\"minist\" + 0.023*\"govern\" + 0.021*\"member\" + 0.017*\"start\" + 0.017*\"serv\" + 0.015*\"gener\" + 0.014*\"seri\"\n", + "2019-01-31 01:27:45,719 : INFO : topic #25 (0.020): 0.033*\"ring\" + 0.018*\"area\" + 0.018*\"lagrang\" + 0.017*\"warmth\" + 0.016*\"mount\" + 0.009*\"north\" + 0.009*\"land\" + 0.009*\"sourc\" + 0.009*\"foam\" + 0.009*\"lobe\"\n", + "2019-01-31 01:27:45,720 : INFO : topic #40 (0.020): 0.086*\"unit\" + 0.023*\"schuster\" + 0.022*\"collector\" + 0.022*\"institut\" + 0.021*\"requir\" + 0.019*\"student\" + 0.014*\"professor\" + 0.012*\"word\" + 0.011*\"http\" + 0.011*\"degre\"\n", + "2019-01-31 01:27:45,721 : INFO : topic #45 (0.020): 0.043*\"arsen\" + 0.029*\"jpg\" + 0.027*\"museo\" + 0.027*\"fifteenth\" + 0.022*\"pain\" + 0.021*\"illicit\" + 0.016*\"exhaust\" + 0.016*\"artist\" + 0.016*\"gai\" + 0.015*\"colder\"\n", + "2019-01-31 01:27:45,722 : INFO : topic #12 (0.020): 0.008*\"number\" + 0.007*\"frontal\" + 0.006*\"gener\" + 0.006*\"exampl\" + 0.006*\"utopian\" + 0.006*\"poet\" + 0.006*\"southern\" + 0.006*\"théori\" + 0.006*\"measur\" + 0.006*\"field\"\n", + "2019-01-31 01:27:45,728 : INFO : topic diff=0.003244, rho=0.021926\n", + "2019-01-31 01:27:45,884 : INFO : PROGRESS: pass 0, at document #4162000/4922894\n", + "2019-01-31 01:27:47,264 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:27:47,534 : INFO : topic #30 (0.020): 0.036*\"cleveland\" + 0.036*\"leagu\" + 0.029*\"place\" + 0.028*\"taxpay\" + 0.024*\"scientist\" + 0.024*\"crete\" + 0.022*\"folei\" + 0.016*\"goal\" + 0.016*\"martin\" + 0.012*\"schmitz\"\n", + "2019-01-31 01:27:47,535 : INFO : topic #47 (0.020): 0.062*\"muscl\" + 0.033*\"perceptu\" + 0.020*\"theater\" + 0.018*\"place\" + 0.017*\"compos\" + 0.016*\"damn\" + 0.013*\"orchestr\" + 0.013*\"olympo\" + 0.013*\"physician\" + 0.011*\"word\"\n", + "2019-01-31 01:27:47,536 : INFO : topic #5 (0.020): 0.039*\"abroad\" + 0.028*\"son\" + 0.027*\"rel\" + 0.025*\"reconstruct\" + 0.021*\"band\" + 0.017*\"muscl\" + 0.015*\"simultan\" + 0.013*\"toyota\" + 0.013*\"charcoal\" + 0.010*\"myspac\"\n", + "2019-01-31 01:27:47,537 : INFO : topic #17 (0.020): 0.079*\"church\" + 0.023*\"cathol\" + 0.022*\"christian\" + 0.021*\"bishop\" + 0.017*\"sail\" + 0.015*\"retroflex\" + 0.009*\"relationship\" + 0.009*\"parish\" + 0.009*\"historiographi\" + 0.009*\"cathedr\"\n", + "2019-01-31 01:27:47,538 : INFO : topic #3 (0.020): 0.033*\"present\" + 0.025*\"offic\" + 0.024*\"nation\" + 0.023*\"minist\" + 0.023*\"govern\" + 0.021*\"member\" + 0.017*\"start\" + 0.017*\"serv\" + 0.015*\"gener\" + 0.014*\"seri\"\n", + "2019-01-31 01:27:47,544 : INFO : topic diff=0.003101, rho=0.021921\n", + "2019-01-31 01:27:47,700 : INFO : PROGRESS: pass 0, at document #4164000/4922894\n", + "2019-01-31 01:27:49,057 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:27:49,324 : INFO : topic #1 (0.020): 0.055*\"china\" + 0.047*\"chilton\" + 0.026*\"kong\" + 0.025*\"hong\" + 0.020*\"korea\" + 0.017*\"korean\" + 0.016*\"leah\" + 0.015*\"shirin\" + 0.015*\"sourc\" + 0.014*\"kim\"\n", + "2019-01-31 01:27:49,325 : INFO : topic #28 (0.020): 0.036*\"build\" + 0.030*\"hous\" + 0.018*\"buford\" + 0.015*\"histor\" + 0.012*\"linear\" + 0.011*\"depress\" + 0.011*\"constitut\" + 0.011*\"silicon\" + 0.010*\"centuri\" + 0.010*\"pistol\"\n", + "2019-01-31 01:27:49,326 : INFO : topic #22 (0.020): 0.033*\"spars\" + 0.018*\"factor\" + 0.013*\"plaisir\" + 0.010*\"western\" + 0.010*\"genu\" + 0.009*\"biom\" + 0.008*\"median\" + 0.007*\"florida\" + 0.006*\"trap\" + 0.006*\"incom\"\n", + "2019-01-31 01:27:49,327 : INFO : topic #20 (0.020): 0.140*\"scholar\" + 0.041*\"struggl\" + 0.033*\"high\" + 0.030*\"educ\" + 0.024*\"collector\" + 0.018*\"yawn\" + 0.013*\"prognosi\" + 0.009*\"class\" + 0.009*\"gothic\" + 0.009*\"district\"\n", + "2019-01-31 01:27:49,328 : INFO : topic #2 (0.020): 0.050*\"isl\" + 0.038*\"shield\" + 0.018*\"narrat\" + 0.015*\"scot\" + 0.013*\"pope\" + 0.012*\"blur\" + 0.011*\"nativist\" + 0.010*\"coalit\" + 0.010*\"class\" + 0.009*\"bahá\"\n", + "2019-01-31 01:27:49,334 : INFO : topic diff=0.003037, rho=0.021916\n", + "2019-01-31 01:27:49,492 : INFO : PROGRESS: pass 0, at document #4166000/4922894\n", + "2019-01-31 01:27:50,877 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:27:51,143 : INFO : topic #46 (0.020): 0.017*\"stop\" + 0.015*\"norwai\" + 0.015*\"sweden\" + 0.014*\"wind\" + 0.014*\"damag\" + 0.014*\"swedish\" + 0.013*\"norwegian\" + 0.012*\"treeless\" + 0.012*\"huntsvil\" + 0.010*\"denmark\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 01:27:51,144 : INFO : topic #33 (0.020): 0.060*\"french\" + 0.045*\"franc\" + 0.030*\"pari\" + 0.022*\"jean\" + 0.021*\"sail\" + 0.017*\"daphn\" + 0.013*\"lazi\" + 0.012*\"loui\" + 0.011*\"piec\" + 0.010*\"wine\"\n", + "2019-01-31 01:27:51,145 : INFO : topic #27 (0.020): 0.073*\"questionnair\" + 0.021*\"candid\" + 0.018*\"taxpay\" + 0.014*\"tornado\" + 0.014*\"ret\" + 0.012*\"driver\" + 0.012*\"horac\" + 0.011*\"fool\" + 0.011*\"find\" + 0.010*\"squatter\"\n", + "2019-01-31 01:27:51,147 : INFO : topic #28 (0.020): 0.036*\"build\" + 0.030*\"hous\" + 0.018*\"buford\" + 0.015*\"histor\" + 0.012*\"linear\" + 0.011*\"constitut\" + 0.011*\"depress\" + 0.010*\"silicon\" + 0.010*\"centuri\" + 0.010*\"pistol\"\n", + "2019-01-31 01:27:51,147 : INFO : topic #13 (0.020): 0.027*\"london\" + 0.026*\"sourc\" + 0.025*\"australia\" + 0.024*\"new\" + 0.023*\"england\" + 0.022*\"australian\" + 0.019*\"british\" + 0.018*\"ireland\" + 0.015*\"youth\" + 0.013*\"wale\"\n", + "2019-01-31 01:27:51,153 : INFO : topic diff=0.003395, rho=0.021911\n", + "2019-01-31 01:27:51,308 : INFO : PROGRESS: pass 0, at document #4168000/4922894\n", + "2019-01-31 01:27:52,676 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:27:52,942 : INFO : topic #30 (0.020): 0.036*\"cleveland\" + 0.036*\"leagu\" + 0.029*\"place\" + 0.027*\"taxpay\" + 0.024*\"scientist\" + 0.024*\"crete\" + 0.022*\"folei\" + 0.017*\"goal\" + 0.016*\"martin\" + 0.012*\"schmitz\"\n", + "2019-01-31 01:27:52,943 : INFO : topic #2 (0.020): 0.050*\"isl\" + 0.038*\"shield\" + 0.017*\"narrat\" + 0.016*\"scot\" + 0.013*\"pope\" + 0.012*\"blur\" + 0.011*\"nativist\" + 0.010*\"coalit\" + 0.010*\"class\" + 0.009*\"bahá\"\n", + "2019-01-31 01:27:52,944 : INFO : topic #9 (0.020): 0.072*\"bone\" + 0.042*\"american\" + 0.028*\"valour\" + 0.020*\"dutch\" + 0.018*\"player\" + 0.017*\"folei\" + 0.017*\"polit\" + 0.017*\"english\" + 0.014*\"acrimoni\" + 0.013*\"simpler\"\n", + "2019-01-31 01:27:52,946 : INFO : topic #36 (0.020): 0.011*\"network\" + 0.010*\"prognosi\" + 0.010*\"pop\" + 0.009*\"cytokin\" + 0.008*\"softwar\" + 0.008*\"develop\" + 0.008*\"diggin\" + 0.008*\"uruguayan\" + 0.007*\"user\" + 0.007*\"championship\"\n", + "2019-01-31 01:27:52,947 : INFO : topic #26 (0.020): 0.030*\"workplac\" + 0.029*\"champion\" + 0.026*\"woman\" + 0.024*\"olymp\" + 0.023*\"men\" + 0.022*\"medal\" + 0.019*\"event\" + 0.018*\"taxpay\" + 0.018*\"nation\" + 0.017*\"rainfal\"\n", + "2019-01-31 01:27:52,953 : INFO : topic diff=0.003222, rho=0.021905\n", + "2019-01-31 01:27:53,110 : INFO : PROGRESS: pass 0, at document #4170000/4922894\n", + "2019-01-31 01:27:54,521 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:27:54,788 : INFO : topic #17 (0.020): 0.078*\"church\" + 0.023*\"cathol\" + 0.022*\"christian\" + 0.021*\"bishop\" + 0.017*\"sail\" + 0.015*\"retroflex\" + 0.010*\"relationship\" + 0.009*\"parish\" + 0.009*\"cathedr\" + 0.009*\"historiographi\"\n", + "2019-01-31 01:27:54,789 : INFO : topic #47 (0.020): 0.063*\"muscl\" + 0.033*\"perceptu\" + 0.020*\"theater\" + 0.017*\"place\" + 0.017*\"compos\" + 0.016*\"damn\" + 0.013*\"orchestr\" + 0.013*\"olympo\" + 0.012*\"physician\" + 0.011*\"word\"\n", + "2019-01-31 01:27:54,790 : INFO : topic #27 (0.020): 0.073*\"questionnair\" + 0.021*\"candid\" + 0.018*\"taxpay\" + 0.014*\"tornado\" + 0.014*\"ret\" + 0.012*\"driver\" + 0.012*\"horac\" + 0.011*\"fool\" + 0.011*\"find\" + 0.010*\"squatter\"\n", + "2019-01-31 01:27:54,791 : INFO : topic #28 (0.020): 0.036*\"build\" + 0.030*\"hous\" + 0.018*\"buford\" + 0.015*\"histor\" + 0.012*\"linear\" + 0.011*\"constitut\" + 0.011*\"depress\" + 0.010*\"silicon\" + 0.010*\"centuri\" + 0.010*\"pistol\"\n", + "2019-01-31 01:27:54,793 : INFO : topic #25 (0.020): 0.033*\"ring\" + 0.018*\"area\" + 0.018*\"lagrang\" + 0.017*\"warmth\" + 0.016*\"mount\" + 0.009*\"north\" + 0.009*\"land\" + 0.009*\"sourc\" + 0.009*\"foam\" + 0.009*\"vacant\"\n", + "2019-01-31 01:27:54,798 : INFO : topic diff=0.003274, rho=0.021900\n", + "2019-01-31 01:27:54,952 : INFO : PROGRESS: pass 0, at document #4172000/4922894\n", + "2019-01-31 01:27:56,313 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:27:56,580 : INFO : topic #36 (0.020): 0.011*\"network\" + 0.011*\"prognosi\" + 0.010*\"pop\" + 0.009*\"cytokin\" + 0.008*\"softwar\" + 0.008*\"develop\" + 0.008*\"diggin\" + 0.008*\"uruguayan\" + 0.007*\"championship\" + 0.007*\"includ\"\n", + "2019-01-31 01:27:56,581 : INFO : topic #2 (0.020): 0.050*\"isl\" + 0.038*\"shield\" + 0.017*\"narrat\" + 0.016*\"scot\" + 0.013*\"pope\" + 0.012*\"blur\" + 0.011*\"nativist\" + 0.010*\"coalit\" + 0.010*\"class\" + 0.009*\"bahá\"\n", + "2019-01-31 01:27:56,582 : INFO : topic #16 (0.020): 0.054*\"king\" + 0.032*\"priest\" + 0.019*\"grammat\" + 0.018*\"duke\" + 0.018*\"idiosyncrat\" + 0.018*\"rotterdam\" + 0.016*\"quarterli\" + 0.014*\"kingdom\" + 0.013*\"order\" + 0.013*\"portugues\"\n", + "2019-01-31 01:27:56,583 : INFO : topic #34 (0.020): 0.067*\"start\" + 0.034*\"new\" + 0.032*\"american\" + 0.029*\"unionist\" + 0.025*\"cotton\" + 0.022*\"year\" + 0.015*\"california\" + 0.013*\"terri\" + 0.013*\"warrior\" + 0.011*\"citi\"\n", + "2019-01-31 01:27:56,584 : INFO : topic #12 (0.020): 0.008*\"number\" + 0.007*\"frontal\" + 0.006*\"exampl\" + 0.006*\"gener\" + 0.006*\"southern\" + 0.006*\"poet\" + 0.006*\"utopian\" + 0.006*\"théori\" + 0.006*\"measur\" + 0.006*\"field\"\n", + "2019-01-31 01:27:56,590 : INFO : topic diff=0.002931, rho=0.021895\n", + "2019-01-31 01:27:56,750 : INFO : PROGRESS: pass 0, at document #4174000/4922894\n", + "2019-01-31 01:27:58,138 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:27:58,408 : INFO : topic #21 (0.020): 0.033*\"samford\" + 0.023*\"spain\" + 0.018*\"del\" + 0.018*\"italian\" + 0.017*\"mexico\" + 0.014*\"soviet\" + 0.012*\"santa\" + 0.011*\"juan\" + 0.010*\"lizard\" + 0.010*\"carlo\"\n", + "2019-01-31 01:27:58,409 : INFO : topic #41 (0.020): 0.041*\"citi\" + 0.023*\"palmer\" + 0.020*\"new\" + 0.017*\"strategist\" + 0.013*\"open\" + 0.013*\"center\" + 0.011*\"includ\" + 0.011*\"lobe\" + 0.010*\"dai\" + 0.009*\"hot\"\n", + "2019-01-31 01:27:58,410 : INFO : topic #7 (0.020): 0.021*\"snatch\" + 0.020*\"di\" + 0.019*\"factor\" + 0.016*\"margin\" + 0.016*\"yawn\" + 0.014*\"bone\" + 0.013*\"life\" + 0.013*\"faster\" + 0.012*\"daughter\" + 0.012*\"deal\"\n", + "2019-01-31 01:27:58,411 : INFO : topic #22 (0.020): 0.033*\"spars\" + 0.018*\"factor\" + 0.013*\"plaisir\" + 0.010*\"western\" + 0.010*\"genu\" + 0.009*\"biom\" + 0.008*\"median\" + 0.007*\"trap\" + 0.007*\"florida\" + 0.007*\"incom\"\n", + "2019-01-31 01:27:58,412 : INFO : topic #30 (0.020): 0.036*\"leagu\" + 0.036*\"cleveland\" + 0.029*\"place\" + 0.027*\"taxpay\" + 0.024*\"scientist\" + 0.024*\"crete\" + 0.022*\"folei\" + 0.017*\"goal\" + 0.016*\"martin\" + 0.012*\"schmitz\"\n", + "2019-01-31 01:27:58,418 : INFO : topic diff=0.002811, rho=0.021890\n", + "2019-01-31 01:27:58,574 : INFO : PROGRESS: pass 0, at document #4176000/4922894\n", + "2019-01-31 01:27:59,946 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:28:00,213 : INFO : topic #32 (0.020): 0.049*\"district\" + 0.045*\"popolo\" + 0.043*\"vigour\" + 0.036*\"tortur\" + 0.033*\"cotton\" + 0.023*\"multitud\" + 0.022*\"adulthood\" + 0.021*\"area\" + 0.019*\"cede\" + 0.018*\"citi\"\n", + "2019-01-31 01:28:00,214 : INFO : topic #41 (0.020): 0.041*\"citi\" + 0.023*\"palmer\" + 0.020*\"new\" + 0.017*\"strategist\" + 0.013*\"open\" + 0.013*\"center\" + 0.011*\"includ\" + 0.011*\"lobe\" + 0.010*\"dai\" + 0.009*\"hot\"\n", + "2019-01-31 01:28:00,215 : INFO : topic #24 (0.020): 0.040*\"book\" + 0.035*\"publicis\" + 0.027*\"word\" + 0.020*\"new\" + 0.014*\"edit\" + 0.014*\"presid\" + 0.011*\"magazin\" + 0.011*\"worldwid\" + 0.011*\"author\" + 0.011*\"nicola\"\n", + "2019-01-31 01:28:00,216 : INFO : topic #48 (0.020): 0.079*\"sens\" + 0.078*\"octob\" + 0.078*\"march\" + 0.071*\"juli\" + 0.071*\"august\" + 0.070*\"januari\" + 0.067*\"notion\" + 0.066*\"judici\" + 0.066*\"april\" + 0.065*\"decatur\"\n", + "2019-01-31 01:28:00,217 : INFO : topic #0 (0.020): 0.063*\"statewid\" + 0.041*\"line\" + 0.031*\"raid\" + 0.028*\"rivièr\" + 0.026*\"rosenwald\" + 0.022*\"airmen\" + 0.019*\"serv\" + 0.019*\"traceabl\" + 0.014*\"oper\" + 0.010*\"transient\"\n", + "2019-01-31 01:28:00,223 : INFO : topic diff=0.003335, rho=0.021884\n", + "2019-01-31 01:28:00,385 : INFO : PROGRESS: pass 0, at document #4178000/4922894\n", + "2019-01-31 01:28:01,813 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:28:02,079 : INFO : topic #18 (0.020): 0.011*\"théori\" + 0.007*\"later\" + 0.007*\"sack\" + 0.006*\"dai\" + 0.006*\"kill\" + 0.005*\"like\" + 0.005*\"end\" + 0.005*\"retrospect\" + 0.004*\"call\" + 0.004*\"wander\"\n", + "2019-01-31 01:28:02,081 : INFO : topic #15 (0.020): 0.011*\"small\" + 0.010*\"organ\" + 0.010*\"develop\" + 0.009*\"commun\" + 0.009*\"word\" + 0.008*\"group\" + 0.008*\"peopl\" + 0.007*\"human\" + 0.007*\"woman\" + 0.006*\"workplac\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 01:28:02,082 : INFO : topic #27 (0.020): 0.073*\"questionnair\" + 0.021*\"candid\" + 0.018*\"taxpay\" + 0.014*\"tornado\" + 0.013*\"ret\" + 0.012*\"horac\" + 0.012*\"driver\" + 0.011*\"fool\" + 0.011*\"find\" + 0.010*\"théori\"\n", + "2019-01-31 01:28:02,083 : INFO : topic #44 (0.020): 0.030*\"rooftop\" + 0.028*\"final\" + 0.024*\"wife\" + 0.022*\"tourist\" + 0.020*\"champion\" + 0.015*\"martin\" + 0.015*\"chamber\" + 0.014*\"tiepolo\" + 0.014*\"taxpay\" + 0.013*\"open\"\n", + "2019-01-31 01:28:02,084 : INFO : topic #33 (0.020): 0.059*\"french\" + 0.046*\"franc\" + 0.030*\"pari\" + 0.022*\"jean\" + 0.021*\"sail\" + 0.017*\"daphn\" + 0.013*\"lazi\" + 0.012*\"loui\" + 0.011*\"piec\" + 0.010*\"wine\"\n", + "2019-01-31 01:28:02,090 : INFO : topic diff=0.002943, rho=0.021879\n", + "2019-01-31 01:28:04,807 : INFO : -11.514 per-word bound, 2925.5 perplexity estimate based on a held-out corpus of 2000 documents with 561329 words\n", + "2019-01-31 01:28:04,808 : INFO : PROGRESS: pass 0, at document #4180000/4922894\n", + "2019-01-31 01:28:06,186 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:28:06,453 : INFO : topic #22 (0.020): 0.033*\"spars\" + 0.018*\"factor\" + 0.013*\"plaisir\" + 0.010*\"western\" + 0.010*\"genu\" + 0.009*\"biom\" + 0.008*\"median\" + 0.007*\"trap\" + 0.007*\"incom\" + 0.006*\"florida\"\n", + "2019-01-31 01:28:06,454 : INFO : topic #43 (0.020): 0.068*\"elect\" + 0.053*\"parti\" + 0.024*\"voluntari\" + 0.024*\"democrat\" + 0.019*\"member\" + 0.016*\"polici\" + 0.016*\"republ\" + 0.015*\"conserv\" + 0.014*\"bypass\" + 0.013*\"selma\"\n", + "2019-01-31 01:28:06,455 : INFO : topic #21 (0.020): 0.034*\"samford\" + 0.023*\"spain\" + 0.018*\"del\" + 0.017*\"italian\" + 0.017*\"mexico\" + 0.014*\"soviet\" + 0.012*\"santa\" + 0.011*\"juan\" + 0.010*\"lizard\" + 0.010*\"carlo\"\n", + "2019-01-31 01:28:06,456 : INFO : topic #29 (0.020): 0.031*\"companhia\" + 0.013*\"busi\" + 0.012*\"million\" + 0.011*\"produc\" + 0.011*\"market\" + 0.011*\"bank\" + 0.010*\"industri\" + 0.008*\"yawn\" + 0.008*\"manag\" + 0.007*\"serv\"\n", + "2019-01-31 01:28:06,457 : INFO : topic #15 (0.020): 0.011*\"small\" + 0.010*\"organ\" + 0.010*\"develop\" + 0.009*\"commun\" + 0.009*\"word\" + 0.008*\"group\" + 0.008*\"peopl\" + 0.007*\"human\" + 0.007*\"woman\" + 0.006*\"summerhil\"\n", + "2019-01-31 01:28:06,462 : INFO : topic diff=0.002960, rho=0.021874\n", + "2019-01-31 01:28:06,617 : INFO : PROGRESS: pass 0, at document #4182000/4922894\n", + "2019-01-31 01:28:07,956 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:28:08,223 : INFO : topic #6 (0.020): 0.071*\"fewer\" + 0.024*\"epiru\" + 0.020*\"septemb\" + 0.018*\"teacher\" + 0.015*\"stake\" + 0.012*\"rodríguez\" + 0.011*\"proclaim\" + 0.011*\"direct\" + 0.010*\"movi\" + 0.010*\"acrimoni\"\n", + "2019-01-31 01:28:08,224 : INFO : topic #41 (0.020): 0.041*\"citi\" + 0.023*\"palmer\" + 0.020*\"new\" + 0.016*\"strategist\" + 0.013*\"open\" + 0.013*\"center\" + 0.011*\"includ\" + 0.011*\"lobe\" + 0.010*\"dai\" + 0.009*\"hot\"\n", + "2019-01-31 01:28:08,225 : INFO : topic #23 (0.020): 0.137*\"audit\" + 0.070*\"best\" + 0.034*\"yawn\" + 0.029*\"jacksonvil\" + 0.023*\"japanes\" + 0.022*\"noll\" + 0.019*\"women\" + 0.018*\"festiv\" + 0.016*\"intern\" + 0.014*\"winner\"\n", + "2019-01-31 01:28:08,226 : INFO : topic #39 (0.020): 0.062*\"canada\" + 0.046*\"canadian\" + 0.024*\"hoar\" + 0.024*\"toronto\" + 0.020*\"ontario\" + 0.015*\"quebec\" + 0.015*\"new\" + 0.015*\"misericordia\" + 0.014*\"hydrogen\" + 0.013*\"novotná\"\n", + "2019-01-31 01:28:08,227 : INFO : topic #12 (0.020): 0.008*\"number\" + 0.007*\"frontal\" + 0.006*\"southern\" + 0.006*\"exampl\" + 0.006*\"poet\" + 0.006*\"gener\" + 0.006*\"utopian\" + 0.006*\"théori\" + 0.006*\"field\" + 0.006*\"servitud\"\n", + "2019-01-31 01:28:08,233 : INFO : topic diff=0.003073, rho=0.021869\n", + "2019-01-31 01:28:08,391 : INFO : PROGRESS: pass 0, at document #4184000/4922894\n", + "2019-01-31 01:28:09,769 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:28:10,036 : INFO : topic #44 (0.020): 0.030*\"rooftop\" + 0.028*\"final\" + 0.023*\"wife\" + 0.022*\"tourist\" + 0.019*\"champion\" + 0.015*\"martin\" + 0.015*\"chamber\" + 0.014*\"tiepolo\" + 0.014*\"taxpay\" + 0.013*\"open\"\n", + "2019-01-31 01:28:10,037 : INFO : topic #49 (0.020): 0.044*\"india\" + 0.031*\"incumb\" + 0.013*\"islam\" + 0.013*\"pakistan\" + 0.012*\"televis\" + 0.011*\"muskoge\" + 0.011*\"anglo\" + 0.010*\"affection\" + 0.010*\"khalsa\" + 0.010*\"sri\"\n", + "2019-01-31 01:28:10,038 : INFO : topic #35 (0.020): 0.055*\"russia\" + 0.036*\"sovereignti\" + 0.032*\"rural\" + 0.026*\"personifi\" + 0.024*\"reprint\" + 0.024*\"poison\" + 0.020*\"moscow\" + 0.019*\"poland\" + 0.016*\"malaysia\" + 0.015*\"unfortun\"\n", + "2019-01-31 01:28:10,039 : INFO : topic #32 (0.020): 0.049*\"district\" + 0.045*\"popolo\" + 0.043*\"vigour\" + 0.036*\"tortur\" + 0.033*\"cotton\" + 0.023*\"multitud\" + 0.022*\"adulthood\" + 0.021*\"area\" + 0.019*\"cede\" + 0.018*\"citi\"\n", + "2019-01-31 01:28:10,040 : INFO : topic #19 (0.020): 0.016*\"languag\" + 0.015*\"centuri\" + 0.011*\"woodcut\" + 0.010*\"form\" + 0.009*\"origin\" + 0.009*\"mean\" + 0.008*\"trade\" + 0.007*\"english\" + 0.007*\"known\" + 0.007*\"uruguayan\"\n", + "2019-01-31 01:28:10,046 : INFO : topic diff=0.003508, rho=0.021863\n", + "2019-01-31 01:28:10,205 : INFO : PROGRESS: pass 0, at document #4186000/4922894\n", + "2019-01-31 01:28:11,590 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:28:11,857 : INFO : topic #40 (0.020): 0.086*\"unit\" + 0.023*\"schuster\" + 0.022*\"collector\" + 0.021*\"institut\" + 0.020*\"requir\" + 0.019*\"student\" + 0.014*\"professor\" + 0.012*\"word\" + 0.011*\"degre\" + 0.011*\"http\"\n", + "2019-01-31 01:28:11,858 : INFO : topic #33 (0.020): 0.059*\"french\" + 0.046*\"franc\" + 0.030*\"pari\" + 0.022*\"jean\" + 0.021*\"sail\" + 0.017*\"daphn\" + 0.013*\"lazi\" + 0.012*\"loui\" + 0.011*\"piec\" + 0.010*\"wine\"\n", + "2019-01-31 01:28:11,860 : INFO : topic #34 (0.020): 0.067*\"start\" + 0.034*\"new\" + 0.032*\"american\" + 0.029*\"unionist\" + 0.026*\"cotton\" + 0.022*\"year\" + 0.015*\"california\" + 0.013*\"terri\" + 0.013*\"warrior\" + 0.011*\"citi\"\n", + "2019-01-31 01:28:11,861 : INFO : topic #20 (0.020): 0.140*\"scholar\" + 0.041*\"struggl\" + 0.033*\"high\" + 0.030*\"educ\" + 0.024*\"collector\" + 0.018*\"yawn\" + 0.013*\"prognosi\" + 0.009*\"gothic\" + 0.009*\"district\" + 0.009*\"task\"\n", + "2019-01-31 01:28:11,862 : INFO : topic #22 (0.020): 0.033*\"spars\" + 0.018*\"factor\" + 0.012*\"plaisir\" + 0.010*\"western\" + 0.010*\"genu\" + 0.009*\"biom\" + 0.008*\"median\" + 0.007*\"incom\" + 0.006*\"trap\" + 0.006*\"florida\"\n", + "2019-01-31 01:28:11,868 : INFO : topic diff=0.003025, rho=0.021858\n", + "2019-01-31 01:28:12,029 : INFO : PROGRESS: pass 0, at document #4188000/4922894\n", + "2019-01-31 01:28:13,914 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:28:14,180 : INFO : topic #27 (0.020): 0.075*\"questionnair\" + 0.021*\"candid\" + 0.018*\"taxpay\" + 0.014*\"tornado\" + 0.013*\"ret\" + 0.012*\"horac\" + 0.012*\"driver\" + 0.011*\"fool\" + 0.011*\"find\" + 0.010*\"théori\"\n", + "2019-01-31 01:28:14,181 : INFO : topic #1 (0.020): 0.056*\"china\" + 0.046*\"chilton\" + 0.026*\"kong\" + 0.025*\"hong\" + 0.021*\"korea\" + 0.018*\"korean\" + 0.017*\"leah\" + 0.015*\"shirin\" + 0.015*\"sourc\" + 0.014*\"kim\"\n", + "2019-01-31 01:28:14,182 : INFO : topic #26 (0.020): 0.030*\"workplac\" + 0.028*\"champion\" + 0.026*\"woman\" + 0.024*\"olymp\" + 0.023*\"men\" + 0.022*\"medal\" + 0.019*\"event\" + 0.018*\"taxpay\" + 0.018*\"nation\" + 0.017*\"rainfal\"\n", + "2019-01-31 01:28:14,183 : INFO : topic #42 (0.020): 0.047*\"german\" + 0.032*\"germani\" + 0.016*\"vol\" + 0.014*\"jewish\" + 0.014*\"israel\" + 0.014*\"berlin\" + 0.013*\"der\" + 0.010*\"european\" + 0.010*\"europ\" + 0.009*\"austria\"\n", + "2019-01-31 01:28:14,184 : INFO : topic #49 (0.020): 0.044*\"india\" + 0.031*\"incumb\" + 0.014*\"islam\" + 0.013*\"pakistan\" + 0.012*\"televis\" + 0.011*\"muskoge\" + 0.011*\"anglo\" + 0.011*\"affection\" + 0.010*\"khalsa\" + 0.010*\"sri\"\n", + "2019-01-31 01:28:14,190 : INFO : topic diff=0.003308, rho=0.021853\n", + "2019-01-31 01:28:14,346 : INFO : PROGRESS: pass 0, at document #4190000/4922894\n", + "2019-01-31 01:28:15,753 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:28:16,021 : INFO : topic #0 (0.020): 0.063*\"statewid\" + 0.040*\"line\" + 0.031*\"raid\" + 0.029*\"rivièr\" + 0.027*\"rosenwald\" + 0.022*\"airmen\" + 0.019*\"serv\" + 0.018*\"traceabl\" + 0.013*\"oper\" + 0.010*\"transient\"\n", + "2019-01-31 01:28:16,022 : INFO : topic #35 (0.020): 0.055*\"russia\" + 0.038*\"sovereignti\" + 0.032*\"rural\" + 0.026*\"personifi\" + 0.024*\"reprint\" + 0.024*\"poison\" + 0.020*\"moscow\" + 0.019*\"poland\" + 0.016*\"malaysia\" + 0.015*\"unfortun\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 01:28:16,023 : INFO : topic #43 (0.020): 0.069*\"elect\" + 0.053*\"parti\" + 0.024*\"democrat\" + 0.024*\"voluntari\" + 0.019*\"member\" + 0.016*\"polici\" + 0.016*\"republ\" + 0.014*\"conserv\" + 0.014*\"selma\" + 0.014*\"bypass\"\n", + "2019-01-31 01:28:16,024 : INFO : topic #32 (0.020): 0.049*\"district\" + 0.045*\"popolo\" + 0.043*\"vigour\" + 0.036*\"tortur\" + 0.033*\"cotton\" + 0.023*\"multitud\" + 0.022*\"adulthood\" + 0.021*\"area\" + 0.019*\"cede\" + 0.018*\"citi\"\n", + "2019-01-31 01:28:16,025 : INFO : topic #4 (0.020): 0.019*\"enfranchis\" + 0.015*\"depress\" + 0.014*\"pour\" + 0.008*\"elabor\" + 0.008*\"uruguayan\" + 0.008*\"veget\" + 0.007*\"mode\" + 0.006*\"develop\" + 0.006*\"spectacl\" + 0.006*\"turn\"\n", + "2019-01-31 01:28:16,031 : INFO : topic diff=0.002794, rho=0.021848\n", + "2019-01-31 01:28:16,242 : INFO : PROGRESS: pass 0, at document #4192000/4922894\n", + "2019-01-31 01:28:17,599 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:28:17,865 : INFO : topic #47 (0.020): 0.063*\"muscl\" + 0.033*\"perceptu\" + 0.021*\"theater\" + 0.018*\"compos\" + 0.018*\"place\" + 0.015*\"damn\" + 0.013*\"olympo\" + 0.013*\"orchestr\" + 0.012*\"physician\" + 0.011*\"word\"\n", + "2019-01-31 01:28:17,867 : INFO : topic #6 (0.020): 0.070*\"fewer\" + 0.024*\"epiru\" + 0.020*\"septemb\" + 0.018*\"teacher\" + 0.015*\"stake\" + 0.012*\"rodríguez\" + 0.011*\"direct\" + 0.011*\"proclaim\" + 0.010*\"movi\" + 0.010*\"acrimoni\"\n", + "2019-01-31 01:28:17,868 : INFO : topic #7 (0.020): 0.021*\"snatch\" + 0.020*\"di\" + 0.019*\"factor\" + 0.016*\"margin\" + 0.016*\"yawn\" + 0.014*\"bone\" + 0.013*\"life\" + 0.013*\"faster\" + 0.012*\"deal\" + 0.011*\"daughter\"\n", + "2019-01-31 01:28:17,869 : INFO : topic #48 (0.020): 0.080*\"sens\" + 0.080*\"march\" + 0.078*\"octob\" + 0.072*\"juli\" + 0.072*\"januari\" + 0.071*\"august\" + 0.068*\"notion\" + 0.068*\"judici\" + 0.067*\"april\" + 0.065*\"decatur\"\n", + "2019-01-31 01:28:17,870 : INFO : topic #38 (0.020): 0.022*\"walter\" + 0.010*\"aza\" + 0.009*\"forc\" + 0.008*\"battalion\" + 0.007*\"armi\" + 0.007*\"empath\" + 0.007*\"teufel\" + 0.006*\"govern\" + 0.006*\"militari\" + 0.006*\"citi\"\n", + "2019-01-31 01:28:17,876 : INFO : topic diff=0.003122, rho=0.021843\n", + "2019-01-31 01:28:18,039 : INFO : PROGRESS: pass 0, at document #4194000/4922894\n", + "2019-01-31 01:28:19,446 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:28:19,713 : INFO : topic #38 (0.020): 0.022*\"walter\" + 0.010*\"aza\" + 0.009*\"forc\" + 0.008*\"battalion\" + 0.007*\"armi\" + 0.007*\"empath\" + 0.007*\"teufel\" + 0.006*\"govern\" + 0.006*\"militari\" + 0.006*\"citi\"\n", + "2019-01-31 01:28:19,714 : INFO : topic #7 (0.020): 0.021*\"snatch\" + 0.020*\"di\" + 0.019*\"factor\" + 0.016*\"margin\" + 0.016*\"yawn\" + 0.014*\"bone\" + 0.013*\"life\" + 0.013*\"faster\" + 0.012*\"deal\" + 0.011*\"daughter\"\n", + "2019-01-31 01:28:19,715 : INFO : topic #5 (0.020): 0.038*\"abroad\" + 0.029*\"son\" + 0.027*\"rel\" + 0.025*\"reconstruct\" + 0.021*\"band\" + 0.017*\"muscl\" + 0.015*\"simultan\" + 0.014*\"charcoal\" + 0.013*\"toyota\" + 0.010*\"myspac\"\n", + "2019-01-31 01:28:19,716 : INFO : topic #41 (0.020): 0.040*\"citi\" + 0.023*\"palmer\" + 0.020*\"new\" + 0.016*\"strategist\" + 0.013*\"center\" + 0.013*\"open\" + 0.011*\"includ\" + 0.011*\"lobe\" + 0.010*\"dai\" + 0.009*\"hot\"\n", + "2019-01-31 01:28:19,717 : INFO : topic #13 (0.020): 0.027*\"london\" + 0.026*\"sourc\" + 0.025*\"australia\" + 0.024*\"new\" + 0.023*\"australian\" + 0.022*\"england\" + 0.019*\"british\" + 0.018*\"ireland\" + 0.014*\"youth\" + 0.013*\"wale\"\n", + "2019-01-31 01:28:19,723 : INFO : topic diff=0.003516, rho=0.021837\n", + "2019-01-31 01:28:19,875 : INFO : PROGRESS: pass 0, at document #4196000/4922894\n", + "2019-01-31 01:28:21,220 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:28:21,487 : INFO : topic #47 (0.020): 0.063*\"muscl\" + 0.033*\"perceptu\" + 0.021*\"theater\" + 0.018*\"compos\" + 0.018*\"place\" + 0.016*\"damn\" + 0.013*\"olympo\" + 0.013*\"orchestr\" + 0.012*\"physician\" + 0.011*\"word\"\n", + "2019-01-31 01:28:21,488 : INFO : topic #35 (0.020): 0.054*\"russia\" + 0.037*\"sovereignti\" + 0.033*\"rural\" + 0.026*\"personifi\" + 0.024*\"reprint\" + 0.024*\"poison\" + 0.020*\"moscow\" + 0.019*\"poland\" + 0.016*\"malaysia\" + 0.015*\"unfortun\"\n", + "2019-01-31 01:28:21,489 : INFO : topic #43 (0.020): 0.068*\"elect\" + 0.055*\"parti\" + 0.025*\"democrat\" + 0.024*\"voluntari\" + 0.019*\"member\" + 0.016*\"polici\" + 0.015*\"republ\" + 0.013*\"conserv\" + 0.013*\"bypass\" + 0.013*\"selma\"\n", + "2019-01-31 01:28:21,490 : INFO : topic #36 (0.020): 0.011*\"network\" + 0.011*\"pop\" + 0.010*\"prognosi\" + 0.009*\"cytokin\" + 0.008*\"diggin\" + 0.008*\"develop\" + 0.008*\"uruguayan\" + 0.008*\"softwar\" + 0.008*\"championship\" + 0.007*\"includ\"\n", + "2019-01-31 01:28:21,490 : INFO : topic #13 (0.020): 0.028*\"london\" + 0.026*\"sourc\" + 0.025*\"australia\" + 0.024*\"new\" + 0.023*\"england\" + 0.022*\"australian\" + 0.019*\"british\" + 0.018*\"ireland\" + 0.014*\"youth\" + 0.013*\"wale\"\n", + "2019-01-31 01:28:21,496 : INFO : topic diff=0.003670, rho=0.021832\n", + "2019-01-31 01:28:21,656 : INFO : PROGRESS: pass 0, at document #4198000/4922894\n", + "2019-01-31 01:28:23,044 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:28:23,310 : INFO : topic #15 (0.020): 0.011*\"small\" + 0.010*\"organ\" + 0.009*\"develop\" + 0.009*\"commun\" + 0.009*\"word\" + 0.008*\"group\" + 0.008*\"peopl\" + 0.007*\"woman\" + 0.007*\"human\" + 0.006*\"summerhil\"\n", + "2019-01-31 01:28:23,312 : INFO : topic #37 (0.020): 0.013*\"charact\" + 0.012*\"septemb\" + 0.011*\"anim\" + 0.011*\"man\" + 0.009*\"comic\" + 0.007*\"appear\" + 0.007*\"storag\" + 0.007*\"workplac\" + 0.007*\"fusiform\" + 0.006*\"black\"\n", + "2019-01-31 01:28:23,313 : INFO : topic #18 (0.020): 0.011*\"théori\" + 0.007*\"later\" + 0.007*\"sack\" + 0.006*\"dai\" + 0.006*\"kill\" + 0.005*\"like\" + 0.005*\"end\" + 0.005*\"retrospect\" + 0.004*\"call\" + 0.004*\"help\"\n", + "2019-01-31 01:28:23,314 : INFO : topic #17 (0.020): 0.078*\"church\" + 0.025*\"cathol\" + 0.022*\"christian\" + 0.021*\"bishop\" + 0.017*\"sail\" + 0.015*\"retroflex\" + 0.010*\"relationship\" + 0.010*\"parish\" + 0.009*\"historiographi\" + 0.009*\"cathedr\"\n", + "2019-01-31 01:28:23,315 : INFO : topic #3 (0.020): 0.033*\"present\" + 0.025*\"offic\" + 0.024*\"nation\" + 0.023*\"minist\" + 0.023*\"govern\" + 0.022*\"member\" + 0.017*\"start\" + 0.016*\"serv\" + 0.015*\"gener\" + 0.014*\"seri\"\n", + "2019-01-31 01:28:23,321 : INFO : topic diff=0.004351, rho=0.021827\n", + "2019-01-31 01:28:25,977 : INFO : -11.615 per-word bound, 3137.4 perplexity estimate based on a held-out corpus of 2000 documents with 531616 words\n", + "2019-01-31 01:28:25,978 : INFO : PROGRESS: pass 0, at document #4200000/4922894\n", + "2019-01-31 01:28:27,354 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:28:27,621 : INFO : topic #9 (0.020): 0.073*\"bone\" + 0.042*\"american\" + 0.028*\"valour\" + 0.019*\"dutch\" + 0.018*\"player\" + 0.017*\"folei\" + 0.017*\"polit\" + 0.016*\"english\" + 0.014*\"acrimoni\" + 0.013*\"simpler\"\n", + "2019-01-31 01:28:27,622 : INFO : topic #39 (0.020): 0.061*\"canada\" + 0.046*\"canadian\" + 0.024*\"hoar\" + 0.024*\"toronto\" + 0.020*\"ontario\" + 0.015*\"misericordia\" + 0.015*\"new\" + 0.015*\"hydrogen\" + 0.014*\"quebec\" + 0.014*\"novotná\"\n", + "2019-01-31 01:28:27,623 : INFO : topic #47 (0.020): 0.063*\"muscl\" + 0.034*\"perceptu\" + 0.021*\"theater\" + 0.018*\"compos\" + 0.018*\"place\" + 0.016*\"damn\" + 0.013*\"olympo\" + 0.013*\"orchestr\" + 0.012*\"physician\" + 0.011*\"word\"\n", + "2019-01-31 01:28:27,624 : INFO : topic #20 (0.020): 0.140*\"scholar\" + 0.040*\"struggl\" + 0.033*\"high\" + 0.030*\"educ\" + 0.023*\"collector\" + 0.018*\"yawn\" + 0.013*\"prognosi\" + 0.010*\"district\" + 0.009*\"gothic\" + 0.009*\"task\"\n", + "2019-01-31 01:28:27,625 : INFO : topic #17 (0.020): 0.078*\"church\" + 0.025*\"cathol\" + 0.022*\"christian\" + 0.021*\"bishop\" + 0.016*\"sail\" + 0.015*\"retroflex\" + 0.010*\"relationship\" + 0.010*\"parish\" + 0.009*\"historiographi\" + 0.009*\"cathedr\"\n", + "2019-01-31 01:28:27,631 : INFO : topic diff=0.002872, rho=0.021822\n", + "2019-01-31 01:28:27,788 : INFO : PROGRESS: pass 0, at document #4202000/4922894\n", + "2019-01-31 01:28:29,166 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:28:29,432 : INFO : topic #19 (0.020): 0.016*\"languag\" + 0.015*\"centuri\" + 0.011*\"woodcut\" + 0.010*\"form\" + 0.009*\"mean\" + 0.009*\"origin\" + 0.008*\"trade\" + 0.008*\"english\" + 0.007*\"known\" + 0.007*\"uruguayan\"\n", + "2019-01-31 01:28:29,433 : INFO : topic #9 (0.020): 0.073*\"bone\" + 0.042*\"american\" + 0.028*\"valour\" + 0.019*\"dutch\" + 0.018*\"player\" + 0.017*\"folei\" + 0.017*\"polit\" + 0.016*\"english\" + 0.014*\"acrimoni\" + 0.013*\"simpler\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 01:28:29,434 : INFO : topic #1 (0.020): 0.055*\"china\" + 0.045*\"chilton\" + 0.025*\"kong\" + 0.025*\"hong\" + 0.021*\"korea\" + 0.018*\"korean\" + 0.017*\"leah\" + 0.015*\"shirin\" + 0.015*\"sourc\" + 0.014*\"kim\"\n", + "2019-01-31 01:28:29,435 : INFO : topic #4 (0.020): 0.020*\"enfranchis\" + 0.015*\"depress\" + 0.014*\"pour\" + 0.008*\"elabor\" + 0.008*\"uruguayan\" + 0.008*\"mode\" + 0.007*\"veget\" + 0.006*\"develop\" + 0.006*\"spectacl\" + 0.006*\"produc\"\n", + "2019-01-31 01:28:29,436 : INFO : topic #18 (0.020): 0.011*\"théori\" + 0.007*\"later\" + 0.007*\"sack\" + 0.006*\"dai\" + 0.005*\"kill\" + 0.005*\"like\" + 0.005*\"end\" + 0.005*\"retrospect\" + 0.004*\"call\" + 0.004*\"help\"\n", + "2019-01-31 01:28:29,442 : INFO : topic diff=0.003367, rho=0.021817\n", + "2019-01-31 01:28:29,602 : INFO : PROGRESS: pass 0, at document #4204000/4922894\n", + "2019-01-31 01:28:30,999 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:28:31,265 : INFO : topic #15 (0.020): 0.011*\"small\" + 0.010*\"organ\" + 0.009*\"develop\" + 0.009*\"commun\" + 0.009*\"word\" + 0.009*\"group\" + 0.008*\"peopl\" + 0.007*\"human\" + 0.007*\"woman\" + 0.006*\"summerhil\"\n", + "2019-01-31 01:28:31,266 : INFO : topic #31 (0.020): 0.050*\"fusiform\" + 0.027*\"scientist\" + 0.025*\"taxpay\" + 0.022*\"player\" + 0.019*\"place\" + 0.014*\"clot\" + 0.013*\"leagu\" + 0.011*\"folei\" + 0.010*\"yawn\" + 0.009*\"reconstruct\"\n", + "2019-01-31 01:28:31,267 : INFO : topic #25 (0.020): 0.033*\"ring\" + 0.018*\"area\" + 0.018*\"lagrang\" + 0.017*\"warmth\" + 0.016*\"mount\" + 0.009*\"north\" + 0.009*\"land\" + 0.009*\"sourc\" + 0.009*\"foam\" + 0.009*\"lobe\"\n", + "2019-01-31 01:28:31,268 : INFO : topic #17 (0.020): 0.079*\"church\" + 0.025*\"cathol\" + 0.022*\"christian\" + 0.021*\"bishop\" + 0.016*\"sail\" + 0.015*\"retroflex\" + 0.010*\"parish\" + 0.010*\"historiographi\" + 0.010*\"relationship\" + 0.009*\"cathedr\"\n", + "2019-01-31 01:28:31,269 : INFO : topic #21 (0.020): 0.034*\"samford\" + 0.023*\"spain\" + 0.018*\"del\" + 0.017*\"italian\" + 0.017*\"mexico\" + 0.014*\"soviet\" + 0.011*\"santa\" + 0.011*\"juan\" + 0.010*\"francisco\" + 0.010*\"carlo\"\n", + "2019-01-31 01:28:31,275 : INFO : topic diff=0.003307, rho=0.021811\n", + "2019-01-31 01:28:31,434 : INFO : PROGRESS: pass 0, at document #4206000/4922894\n", + "2019-01-31 01:28:32,795 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:28:33,063 : INFO : topic #49 (0.020): 0.044*\"india\" + 0.031*\"incumb\" + 0.013*\"islam\" + 0.013*\"pakistan\" + 0.012*\"televis\" + 0.011*\"anglo\" + 0.011*\"affection\" + 0.011*\"muskoge\" + 0.010*\"khalsa\" + 0.010*\"sri\"\n", + "2019-01-31 01:28:33,064 : INFO : topic #24 (0.020): 0.041*\"book\" + 0.035*\"publicis\" + 0.026*\"word\" + 0.020*\"new\" + 0.014*\"presid\" + 0.014*\"edit\" + 0.011*\"magazin\" + 0.011*\"worldwid\" + 0.011*\"author\" + 0.011*\"storag\"\n", + "2019-01-31 01:28:33,065 : INFO : topic #11 (0.020): 0.023*\"john\" + 0.011*\"jame\" + 0.011*\"david\" + 0.011*\"will\" + 0.010*\"rival\" + 0.009*\"mexican–american\" + 0.009*\"slur\" + 0.008*\"georg\" + 0.007*\"rhyme\" + 0.007*\"paul\"\n", + "2019-01-31 01:28:33,066 : INFO : topic #48 (0.020): 0.080*\"sens\" + 0.080*\"march\" + 0.080*\"octob\" + 0.073*\"juli\" + 0.072*\"januari\" + 0.071*\"august\" + 0.069*\"notion\" + 0.069*\"judici\" + 0.068*\"april\" + 0.066*\"decatur\"\n", + "2019-01-31 01:28:33,067 : INFO : topic #6 (0.020): 0.071*\"fewer\" + 0.023*\"epiru\" + 0.020*\"septemb\" + 0.018*\"teacher\" + 0.015*\"stake\" + 0.012*\"rodríguez\" + 0.011*\"direct\" + 0.011*\"proclaim\" + 0.010*\"movi\" + 0.010*\"acrimoni\"\n", + "2019-01-31 01:28:33,073 : INFO : topic diff=0.003209, rho=0.021806\n", + "2019-01-31 01:28:33,236 : INFO : PROGRESS: pass 0, at document #4208000/4922894\n", + "2019-01-31 01:28:34,661 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:28:34,928 : INFO : topic #6 (0.020): 0.071*\"fewer\" + 0.023*\"epiru\" + 0.020*\"septemb\" + 0.018*\"teacher\" + 0.015*\"stake\" + 0.012*\"rodríguez\" + 0.011*\"direct\" + 0.011*\"proclaim\" + 0.010*\"movi\" + 0.010*\"acrimoni\"\n", + "2019-01-31 01:28:34,929 : INFO : topic #22 (0.020): 0.034*\"spars\" + 0.019*\"factor\" + 0.012*\"plaisir\" + 0.010*\"western\" + 0.010*\"genu\" + 0.009*\"biom\" + 0.008*\"median\" + 0.007*\"florida\" + 0.006*\"trap\" + 0.006*\"incom\"\n", + "2019-01-31 01:28:34,929 : INFO : topic #20 (0.020): 0.141*\"scholar\" + 0.040*\"struggl\" + 0.033*\"high\" + 0.030*\"educ\" + 0.023*\"collector\" + 0.017*\"yawn\" + 0.013*\"prognosi\" + 0.010*\"district\" + 0.009*\"gothic\" + 0.009*\"task\"\n", + "2019-01-31 01:28:34,930 : INFO : topic #36 (0.020): 0.011*\"network\" + 0.011*\"pop\" + 0.011*\"prognosi\" + 0.008*\"cytokin\" + 0.008*\"diggin\" + 0.008*\"championship\" + 0.008*\"develop\" + 0.008*\"uruguayan\" + 0.008*\"softwar\" + 0.007*\"includ\"\n", + "2019-01-31 01:28:34,931 : INFO : topic #28 (0.020): 0.035*\"build\" + 0.030*\"hous\" + 0.019*\"buford\" + 0.015*\"histor\" + 0.012*\"linear\" + 0.011*\"constitut\" + 0.011*\"depress\" + 0.011*\"pistol\" + 0.011*\"silicon\" + 0.010*\"centuri\"\n", + "2019-01-31 01:28:34,937 : INFO : topic diff=0.004575, rho=0.021801\n", + "2019-01-31 01:28:35,097 : INFO : PROGRESS: pass 0, at document #4210000/4922894\n", + "2019-01-31 01:28:36,481 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:28:36,748 : INFO : topic #6 (0.020): 0.071*\"fewer\" + 0.024*\"epiru\" + 0.020*\"septemb\" + 0.018*\"teacher\" + 0.015*\"stake\" + 0.012*\"rodríguez\" + 0.011*\"direct\" + 0.011*\"proclaim\" + 0.010*\"movi\" + 0.010*\"acrimoni\"\n", + "2019-01-31 01:28:36,749 : INFO : topic #7 (0.020): 0.021*\"snatch\" + 0.020*\"di\" + 0.018*\"factor\" + 0.016*\"yawn\" + 0.016*\"margin\" + 0.014*\"bone\" + 0.013*\"life\" + 0.013*\"faster\" + 0.012*\"deal\" + 0.011*\"will\"\n", + "2019-01-31 01:28:36,750 : INFO : topic #21 (0.020): 0.035*\"samford\" + 0.023*\"spain\" + 0.018*\"del\" + 0.017*\"italian\" + 0.017*\"mexico\" + 0.014*\"soviet\" + 0.012*\"santa\" + 0.011*\"juan\" + 0.010*\"francisco\" + 0.010*\"carlo\"\n", + "2019-01-31 01:28:36,751 : INFO : topic #26 (0.020): 0.030*\"workplac\" + 0.027*\"champion\" + 0.026*\"woman\" + 0.025*\"olymp\" + 0.023*\"men\" + 0.022*\"medal\" + 0.020*\"event\" + 0.018*\"taxpay\" + 0.018*\"nation\" + 0.017*\"rainfal\"\n", + "2019-01-31 01:28:36,752 : INFO : topic #40 (0.020): 0.086*\"unit\" + 0.023*\"schuster\" + 0.022*\"institut\" + 0.022*\"collector\" + 0.021*\"requir\" + 0.019*\"student\" + 0.014*\"professor\" + 0.012*\"word\" + 0.012*\"http\" + 0.011*\"degre\"\n", + "2019-01-31 01:28:36,758 : INFO : topic diff=0.002869, rho=0.021796\n", + "2019-01-31 01:28:36,917 : INFO : PROGRESS: pass 0, at document #4212000/4922894\n", + "2019-01-31 01:28:38,296 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:28:38,563 : INFO : topic #19 (0.020): 0.016*\"languag\" + 0.015*\"centuri\" + 0.011*\"woodcut\" + 0.010*\"form\" + 0.009*\"mean\" + 0.009*\"origin\" + 0.008*\"trade\" + 0.008*\"english\" + 0.007*\"known\" + 0.007*\"uruguayan\"\n", + "2019-01-31 01:28:38,564 : INFO : topic #12 (0.020): 0.008*\"number\" + 0.007*\"frontal\" + 0.006*\"poet\" + 0.006*\"exampl\" + 0.006*\"gener\" + 0.006*\"southern\" + 0.006*\"utopian\" + 0.006*\"servitud\" + 0.006*\"théori\" + 0.006*\"field\"\n", + "2019-01-31 01:28:38,565 : INFO : topic #15 (0.020): 0.011*\"small\" + 0.010*\"organ\" + 0.010*\"develop\" + 0.009*\"commun\" + 0.009*\"word\" + 0.009*\"group\" + 0.008*\"peopl\" + 0.007*\"human\" + 0.007*\"woman\" + 0.006*\"summerhil\"\n", + "2019-01-31 01:28:38,566 : INFO : topic #9 (0.020): 0.071*\"bone\" + 0.042*\"american\" + 0.027*\"valour\" + 0.018*\"dutch\" + 0.018*\"player\" + 0.017*\"folei\" + 0.016*\"polit\" + 0.016*\"english\" + 0.013*\"acrimoni\" + 0.013*\"simpler\"\n", + "2019-01-31 01:28:38,567 : INFO : topic #39 (0.020): 0.060*\"canada\" + 0.045*\"canadian\" + 0.024*\"hoar\" + 0.023*\"toronto\" + 0.021*\"ontario\" + 0.015*\"misericordia\" + 0.015*\"new\" + 0.015*\"hydrogen\" + 0.014*\"quebec\" + 0.014*\"novotná\"\n", + "2019-01-31 01:28:38,573 : INFO : topic diff=0.003219, rho=0.021791\n", + "2019-01-31 01:28:38,729 : INFO : PROGRESS: pass 0, at document #4214000/4922894\n", + "2019-01-31 01:28:40,105 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:28:40,371 : INFO : topic #34 (0.020): 0.066*\"start\" + 0.034*\"new\" + 0.032*\"american\" + 0.029*\"unionist\" + 0.026*\"cotton\" + 0.022*\"year\" + 0.016*\"california\" + 0.013*\"warrior\" + 0.013*\"terri\" + 0.011*\"citi\"\n", + "2019-01-31 01:28:40,372 : INFO : topic #43 (0.020): 0.068*\"elect\" + 0.056*\"parti\" + 0.025*\"democrat\" + 0.023*\"voluntari\" + 0.019*\"member\" + 0.016*\"polici\" + 0.016*\"republ\" + 0.013*\"bypass\" + 0.013*\"seaport\" + 0.013*\"report\"\n", + "2019-01-31 01:28:40,373 : INFO : topic #37 (0.020): 0.013*\"charact\" + 0.012*\"septemb\" + 0.011*\"man\" + 0.011*\"anim\" + 0.009*\"comic\" + 0.007*\"appear\" + 0.007*\"storag\" + 0.007*\"workplac\" + 0.007*\"fusiform\" + 0.006*\"black\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 01:28:40,374 : INFO : topic #19 (0.020): 0.016*\"languag\" + 0.015*\"centuri\" + 0.011*\"woodcut\" + 0.010*\"form\" + 0.009*\"mean\" + 0.009*\"origin\" + 0.008*\"trade\" + 0.008*\"english\" + 0.007*\"known\" + 0.007*\"uruguayan\"\n", + "2019-01-31 01:28:40,375 : INFO : topic #41 (0.020): 0.040*\"citi\" + 0.023*\"palmer\" + 0.020*\"new\" + 0.017*\"strategist\" + 0.013*\"center\" + 0.013*\"open\" + 0.011*\"includ\" + 0.011*\"lobe\" + 0.010*\"dai\" + 0.009*\"hot\"\n", + "2019-01-31 01:28:40,381 : INFO : topic diff=0.003139, rho=0.021786\n", + "2019-01-31 01:28:40,538 : INFO : PROGRESS: pass 0, at document #4216000/4922894\n", + "2019-01-31 01:28:41,918 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:28:42,185 : INFO : topic #13 (0.020): 0.028*\"london\" + 0.026*\"sourc\" + 0.025*\"australia\" + 0.024*\"new\" + 0.023*\"australian\" + 0.023*\"england\" + 0.020*\"british\" + 0.018*\"ireland\" + 0.015*\"youth\" + 0.013*\"wale\"\n", + "2019-01-31 01:28:42,186 : INFO : topic #4 (0.020): 0.020*\"enfranchis\" + 0.015*\"depress\" + 0.013*\"pour\" + 0.008*\"elabor\" + 0.008*\"uruguayan\" + 0.008*\"mode\" + 0.007*\"veget\" + 0.006*\"develop\" + 0.006*\"produc\" + 0.006*\"spectacl\"\n", + "2019-01-31 01:28:42,187 : INFO : topic #1 (0.020): 0.055*\"china\" + 0.046*\"chilton\" + 0.026*\"kong\" + 0.026*\"hong\" + 0.021*\"korea\" + 0.019*\"korean\" + 0.017*\"leah\" + 0.015*\"sourc\" + 0.015*\"shirin\" + 0.014*\"kim\"\n", + "2019-01-31 01:28:42,188 : INFO : topic #12 (0.020): 0.008*\"number\" + 0.008*\"frontal\" + 0.006*\"exampl\" + 0.006*\"poet\" + 0.006*\"gener\" + 0.006*\"utopian\" + 0.006*\"southern\" + 0.006*\"servitud\" + 0.006*\"théori\" + 0.006*\"field\"\n", + "2019-01-31 01:28:42,190 : INFO : topic #44 (0.020): 0.029*\"rooftop\" + 0.027*\"final\" + 0.022*\"wife\" + 0.021*\"tourist\" + 0.021*\"champion\" + 0.015*\"martin\" + 0.015*\"open\" + 0.014*\"taxpay\" + 0.014*\"chamber\" + 0.014*\"tiepolo\"\n", + "2019-01-31 01:28:42,195 : INFO : topic diff=0.003594, rho=0.021780\n", + "2019-01-31 01:28:42,358 : INFO : PROGRESS: pass 0, at document #4218000/4922894\n", + "2019-01-31 01:28:43,770 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:28:44,036 : INFO : topic #13 (0.020): 0.028*\"london\" + 0.026*\"sourc\" + 0.025*\"australia\" + 0.024*\"new\" + 0.023*\"australian\" + 0.022*\"england\" + 0.020*\"british\" + 0.018*\"ireland\" + 0.015*\"youth\" + 0.013*\"wale\"\n", + "2019-01-31 01:28:44,038 : INFO : topic #4 (0.020): 0.020*\"enfranchis\" + 0.015*\"depress\" + 0.013*\"pour\" + 0.008*\"elabor\" + 0.008*\"uruguayan\" + 0.008*\"mode\" + 0.007*\"veget\" + 0.006*\"develop\" + 0.006*\"produc\" + 0.006*\"spectacl\"\n", + "2019-01-31 01:28:44,039 : INFO : topic #12 (0.020): 0.008*\"number\" + 0.007*\"frontal\" + 0.006*\"exampl\" + 0.006*\"poet\" + 0.006*\"gener\" + 0.006*\"southern\" + 0.006*\"utopian\" + 0.006*\"servitud\" + 0.006*\"théori\" + 0.006*\"field\"\n", + "2019-01-31 01:28:44,040 : INFO : topic #0 (0.020): 0.063*\"statewid\" + 0.041*\"line\" + 0.032*\"raid\" + 0.028*\"rivièr\" + 0.026*\"rosenwald\" + 0.021*\"airmen\" + 0.019*\"serv\" + 0.018*\"traceabl\" + 0.013*\"oper\" + 0.010*\"transient\"\n", + "2019-01-31 01:28:44,041 : INFO : topic #28 (0.020): 0.035*\"build\" + 0.030*\"hous\" + 0.019*\"buford\" + 0.015*\"histor\" + 0.012*\"linear\" + 0.011*\"depress\" + 0.011*\"constitut\" + 0.011*\"pistol\" + 0.011*\"silicon\" + 0.010*\"centuri\"\n", + "2019-01-31 01:28:44,047 : INFO : topic diff=0.003487, rho=0.021775\n", + "2019-01-31 01:28:46,784 : INFO : -11.678 per-word bound, 3277.5 perplexity estimate based on a held-out corpus of 2000 documents with 580486 words\n", + "2019-01-31 01:28:46,784 : INFO : PROGRESS: pass 0, at document #4220000/4922894\n", + "2019-01-31 01:28:48,190 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:28:48,457 : INFO : topic #8 (0.020): 0.025*\"law\" + 0.022*\"cortic\" + 0.019*\"start\" + 0.018*\"act\" + 0.013*\"ricardo\" + 0.012*\"case\" + 0.010*\"replac\" + 0.009*\"polaris\" + 0.008*\"legal\" + 0.007*\"judaism\"\n", + "2019-01-31 01:28:48,458 : INFO : topic #3 (0.020): 0.033*\"present\" + 0.025*\"offic\" + 0.024*\"nation\" + 0.023*\"minist\" + 0.023*\"govern\" + 0.021*\"member\" + 0.017*\"start\" + 0.017*\"serv\" + 0.015*\"gener\" + 0.014*\"seri\"\n", + "2019-01-31 01:28:48,459 : INFO : topic #49 (0.020): 0.044*\"india\" + 0.031*\"incumb\" + 0.014*\"islam\" + 0.013*\"pakistan\" + 0.012*\"televis\" + 0.012*\"anglo\" + 0.011*\"affection\" + 0.011*\"muskoge\" + 0.011*\"khalsa\" + 0.010*\"sri\"\n", + "2019-01-31 01:28:48,460 : INFO : topic #25 (0.020): 0.035*\"ring\" + 0.018*\"lagrang\" + 0.018*\"area\" + 0.017*\"warmth\" + 0.015*\"mount\" + 0.009*\"north\" + 0.009*\"land\" + 0.009*\"sourc\" + 0.009*\"foam\" + 0.009*\"lobe\"\n", + "2019-01-31 01:28:48,461 : INFO : topic #22 (0.020): 0.033*\"spars\" + 0.018*\"factor\" + 0.012*\"plaisir\" + 0.010*\"western\" + 0.009*\"genu\" + 0.009*\"biom\" + 0.008*\"median\" + 0.007*\"florida\" + 0.007*\"incom\" + 0.006*\"trap\"\n", + "2019-01-31 01:28:48,467 : INFO : topic diff=0.003706, rho=0.021770\n", + "2019-01-31 01:28:48,685 : INFO : PROGRESS: pass 0, at document #4222000/4922894\n", + "2019-01-31 01:28:50,076 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:28:50,342 : INFO : topic #6 (0.020): 0.071*\"fewer\" + 0.024*\"epiru\" + 0.020*\"septemb\" + 0.018*\"teacher\" + 0.014*\"stake\" + 0.012*\"rodríguez\" + 0.011*\"proclaim\" + 0.011*\"direct\" + 0.010*\"movi\" + 0.010*\"acrimoni\"\n", + "2019-01-31 01:28:50,343 : INFO : topic #5 (0.020): 0.038*\"abroad\" + 0.028*\"son\" + 0.026*\"rel\" + 0.025*\"reconstruct\" + 0.021*\"band\" + 0.017*\"muscl\" + 0.016*\"simultan\" + 0.014*\"charcoal\" + 0.013*\"toyota\" + 0.010*\"myspac\"\n", + "2019-01-31 01:28:50,344 : INFO : topic #39 (0.020): 0.061*\"canada\" + 0.045*\"canadian\" + 0.024*\"hoar\" + 0.023*\"toronto\" + 0.020*\"ontario\" + 0.015*\"new\" + 0.015*\"misericordia\" + 0.015*\"hydrogen\" + 0.014*\"quebec\" + 0.014*\"novotná\"\n", + "2019-01-31 01:28:50,345 : INFO : topic #44 (0.020): 0.030*\"rooftop\" + 0.027*\"final\" + 0.022*\"wife\" + 0.021*\"tourist\" + 0.020*\"champion\" + 0.015*\"open\" + 0.015*\"martin\" + 0.014*\"taxpay\" + 0.014*\"chamber\" + 0.014*\"tiepolo\"\n", + "2019-01-31 01:28:50,346 : INFO : topic #21 (0.020): 0.035*\"samford\" + 0.023*\"spain\" + 0.018*\"del\" + 0.017*\"mexico\" + 0.017*\"italian\" + 0.014*\"soviet\" + 0.012*\"santa\" + 0.011*\"juan\" + 0.010*\"francisco\" + 0.010*\"carlo\"\n", + "2019-01-31 01:28:50,352 : INFO : topic diff=0.003464, rho=0.021765\n", + "2019-01-31 01:28:50,508 : INFO : PROGRESS: pass 0, at document #4224000/4922894\n", + "2019-01-31 01:28:51,889 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:28:52,155 : INFO : topic #19 (0.020): 0.017*\"languag\" + 0.015*\"centuri\" + 0.011*\"woodcut\" + 0.010*\"form\" + 0.009*\"mean\" + 0.009*\"origin\" + 0.008*\"trade\" + 0.007*\"english\" + 0.007*\"known\" + 0.007*\"uruguayan\"\n", + "2019-01-31 01:28:52,156 : INFO : topic #29 (0.020): 0.030*\"companhia\" + 0.013*\"busi\" + 0.012*\"million\" + 0.012*\"market\" + 0.011*\"produc\" + 0.010*\"industri\" + 0.010*\"bank\" + 0.008*\"yawn\" + 0.008*\"manag\" + 0.007*\"serv\"\n", + "2019-01-31 01:28:52,157 : INFO : topic #14 (0.020): 0.024*\"forc\" + 0.022*\"aggress\" + 0.021*\"walter\" + 0.020*\"armi\" + 0.018*\"com\" + 0.014*\"unionist\" + 0.013*\"militari\" + 0.013*\"oper\" + 0.013*\"airbu\" + 0.011*\"diversifi\"\n", + "2019-01-31 01:28:52,158 : INFO : topic #31 (0.020): 0.051*\"fusiform\" + 0.027*\"scientist\" + 0.025*\"taxpay\" + 0.022*\"player\" + 0.019*\"place\" + 0.014*\"clot\" + 0.013*\"leagu\" + 0.011*\"folei\" + 0.010*\"yawn\" + 0.009*\"reconstruct\"\n", + "2019-01-31 01:28:52,159 : INFO : topic #48 (0.020): 0.081*\"march\" + 0.079*\"sens\" + 0.079*\"octob\" + 0.073*\"juli\" + 0.072*\"januari\" + 0.071*\"august\" + 0.070*\"judici\" + 0.070*\"notion\" + 0.068*\"april\" + 0.066*\"decatur\"\n", + "2019-01-31 01:28:52,165 : INFO : topic diff=0.002320, rho=0.021760\n", + "2019-01-31 01:28:52,325 : INFO : PROGRESS: pass 0, at document #4226000/4922894\n", + "2019-01-31 01:28:53,716 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:28:53,986 : INFO : topic #45 (0.020): 0.044*\"arsen\" + 0.030*\"jpg\" + 0.028*\"fifteenth\" + 0.027*\"museo\" + 0.022*\"pain\" + 0.020*\"illicit\" + 0.016*\"artist\" + 0.016*\"exhaust\" + 0.015*\"gai\" + 0.015*\"colder\"\n", + "2019-01-31 01:28:53,987 : INFO : topic #2 (0.020): 0.049*\"isl\" + 0.037*\"shield\" + 0.018*\"narrat\" + 0.015*\"scot\" + 0.013*\"pope\" + 0.012*\"blur\" + 0.011*\"nativist\" + 0.011*\"coalit\" + 0.009*\"class\" + 0.009*\"bahá\"\n", + "2019-01-31 01:28:53,989 : INFO : topic #41 (0.020): 0.040*\"citi\" + 0.023*\"palmer\" + 0.020*\"new\" + 0.016*\"strategist\" + 0.013*\"open\" + 0.013*\"center\" + 0.011*\"includ\" + 0.011*\"lobe\" + 0.011*\"dai\" + 0.009*\"hot\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 01:28:53,990 : INFO : topic #31 (0.020): 0.051*\"fusiform\" + 0.027*\"scientist\" + 0.025*\"taxpay\" + 0.021*\"player\" + 0.020*\"place\" + 0.014*\"clot\" + 0.013*\"leagu\" + 0.011*\"folei\" + 0.010*\"yawn\" + 0.009*\"reconstruct\"\n", + "2019-01-31 01:28:53,991 : INFO : topic #22 (0.020): 0.033*\"spars\" + 0.018*\"factor\" + 0.012*\"plaisir\" + 0.010*\"western\" + 0.010*\"genu\" + 0.009*\"biom\" + 0.008*\"median\" + 0.007*\"florida\" + 0.006*\"incom\" + 0.006*\"trap\"\n", + "2019-01-31 01:28:53,997 : INFO : topic diff=0.003006, rho=0.021755\n", + "2019-01-31 01:28:54,153 : INFO : PROGRESS: pass 0, at document #4228000/4922894\n", + "2019-01-31 01:28:55,528 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:28:55,795 : INFO : topic #8 (0.020): 0.025*\"law\" + 0.022*\"cortic\" + 0.019*\"start\" + 0.017*\"act\" + 0.013*\"ricardo\" + 0.012*\"case\" + 0.010*\"replac\" + 0.009*\"polaris\" + 0.008*\"legal\" + 0.007*\"judaism\"\n", + "2019-01-31 01:28:55,796 : INFO : topic #23 (0.020): 0.137*\"audit\" + 0.070*\"best\" + 0.034*\"yawn\" + 0.030*\"jacksonvil\" + 0.023*\"japanes\" + 0.022*\"noll\" + 0.019*\"women\" + 0.018*\"festiv\" + 0.016*\"intern\" + 0.013*\"prison\"\n", + "2019-01-31 01:28:55,797 : INFO : topic #38 (0.020): 0.022*\"walter\" + 0.010*\"aza\" + 0.009*\"forc\" + 0.008*\"battalion\" + 0.007*\"armi\" + 0.007*\"empath\" + 0.006*\"teufel\" + 0.006*\"govern\" + 0.006*\"militari\" + 0.006*\"citi\"\n", + "2019-01-31 01:28:55,798 : INFO : topic #43 (0.020): 0.067*\"elect\" + 0.055*\"parti\" + 0.026*\"democrat\" + 0.024*\"voluntari\" + 0.018*\"member\" + 0.017*\"republ\" + 0.016*\"polici\" + 0.014*\"bypass\" + 0.013*\"selma\" + 0.013*\"report\"\n", + "2019-01-31 01:28:55,799 : INFO : topic #4 (0.020): 0.020*\"enfranchis\" + 0.015*\"depress\" + 0.013*\"pour\" + 0.008*\"elabor\" + 0.008*\"uruguayan\" + 0.008*\"mode\" + 0.007*\"veget\" + 0.006*\"develop\" + 0.006*\"produc\" + 0.006*\"turn\"\n", + "2019-01-31 01:28:55,805 : INFO : topic diff=0.002645, rho=0.021749\n", + "2019-01-31 01:28:55,965 : INFO : PROGRESS: pass 0, at document #4230000/4922894\n", + "2019-01-31 01:28:57,360 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:28:57,626 : INFO : topic #11 (0.020): 0.023*\"john\" + 0.012*\"will\" + 0.011*\"david\" + 0.011*\"jame\" + 0.010*\"rival\" + 0.009*\"mexican–american\" + 0.009*\"slur\" + 0.008*\"georg\" + 0.007*\"rhyme\" + 0.007*\"paul\"\n", + "2019-01-31 01:28:57,628 : INFO : topic #46 (0.020): 0.017*\"stop\" + 0.015*\"sweden\" + 0.014*\"wind\" + 0.014*\"norwai\" + 0.014*\"damag\" + 0.014*\"swedish\" + 0.012*\"norwegian\" + 0.012*\"treeless\" + 0.011*\"huntsvil\" + 0.010*\"denmark\"\n", + "2019-01-31 01:28:57,629 : INFO : topic #45 (0.020): 0.044*\"arsen\" + 0.030*\"jpg\" + 0.028*\"museo\" + 0.027*\"fifteenth\" + 0.022*\"pain\" + 0.020*\"illicit\" + 0.016*\"artist\" + 0.016*\"exhaust\" + 0.016*\"gai\" + 0.015*\"colder\"\n", + "2019-01-31 01:28:57,630 : INFO : topic #10 (0.020): 0.012*\"cdd\" + 0.009*\"media\" + 0.008*\"disco\" + 0.007*\"hormon\" + 0.007*\"caus\" + 0.007*\"have\" + 0.007*\"pathwai\" + 0.007*\"effect\" + 0.006*\"treat\" + 0.006*\"proper\"\n", + "2019-01-31 01:28:57,631 : INFO : topic #36 (0.020): 0.011*\"network\" + 0.011*\"prognosi\" + 0.010*\"pop\" + 0.009*\"cytokin\" + 0.008*\"diggin\" + 0.008*\"develop\" + 0.008*\"uruguayan\" + 0.008*\"championship\" + 0.008*\"softwar\" + 0.008*\"user\"\n", + "2019-01-31 01:28:57,636 : INFO : topic diff=0.003075, rho=0.021744\n", + "2019-01-31 01:28:57,792 : INFO : PROGRESS: pass 0, at document #4232000/4922894\n", + "2019-01-31 01:28:59,168 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:28:59,434 : INFO : topic #6 (0.020): 0.071*\"fewer\" + 0.024*\"epiru\" + 0.020*\"septemb\" + 0.018*\"teacher\" + 0.014*\"stake\" + 0.012*\"rodríguez\" + 0.011*\"proclaim\" + 0.011*\"direct\" + 0.011*\"movi\" + 0.010*\"acrimoni\"\n", + "2019-01-31 01:28:59,435 : INFO : topic #49 (0.020): 0.043*\"india\" + 0.031*\"incumb\" + 0.014*\"islam\" + 0.013*\"pakistan\" + 0.012*\"televis\" + 0.011*\"anglo\" + 0.011*\"affection\" + 0.011*\"muskoge\" + 0.010*\"khalsa\" + 0.010*\"sri\"\n", + "2019-01-31 01:28:59,436 : INFO : topic #37 (0.020): 0.013*\"charact\" + 0.012*\"septemb\" + 0.011*\"man\" + 0.011*\"anim\" + 0.008*\"comic\" + 0.007*\"appear\" + 0.007*\"storag\" + 0.007*\"workplac\" + 0.007*\"fusiform\" + 0.006*\"black\"\n", + "2019-01-31 01:28:59,437 : INFO : topic #46 (0.020): 0.017*\"stop\" + 0.015*\"sweden\" + 0.015*\"damag\" + 0.015*\"norwai\" + 0.014*\"wind\" + 0.013*\"swedish\" + 0.013*\"norwegian\" + 0.012*\"treeless\" + 0.011*\"huntsvil\" + 0.010*\"denmark\"\n", + "2019-01-31 01:28:59,438 : INFO : topic #3 (0.020): 0.033*\"present\" + 0.025*\"offic\" + 0.024*\"nation\" + 0.023*\"minist\" + 0.023*\"govern\" + 0.021*\"member\" + 0.017*\"start\" + 0.016*\"serv\" + 0.015*\"gener\" + 0.014*\"chickasaw\"\n", + "2019-01-31 01:28:59,444 : INFO : topic diff=0.003145, rho=0.021739\n", + "2019-01-31 01:28:59,607 : INFO : PROGRESS: pass 0, at document #4234000/4922894\n", + "2019-01-31 01:29:01,024 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:29:01,290 : INFO : topic #21 (0.020): 0.036*\"samford\" + 0.022*\"spain\" + 0.018*\"del\" + 0.017*\"italian\" + 0.017*\"mexico\" + 0.014*\"soviet\" + 0.013*\"santa\" + 0.011*\"juan\" + 0.010*\"carlo\" + 0.010*\"francisco\"\n", + "2019-01-31 01:29:01,291 : INFO : topic #40 (0.020): 0.086*\"unit\" + 0.023*\"schuster\" + 0.022*\"institut\" + 0.021*\"collector\" + 0.021*\"requir\" + 0.019*\"student\" + 0.014*\"professor\" + 0.012*\"word\" + 0.011*\"http\" + 0.011*\"degre\"\n", + "2019-01-31 01:29:01,292 : INFO : topic #0 (0.020): 0.063*\"statewid\" + 0.042*\"line\" + 0.032*\"raid\" + 0.028*\"rivièr\" + 0.026*\"rosenwald\" + 0.021*\"airmen\" + 0.018*\"serv\" + 0.018*\"traceabl\" + 0.013*\"oper\" + 0.010*\"transient\"\n", + "2019-01-31 01:29:01,293 : INFO : topic #17 (0.020): 0.078*\"church\" + 0.025*\"cathol\" + 0.021*\"christian\" + 0.021*\"bishop\" + 0.017*\"sail\" + 0.015*\"retroflex\" + 0.010*\"relationship\" + 0.010*\"parish\" + 0.010*\"historiographi\" + 0.009*\"cathedr\"\n", + "2019-01-31 01:29:01,294 : INFO : topic #22 (0.020): 0.034*\"spars\" + 0.018*\"factor\" + 0.012*\"plaisir\" + 0.010*\"western\" + 0.010*\"genu\" + 0.009*\"biom\" + 0.008*\"median\" + 0.007*\"florida\" + 0.007*\"trap\" + 0.006*\"incom\"\n", + "2019-01-31 01:29:01,300 : INFO : topic diff=0.004785, rho=0.021734\n", + "2019-01-31 01:29:01,463 : INFO : PROGRESS: pass 0, at document #4236000/4922894\n", + "2019-01-31 01:29:02,861 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:29:03,131 : INFO : topic #14 (0.020): 0.024*\"forc\" + 0.022*\"aggress\" + 0.021*\"walter\" + 0.020*\"armi\" + 0.018*\"com\" + 0.014*\"unionist\" + 0.013*\"militari\" + 0.013*\"oper\" + 0.012*\"airbu\" + 0.012*\"diversifi\"\n", + "2019-01-31 01:29:03,132 : INFO : topic #27 (0.020): 0.076*\"questionnair\" + 0.021*\"candid\" + 0.018*\"taxpay\" + 0.014*\"ret\" + 0.013*\"tornado\" + 0.012*\"driver\" + 0.011*\"fool\" + 0.011*\"find\" + 0.010*\"horac\" + 0.010*\"théori\"\n", + "2019-01-31 01:29:03,133 : INFO : topic #49 (0.020): 0.043*\"india\" + 0.031*\"incumb\" + 0.014*\"islam\" + 0.013*\"pakistan\" + 0.012*\"televis\" + 0.011*\"anglo\" + 0.011*\"affection\" + 0.011*\"muskoge\" + 0.011*\"khalsa\" + 0.010*\"sri\"\n", + "2019-01-31 01:29:03,134 : INFO : topic #16 (0.020): 0.055*\"king\" + 0.031*\"priest\" + 0.019*\"grammat\" + 0.018*\"duke\" + 0.018*\"idiosyncrat\" + 0.017*\"rotterdam\" + 0.016*\"quarterli\" + 0.014*\"kingdom\" + 0.013*\"portugues\" + 0.012*\"order\"\n", + "2019-01-31 01:29:03,135 : INFO : topic #40 (0.020): 0.085*\"unit\" + 0.023*\"schuster\" + 0.022*\"institut\" + 0.021*\"collector\" + 0.021*\"requir\" + 0.019*\"student\" + 0.014*\"professor\" + 0.012*\"word\" + 0.011*\"http\" + 0.011*\"degre\"\n", + "2019-01-31 01:29:03,141 : INFO : topic diff=0.003840, rho=0.021729\n", + "2019-01-31 01:29:03,298 : INFO : PROGRESS: pass 0, at document #4238000/4922894\n", + "2019-01-31 01:29:04,686 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:29:04,953 : INFO : topic #2 (0.020): 0.050*\"isl\" + 0.037*\"shield\" + 0.018*\"narrat\" + 0.015*\"scot\" + 0.013*\"pope\" + 0.012*\"blur\" + 0.012*\"nativist\" + 0.011*\"coalit\" + 0.009*\"bahá\" + 0.009*\"class\"\n", + "2019-01-31 01:29:04,954 : INFO : topic #15 (0.020): 0.011*\"small\" + 0.010*\"organ\" + 0.010*\"develop\" + 0.009*\"commun\" + 0.009*\"word\" + 0.009*\"group\" + 0.008*\"peopl\" + 0.007*\"woman\" + 0.007*\"human\" + 0.006*\"summerhil\"\n", + "2019-01-31 01:29:04,955 : INFO : topic #26 (0.020): 0.030*\"workplac\" + 0.027*\"champion\" + 0.025*\"olymp\" + 0.025*\"woman\" + 0.023*\"men\" + 0.022*\"medal\" + 0.019*\"event\" + 0.018*\"taxpay\" + 0.018*\"nation\" + 0.017*\"atheist\"\n", + "2019-01-31 01:29:04,956 : INFO : topic #0 (0.020): 0.063*\"statewid\" + 0.042*\"line\" + 0.032*\"raid\" + 0.028*\"rivièr\" + 0.026*\"rosenwald\" + 0.020*\"airmen\" + 0.018*\"serv\" + 0.018*\"traceabl\" + 0.013*\"oper\" + 0.010*\"transient\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 01:29:04,957 : INFO : topic #25 (0.020): 0.034*\"ring\" + 0.019*\"lagrang\" + 0.018*\"area\" + 0.016*\"warmth\" + 0.015*\"mount\" + 0.009*\"north\" + 0.009*\"foam\" + 0.009*\"land\" + 0.009*\"sourc\" + 0.009*\"vacant\"\n", + "2019-01-31 01:29:04,963 : INFO : topic diff=0.002986, rho=0.021724\n", + "2019-01-31 01:29:07,674 : INFO : -11.666 per-word bound, 3249.1 perplexity estimate based on a held-out corpus of 2000 documents with 541190 words\n", + "2019-01-31 01:29:07,674 : INFO : PROGRESS: pass 0, at document #4240000/4922894\n", + "2019-01-31 01:29:09,057 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:29:09,326 : INFO : topic #9 (0.020): 0.070*\"bone\" + 0.043*\"american\" + 0.028*\"valour\" + 0.018*\"dutch\" + 0.018*\"player\" + 0.017*\"folei\" + 0.016*\"polit\" + 0.016*\"english\" + 0.013*\"acrimoni\" + 0.012*\"simpler\"\n", + "2019-01-31 01:29:09,327 : INFO : topic #8 (0.020): 0.025*\"law\" + 0.022*\"cortic\" + 0.019*\"start\" + 0.017*\"act\" + 0.013*\"ricardo\" + 0.012*\"case\" + 0.010*\"replac\" + 0.009*\"polaris\" + 0.008*\"legal\" + 0.007*\"judaism\"\n", + "2019-01-31 01:29:09,328 : INFO : topic #4 (0.020): 0.020*\"enfranchis\" + 0.015*\"depress\" + 0.013*\"pour\" + 0.008*\"elabor\" + 0.008*\"uruguayan\" + 0.008*\"mode\" + 0.007*\"veget\" + 0.006*\"develop\" + 0.006*\"produc\" + 0.006*\"turn\"\n", + "2019-01-31 01:29:09,329 : INFO : topic #38 (0.020): 0.022*\"walter\" + 0.010*\"aza\" + 0.009*\"forc\" + 0.008*\"battalion\" + 0.007*\"teufel\" + 0.007*\"armi\" + 0.007*\"till\" + 0.006*\"empath\" + 0.006*\"govern\" + 0.006*\"militari\"\n", + "2019-01-31 01:29:09,330 : INFO : topic #34 (0.020): 0.065*\"start\" + 0.034*\"new\" + 0.031*\"american\" + 0.028*\"unionist\" + 0.026*\"cotton\" + 0.021*\"year\" + 0.016*\"california\" + 0.013*\"warrior\" + 0.012*\"terri\" + 0.012*\"citi\"\n", + "2019-01-31 01:29:09,336 : INFO : topic diff=0.002820, rho=0.021719\n", + "2019-01-31 01:29:09,494 : INFO : PROGRESS: pass 0, at document #4242000/4922894\n", + "2019-01-31 01:29:10,882 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:29:11,149 : INFO : topic #40 (0.020): 0.085*\"unit\" + 0.023*\"schuster\" + 0.022*\"institut\" + 0.021*\"collector\" + 0.021*\"requir\" + 0.019*\"student\" + 0.014*\"professor\" + 0.012*\"word\" + 0.011*\"degre\" + 0.011*\"http\"\n", + "2019-01-31 01:29:11,150 : INFO : topic #9 (0.020): 0.071*\"bone\" + 0.043*\"american\" + 0.028*\"valour\" + 0.018*\"dutch\" + 0.018*\"player\" + 0.017*\"folei\" + 0.016*\"polit\" + 0.016*\"english\" + 0.013*\"acrimoni\" + 0.012*\"simpler\"\n", + "2019-01-31 01:29:11,151 : INFO : topic #4 (0.020): 0.020*\"enfranchis\" + 0.015*\"depress\" + 0.013*\"pour\" + 0.008*\"elabor\" + 0.008*\"uruguayan\" + 0.008*\"mode\" + 0.007*\"veget\" + 0.006*\"develop\" + 0.006*\"produc\" + 0.006*\"turn\"\n", + "2019-01-31 01:29:11,152 : INFO : topic #0 (0.020): 0.063*\"statewid\" + 0.042*\"line\" + 0.032*\"raid\" + 0.028*\"rivièr\" + 0.026*\"rosenwald\" + 0.021*\"airmen\" + 0.018*\"serv\" + 0.018*\"traceabl\" + 0.013*\"oper\" + 0.010*\"transient\"\n", + "2019-01-31 01:29:11,153 : INFO : topic #16 (0.020): 0.055*\"king\" + 0.031*\"priest\" + 0.019*\"grammat\" + 0.018*\"idiosyncrat\" + 0.018*\"duke\" + 0.017*\"rotterdam\" + 0.016*\"quarterli\" + 0.014*\"kingdom\" + 0.013*\"portugues\" + 0.012*\"maria\"\n", + "2019-01-31 01:29:11,159 : INFO : topic diff=0.003042, rho=0.021713\n", + "2019-01-31 01:29:11,311 : INFO : PROGRESS: pass 0, at document #4244000/4922894\n", + "2019-01-31 01:29:12,653 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:29:12,920 : INFO : topic #49 (0.020): 0.043*\"india\" + 0.031*\"incumb\" + 0.014*\"islam\" + 0.013*\"pakistan\" + 0.012*\"televis\" + 0.011*\"affection\" + 0.011*\"anglo\" + 0.011*\"muskoge\" + 0.010*\"sri\" + 0.010*\"khalsa\"\n", + "2019-01-31 01:29:12,921 : INFO : topic #42 (0.020): 0.047*\"german\" + 0.031*\"germani\" + 0.016*\"vol\" + 0.014*\"jewish\" + 0.014*\"israel\" + 0.014*\"berlin\" + 0.014*\"der\" + 0.010*\"european\" + 0.009*\"europ\" + 0.009*\"austria\"\n", + "2019-01-31 01:29:12,922 : INFO : topic #9 (0.020): 0.071*\"bone\" + 0.042*\"american\" + 0.028*\"valour\" + 0.018*\"dutch\" + 0.018*\"player\" + 0.017*\"folei\" + 0.016*\"polit\" + 0.016*\"english\" + 0.013*\"acrimoni\" + 0.012*\"simpler\"\n", + "2019-01-31 01:29:12,923 : INFO : topic #1 (0.020): 0.054*\"china\" + 0.048*\"chilton\" + 0.024*\"kong\" + 0.024*\"hong\" + 0.022*\"korea\" + 0.019*\"korean\" + 0.017*\"leah\" + 0.016*\"sourc\" + 0.014*\"shirin\" + 0.013*\"kim\"\n", + "2019-01-31 01:29:12,924 : INFO : topic #3 (0.020): 0.033*\"present\" + 0.025*\"offic\" + 0.024*\"nation\" + 0.024*\"minist\" + 0.023*\"govern\" + 0.021*\"member\" + 0.017*\"start\" + 0.016*\"serv\" + 0.015*\"gener\" + 0.014*\"chickasaw\"\n", + "2019-01-31 01:29:12,931 : INFO : topic diff=0.003416, rho=0.021708\n", + "2019-01-31 01:29:13,084 : INFO : PROGRESS: pass 0, at document #4246000/4922894\n", + "2019-01-31 01:29:14,443 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:29:14,709 : INFO : topic #13 (0.020): 0.027*\"london\" + 0.026*\"sourc\" + 0.026*\"australia\" + 0.025*\"new\" + 0.023*\"australian\" + 0.022*\"england\" + 0.020*\"british\" + 0.018*\"ireland\" + 0.015*\"youth\" + 0.013*\"wale\"\n", + "2019-01-31 01:29:14,710 : INFO : topic #19 (0.020): 0.017*\"languag\" + 0.015*\"centuri\" + 0.011*\"woodcut\" + 0.009*\"form\" + 0.009*\"mean\" + 0.009*\"origin\" + 0.008*\"trade\" + 0.008*\"english\" + 0.007*\"known\" + 0.007*\"uruguayan\"\n", + "2019-01-31 01:29:14,711 : INFO : topic #24 (0.020): 0.040*\"book\" + 0.035*\"publicis\" + 0.026*\"word\" + 0.020*\"new\" + 0.014*\"edit\" + 0.014*\"presid\" + 0.011*\"worldwid\" + 0.011*\"magazin\" + 0.011*\"author\" + 0.011*\"nicola\"\n", + "2019-01-31 01:29:14,712 : INFO : topic #49 (0.020): 0.043*\"india\" + 0.031*\"incumb\" + 0.014*\"islam\" + 0.013*\"pakistan\" + 0.012*\"televis\" + 0.011*\"affection\" + 0.011*\"anglo\" + 0.010*\"sri\" + 0.010*\"muskoge\" + 0.010*\"khalsa\"\n", + "2019-01-31 01:29:14,713 : INFO : topic #43 (0.020): 0.066*\"elect\" + 0.055*\"parti\" + 0.025*\"democrat\" + 0.025*\"voluntari\" + 0.018*\"member\" + 0.016*\"republ\" + 0.016*\"polici\" + 0.014*\"bypass\" + 0.013*\"selma\" + 0.013*\"report\"\n", + "2019-01-31 01:29:14,719 : INFO : topic diff=0.003352, rho=0.021703\n", + "2019-01-31 01:29:14,877 : INFO : PROGRESS: pass 0, at document #4248000/4922894\n", + "2019-01-31 01:29:16,277 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:29:16,543 : INFO : topic #16 (0.020): 0.056*\"king\" + 0.031*\"priest\" + 0.019*\"duke\" + 0.018*\"grammat\" + 0.018*\"idiosyncrat\" + 0.017*\"rotterdam\" + 0.016*\"quarterli\" + 0.014*\"kingdom\" + 0.013*\"portugues\" + 0.012*\"maria\"\n", + "2019-01-31 01:29:16,544 : INFO : topic #3 (0.020): 0.033*\"present\" + 0.025*\"offic\" + 0.024*\"nation\" + 0.024*\"minist\" + 0.023*\"govern\" + 0.021*\"member\" + 0.017*\"start\" + 0.016*\"serv\" + 0.015*\"gener\" + 0.014*\"seri\"\n", + "2019-01-31 01:29:16,545 : INFO : topic #37 (0.020): 0.013*\"anim\" + 0.013*\"charact\" + 0.012*\"septemb\" + 0.011*\"man\" + 0.008*\"comic\" + 0.007*\"appear\" + 0.007*\"fusiform\" + 0.007*\"workplac\" + 0.007*\"storag\" + 0.006*\"black\"\n", + "2019-01-31 01:29:16,546 : INFO : topic #45 (0.020): 0.045*\"arsen\" + 0.030*\"jpg\" + 0.028*\"museo\" + 0.028*\"fifteenth\" + 0.022*\"pain\" + 0.020*\"illicit\" + 0.016*\"artist\" + 0.016*\"exhaust\" + 0.016*\"gai\" + 0.016*\"colder\"\n", + "2019-01-31 01:29:16,548 : INFO : topic #11 (0.020): 0.023*\"john\" + 0.011*\"david\" + 0.011*\"jame\" + 0.011*\"will\" + 0.010*\"rival\" + 0.009*\"mexican–american\" + 0.009*\"slur\" + 0.008*\"georg\" + 0.007*\"rhyme\" + 0.007*\"paul\"\n", + "2019-01-31 01:29:16,553 : INFO : topic diff=0.003377, rho=0.021698\n", + "2019-01-31 01:29:16,712 : INFO : PROGRESS: pass 0, at document #4250000/4922894\n", + "2019-01-31 01:29:18,098 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:29:18,365 : INFO : topic #19 (0.020): 0.017*\"languag\" + 0.015*\"centuri\" + 0.011*\"woodcut\" + 0.009*\"form\" + 0.009*\"mean\" + 0.009*\"origin\" + 0.008*\"trade\" + 0.008*\"english\" + 0.007*\"known\" + 0.007*\"uruguayan\"\n", + "2019-01-31 01:29:18,366 : INFO : topic #33 (0.020): 0.059*\"french\" + 0.044*\"franc\" + 0.029*\"pari\" + 0.023*\"sail\" + 0.023*\"jean\" + 0.017*\"daphn\" + 0.013*\"lazi\" + 0.011*\"piec\" + 0.011*\"loui\" + 0.010*\"wine\"\n", + "2019-01-31 01:29:18,367 : INFO : topic #34 (0.020): 0.065*\"start\" + 0.033*\"new\" + 0.031*\"american\" + 0.028*\"unionist\" + 0.026*\"cotton\" + 0.021*\"year\" + 0.016*\"california\" + 0.013*\"warrior\" + 0.012*\"terri\" + 0.012*\"citi\"\n", + "2019-01-31 01:29:18,368 : INFO : topic #12 (0.020): 0.008*\"number\" + 0.008*\"frontal\" + 0.007*\"poet\" + 0.006*\"exampl\" + 0.006*\"gener\" + 0.006*\"utopian\" + 0.006*\"southern\" + 0.006*\"servitud\" + 0.006*\"théori\" + 0.005*\"measur\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 01:29:18,369 : INFO : topic #5 (0.020): 0.038*\"abroad\" + 0.029*\"son\" + 0.026*\"rel\" + 0.025*\"reconstruct\" + 0.021*\"band\" + 0.017*\"muscl\" + 0.016*\"simultan\" + 0.014*\"charcoal\" + 0.013*\"toyota\" + 0.010*\"vocabulari\"\n", + "2019-01-31 01:29:18,375 : INFO : topic diff=0.003000, rho=0.021693\n", + "2019-01-31 01:29:18,528 : INFO : PROGRESS: pass 0, at document #4252000/4922894\n", + "2019-01-31 01:29:19,874 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:29:20,140 : INFO : topic #18 (0.020): 0.011*\"théori\" + 0.007*\"later\" + 0.007*\"sack\" + 0.006*\"dai\" + 0.005*\"kill\" + 0.005*\"like\" + 0.005*\"end\" + 0.005*\"retrospect\" + 0.004*\"call\" + 0.004*\"help\"\n", + "2019-01-31 01:29:20,141 : INFO : topic #33 (0.020): 0.058*\"french\" + 0.043*\"franc\" + 0.029*\"pari\" + 0.023*\"sail\" + 0.022*\"jean\" + 0.017*\"daphn\" + 0.013*\"lazi\" + 0.011*\"loui\" + 0.011*\"piec\" + 0.010*\"wine\"\n", + "2019-01-31 01:29:20,142 : INFO : topic #19 (0.020): 0.017*\"languag\" + 0.015*\"centuri\" + 0.011*\"woodcut\" + 0.009*\"form\" + 0.009*\"mean\" + 0.009*\"origin\" + 0.008*\"trade\" + 0.008*\"english\" + 0.007*\"known\" + 0.007*\"uruguayan\"\n", + "2019-01-31 01:29:20,143 : INFO : topic #22 (0.020): 0.034*\"spars\" + 0.018*\"factor\" + 0.012*\"plaisir\" + 0.010*\"western\" + 0.010*\"genu\" + 0.009*\"biom\" + 0.008*\"median\" + 0.007*\"florida\" + 0.007*\"trap\" + 0.006*\"incom\"\n", + "2019-01-31 01:29:20,144 : INFO : topic #1 (0.020): 0.055*\"china\" + 0.048*\"chilton\" + 0.023*\"kong\" + 0.023*\"hong\" + 0.022*\"korea\" + 0.019*\"korean\" + 0.017*\"leah\" + 0.016*\"sourc\" + 0.015*\"kim\" + 0.014*\"shirin\"\n", + "2019-01-31 01:29:20,150 : INFO : topic diff=0.003174, rho=0.021688\n", + "2019-01-31 01:29:20,362 : INFO : PROGRESS: pass 0, at document #4254000/4922894\n", + "2019-01-31 01:29:21,753 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:29:22,020 : INFO : topic #32 (0.020): 0.051*\"district\" + 0.044*\"popolo\" + 0.043*\"vigour\" + 0.035*\"cotton\" + 0.035*\"tortur\" + 0.022*\"multitud\" + 0.022*\"adulthood\" + 0.021*\"area\" + 0.019*\"cede\" + 0.018*\"commun\"\n", + "2019-01-31 01:29:22,021 : INFO : topic #18 (0.020): 0.011*\"théori\" + 0.007*\"later\" + 0.007*\"sack\" + 0.006*\"dai\" + 0.006*\"kill\" + 0.005*\"like\" + 0.005*\"end\" + 0.005*\"retrospect\" + 0.004*\"call\" + 0.004*\"help\"\n", + "2019-01-31 01:29:22,022 : INFO : topic #8 (0.020): 0.025*\"law\" + 0.022*\"cortic\" + 0.019*\"start\" + 0.017*\"act\" + 0.013*\"ricardo\" + 0.012*\"case\" + 0.010*\"replac\" + 0.009*\"polaris\" + 0.008*\"legal\" + 0.007*\"judaism\"\n", + "2019-01-31 01:29:22,023 : INFO : topic #40 (0.020): 0.085*\"unit\" + 0.023*\"schuster\" + 0.021*\"institut\" + 0.021*\"collector\" + 0.021*\"requir\" + 0.019*\"student\" + 0.014*\"professor\" + 0.012*\"word\" + 0.011*\"degre\" + 0.011*\"http\"\n", + "2019-01-31 01:29:22,024 : INFO : topic #10 (0.020): 0.012*\"cdd\" + 0.008*\"disco\" + 0.008*\"media\" + 0.007*\"hormon\" + 0.007*\"caus\" + 0.007*\"have\" + 0.007*\"pathwai\" + 0.006*\"effect\" + 0.006*\"treat\" + 0.006*\"proper\"\n", + "2019-01-31 01:29:22,030 : INFO : topic diff=0.003509, rho=0.021683\n", + "2019-01-31 01:29:22,184 : INFO : PROGRESS: pass 0, at document #4256000/4922894\n", + "2019-01-31 01:29:23,544 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:29:23,811 : INFO : topic #11 (0.020): 0.023*\"john\" + 0.012*\"jame\" + 0.011*\"will\" + 0.011*\"david\" + 0.010*\"rival\" + 0.009*\"mexican–american\" + 0.009*\"slur\" + 0.008*\"georg\" + 0.007*\"rhyme\" + 0.007*\"paul\"\n", + "2019-01-31 01:29:23,812 : INFO : topic #24 (0.020): 0.040*\"book\" + 0.035*\"publicis\" + 0.026*\"word\" + 0.020*\"new\" + 0.014*\"edit\" + 0.014*\"presid\" + 0.011*\"worldwid\" + 0.011*\"magazin\" + 0.011*\"author\" + 0.011*\"nicola\"\n", + "2019-01-31 01:29:23,813 : INFO : topic #28 (0.020): 0.035*\"build\" + 0.030*\"hous\" + 0.019*\"buford\" + 0.015*\"histor\" + 0.012*\"linear\" + 0.011*\"constitut\" + 0.011*\"depress\" + 0.011*\"pistol\" + 0.011*\"silicon\" + 0.010*\"centuri\"\n", + "2019-01-31 01:29:23,814 : INFO : topic #23 (0.020): 0.138*\"audit\" + 0.069*\"best\" + 0.034*\"yawn\" + 0.032*\"jacksonvil\" + 0.023*\"japanes\" + 0.022*\"noll\" + 0.019*\"women\" + 0.017*\"festiv\" + 0.016*\"intern\" + 0.013*\"winner\"\n", + "2019-01-31 01:29:23,815 : INFO : topic #13 (0.020): 0.027*\"london\" + 0.026*\"sourc\" + 0.026*\"australia\" + 0.025*\"new\" + 0.023*\"australian\" + 0.022*\"england\" + 0.020*\"british\" + 0.018*\"ireland\" + 0.015*\"youth\" + 0.013*\"wale\"\n", + "2019-01-31 01:29:23,820 : INFO : topic diff=0.003445, rho=0.021678\n", + "2019-01-31 01:29:23,977 : INFO : PROGRESS: pass 0, at document #4258000/4922894\n", + "2019-01-31 01:29:25,349 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:29:25,616 : INFO : topic #39 (0.020): 0.061*\"canada\" + 0.046*\"canadian\" + 0.025*\"toronto\" + 0.024*\"hoar\" + 0.021*\"ontario\" + 0.016*\"hydrogen\" + 0.015*\"new\" + 0.015*\"misericordia\" + 0.015*\"novotná\" + 0.013*\"quebec\"\n", + "2019-01-31 01:29:25,617 : INFO : topic #47 (0.020): 0.063*\"muscl\" + 0.033*\"perceptu\" + 0.021*\"theater\" + 0.018*\"place\" + 0.018*\"compos\" + 0.015*\"damn\" + 0.013*\"orchestr\" + 0.013*\"olympo\" + 0.013*\"physician\" + 0.011*\"jack\"\n", + "2019-01-31 01:29:25,618 : INFO : topic #26 (0.020): 0.029*\"workplac\" + 0.027*\"champion\" + 0.025*\"olymp\" + 0.025*\"woman\" + 0.023*\"men\" + 0.021*\"medal\" + 0.020*\"event\" + 0.018*\"taxpay\" + 0.018*\"alic\" + 0.017*\"nation\"\n", + "2019-01-31 01:29:25,619 : INFO : topic #3 (0.020): 0.033*\"present\" + 0.025*\"offic\" + 0.024*\"minist\" + 0.024*\"nation\" + 0.023*\"govern\" + 0.021*\"member\" + 0.017*\"start\" + 0.016*\"serv\" + 0.015*\"gener\" + 0.014*\"chickasaw\"\n", + "2019-01-31 01:29:25,620 : INFO : topic #20 (0.020): 0.140*\"scholar\" + 0.039*\"struggl\" + 0.032*\"high\" + 0.031*\"educ\" + 0.024*\"collector\" + 0.018*\"yawn\" + 0.013*\"prognosi\" + 0.010*\"district\" + 0.010*\"gothic\" + 0.009*\"task\"\n", + "2019-01-31 01:29:25,626 : INFO : topic diff=0.004405, rho=0.021673\n", + "2019-01-31 01:29:28,311 : INFO : -11.591 per-word bound, 3084.4 perplexity estimate based on a held-out corpus of 2000 documents with 547586 words\n", + "2019-01-31 01:29:28,312 : INFO : PROGRESS: pass 0, at document #4260000/4922894\n", + "2019-01-31 01:29:29,688 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:29:29,955 : INFO : topic #28 (0.020): 0.035*\"build\" + 0.030*\"hous\" + 0.019*\"buford\" + 0.015*\"histor\" + 0.012*\"linear\" + 0.011*\"constitut\" + 0.011*\"depress\" + 0.011*\"pistol\" + 0.011*\"silicon\" + 0.010*\"centuri\"\n", + "2019-01-31 01:29:29,956 : INFO : topic #48 (0.020): 0.079*\"sens\" + 0.079*\"march\" + 0.078*\"octob\" + 0.069*\"januari\" + 0.069*\"juli\" + 0.068*\"august\" + 0.067*\"notion\" + 0.066*\"judici\" + 0.066*\"april\" + 0.064*\"decatur\"\n", + "2019-01-31 01:29:29,957 : INFO : topic #2 (0.020): 0.050*\"isl\" + 0.038*\"shield\" + 0.017*\"narrat\" + 0.015*\"scot\" + 0.013*\"pope\" + 0.012*\"blur\" + 0.011*\"nativist\" + 0.011*\"coalit\" + 0.010*\"bahá\" + 0.009*\"class\"\n", + "2019-01-31 01:29:29,958 : INFO : topic #19 (0.020): 0.016*\"languag\" + 0.015*\"centuri\" + 0.011*\"woodcut\" + 0.009*\"form\" + 0.009*\"mean\" + 0.009*\"origin\" + 0.008*\"trade\" + 0.007*\"english\" + 0.007*\"known\" + 0.006*\"uruguayan\"\n", + "2019-01-31 01:29:29,959 : INFO : topic #45 (0.020): 0.045*\"arsen\" + 0.031*\"jpg\" + 0.029*\"fifteenth\" + 0.028*\"museo\" + 0.022*\"pain\" + 0.020*\"illicit\" + 0.016*\"artist\" + 0.016*\"exhaust\" + 0.016*\"gai\" + 0.016*\"colder\"\n", + "2019-01-31 01:29:29,965 : INFO : topic diff=0.002638, rho=0.021668\n", + "2019-01-31 01:29:30,125 : INFO : PROGRESS: pass 0, at document #4262000/4922894\n", + "2019-01-31 01:29:31,514 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:29:31,781 : INFO : topic #12 (0.020): 0.008*\"number\" + 0.007*\"frontal\" + 0.007*\"poet\" + 0.006*\"exampl\" + 0.006*\"gener\" + 0.006*\"utopian\" + 0.006*\"southern\" + 0.006*\"théori\" + 0.006*\"servitud\" + 0.006*\"method\"\n", + "2019-01-31 01:29:31,782 : INFO : topic #46 (0.020): 0.016*\"stop\" + 0.016*\"damag\" + 0.015*\"sweden\" + 0.014*\"wind\" + 0.014*\"norwai\" + 0.014*\"swedish\" + 0.013*\"norwegian\" + 0.012*\"treeless\" + 0.011*\"huntsvil\" + 0.009*\"denmark\"\n", + "2019-01-31 01:29:31,783 : INFO : topic #48 (0.020): 0.079*\"march\" + 0.079*\"sens\" + 0.078*\"octob\" + 0.069*\"januari\" + 0.069*\"juli\" + 0.068*\"august\" + 0.067*\"notion\" + 0.067*\"judici\" + 0.066*\"april\" + 0.064*\"decatur\"\n", + "2019-01-31 01:29:31,784 : INFO : topic #32 (0.020): 0.051*\"district\" + 0.045*\"popolo\" + 0.043*\"vigour\" + 0.035*\"tortur\" + 0.035*\"cotton\" + 0.022*\"multitud\" + 0.022*\"adulthood\" + 0.021*\"area\" + 0.019*\"cede\" + 0.018*\"commun\"\n", + "2019-01-31 01:29:31,785 : INFO : topic #38 (0.020): 0.023*\"walter\" + 0.010*\"aza\" + 0.010*\"battalion\" + 0.009*\"forc\" + 0.007*\"teufel\" + 0.007*\"armi\" + 0.007*\"empath\" + 0.006*\"till\" + 0.006*\"govern\" + 0.006*\"militari\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 01:29:31,791 : INFO : topic diff=0.002990, rho=0.021662\n", + "2019-01-31 01:29:31,949 : INFO : PROGRESS: pass 0, at document #4264000/4922894\n", + "2019-01-31 01:29:33,345 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:29:33,612 : INFO : topic #32 (0.020): 0.051*\"district\" + 0.045*\"popolo\" + 0.042*\"vigour\" + 0.036*\"tortur\" + 0.035*\"cotton\" + 0.022*\"multitud\" + 0.022*\"adulthood\" + 0.021*\"area\" + 0.019*\"cede\" + 0.018*\"citi\"\n", + "2019-01-31 01:29:33,613 : INFO : topic #17 (0.020): 0.077*\"church\" + 0.025*\"cathol\" + 0.023*\"christian\" + 0.021*\"bishop\" + 0.017*\"sail\" + 0.015*\"retroflex\" + 0.011*\"historiographi\" + 0.010*\"relationship\" + 0.010*\"parish\" + 0.009*\"poll\"\n", + "2019-01-31 01:29:33,614 : INFO : topic #12 (0.020): 0.008*\"number\" + 0.007*\"frontal\" + 0.007*\"poet\" + 0.006*\"exampl\" + 0.006*\"gener\" + 0.006*\"southern\" + 0.006*\"utopian\" + 0.006*\"théori\" + 0.006*\"servitud\" + 0.006*\"method\"\n", + "2019-01-31 01:29:33,615 : INFO : topic #46 (0.020): 0.016*\"stop\" + 0.016*\"damag\" + 0.015*\"sweden\" + 0.014*\"norwai\" + 0.014*\"wind\" + 0.014*\"swedish\" + 0.013*\"norwegian\" + 0.012*\"treeless\" + 0.011*\"huntsvil\" + 0.009*\"denmark\"\n", + "2019-01-31 01:29:33,616 : INFO : topic #37 (0.020): 0.013*\"anim\" + 0.013*\"charact\" + 0.012*\"septemb\" + 0.011*\"man\" + 0.008*\"comic\" + 0.007*\"appear\" + 0.007*\"storag\" + 0.007*\"workplac\" + 0.007*\"fusiform\" + 0.006*\"black\"\n", + "2019-01-31 01:29:33,622 : INFO : topic diff=0.003069, rho=0.021657\n", + "2019-01-31 01:29:33,778 : INFO : PROGRESS: pass 0, at document #4266000/4922894\n", + "2019-01-31 01:29:35,160 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:29:35,427 : INFO : topic #4 (0.020): 0.020*\"enfranchis\" + 0.015*\"depress\" + 0.013*\"pour\" + 0.008*\"elabor\" + 0.008*\"mode\" + 0.008*\"uruguayan\" + 0.008*\"veget\" + 0.006*\"develop\" + 0.006*\"produc\" + 0.006*\"turn\"\n", + "2019-01-31 01:29:35,428 : INFO : topic #42 (0.020): 0.047*\"german\" + 0.031*\"germani\" + 0.015*\"vol\" + 0.014*\"jewish\" + 0.014*\"berlin\" + 0.014*\"israel\" + 0.014*\"der\" + 0.010*\"european\" + 0.009*\"austria\" + 0.009*\"europ\"\n", + "2019-01-31 01:29:35,429 : INFO : topic #23 (0.020): 0.138*\"audit\" + 0.070*\"best\" + 0.034*\"yawn\" + 0.031*\"jacksonvil\" + 0.024*\"japanes\" + 0.022*\"noll\" + 0.019*\"women\" + 0.017*\"festiv\" + 0.016*\"intern\" + 0.013*\"winner\"\n", + "2019-01-31 01:29:35,430 : INFO : topic #6 (0.020): 0.070*\"fewer\" + 0.023*\"epiru\" + 0.020*\"septemb\" + 0.018*\"teacher\" + 0.014*\"stake\" + 0.012*\"rodríguez\" + 0.012*\"proclaim\" + 0.011*\"direct\" + 0.011*\"movi\" + 0.010*\"acrimoni\"\n", + "2019-01-31 01:29:35,431 : INFO : topic #49 (0.020): 0.045*\"india\" + 0.032*\"incumb\" + 0.014*\"islam\" + 0.012*\"televis\" + 0.012*\"pakistan\" + 0.011*\"anglo\" + 0.011*\"affection\" + 0.010*\"sri\" + 0.010*\"muskoge\" + 0.010*\"khalsa\"\n", + "2019-01-31 01:29:35,437 : INFO : topic diff=0.003100, rho=0.021652\n", + "2019-01-31 01:29:35,595 : INFO : PROGRESS: pass 0, at document #4268000/4922894\n", + "2019-01-31 01:29:36,990 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:29:37,257 : INFO : topic #9 (0.020): 0.071*\"bone\" + 0.043*\"american\" + 0.028*\"valour\" + 0.019*\"dutch\" + 0.018*\"player\" + 0.017*\"folei\" + 0.016*\"polit\" + 0.016*\"english\" + 0.013*\"acrimoni\" + 0.013*\"simpler\"\n", + "2019-01-31 01:29:37,258 : INFO : topic #5 (0.020): 0.038*\"abroad\" + 0.029*\"son\" + 0.026*\"rel\" + 0.025*\"reconstruct\" + 0.021*\"band\" + 0.017*\"muscl\" + 0.016*\"simultan\" + 0.014*\"charcoal\" + 0.014*\"toyota\" + 0.010*\"vocabulari\"\n", + "2019-01-31 01:29:37,259 : INFO : topic #28 (0.020): 0.035*\"build\" + 0.030*\"hous\" + 0.019*\"buford\" + 0.015*\"histor\" + 0.012*\"linear\" + 0.011*\"constitut\" + 0.011*\"depress\" + 0.011*\"silicon\" + 0.010*\"pistol\" + 0.010*\"centuri\"\n", + "2019-01-31 01:29:37,260 : INFO : topic #23 (0.020): 0.138*\"audit\" + 0.070*\"best\" + 0.034*\"yawn\" + 0.031*\"jacksonvil\" + 0.023*\"japanes\" + 0.022*\"noll\" + 0.019*\"women\" + 0.017*\"festiv\" + 0.016*\"intern\" + 0.013*\"winner\"\n", + "2019-01-31 01:29:37,261 : INFO : topic #3 (0.020): 0.034*\"present\" + 0.025*\"minist\" + 0.025*\"offic\" + 0.024*\"nation\" + 0.023*\"govern\" + 0.021*\"member\" + 0.017*\"start\" + 0.016*\"serv\" + 0.015*\"gener\" + 0.014*\"council\"\n", + "2019-01-31 01:29:37,267 : INFO : topic diff=0.003114, rho=0.021647\n", + "2019-01-31 01:29:37,426 : INFO : PROGRESS: pass 0, at document #4270000/4922894\n", + "2019-01-31 01:29:38,820 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:29:39,087 : INFO : topic #33 (0.020): 0.057*\"french\" + 0.043*\"franc\" + 0.028*\"pari\" + 0.023*\"wreath\" + 0.022*\"jean\" + 0.022*\"sail\" + 0.017*\"daphn\" + 0.013*\"lazi\" + 0.012*\"wine\" + 0.011*\"loui\"\n", + "2019-01-31 01:29:39,088 : INFO : topic #11 (0.020): 0.023*\"john\" + 0.012*\"jame\" + 0.011*\"david\" + 0.011*\"will\" + 0.010*\"rival\" + 0.009*\"mexican–american\" + 0.009*\"slur\" + 0.008*\"georg\" + 0.007*\"rhyme\" + 0.007*\"paul\"\n", + "2019-01-31 01:29:39,089 : INFO : topic #3 (0.020): 0.034*\"present\" + 0.025*\"minist\" + 0.025*\"offic\" + 0.024*\"nation\" + 0.023*\"govern\" + 0.021*\"member\" + 0.017*\"start\" + 0.016*\"serv\" + 0.015*\"gener\" + 0.014*\"council\"\n", + "2019-01-31 01:29:39,090 : INFO : topic #1 (0.020): 0.054*\"china\" + 0.047*\"chilton\" + 0.023*\"kong\" + 0.023*\"hong\" + 0.022*\"korea\" + 0.019*\"korean\" + 0.017*\"leah\" + 0.016*\"sourc\" + 0.014*\"shirin\" + 0.014*\"kim\"\n", + "2019-01-31 01:29:39,091 : INFO : topic #10 (0.020): 0.012*\"cdd\" + 0.008*\"disco\" + 0.008*\"media\" + 0.007*\"hormon\" + 0.007*\"caus\" + 0.007*\"have\" + 0.007*\"pathwai\" + 0.006*\"effect\" + 0.006*\"treat\" + 0.006*\"proper\"\n", + "2019-01-31 01:29:39,097 : INFO : topic diff=0.003089, rho=0.021642\n", + "2019-01-31 01:29:39,257 : INFO : PROGRESS: pass 0, at document #4272000/4922894\n", + "2019-01-31 01:29:40,663 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:29:40,930 : INFO : topic #41 (0.020): 0.041*\"citi\" + 0.023*\"palmer\" + 0.019*\"new\" + 0.016*\"strategist\" + 0.013*\"open\" + 0.013*\"center\" + 0.011*\"includ\" + 0.011*\"lobe\" + 0.011*\"dai\" + 0.009*\"hot\"\n", + "2019-01-31 01:29:40,931 : INFO : topic #30 (0.020): 0.035*\"leagu\" + 0.035*\"cleveland\" + 0.029*\"place\" + 0.027*\"taxpay\" + 0.024*\"scientist\" + 0.023*\"crete\" + 0.022*\"folei\" + 0.016*\"goal\" + 0.015*\"martin\" + 0.012*\"schmitz\"\n", + "2019-01-31 01:29:40,932 : INFO : topic #16 (0.020): 0.055*\"king\" + 0.031*\"priest\" + 0.019*\"idiosyncrat\" + 0.019*\"duke\" + 0.018*\"rotterdam\" + 0.018*\"grammat\" + 0.017*\"quarterli\" + 0.014*\"kingdom\" + 0.014*\"portugues\" + 0.012*\"count\"\n", + "2019-01-31 01:29:40,933 : INFO : topic #18 (0.020): 0.011*\"théori\" + 0.007*\"later\" + 0.007*\"sack\" + 0.006*\"dai\" + 0.006*\"kill\" + 0.005*\"like\" + 0.005*\"end\" + 0.005*\"retrospect\" + 0.004*\"call\" + 0.004*\"help\"\n", + "2019-01-31 01:29:40,934 : INFO : topic #46 (0.020): 0.016*\"stop\" + 0.015*\"damag\" + 0.015*\"sweden\" + 0.014*\"wind\" + 0.014*\"norwai\" + 0.014*\"swedish\" + 0.013*\"norwegian\" + 0.012*\"treeless\" + 0.011*\"huntsvil\" + 0.009*\"turkish\"\n", + "2019-01-31 01:29:40,940 : INFO : topic diff=0.003378, rho=0.021637\n", + "2019-01-31 01:29:41,102 : INFO : PROGRESS: pass 0, at document #4274000/4922894\n", + "2019-01-31 01:29:42,495 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:29:42,762 : INFO : topic #18 (0.020): 0.011*\"théori\" + 0.007*\"later\" + 0.007*\"sack\" + 0.006*\"dai\" + 0.006*\"kill\" + 0.005*\"like\" + 0.005*\"end\" + 0.005*\"retrospect\" + 0.004*\"call\" + 0.004*\"help\"\n", + "2019-01-31 01:29:42,763 : INFO : topic #38 (0.020): 0.023*\"walter\" + 0.010*\"aza\" + 0.009*\"battalion\" + 0.009*\"forc\" + 0.007*\"teufel\" + 0.007*\"armi\" + 0.007*\"empath\" + 0.006*\"till\" + 0.006*\"govern\" + 0.006*\"militari\"\n", + "2019-01-31 01:29:42,764 : INFO : topic #1 (0.020): 0.055*\"china\" + 0.049*\"chilton\" + 0.023*\"kong\" + 0.023*\"hong\" + 0.022*\"korea\" + 0.020*\"korean\" + 0.017*\"leah\" + 0.016*\"sourc\" + 0.014*\"shirin\" + 0.014*\"kim\"\n", + "2019-01-31 01:29:42,765 : INFO : topic #21 (0.020): 0.035*\"samford\" + 0.022*\"spain\" + 0.018*\"del\" + 0.017*\"mexico\" + 0.016*\"italian\" + 0.014*\"soviet\" + 0.014*\"santa\" + 0.011*\"juan\" + 0.010*\"francisco\" + 0.010*\"carlo\"\n", + "2019-01-31 01:29:42,766 : INFO : topic #49 (0.020): 0.045*\"india\" + 0.032*\"incumb\" + 0.014*\"islam\" + 0.012*\"televis\" + 0.012*\"pakistan\" + 0.011*\"affection\" + 0.011*\"anglo\" + 0.010*\"muskoge\" + 0.010*\"sri\" + 0.010*\"khalsa\"\n", + "2019-01-31 01:29:42,772 : INFO : topic diff=0.003894, rho=0.021632\n", + "2019-01-31 01:29:42,928 : INFO : PROGRESS: pass 0, at document #4276000/4922894\n", + "2019-01-31 01:29:44,282 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 01:29:44,549 : INFO : topic #27 (0.020): 0.076*\"questionnair\" + 0.021*\"candid\" + 0.018*\"taxpay\" + 0.015*\"ret\" + 0.012*\"tornado\" + 0.012*\"driver\" + 0.011*\"find\" + 0.011*\"fool\" + 0.010*\"horac\" + 0.010*\"champion\"\n", + "2019-01-31 01:29:44,550 : INFO : topic #3 (0.020): 0.034*\"present\" + 0.025*\"offic\" + 0.025*\"minist\" + 0.024*\"nation\" + 0.023*\"govern\" + 0.021*\"member\" + 0.017*\"start\" + 0.016*\"serv\" + 0.015*\"gener\" + 0.014*\"council\"\n", + "2019-01-31 01:29:44,551 : INFO : topic #13 (0.020): 0.027*\"london\" + 0.026*\"sourc\" + 0.025*\"australia\" + 0.025*\"new\" + 0.023*\"england\" + 0.022*\"australian\" + 0.020*\"british\" + 0.018*\"ireland\" + 0.015*\"youth\" + 0.013*\"wale\"\n", + "2019-01-31 01:29:44,552 : INFO : topic #22 (0.020): 0.033*\"spars\" + 0.018*\"factor\" + 0.012*\"plaisir\" + 0.010*\"western\" + 0.010*\"genu\" + 0.009*\"biom\" + 0.008*\"median\" + 0.007*\"florida\" + 0.007*\"trap\" + 0.006*\"incom\"\n", + "2019-01-31 01:29:44,553 : INFO : topic #43 (0.020): 0.066*\"elect\" + 0.054*\"parti\" + 0.025*\"voluntari\" + 0.024*\"democrat\" + 0.018*\"member\" + 0.016*\"polici\" + 0.016*\"republ\" + 0.015*\"bypass\" + 0.013*\"selma\" + 0.013*\"report\"\n", + "2019-01-31 01:29:44,559 : INFO : topic diff=0.003050, rho=0.021627\n", + "2019-01-31 01:29:44,716 : INFO : PROGRESS: pass 0, at document #4278000/4922894\n", + "2019-01-31 01:29:46,088 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:29:46,355 : INFO : topic #20 (0.020): 0.142*\"scholar\" + 0.039*\"struggl\" + 0.032*\"high\" + 0.030*\"educ\" + 0.024*\"collector\" + 0.018*\"yawn\" + 0.013*\"prognosi\" + 0.010*\"district\" + 0.010*\"gothic\" + 0.009*\"task\"\n", + "2019-01-31 01:29:46,356 : INFO : topic #36 (0.020): 0.011*\"network\" + 0.010*\"prognosi\" + 0.010*\"pop\" + 0.009*\"cytokin\" + 0.008*\"diggin\" + 0.008*\"softwar\" + 0.008*\"develop\" + 0.008*\"user\" + 0.008*\"uruguayan\" + 0.007*\"includ\"\n", + "2019-01-31 01:29:46,357 : INFO : topic #12 (0.020): 0.008*\"number\" + 0.008*\"frontal\" + 0.007*\"poet\" + 0.006*\"exampl\" + 0.006*\"gener\" + 0.006*\"southern\" + 0.006*\"utopian\" + 0.006*\"théori\" + 0.006*\"servitud\" + 0.006*\"field\"\n", + "2019-01-31 01:29:46,358 : INFO : topic #15 (0.020): 0.011*\"small\" + 0.010*\"organ\" + 0.009*\"develop\" + 0.009*\"commun\" + 0.009*\"word\" + 0.009*\"group\" + 0.008*\"peopl\" + 0.007*\"woman\" + 0.007*\"human\" + 0.006*\"summerhil\"\n", + "2019-01-31 01:29:46,359 : INFO : topic #28 (0.020): 0.035*\"build\" + 0.030*\"hous\" + 0.019*\"buford\" + 0.015*\"histor\" + 0.011*\"linear\" + 0.011*\"constitut\" + 0.011*\"depress\" + 0.011*\"silicon\" + 0.010*\"pistol\" + 0.010*\"centuri\"\n", + "2019-01-31 01:29:46,365 : INFO : topic diff=0.003646, rho=0.021622\n", + "2019-01-31 01:29:48,981 : INFO : -11.619 per-word bound, 3145.6 perplexity estimate based on a held-out corpus of 2000 documents with 516782 words\n", + "2019-01-31 01:29:48,981 : INFO : PROGRESS: pass 0, at document #4280000/4922894\n", + "2019-01-31 01:29:50,325 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:29:50,592 : INFO : topic #15 (0.020): 0.011*\"small\" + 0.010*\"organ\" + 0.009*\"develop\" + 0.009*\"commun\" + 0.009*\"word\" + 0.009*\"group\" + 0.008*\"peopl\" + 0.007*\"woman\" + 0.007*\"human\" + 0.006*\"summerhil\"\n", + "2019-01-31 01:29:50,593 : INFO : topic #33 (0.020): 0.057*\"french\" + 0.043*\"franc\" + 0.028*\"pari\" + 0.022*\"jean\" + 0.022*\"sail\" + 0.021*\"wreath\" + 0.016*\"daphn\" + 0.013*\"lazi\" + 0.012*\"wine\" + 0.011*\"loui\"\n", + "2019-01-31 01:29:50,594 : INFO : topic #2 (0.020): 0.050*\"isl\" + 0.037*\"shield\" + 0.018*\"narrat\" + 0.015*\"scot\" + 0.014*\"pope\" + 0.012*\"blur\" + 0.011*\"nativist\" + 0.010*\"coalit\" + 0.009*\"class\" + 0.009*\"bahá\"\n", + "2019-01-31 01:29:50,596 : INFO : topic #4 (0.020): 0.019*\"enfranchis\" + 0.014*\"depress\" + 0.013*\"pour\" + 0.008*\"mode\" + 0.008*\"elabor\" + 0.008*\"uruguayan\" + 0.008*\"veget\" + 0.006*\"develop\" + 0.006*\"produc\" + 0.006*\"spectacl\"\n", + "2019-01-31 01:29:50,597 : INFO : topic #23 (0.020): 0.139*\"audit\" + 0.069*\"best\" + 0.034*\"yawn\" + 0.030*\"jacksonvil\" + 0.024*\"japanes\" + 0.022*\"noll\" + 0.019*\"women\" + 0.017*\"festiv\" + 0.016*\"intern\" + 0.013*\"winner\"\n", + "2019-01-31 01:29:50,602 : INFO : topic diff=0.003364, rho=0.021617\n", + "2019-01-31 01:29:50,762 : INFO : PROGRESS: pass 0, at document #4282000/4922894\n", + "2019-01-31 01:29:52,143 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:29:52,409 : INFO : topic #7 (0.020): 0.021*\"snatch\" + 0.020*\"di\" + 0.019*\"factor\" + 0.016*\"yawn\" + 0.016*\"margin\" + 0.015*\"bone\" + 0.013*\"life\" + 0.013*\"faster\" + 0.012*\"daughter\" + 0.012*\"deal\"\n", + "2019-01-31 01:29:52,410 : INFO : topic #47 (0.020): 0.063*\"muscl\" + 0.033*\"perceptu\" + 0.021*\"theater\" + 0.018*\"compos\" + 0.018*\"place\" + 0.015*\"damn\" + 0.013*\"orchestr\" + 0.013*\"olympo\" + 0.013*\"physician\" + 0.011*\"word\"\n", + "2019-01-31 01:29:52,412 : INFO : topic #15 (0.020): 0.011*\"small\" + 0.010*\"organ\" + 0.009*\"develop\" + 0.009*\"commun\" + 0.009*\"word\" + 0.009*\"group\" + 0.008*\"peopl\" + 0.007*\"human\" + 0.007*\"woman\" + 0.006*\"summerhil\"\n", + "2019-01-31 01:29:52,413 : INFO : topic #6 (0.020): 0.071*\"fewer\" + 0.023*\"epiru\" + 0.020*\"septemb\" + 0.018*\"teacher\" + 0.014*\"stake\" + 0.012*\"rodríguez\" + 0.012*\"proclaim\" + 0.011*\"direct\" + 0.011*\"movi\" + 0.010*\"acrimoni\"\n", + "2019-01-31 01:29:52,414 : INFO : topic #40 (0.020): 0.086*\"unit\" + 0.023*\"schuster\" + 0.021*\"institut\" + 0.021*\"collector\" + 0.021*\"requir\" + 0.019*\"student\" + 0.015*\"professor\" + 0.012*\"degre\" + 0.012*\"word\" + 0.011*\"http\"\n", + "2019-01-31 01:29:52,420 : INFO : topic diff=0.003373, rho=0.021612\n", + "2019-01-31 01:29:52,571 : INFO : PROGRESS: pass 0, at document #4284000/4922894\n", + "2019-01-31 01:29:53,915 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:29:54,182 : INFO : topic #3 (0.020): 0.034*\"present\" + 0.025*\"minist\" + 0.025*\"offic\" + 0.024*\"nation\" + 0.023*\"govern\" + 0.021*\"member\" + 0.017*\"start\" + 0.016*\"serv\" + 0.015*\"gener\" + 0.014*\"council\"\n", + "2019-01-31 01:29:54,182 : INFO : topic #32 (0.020): 0.051*\"district\" + 0.044*\"popolo\" + 0.043*\"vigour\" + 0.036*\"tortur\" + 0.035*\"cotton\" + 0.022*\"multitud\" + 0.022*\"adulthood\" + 0.021*\"area\" + 0.019*\"cede\" + 0.018*\"citi\"\n", + "2019-01-31 01:29:54,183 : INFO : topic #36 (0.020): 0.011*\"network\" + 0.010*\"prognosi\" + 0.010*\"pop\" + 0.008*\"cytokin\" + 0.008*\"diggin\" + 0.008*\"develop\" + 0.008*\"user\" + 0.008*\"softwar\" + 0.008*\"uruguayan\" + 0.007*\"includ\"\n", + "2019-01-31 01:29:54,185 : INFO : topic #12 (0.020): 0.008*\"number\" + 0.008*\"frontal\" + 0.007*\"poet\" + 0.006*\"exampl\" + 0.006*\"gener\" + 0.006*\"southern\" + 0.006*\"utopian\" + 0.006*\"théori\" + 0.006*\"servitud\" + 0.006*\"field\"\n", + "2019-01-31 01:29:54,185 : INFO : topic #26 (0.020): 0.029*\"workplac\" + 0.027*\"champion\" + 0.025*\"woman\" + 0.025*\"olymp\" + 0.024*\"men\" + 0.022*\"medal\" + 0.020*\"event\" + 0.018*\"taxpay\" + 0.018*\"alic\" + 0.017*\"atheist\"\n", + "2019-01-31 01:29:54,191 : INFO : topic diff=0.003117, rho=0.021607\n", + "2019-01-31 01:29:54,349 : INFO : PROGRESS: pass 0, at document #4286000/4922894\n", + "2019-01-31 01:29:55,722 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:29:55,989 : INFO : topic #3 (0.020): 0.034*\"present\" + 0.025*\"minist\" + 0.025*\"offic\" + 0.024*\"nation\" + 0.023*\"govern\" + 0.021*\"member\" + 0.017*\"start\" + 0.016*\"serv\" + 0.015*\"gener\" + 0.014*\"council\"\n", + "2019-01-31 01:29:55,990 : INFO : topic #8 (0.020): 0.025*\"law\" + 0.023*\"cortic\" + 0.019*\"act\" + 0.018*\"start\" + 0.013*\"ricardo\" + 0.012*\"case\" + 0.010*\"replac\" + 0.009*\"polaris\" + 0.008*\"legal\" + 0.007*\"judaism\"\n", + "2019-01-31 01:29:55,991 : INFO : topic #17 (0.020): 0.077*\"church\" + 0.025*\"cathol\" + 0.023*\"christian\" + 0.022*\"bishop\" + 0.016*\"sail\" + 0.015*\"retroflex\" + 0.010*\"historiographi\" + 0.010*\"relationship\" + 0.009*\"parish\" + 0.009*\"poll\"\n", + "2019-01-31 01:29:55,992 : INFO : topic #18 (0.020): 0.011*\"théori\" + 0.007*\"later\" + 0.007*\"sack\" + 0.006*\"dai\" + 0.006*\"kill\" + 0.005*\"like\" + 0.005*\"retrospect\" + 0.005*\"end\" + 0.004*\"call\" + 0.004*\"help\"\n", + "2019-01-31 01:29:55,993 : INFO : topic #6 (0.020): 0.071*\"fewer\" + 0.023*\"epiru\" + 0.020*\"septemb\" + 0.018*\"teacher\" + 0.015*\"stake\" + 0.012*\"rodríguez\" + 0.012*\"proclaim\" + 0.011*\"direct\" + 0.011*\"movi\" + 0.010*\"acrimoni\"\n", + "2019-01-31 01:29:55,999 : INFO : topic diff=0.002996, rho=0.021602\n", + "2019-01-31 01:29:56,210 : INFO : PROGRESS: pass 0, at document #4288000/4922894\n", + "2019-01-31 01:29:57,693 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 01:29:57,960 : INFO : topic #32 (0.020): 0.051*\"district\" + 0.044*\"popolo\" + 0.042*\"vigour\" + 0.036*\"tortur\" + 0.035*\"cotton\" + 0.022*\"adulthood\" + 0.022*\"multitud\" + 0.021*\"area\" + 0.019*\"cede\" + 0.018*\"citi\"\n", + "2019-01-31 01:29:57,961 : INFO : topic #21 (0.020): 0.035*\"samford\" + 0.022*\"spain\" + 0.018*\"del\" + 0.017*\"mexico\" + 0.016*\"italian\" + 0.014*\"santa\" + 0.013*\"soviet\" + 0.011*\"juan\" + 0.010*\"francisco\" + 0.010*\"carlo\"\n", + "2019-01-31 01:29:57,962 : INFO : topic #44 (0.020): 0.031*\"rooftop\" + 0.027*\"final\" + 0.025*\"wife\" + 0.020*\"tourist\" + 0.019*\"champion\" + 0.016*\"martin\" + 0.015*\"open\" + 0.014*\"chamber\" + 0.014*\"taxpay\" + 0.014*\"tiepolo\"\n", + "2019-01-31 01:29:57,964 : INFO : topic #7 (0.020): 0.021*\"snatch\" + 0.020*\"di\" + 0.019*\"factor\" + 0.016*\"margin\" + 0.016*\"yawn\" + 0.015*\"bone\" + 0.013*\"life\" + 0.013*\"faster\" + 0.012*\"daughter\" + 0.012*\"deal\"\n", + "2019-01-31 01:29:57,965 : INFO : topic #28 (0.020): 0.035*\"build\" + 0.030*\"hous\" + 0.019*\"buford\" + 0.015*\"histor\" + 0.011*\"linear\" + 0.011*\"constitut\" + 0.011*\"depress\" + 0.011*\"silicon\" + 0.010*\"centuri\" + 0.010*\"pistol\"\n", + "2019-01-31 01:29:57,970 : INFO : topic diff=0.003408, rho=0.021597\n", + "2019-01-31 01:29:58,127 : INFO : PROGRESS: pass 0, at document #4290000/4922894\n", + "2019-01-31 01:29:59,501 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:29:59,767 : INFO : topic #25 (0.020): 0.034*\"ring\" + 0.018*\"area\" + 0.018*\"lagrang\" + 0.016*\"warmth\" + 0.015*\"mount\" + 0.010*\"north\" + 0.009*\"foam\" + 0.009*\"sourc\" + 0.009*\"land\" + 0.009*\"lobe\"\n", + "2019-01-31 01:29:59,769 : INFO : topic #38 (0.020): 0.023*\"walter\" + 0.010*\"aza\" + 0.009*\"battalion\" + 0.009*\"forc\" + 0.007*\"teufel\" + 0.007*\"armi\" + 0.007*\"empath\" + 0.006*\"till\" + 0.006*\"govern\" + 0.006*\"militari\"\n", + "2019-01-31 01:29:59,770 : INFO : topic #32 (0.020): 0.052*\"district\" + 0.044*\"popolo\" + 0.042*\"vigour\" + 0.035*\"tortur\" + 0.035*\"cotton\" + 0.022*\"adulthood\" + 0.022*\"multitud\" + 0.021*\"area\" + 0.019*\"cede\" + 0.018*\"citi\"\n", + "2019-01-31 01:29:59,771 : INFO : topic #48 (0.020): 0.078*\"sens\" + 0.078*\"march\" + 0.077*\"octob\" + 0.068*\"januari\" + 0.067*\"notion\" + 0.066*\"juli\" + 0.066*\"april\" + 0.066*\"august\" + 0.064*\"judici\" + 0.063*\"decatur\"\n", + "2019-01-31 01:29:59,772 : INFO : topic #42 (0.020): 0.046*\"german\" + 0.031*\"germani\" + 0.016*\"vol\" + 0.014*\"der\" + 0.014*\"jewish\" + 0.014*\"berlin\" + 0.013*\"israel\" + 0.010*\"european\" + 0.010*\"austria\" + 0.009*\"europ\"\n", + "2019-01-31 01:29:59,778 : INFO : topic diff=0.003606, rho=0.021592\n", + "2019-01-31 01:29:59,938 : INFO : PROGRESS: pass 0, at document #4292000/4922894\n", + "2019-01-31 01:30:01,356 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:30:01,623 : INFO : topic #6 (0.020): 0.071*\"fewer\" + 0.023*\"epiru\" + 0.020*\"septemb\" + 0.018*\"teacher\" + 0.014*\"stake\" + 0.012*\"rodríguez\" + 0.012*\"proclaim\" + 0.011*\"direct\" + 0.011*\"movi\" + 0.010*\"acrimoni\"\n", + "2019-01-31 01:30:01,624 : INFO : topic #3 (0.020): 0.035*\"present\" + 0.026*\"minist\" + 0.025*\"offic\" + 0.024*\"nation\" + 0.023*\"govern\" + 0.021*\"member\" + 0.017*\"start\" + 0.016*\"serv\" + 0.015*\"gener\" + 0.014*\"council\"\n", + "2019-01-31 01:30:01,625 : INFO : topic #25 (0.020): 0.034*\"ring\" + 0.018*\"area\" + 0.018*\"lagrang\" + 0.016*\"warmth\" + 0.015*\"mount\" + 0.010*\"north\" + 0.009*\"sourc\" + 0.009*\"land\" + 0.009*\"foam\" + 0.009*\"lobe\"\n", + "2019-01-31 01:30:01,626 : INFO : topic #48 (0.020): 0.078*\"sens\" + 0.078*\"march\" + 0.077*\"octob\" + 0.068*\"januari\" + 0.067*\"notion\" + 0.066*\"juli\" + 0.066*\"august\" + 0.066*\"april\" + 0.064*\"judici\" + 0.064*\"decatur\"\n", + "2019-01-31 01:30:01,627 : INFO : topic #31 (0.020): 0.052*\"fusiform\" + 0.026*\"scientist\" + 0.024*\"taxpay\" + 0.022*\"player\" + 0.020*\"place\" + 0.013*\"clot\" + 0.013*\"leagu\" + 0.011*\"folei\" + 0.010*\"yawn\" + 0.009*\"reconstruct\"\n", + "2019-01-31 01:30:01,633 : INFO : topic diff=0.003357, rho=0.021587\n", + "2019-01-31 01:30:01,788 : INFO : PROGRESS: pass 0, at document #4294000/4922894\n", + "2019-01-31 01:30:03,150 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:30:03,416 : INFO : topic #44 (0.020): 0.031*\"rooftop\" + 0.026*\"final\" + 0.025*\"wife\" + 0.020*\"tourist\" + 0.019*\"champion\" + 0.016*\"martin\" + 0.014*\"open\" + 0.014*\"chamber\" + 0.014*\"taxpay\" + 0.014*\"tiepolo\"\n", + "2019-01-31 01:30:03,418 : INFO : topic #12 (0.020): 0.008*\"number\" + 0.007*\"frontal\" + 0.007*\"poet\" + 0.006*\"gener\" + 0.006*\"exampl\" + 0.006*\"southern\" + 0.006*\"théori\" + 0.006*\"utopian\" + 0.006*\"servitud\" + 0.006*\"field\"\n", + "2019-01-31 01:30:03,419 : INFO : topic #38 (0.020): 0.023*\"walter\" + 0.010*\"aza\" + 0.009*\"battalion\" + 0.009*\"forc\" + 0.007*\"teufel\" + 0.007*\"armi\" + 0.007*\"empath\" + 0.006*\"till\" + 0.006*\"militari\" + 0.006*\"govern\"\n", + "2019-01-31 01:30:03,420 : INFO : topic #28 (0.020): 0.035*\"build\" + 0.030*\"hous\" + 0.019*\"buford\" + 0.015*\"histor\" + 0.011*\"linear\" + 0.011*\"constitut\" + 0.011*\"depress\" + 0.011*\"silicon\" + 0.010*\"centuri\" + 0.010*\"pistol\"\n", + "2019-01-31 01:30:03,421 : INFO : topic #48 (0.020): 0.078*\"sens\" + 0.078*\"march\" + 0.076*\"octob\" + 0.068*\"januari\" + 0.067*\"august\" + 0.067*\"notion\" + 0.066*\"juli\" + 0.066*\"april\" + 0.064*\"judici\" + 0.064*\"decatur\"\n", + "2019-01-31 01:30:03,427 : INFO : topic diff=0.003191, rho=0.021582\n", + "2019-01-31 01:30:03,581 : INFO : PROGRESS: pass 0, at document #4296000/4922894\n", + "2019-01-31 01:30:04,978 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:30:05,244 : INFO : topic #7 (0.020): 0.021*\"snatch\" + 0.020*\"di\" + 0.019*\"factor\" + 0.016*\"margin\" + 0.016*\"yawn\" + 0.015*\"bone\" + 0.013*\"life\" + 0.013*\"faster\" + 0.012*\"daughter\" + 0.012*\"deal\"\n", + "2019-01-31 01:30:05,245 : INFO : topic #6 (0.020): 0.071*\"fewer\" + 0.023*\"epiru\" + 0.020*\"septemb\" + 0.018*\"teacher\" + 0.015*\"stake\" + 0.012*\"rodríguez\" + 0.012*\"proclaim\" + 0.011*\"direct\" + 0.011*\"movi\" + 0.010*\"acrimoni\"\n", + "2019-01-31 01:30:05,246 : INFO : topic #10 (0.020): 0.012*\"cdd\" + 0.008*\"disco\" + 0.008*\"media\" + 0.007*\"hormon\" + 0.007*\"have\" + 0.007*\"caus\" + 0.007*\"pathwai\" + 0.006*\"effect\" + 0.006*\"treat\" + 0.006*\"proper\"\n", + "2019-01-31 01:30:05,247 : INFO : topic #16 (0.020): 0.055*\"king\" + 0.031*\"priest\" + 0.019*\"idiosyncrat\" + 0.019*\"rotterdam\" + 0.018*\"duke\" + 0.018*\"grammat\" + 0.017*\"quarterli\" + 0.014*\"kingdom\" + 0.014*\"portugues\" + 0.013*\"maria\"\n", + "2019-01-31 01:30:05,249 : INFO : topic #17 (0.020): 0.077*\"church\" + 0.025*\"cathol\" + 0.023*\"christian\" + 0.023*\"bishop\" + 0.016*\"sail\" + 0.015*\"retroflex\" + 0.010*\"historiographi\" + 0.010*\"relationship\" + 0.009*\"parish\" + 0.009*\"poll\"\n", + "2019-01-31 01:30:05,254 : INFO : topic diff=0.002855, rho=0.021577\n", + "2019-01-31 01:30:05,412 : INFO : PROGRESS: pass 0, at document #4298000/4922894\n", + "2019-01-31 01:30:06,802 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:30:07,070 : INFO : topic #32 (0.020): 0.051*\"district\" + 0.045*\"popolo\" + 0.042*\"vigour\" + 0.036*\"tortur\" + 0.034*\"cotton\" + 0.022*\"adulthood\" + 0.022*\"multitud\" + 0.021*\"area\" + 0.019*\"cede\" + 0.018*\"commun\"\n", + "2019-01-31 01:30:07,071 : INFO : topic #25 (0.020): 0.034*\"ring\" + 0.018*\"area\" + 0.018*\"lagrang\" + 0.016*\"warmth\" + 0.015*\"mount\" + 0.010*\"north\" + 0.009*\"sourc\" + 0.009*\"foam\" + 0.009*\"land\" + 0.009*\"lobe\"\n", + "2019-01-31 01:30:07,072 : INFO : topic #37 (0.020): 0.013*\"charact\" + 0.012*\"anim\" + 0.012*\"septemb\" + 0.011*\"man\" + 0.008*\"comic\" + 0.007*\"appear\" + 0.007*\"fusiform\" + 0.007*\"workplac\" + 0.007*\"storag\" + 0.006*\"black\"\n", + "2019-01-31 01:30:07,073 : INFO : topic #36 (0.020): 0.011*\"network\" + 0.010*\"prognosi\" + 0.010*\"pop\" + 0.008*\"cytokin\" + 0.008*\"user\" + 0.008*\"develop\" + 0.008*\"softwar\" + 0.008*\"diggin\" + 0.008*\"uruguayan\" + 0.007*\"includ\"\n", + "2019-01-31 01:30:07,074 : INFO : topic #46 (0.020): 0.017*\"stop\" + 0.015*\"sweden\" + 0.015*\"swedish\" + 0.014*\"wind\" + 0.014*\"norwai\" + 0.014*\"damag\" + 0.013*\"treeless\" + 0.013*\"norwegian\" + 0.011*\"huntsvil\" + 0.009*\"denmark\"\n", + "2019-01-31 01:30:07,080 : INFO : topic diff=0.003643, rho=0.021572\n", + "2019-01-31 01:30:09,809 : INFO : -11.602 per-word bound, 3108.6 perplexity estimate based on a held-out corpus of 2000 documents with 566311 words\n", + "2019-01-31 01:30:09,809 : INFO : PROGRESS: pass 0, at document #4300000/4922894\n", + "2019-01-31 01:30:11,199 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 01:30:11,465 : INFO : topic #5 (0.020): 0.038*\"abroad\" + 0.029*\"son\" + 0.027*\"rel\" + 0.025*\"reconstruct\" + 0.020*\"band\" + 0.017*\"muscl\" + 0.016*\"simultan\" + 0.014*\"charcoal\" + 0.013*\"toyota\" + 0.010*\"vocabulari\"\n", + "2019-01-31 01:30:11,466 : INFO : topic #42 (0.020): 0.046*\"german\" + 0.031*\"germani\" + 0.016*\"vol\" + 0.014*\"jewish\" + 0.014*\"der\" + 0.014*\"berlin\" + 0.013*\"israel\" + 0.010*\"european\" + 0.010*\"austria\" + 0.009*\"europ\"\n", + "2019-01-31 01:30:11,467 : INFO : topic #32 (0.020): 0.051*\"district\" + 0.045*\"popolo\" + 0.042*\"vigour\" + 0.035*\"tortur\" + 0.034*\"cotton\" + 0.022*\"adulthood\" + 0.022*\"multitud\" + 0.021*\"area\" + 0.019*\"cede\" + 0.018*\"commun\"\n", + "2019-01-31 01:30:11,468 : INFO : topic #30 (0.020): 0.035*\"leagu\" + 0.035*\"cleveland\" + 0.029*\"place\" + 0.027*\"taxpay\" + 0.025*\"scientist\" + 0.023*\"crete\" + 0.022*\"folei\" + 0.016*\"goal\" + 0.015*\"martin\" + 0.012*\"schmitz\"\n", + "2019-01-31 01:30:11,469 : INFO : topic #9 (0.020): 0.069*\"bone\" + 0.043*\"american\" + 0.029*\"valour\" + 0.018*\"dutch\" + 0.017*\"player\" + 0.017*\"folei\" + 0.016*\"polit\" + 0.015*\"english\" + 0.012*\"acrimoni\" + 0.012*\"simpler\"\n", + "2019-01-31 01:30:11,475 : INFO : topic diff=0.002694, rho=0.021567\n", + "2019-01-31 01:30:11,634 : INFO : PROGRESS: pass 0, at document #4302000/4922894\n", + "2019-01-31 01:30:13,036 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:30:13,303 : INFO : topic #23 (0.020): 0.139*\"audit\" + 0.069*\"best\" + 0.034*\"yawn\" + 0.030*\"jacksonvil\" + 0.023*\"japanes\" + 0.022*\"noll\" + 0.019*\"women\" + 0.018*\"festiv\" + 0.016*\"intern\" + 0.013*\"prison\"\n", + "2019-01-31 01:30:13,304 : INFO : topic #40 (0.020): 0.086*\"unit\" + 0.023*\"schuster\" + 0.021*\"requir\" + 0.021*\"institut\" + 0.021*\"collector\" + 0.019*\"student\" + 0.015*\"professor\" + 0.012*\"degre\" + 0.012*\"word\" + 0.011*\"governor\"\n", + "2019-01-31 01:30:13,305 : INFO : topic #24 (0.020): 0.041*\"book\" + 0.035*\"publicis\" + 0.026*\"word\" + 0.020*\"new\" + 0.014*\"edit\" + 0.014*\"presid\" + 0.011*\"worldwid\" + 0.011*\"author\" + 0.011*\"magazin\" + 0.011*\"storag\"\n", + "2019-01-31 01:30:13,306 : INFO : topic #4 (0.020): 0.019*\"enfranchis\" + 0.014*\"depress\" + 0.013*\"pour\" + 0.008*\"mode\" + 0.008*\"elabor\" + 0.008*\"uruguayan\" + 0.008*\"veget\" + 0.006*\"develop\" + 0.006*\"produc\" + 0.006*\"spectacl\"\n", + "2019-01-31 01:30:13,307 : INFO : topic #0 (0.020): 0.062*\"statewid\" + 0.043*\"line\" + 0.031*\"raid\" + 0.029*\"rivièr\" + 0.027*\"rosenwald\" + 0.020*\"airmen\" + 0.018*\"serv\" + 0.017*\"traceabl\" + 0.013*\"oper\" + 0.010*\"transient\"\n", + "2019-01-31 01:30:13,313 : INFO : topic diff=0.003273, rho=0.021562\n", + "2019-01-31 01:30:13,468 : INFO : PROGRESS: pass 0, at document #4304000/4922894\n", + "2019-01-31 01:30:14,839 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:30:15,105 : INFO : topic #17 (0.020): 0.077*\"church\" + 0.025*\"cathol\" + 0.023*\"christian\" + 0.022*\"bishop\" + 0.017*\"sail\" + 0.016*\"retroflex\" + 0.010*\"historiographi\" + 0.010*\"relationship\" + 0.009*\"parish\" + 0.009*\"poll\"\n", + "2019-01-31 01:30:15,106 : INFO : topic #47 (0.020): 0.063*\"muscl\" + 0.034*\"perceptu\" + 0.020*\"theater\" + 0.018*\"compos\" + 0.018*\"place\" + 0.015*\"damn\" + 0.014*\"orchestr\" + 0.013*\"physician\" + 0.012*\"olympo\" + 0.011*\"jack\"\n", + "2019-01-31 01:30:15,107 : INFO : topic #12 (0.020): 0.009*\"number\" + 0.008*\"frontal\" + 0.007*\"poet\" + 0.006*\"gener\" + 0.006*\"exampl\" + 0.006*\"southern\" + 0.006*\"théori\" + 0.006*\"utopian\" + 0.006*\"servitud\" + 0.005*\"field\"\n", + "2019-01-31 01:30:15,109 : INFO : topic #38 (0.020): 0.023*\"walter\" + 0.010*\"aza\" + 0.009*\"battalion\" + 0.008*\"forc\" + 0.007*\"teufel\" + 0.007*\"armi\" + 0.007*\"empath\" + 0.006*\"till\" + 0.006*\"govern\" + 0.006*\"militari\"\n", + "2019-01-31 01:30:15,110 : INFO : topic #16 (0.020): 0.055*\"king\" + 0.031*\"priest\" + 0.019*\"rotterdam\" + 0.019*\"idiosyncrat\" + 0.019*\"grammat\" + 0.018*\"duke\" + 0.017*\"quarterli\" + 0.014*\"kingdom\" + 0.013*\"portugues\" + 0.012*\"maria\"\n", + "2019-01-31 01:30:15,115 : INFO : topic diff=0.002852, rho=0.021557\n", + "2019-01-31 01:30:15,273 : INFO : PROGRESS: pass 0, at document #4306000/4922894\n", + "2019-01-31 01:30:16,663 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:30:16,929 : INFO : topic #24 (0.020): 0.041*\"book\" + 0.035*\"publicis\" + 0.026*\"word\" + 0.020*\"new\" + 0.014*\"edit\" + 0.014*\"presid\" + 0.011*\"worldwid\" + 0.011*\"author\" + 0.011*\"magazin\" + 0.011*\"storag\"\n", + "2019-01-31 01:30:16,930 : INFO : topic #42 (0.020): 0.046*\"german\" + 0.031*\"germani\" + 0.016*\"vol\" + 0.014*\"jewish\" + 0.014*\"der\" + 0.014*\"berlin\" + 0.014*\"israel\" + 0.010*\"european\" + 0.010*\"austria\" + 0.009*\"europ\"\n", + "2019-01-31 01:30:16,932 : INFO : topic #29 (0.020): 0.030*\"companhia\" + 0.013*\"busi\" + 0.012*\"million\" + 0.011*\"market\" + 0.011*\"produc\" + 0.010*\"industri\" + 0.010*\"bank\" + 0.009*\"yawn\" + 0.008*\"manag\" + 0.007*\"trace\"\n", + "2019-01-31 01:30:16,933 : INFO : topic #8 (0.020): 0.026*\"law\" + 0.022*\"cortic\" + 0.018*\"act\" + 0.018*\"start\" + 0.013*\"ricardo\" + 0.012*\"case\" + 0.010*\"replac\" + 0.009*\"polaris\" + 0.009*\"legal\" + 0.007*\"judaism\"\n", + "2019-01-31 01:30:16,934 : INFO : topic #16 (0.020): 0.055*\"king\" + 0.031*\"priest\" + 0.019*\"rotterdam\" + 0.019*\"grammat\" + 0.019*\"idiosyncrat\" + 0.019*\"duke\" + 0.017*\"quarterli\" + 0.014*\"kingdom\" + 0.013*\"portugues\" + 0.012*\"maria\"\n", + "2019-01-31 01:30:16,939 : INFO : topic diff=0.003345, rho=0.021552\n", + "2019-01-31 01:30:17,095 : INFO : PROGRESS: pass 0, at document #4308000/4922894\n", + "2019-01-31 01:30:18,471 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:30:18,738 : INFO : topic #7 (0.020): 0.021*\"snatch\" + 0.020*\"di\" + 0.019*\"factor\" + 0.016*\"margin\" + 0.016*\"yawn\" + 0.015*\"bone\" + 0.013*\"life\" + 0.013*\"faster\" + 0.012*\"will\" + 0.012*\"daughter\"\n", + "2019-01-31 01:30:18,739 : INFO : topic #19 (0.020): 0.016*\"languag\" + 0.015*\"centuri\" + 0.011*\"woodcut\" + 0.009*\"form\" + 0.009*\"mean\" + 0.009*\"origin\" + 0.008*\"trade\" + 0.007*\"english\" + 0.007*\"known\" + 0.006*\"uruguayan\"\n", + "2019-01-31 01:30:18,740 : INFO : topic #48 (0.020): 0.081*\"march\" + 0.078*\"sens\" + 0.076*\"octob\" + 0.069*\"januari\" + 0.067*\"august\" + 0.067*\"juli\" + 0.066*\"notion\" + 0.066*\"april\" + 0.064*\"judici\" + 0.063*\"decatur\"\n", + "2019-01-31 01:30:18,741 : INFO : topic #11 (0.020): 0.024*\"john\" + 0.012*\"will\" + 0.011*\"jame\" + 0.011*\"david\" + 0.010*\"rival\" + 0.009*\"mexican–american\" + 0.009*\"slur\" + 0.008*\"georg\" + 0.008*\"paul\" + 0.007*\"rhyme\"\n", + "2019-01-31 01:30:18,742 : INFO : topic #20 (0.020): 0.145*\"scholar\" + 0.039*\"struggl\" + 0.032*\"high\" + 0.030*\"educ\" + 0.023*\"collector\" + 0.018*\"yawn\" + 0.013*\"prognosi\" + 0.010*\"district\" + 0.010*\"gothic\" + 0.009*\"task\"\n", + "2019-01-31 01:30:18,748 : INFO : topic diff=0.002474, rho=0.021547\n", + "2019-01-31 01:30:18,906 : INFO : PROGRESS: pass 0, at document #4310000/4922894\n", + "2019-01-31 01:30:20,273 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:30:20,540 : INFO : topic #12 (0.020): 0.009*\"number\" + 0.008*\"frontal\" + 0.007*\"poet\" + 0.006*\"gener\" + 0.006*\"southern\" + 0.006*\"exampl\" + 0.006*\"théori\" + 0.006*\"utopian\" + 0.006*\"servitud\" + 0.005*\"field\"\n", + "2019-01-31 01:30:20,541 : INFO : topic #0 (0.020): 0.062*\"statewid\" + 0.042*\"line\" + 0.031*\"raid\" + 0.030*\"rivièr\" + 0.027*\"rosenwald\" + 0.020*\"airmen\" + 0.018*\"serv\" + 0.018*\"traceabl\" + 0.013*\"oper\" + 0.010*\"transient\"\n", + "2019-01-31 01:30:20,542 : INFO : topic #21 (0.020): 0.036*\"samford\" + 0.023*\"spain\" + 0.017*\"mexico\" + 0.017*\"del\" + 0.016*\"italian\" + 0.014*\"soviet\" + 0.013*\"santa\" + 0.011*\"francisco\" + 0.011*\"juan\" + 0.010*\"carlo\"\n", + "2019-01-31 01:30:20,543 : INFO : topic #2 (0.020): 0.049*\"isl\" + 0.038*\"shield\" + 0.019*\"narrat\" + 0.015*\"scot\" + 0.014*\"pope\" + 0.012*\"blur\" + 0.011*\"nativist\" + 0.010*\"coalit\" + 0.009*\"class\" + 0.009*\"bahá\"\n", + "2019-01-31 01:30:20,544 : INFO : topic #15 (0.020): 0.011*\"small\" + 0.010*\"organ\" + 0.009*\"develop\" + 0.009*\"commun\" + 0.009*\"group\" + 0.009*\"word\" + 0.008*\"peopl\" + 0.007*\"woman\" + 0.007*\"human\" + 0.006*\"summerhil\"\n", + "2019-01-31 01:30:20,550 : INFO : topic diff=0.003426, rho=0.021542\n", + "2019-01-31 01:30:20,702 : INFO : PROGRESS: pass 0, at document #4312000/4922894\n", + "2019-01-31 01:30:22,052 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:30:22,318 : INFO : topic #32 (0.020): 0.050*\"district\" + 0.045*\"popolo\" + 0.042*\"vigour\" + 0.036*\"tortur\" + 0.034*\"cotton\" + 0.022*\"multitud\" + 0.022*\"adulthood\" + 0.021*\"area\" + 0.019*\"cede\" + 0.018*\"citi\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 01:30:22,320 : INFO : topic #1 (0.020): 0.056*\"china\" + 0.050*\"chilton\" + 0.024*\"hong\" + 0.024*\"kong\" + 0.022*\"korea\" + 0.019*\"korean\" + 0.017*\"leah\" + 0.016*\"sourc\" + 0.014*\"shirin\" + 0.014*\"kim\"\n", + "2019-01-31 01:30:22,321 : INFO : topic #9 (0.020): 0.070*\"bone\" + 0.043*\"american\" + 0.030*\"valour\" + 0.019*\"dutch\" + 0.017*\"player\" + 0.017*\"folei\" + 0.016*\"polit\" + 0.016*\"english\" + 0.012*\"acrimoni\" + 0.012*\"simpler\"\n", + "2019-01-31 01:30:22,322 : INFO : topic #35 (0.020): 0.054*\"russia\" + 0.035*\"sovereignti\" + 0.032*\"rural\" + 0.026*\"poison\" + 0.026*\"reprint\" + 0.024*\"personifi\" + 0.019*\"moscow\" + 0.019*\"poland\" + 0.016*\"tyrant\" + 0.015*\"unfortun\"\n", + "2019-01-31 01:30:22,323 : INFO : topic #29 (0.020): 0.030*\"companhia\" + 0.013*\"busi\" + 0.012*\"million\" + 0.011*\"market\" + 0.011*\"produc\" + 0.010*\"industri\" + 0.010*\"bank\" + 0.009*\"yawn\" + 0.008*\"manag\" + 0.007*\"trace\"\n", + "2019-01-31 01:30:22,329 : INFO : topic diff=0.002987, rho=0.021537\n", + "2019-01-31 01:30:22,489 : INFO : PROGRESS: pass 0, at document #4314000/4922894\n", + "2019-01-31 01:30:23,896 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:30:24,162 : INFO : topic #43 (0.020): 0.065*\"elect\" + 0.054*\"parti\" + 0.025*\"voluntari\" + 0.024*\"democrat\" + 0.018*\"member\" + 0.016*\"republ\" + 0.016*\"polici\" + 0.014*\"bypass\" + 0.013*\"selma\" + 0.013*\"seaport\"\n", + "2019-01-31 01:30:24,164 : INFO : topic #26 (0.020): 0.028*\"workplac\" + 0.027*\"champion\" + 0.026*\"woman\" + 0.025*\"men\" + 0.025*\"olymp\" + 0.021*\"medal\" + 0.020*\"event\" + 0.019*\"alic\" + 0.018*\"taxpay\" + 0.018*\"atheist\"\n", + "2019-01-31 01:30:24,165 : INFO : topic #45 (0.020): 0.046*\"arsen\" + 0.031*\"jpg\" + 0.029*\"fifteenth\" + 0.029*\"museo\" + 0.022*\"pain\" + 0.021*\"illicit\" + 0.017*\"exhaust\" + 0.016*\"artist\" + 0.016*\"gai\" + 0.015*\"colder\"\n", + "2019-01-31 01:30:24,166 : INFO : topic #49 (0.020): 0.044*\"india\" + 0.032*\"incumb\" + 0.014*\"islam\" + 0.012*\"pakistan\" + 0.011*\"affection\" + 0.011*\"televis\" + 0.010*\"anglo\" + 0.010*\"muskoge\" + 0.010*\"khalsa\" + 0.010*\"sri\"\n", + "2019-01-31 01:30:24,167 : INFO : topic #17 (0.020): 0.079*\"church\" + 0.025*\"cathol\" + 0.023*\"christian\" + 0.022*\"bishop\" + 0.016*\"sail\" + 0.016*\"retroflex\" + 0.010*\"relationship\" + 0.010*\"historiographi\" + 0.009*\"cathedr\" + 0.009*\"parish\"\n", + "2019-01-31 01:30:24,173 : INFO : topic diff=0.003430, rho=0.021532\n", + "2019-01-31 01:30:24,330 : INFO : PROGRESS: pass 0, at document #4316000/4922894\n", + "2019-01-31 01:30:25,708 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:30:25,974 : INFO : topic #43 (0.020): 0.065*\"elect\" + 0.054*\"parti\" + 0.025*\"voluntari\" + 0.024*\"democrat\" + 0.018*\"member\" + 0.016*\"republ\" + 0.016*\"polici\" + 0.014*\"bypass\" + 0.013*\"seaport\" + 0.013*\"selma\"\n", + "2019-01-31 01:30:25,975 : INFO : topic #23 (0.020): 0.138*\"audit\" + 0.068*\"best\" + 0.033*\"yawn\" + 0.029*\"jacksonvil\" + 0.023*\"japanes\" + 0.022*\"noll\" + 0.019*\"women\" + 0.018*\"festiv\" + 0.016*\"intern\" + 0.013*\"prison\"\n", + "2019-01-31 01:30:25,976 : INFO : topic #30 (0.020): 0.036*\"cleveland\" + 0.035*\"leagu\" + 0.029*\"place\" + 0.028*\"taxpay\" + 0.025*\"scientist\" + 0.023*\"crete\" + 0.022*\"folei\" + 0.017*\"goal\" + 0.015*\"martin\" + 0.012*\"schmitz\"\n", + "2019-01-31 01:30:25,977 : INFO : topic #22 (0.020): 0.034*\"spars\" + 0.018*\"factor\" + 0.012*\"plaisir\" + 0.010*\"western\" + 0.010*\"genu\" + 0.009*\"biom\" + 0.008*\"median\" + 0.007*\"florida\" + 0.007*\"incom\" + 0.006*\"trap\"\n", + "2019-01-31 01:30:25,978 : INFO : topic #12 (0.020): 0.009*\"number\" + 0.008*\"frontal\" + 0.007*\"gener\" + 0.007*\"poet\" + 0.006*\"southern\" + 0.006*\"exampl\" + 0.006*\"utopian\" + 0.006*\"théori\" + 0.006*\"servitud\" + 0.006*\"method\"\n", + "2019-01-31 01:30:25,984 : INFO : topic diff=0.003749, rho=0.021527\n", + "2019-01-31 01:30:26,196 : INFO : PROGRESS: pass 0, at document #4318000/4922894\n", + "2019-01-31 01:30:27,558 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:30:27,825 : INFO : topic #49 (0.020): 0.045*\"india\" + 0.032*\"incumb\" + 0.014*\"islam\" + 0.012*\"pakistan\" + 0.011*\"affection\" + 0.011*\"televis\" + 0.011*\"anglo\" + 0.010*\"muskoge\" + 0.010*\"khalsa\" + 0.010*\"sri\"\n", + "2019-01-31 01:30:27,826 : INFO : topic #14 (0.020): 0.024*\"forc\" + 0.022*\"aggress\" + 0.022*\"armi\" + 0.021*\"walter\" + 0.018*\"com\" + 0.013*\"unionist\" + 0.013*\"oper\" + 0.013*\"militari\" + 0.012*\"airbu\" + 0.012*\"diversifi\"\n", + "2019-01-31 01:30:27,827 : INFO : topic #28 (0.020): 0.035*\"build\" + 0.030*\"hous\" + 0.019*\"buford\" + 0.015*\"histor\" + 0.011*\"constitut\" + 0.011*\"linear\" + 0.011*\"centuri\" + 0.011*\"depress\" + 0.011*\"silicon\" + 0.010*\"pistol\"\n", + "2019-01-31 01:30:27,828 : INFO : topic #27 (0.020): 0.075*\"questionnair\" + 0.020*\"candid\" + 0.018*\"taxpay\" + 0.015*\"ret\" + 0.013*\"tornado\" + 0.012*\"driver\" + 0.012*\"find\" + 0.011*\"fool\" + 0.010*\"horac\" + 0.010*\"squatter\"\n", + "2019-01-31 01:30:27,829 : INFO : topic #42 (0.020): 0.046*\"german\" + 0.031*\"germani\" + 0.016*\"vol\" + 0.014*\"jewish\" + 0.014*\"israel\" + 0.014*\"berlin\" + 0.013*\"der\" + 0.010*\"european\" + 0.010*\"austria\" + 0.009*\"europ\"\n", + "2019-01-31 01:30:27,835 : INFO : topic diff=0.003532, rho=0.021522\n", + "2019-01-31 01:30:30,578 : INFO : -11.686 per-word bound, 3294.5 perplexity estimate based on a held-out corpus of 2000 documents with 558351 words\n", + "2019-01-31 01:30:30,579 : INFO : PROGRESS: pass 0, at document #4320000/4922894\n", + "2019-01-31 01:30:31,984 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:30:32,251 : INFO : topic #17 (0.020): 0.079*\"church\" + 0.025*\"cathol\" + 0.024*\"christian\" + 0.022*\"bishop\" + 0.016*\"sail\" + 0.016*\"retroflex\" + 0.010*\"relationship\" + 0.010*\"historiographi\" + 0.009*\"parish\" + 0.009*\"cathedr\"\n", + "2019-01-31 01:30:32,252 : INFO : topic #48 (0.020): 0.081*\"march\" + 0.078*\"sens\" + 0.076*\"octob\" + 0.070*\"januari\" + 0.067*\"juli\" + 0.067*\"august\" + 0.067*\"notion\" + 0.066*\"april\" + 0.065*\"judici\" + 0.064*\"decatur\"\n", + "2019-01-31 01:30:32,253 : INFO : topic #25 (0.020): 0.034*\"ring\" + 0.018*\"area\" + 0.018*\"lagrang\" + 0.016*\"warmth\" + 0.015*\"mount\" + 0.010*\"north\" + 0.009*\"sourc\" + 0.009*\"land\" + 0.009*\"foam\" + 0.009*\"vacant\"\n", + "2019-01-31 01:30:32,254 : INFO : topic #24 (0.020): 0.040*\"book\" + 0.035*\"publicis\" + 0.026*\"word\" + 0.020*\"new\" + 0.014*\"edit\" + 0.014*\"presid\" + 0.011*\"worldwid\" + 0.011*\"magazin\" + 0.011*\"author\" + 0.011*\"storag\"\n", + "2019-01-31 01:30:32,255 : INFO : topic #44 (0.020): 0.030*\"rooftop\" + 0.026*\"final\" + 0.024*\"wife\" + 0.020*\"tourist\" + 0.019*\"champion\" + 0.016*\"martin\" + 0.015*\"taxpay\" + 0.014*\"chamber\" + 0.014*\"open\" + 0.014*\"tiepolo\"\n", + "2019-01-31 01:30:32,261 : INFO : topic diff=0.003003, rho=0.021517\n", + "2019-01-31 01:30:32,421 : INFO : PROGRESS: pass 0, at document #4322000/4922894\n", + "2019-01-31 01:30:33,801 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:30:34,069 : INFO : topic #10 (0.020): 0.012*\"cdd\" + 0.008*\"media\" + 0.008*\"disco\" + 0.007*\"hormon\" + 0.007*\"have\" + 0.007*\"pathwai\" + 0.007*\"caus\" + 0.006*\"treat\" + 0.006*\"effect\" + 0.006*\"proper\"\n", + "2019-01-31 01:30:34,070 : INFO : topic #14 (0.020): 0.024*\"forc\" + 0.022*\"armi\" + 0.022*\"aggress\" + 0.021*\"walter\" + 0.018*\"com\" + 0.013*\"oper\" + 0.013*\"unionist\" + 0.013*\"militari\" + 0.012*\"airbu\" + 0.011*\"diversifi\"\n", + "2019-01-31 01:30:34,071 : INFO : topic #4 (0.020): 0.019*\"enfranchis\" + 0.014*\"depress\" + 0.013*\"pour\" + 0.009*\"mode\" + 0.008*\"elabor\" + 0.008*\"veget\" + 0.008*\"uruguayan\" + 0.006*\"teratogen\" + 0.006*\"develop\" + 0.006*\"produc\"\n", + "2019-01-31 01:30:34,072 : INFO : topic #19 (0.020): 0.016*\"languag\" + 0.015*\"centuri\" + 0.011*\"woodcut\" + 0.009*\"form\" + 0.009*\"mean\" + 0.009*\"origin\" + 0.008*\"trade\" + 0.008*\"english\" + 0.007*\"known\" + 0.006*\"uruguayan\"\n", + "2019-01-31 01:30:34,074 : INFO : topic #24 (0.020): 0.041*\"book\" + 0.035*\"publicis\" + 0.026*\"word\" + 0.020*\"new\" + 0.014*\"edit\" + 0.014*\"presid\" + 0.011*\"worldwid\" + 0.011*\"magazin\" + 0.011*\"author\" + 0.011*\"storag\"\n", + "2019-01-31 01:30:34,079 : INFO : topic diff=0.003004, rho=0.021512\n", + "2019-01-31 01:30:34,240 : INFO : PROGRESS: pass 0, at document #4324000/4922894\n", + "2019-01-31 01:30:35,619 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:30:35,886 : INFO : topic #6 (0.020): 0.070*\"fewer\" + 0.023*\"epiru\" + 0.019*\"septemb\" + 0.018*\"teacher\" + 0.014*\"stake\" + 0.012*\"rodríguez\" + 0.012*\"proclaim\" + 0.011*\"direct\" + 0.011*\"movi\" + 0.010*\"acrimoni\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 01:30:35,887 : INFO : topic #23 (0.020): 0.138*\"audit\" + 0.068*\"best\" + 0.033*\"yawn\" + 0.029*\"jacksonvil\" + 0.023*\"japanes\" + 0.022*\"noll\" + 0.019*\"women\" + 0.018*\"festiv\" + 0.016*\"intern\" + 0.013*\"prison\"\n", + "2019-01-31 01:30:35,888 : INFO : topic #9 (0.020): 0.069*\"bone\" + 0.043*\"american\" + 0.030*\"valour\" + 0.020*\"dutch\" + 0.017*\"player\" + 0.017*\"folei\" + 0.016*\"english\" + 0.016*\"polit\" + 0.012*\"acrimoni\" + 0.012*\"simpler\"\n", + "2019-01-31 01:30:35,889 : INFO : topic #44 (0.020): 0.030*\"rooftop\" + 0.027*\"final\" + 0.024*\"wife\" + 0.020*\"tourist\" + 0.019*\"champion\" + 0.016*\"martin\" + 0.015*\"taxpay\" + 0.014*\"chamber\" + 0.014*\"open\" + 0.013*\"tiepolo\"\n", + "2019-01-31 01:30:35,890 : INFO : topic #45 (0.020): 0.046*\"arsen\" + 0.031*\"jpg\" + 0.029*\"fifteenth\" + 0.029*\"museo\" + 0.022*\"pain\" + 0.020*\"illicit\" + 0.017*\"exhaust\" + 0.016*\"artist\" + 0.016*\"gai\" + 0.015*\"colder\"\n", + "2019-01-31 01:30:35,896 : INFO : topic diff=0.002871, rho=0.021507\n", + "2019-01-31 01:30:36,048 : INFO : PROGRESS: pass 0, at document #4326000/4922894\n", + "2019-01-31 01:30:37,401 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:30:37,667 : INFO : topic #48 (0.020): 0.081*\"march\" + 0.078*\"sens\" + 0.077*\"octob\" + 0.070*\"januari\" + 0.068*\"juli\" + 0.068*\"august\" + 0.067*\"notion\" + 0.066*\"april\" + 0.065*\"judici\" + 0.064*\"decatur\"\n", + "2019-01-31 01:30:37,668 : INFO : topic #15 (0.020): 0.011*\"small\" + 0.010*\"organ\" + 0.009*\"develop\" + 0.009*\"commun\" + 0.009*\"group\" + 0.009*\"word\" + 0.008*\"peopl\" + 0.007*\"woman\" + 0.007*\"human\" + 0.006*\"summerhil\"\n", + "2019-01-31 01:30:37,669 : INFO : topic #8 (0.020): 0.025*\"law\" + 0.022*\"cortic\" + 0.020*\"act\" + 0.018*\"start\" + 0.014*\"ricardo\" + 0.012*\"case\" + 0.010*\"replac\" + 0.009*\"polaris\" + 0.009*\"legal\" + 0.007*\"judaism\"\n", + "2019-01-31 01:30:37,670 : INFO : topic #26 (0.020): 0.028*\"workplac\" + 0.027*\"champion\" + 0.026*\"woman\" + 0.025*\"men\" + 0.024*\"olymp\" + 0.021*\"medal\" + 0.020*\"event\" + 0.020*\"alic\" + 0.018*\"taxpay\" + 0.018*\"atheist\"\n", + "2019-01-31 01:30:37,671 : INFO : topic #49 (0.020): 0.044*\"india\" + 0.033*\"incumb\" + 0.014*\"islam\" + 0.012*\"pakistan\" + 0.011*\"anglo\" + 0.011*\"affection\" + 0.011*\"televis\" + 0.011*\"muskoge\" + 0.010*\"khalsa\" + 0.010*\"sri\"\n", + "2019-01-31 01:30:37,677 : INFO : topic diff=0.004297, rho=0.021502\n", + "2019-01-31 01:30:37,838 : INFO : PROGRESS: pass 0, at document #4328000/4922894\n", + "2019-01-31 01:30:39,251 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:30:39,517 : INFO : topic #44 (0.020): 0.029*\"rooftop\" + 0.026*\"final\" + 0.024*\"wife\" + 0.020*\"tourist\" + 0.019*\"champion\" + 0.016*\"martin\" + 0.015*\"taxpay\" + 0.014*\"chamber\" + 0.014*\"tiepolo\" + 0.014*\"open\"\n", + "2019-01-31 01:30:39,518 : INFO : topic #29 (0.020): 0.030*\"companhia\" + 0.013*\"busi\" + 0.012*\"million\" + 0.011*\"market\" + 0.011*\"produc\" + 0.010*\"industri\" + 0.010*\"bank\" + 0.009*\"yawn\" + 0.008*\"manag\" + 0.007*\"trace\"\n", + "2019-01-31 01:30:39,520 : INFO : topic #26 (0.020): 0.028*\"workplac\" + 0.027*\"champion\" + 0.026*\"woman\" + 0.025*\"men\" + 0.024*\"olymp\" + 0.021*\"medal\" + 0.020*\"event\" + 0.020*\"alic\" + 0.018*\"taxpay\" + 0.018*\"rainfal\"\n", + "2019-01-31 01:30:39,521 : INFO : topic #25 (0.020): 0.034*\"ring\" + 0.018*\"area\" + 0.018*\"lagrang\" + 0.016*\"warmth\" + 0.015*\"mount\" + 0.010*\"north\" + 0.009*\"sourc\" + 0.009*\"land\" + 0.009*\"foam\" + 0.009*\"lobe\"\n", + "2019-01-31 01:30:39,522 : INFO : topic #7 (0.020): 0.021*\"snatch\" + 0.020*\"di\" + 0.018*\"factor\" + 0.016*\"margin\" + 0.016*\"yawn\" + 0.015*\"bone\" + 0.013*\"life\" + 0.013*\"faster\" + 0.012*\"deal\" + 0.012*\"will\"\n", + "2019-01-31 01:30:39,528 : INFO : topic diff=0.003342, rho=0.021497\n", + "2019-01-31 01:30:39,687 : INFO : PROGRESS: pass 0, at document #4330000/4922894\n", + "2019-01-31 01:30:41,074 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:30:41,340 : INFO : topic #22 (0.020): 0.034*\"spars\" + 0.018*\"factor\" + 0.012*\"plaisir\" + 0.010*\"genu\" + 0.010*\"western\" + 0.009*\"biom\" + 0.008*\"median\" + 0.007*\"florida\" + 0.006*\"incom\" + 0.006*\"trap\"\n", + "2019-01-31 01:30:41,341 : INFO : topic #11 (0.020): 0.024*\"john\" + 0.011*\"jame\" + 0.011*\"david\" + 0.011*\"will\" + 0.010*\"rival\" + 0.009*\"mexican–american\" + 0.009*\"slur\" + 0.008*\"georg\" + 0.007*\"rhyme\" + 0.007*\"paul\"\n", + "2019-01-31 01:30:41,343 : INFO : topic #4 (0.020): 0.019*\"enfranchis\" + 0.014*\"depress\" + 0.013*\"pour\" + 0.008*\"mode\" + 0.008*\"elabor\" + 0.008*\"veget\" + 0.008*\"uruguayan\" + 0.006*\"teratogen\" + 0.006*\"develop\" + 0.006*\"produc\"\n", + "2019-01-31 01:30:41,344 : INFO : topic #21 (0.020): 0.036*\"samford\" + 0.023*\"spain\" + 0.017*\"mexico\" + 0.017*\"del\" + 0.017*\"italian\" + 0.014*\"soviet\" + 0.013*\"santa\" + 0.011*\"francisco\" + 0.011*\"juan\" + 0.011*\"carlo\"\n", + "2019-01-31 01:30:41,345 : INFO : topic #19 (0.020): 0.016*\"languag\" + 0.015*\"centuri\" + 0.011*\"woodcut\" + 0.009*\"form\" + 0.009*\"mean\" + 0.009*\"origin\" + 0.008*\"trade\" + 0.008*\"english\" + 0.007*\"known\" + 0.007*\"ancestor\"\n", + "2019-01-31 01:30:41,351 : INFO : topic diff=0.002889, rho=0.021492\n", + "2019-01-31 01:30:41,508 : INFO : PROGRESS: pass 0, at document #4332000/4922894\n", + "2019-01-31 01:30:42,891 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:30:43,158 : INFO : topic #29 (0.020): 0.030*\"companhia\" + 0.013*\"busi\" + 0.012*\"million\" + 0.011*\"market\" + 0.011*\"produc\" + 0.010*\"industri\" + 0.010*\"bank\" + 0.009*\"yawn\" + 0.008*\"manag\" + 0.007*\"trace\"\n", + "2019-01-31 01:30:43,159 : INFO : topic #21 (0.020): 0.036*\"samford\" + 0.023*\"spain\" + 0.017*\"mexico\" + 0.017*\"del\" + 0.017*\"italian\" + 0.014*\"soviet\" + 0.013*\"santa\" + 0.011*\"francisco\" + 0.011*\"carlo\" + 0.011*\"juan\"\n", + "2019-01-31 01:30:43,160 : INFO : topic #13 (0.020): 0.026*\"australia\" + 0.026*\"london\" + 0.026*\"sourc\" + 0.025*\"new\" + 0.023*\"england\" + 0.023*\"australian\" + 0.020*\"british\" + 0.017*\"ireland\" + 0.014*\"youth\" + 0.013*\"wale\"\n", + "2019-01-31 01:30:43,161 : INFO : topic #26 (0.020): 0.028*\"workplac\" + 0.027*\"champion\" + 0.026*\"woman\" + 0.025*\"men\" + 0.024*\"olymp\" + 0.021*\"medal\" + 0.020*\"alic\" + 0.020*\"event\" + 0.018*\"taxpay\" + 0.018*\"rainfal\"\n", + "2019-01-31 01:30:43,162 : INFO : topic #20 (0.020): 0.143*\"scholar\" + 0.039*\"struggl\" + 0.032*\"high\" + 0.030*\"educ\" + 0.023*\"collector\" + 0.018*\"yawn\" + 0.013*\"prognosi\" + 0.010*\"district\" + 0.010*\"gothic\" + 0.010*\"task\"\n", + "2019-01-31 01:30:43,168 : INFO : topic diff=0.002964, rho=0.021487\n", + "2019-01-31 01:30:43,324 : INFO : PROGRESS: pass 0, at document #4334000/4922894\n", + "2019-01-31 01:30:44,688 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:30:44,954 : INFO : topic #1 (0.020): 0.055*\"china\" + 0.050*\"chilton\" + 0.025*\"kong\" + 0.025*\"hong\" + 0.022*\"korea\" + 0.018*\"korean\" + 0.017*\"leah\" + 0.016*\"sourc\" + 0.014*\"shirin\" + 0.014*\"kim\"\n", + "2019-01-31 01:30:44,956 : INFO : topic #29 (0.020): 0.030*\"companhia\" + 0.013*\"busi\" + 0.012*\"million\" + 0.011*\"market\" + 0.011*\"produc\" + 0.010*\"bank\" + 0.010*\"industri\" + 0.009*\"yawn\" + 0.008*\"manag\" + 0.007*\"trace\"\n", + "2019-01-31 01:30:44,957 : INFO : topic #49 (0.020): 0.045*\"india\" + 0.033*\"incumb\" + 0.014*\"islam\" + 0.012*\"pakistan\" + 0.011*\"anglo\" + 0.011*\"affection\" + 0.011*\"muskoge\" + 0.011*\"televis\" + 0.010*\"khalsa\" + 0.009*\"sri\"\n", + "2019-01-31 01:30:44,958 : INFO : topic #0 (0.020): 0.062*\"statewid\" + 0.041*\"line\" + 0.031*\"rivièr\" + 0.030*\"raid\" + 0.027*\"rosenwald\" + 0.021*\"airmen\" + 0.018*\"traceabl\" + 0.018*\"serv\" + 0.013*\"oper\" + 0.010*\"transient\"\n", + "2019-01-31 01:30:44,959 : INFO : topic #46 (0.020): 0.017*\"stop\" + 0.016*\"sweden\" + 0.015*\"swedish\" + 0.015*\"wind\" + 0.014*\"treeless\" + 0.014*\"damag\" + 0.014*\"norwai\" + 0.012*\"norwegian\" + 0.011*\"huntsvil\" + 0.009*\"denmark\"\n", + "2019-01-31 01:30:44,965 : INFO : topic diff=0.003669, rho=0.021482\n", + "2019-01-31 01:30:45,123 : INFO : PROGRESS: pass 0, at document #4336000/4922894\n", + "2019-01-31 01:30:46,510 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:30:46,777 : INFO : topic #46 (0.020): 0.017*\"stop\" + 0.016*\"sweden\" + 0.015*\"swedish\" + 0.015*\"wind\" + 0.014*\"damag\" + 0.014*\"treeless\" + 0.014*\"norwai\" + 0.012*\"norwegian\" + 0.011*\"huntsvil\" + 0.009*\"denmark\"\n", + "2019-01-31 01:30:46,778 : INFO : topic #44 (0.020): 0.029*\"rooftop\" + 0.026*\"final\" + 0.024*\"wife\" + 0.020*\"tourist\" + 0.019*\"champion\" + 0.016*\"martin\" + 0.015*\"taxpay\" + 0.014*\"chamber\" + 0.014*\"tiepolo\" + 0.013*\"open\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 01:30:46,779 : INFO : topic #15 (0.020): 0.011*\"small\" + 0.010*\"organ\" + 0.009*\"develop\" + 0.009*\"commun\" + 0.009*\"group\" + 0.009*\"word\" + 0.008*\"peopl\" + 0.008*\"woman\" + 0.007*\"human\" + 0.006*\"summerhil\"\n", + "2019-01-31 01:30:46,780 : INFO : topic #17 (0.020): 0.079*\"church\" + 0.025*\"cathol\" + 0.024*\"christian\" + 0.022*\"bishop\" + 0.016*\"sail\" + 0.016*\"retroflex\" + 0.010*\"relationship\" + 0.010*\"historiographi\" + 0.009*\"cathedr\" + 0.009*\"parish\"\n", + "2019-01-31 01:30:46,781 : INFO : topic #41 (0.020): 0.041*\"citi\" + 0.024*\"palmer\" + 0.020*\"new\" + 0.017*\"strategist\" + 0.013*\"open\" + 0.013*\"center\" + 0.011*\"includ\" + 0.011*\"lobe\" + 0.010*\"dai\" + 0.009*\"hot\"\n", + "2019-01-31 01:30:46,787 : INFO : topic diff=0.003270, rho=0.021477\n", + "2019-01-31 01:30:46,945 : INFO : PROGRESS: pass 0, at document #4338000/4922894\n", + "2019-01-31 01:30:48,322 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:30:48,588 : INFO : topic #10 (0.020): 0.011*\"cdd\" + 0.009*\"media\" + 0.008*\"disco\" + 0.007*\"have\" + 0.007*\"hormon\" + 0.007*\"pathwai\" + 0.007*\"caus\" + 0.006*\"proper\" + 0.006*\"treat\" + 0.006*\"effect\"\n", + "2019-01-31 01:30:48,589 : INFO : topic #18 (0.020): 0.011*\"théori\" + 0.007*\"later\" + 0.007*\"sack\" + 0.006*\"dai\" + 0.005*\"kill\" + 0.005*\"like\" + 0.005*\"end\" + 0.005*\"retrospect\" + 0.004*\"call\" + 0.004*\"help\"\n", + "2019-01-31 01:30:48,590 : INFO : topic #2 (0.020): 0.050*\"isl\" + 0.037*\"shield\" + 0.019*\"narrat\" + 0.015*\"scot\" + 0.013*\"pope\" + 0.012*\"blur\" + 0.011*\"nativist\" + 0.010*\"coalit\" + 0.009*\"bahá\" + 0.009*\"class\"\n", + "2019-01-31 01:30:48,592 : INFO : topic #12 (0.020): 0.009*\"number\" + 0.008*\"frontal\" + 0.007*\"gener\" + 0.007*\"poet\" + 0.006*\"exampl\" + 0.006*\"southern\" + 0.006*\"utopian\" + 0.006*\"théori\" + 0.006*\"servitud\" + 0.006*\"method\"\n", + "2019-01-31 01:30:48,593 : INFO : topic #45 (0.020): 0.046*\"arsen\" + 0.031*\"jpg\" + 0.029*\"fifteenth\" + 0.028*\"museo\" + 0.022*\"pain\" + 0.020*\"illicit\" + 0.016*\"exhaust\" + 0.016*\"colder\" + 0.016*\"artist\" + 0.016*\"gai\"\n", + "2019-01-31 01:30:48,598 : INFO : topic diff=0.002652, rho=0.021472\n", + "2019-01-31 01:30:51,267 : INFO : -11.549 per-word bound, 2996.8 perplexity estimate based on a held-out corpus of 2000 documents with 549907 words\n", + "2019-01-31 01:30:51,268 : INFO : PROGRESS: pass 0, at document #4340000/4922894\n", + "2019-01-31 01:30:52,634 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:30:52,901 : INFO : topic #35 (0.020): 0.055*\"russia\" + 0.034*\"sovereignti\" + 0.033*\"rural\" + 0.026*\"poison\" + 0.026*\"reprint\" + 0.025*\"personifi\" + 0.019*\"moscow\" + 0.018*\"poland\" + 0.016*\"tyrant\" + 0.015*\"unfortun\"\n", + "2019-01-31 01:30:52,902 : INFO : topic #33 (0.020): 0.060*\"french\" + 0.045*\"franc\" + 0.029*\"pari\" + 0.022*\"jean\" + 0.021*\"sail\" + 0.017*\"daphn\" + 0.014*\"wreath\" + 0.013*\"loui\" + 0.012*\"lazi\" + 0.011*\"piec\"\n", + "2019-01-31 01:30:52,903 : INFO : topic #3 (0.020): 0.033*\"present\" + 0.025*\"minist\" + 0.025*\"offic\" + 0.024*\"nation\" + 0.023*\"govern\" + 0.021*\"member\" + 0.017*\"start\" + 0.016*\"serv\" + 0.015*\"gener\" + 0.014*\"council\"\n", + "2019-01-31 01:30:52,904 : INFO : topic #12 (0.020): 0.009*\"number\" + 0.008*\"frontal\" + 0.007*\"gener\" + 0.007*\"poet\" + 0.006*\"exampl\" + 0.006*\"southern\" + 0.006*\"utopian\" + 0.006*\"théori\" + 0.006*\"servitud\" + 0.006*\"method\"\n", + "2019-01-31 01:30:52,905 : INFO : topic #47 (0.020): 0.063*\"muscl\" + 0.033*\"perceptu\" + 0.020*\"theater\" + 0.018*\"place\" + 0.018*\"compos\" + 0.015*\"damn\" + 0.014*\"orchestr\" + 0.013*\"physician\" + 0.012*\"jack\" + 0.012*\"olympo\"\n", + "2019-01-31 01:30:52,911 : INFO : topic diff=0.002908, rho=0.021467\n", + "2019-01-31 01:30:53,064 : INFO : PROGRESS: pass 0, at document #4342000/4922894\n", + "2019-01-31 01:30:54,409 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:30:54,675 : INFO : topic #1 (0.020): 0.056*\"china\" + 0.050*\"chilton\" + 0.025*\"kong\" + 0.025*\"hong\" + 0.021*\"korea\" + 0.018*\"korean\" + 0.017*\"leah\" + 0.016*\"sourc\" + 0.014*\"kim\" + 0.014*\"shirin\"\n", + "2019-01-31 01:30:54,676 : INFO : topic #10 (0.020): 0.011*\"cdd\" + 0.009*\"media\" + 0.008*\"disco\" + 0.007*\"hormon\" + 0.007*\"pathwai\" + 0.007*\"have\" + 0.007*\"caus\" + 0.006*\"proper\" + 0.006*\"treat\" + 0.006*\"effect\"\n", + "2019-01-31 01:30:54,677 : INFO : topic #32 (0.020): 0.050*\"district\" + 0.045*\"popolo\" + 0.042*\"vigour\" + 0.036*\"tortur\" + 0.033*\"cotton\" + 0.022*\"adulthood\" + 0.022*\"multitud\" + 0.021*\"area\" + 0.019*\"cede\" + 0.018*\"citi\"\n", + "2019-01-31 01:30:54,678 : INFO : topic #31 (0.020): 0.051*\"fusiform\" + 0.026*\"scientist\" + 0.025*\"taxpay\" + 0.022*\"player\" + 0.020*\"place\" + 0.014*\"clot\" + 0.013*\"leagu\" + 0.011*\"folei\" + 0.010*\"yawn\" + 0.009*\"reconstruct\"\n", + "2019-01-31 01:30:54,679 : INFO : topic #49 (0.020): 0.045*\"india\" + 0.034*\"incumb\" + 0.014*\"islam\" + 0.012*\"pakistan\" + 0.011*\"muskoge\" + 0.011*\"anglo\" + 0.011*\"affection\" + 0.010*\"televis\" + 0.010*\"khalsa\" + 0.010*\"sri\"\n", + "2019-01-31 01:30:54,685 : INFO : topic diff=0.002702, rho=0.021462\n", + "2019-01-31 01:30:54,842 : INFO : PROGRESS: pass 0, at document #4344000/4922894\n", + "2019-01-31 01:30:56,238 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:30:56,505 : INFO : topic #32 (0.020): 0.050*\"district\" + 0.045*\"popolo\" + 0.042*\"vigour\" + 0.036*\"tortur\" + 0.033*\"cotton\" + 0.022*\"adulthood\" + 0.022*\"multitud\" + 0.021*\"area\" + 0.019*\"cede\" + 0.018*\"citi\"\n", + "2019-01-31 01:30:56,506 : INFO : topic #42 (0.020): 0.047*\"german\" + 0.032*\"germani\" + 0.015*\"vol\" + 0.015*\"israel\" + 0.015*\"berlin\" + 0.014*\"jewish\" + 0.013*\"der\" + 0.010*\"european\" + 0.009*\"austria\" + 0.009*\"europ\"\n", + "2019-01-31 01:30:56,507 : INFO : topic #1 (0.020): 0.057*\"china\" + 0.050*\"chilton\" + 0.025*\"kong\" + 0.025*\"hong\" + 0.021*\"korea\" + 0.018*\"korean\" + 0.017*\"leah\" + 0.016*\"sourc\" + 0.014*\"kim\" + 0.013*\"shirin\"\n", + "2019-01-31 01:30:56,508 : INFO : topic #43 (0.020): 0.064*\"elect\" + 0.054*\"parti\" + 0.025*\"voluntari\" + 0.023*\"democrat\" + 0.019*\"member\" + 0.016*\"polici\" + 0.016*\"republ\" + 0.014*\"bypass\" + 0.014*\"seaport\" + 0.013*\"report\"\n", + "2019-01-31 01:30:56,509 : INFO : topic #31 (0.020): 0.052*\"fusiform\" + 0.026*\"scientist\" + 0.025*\"taxpay\" + 0.022*\"player\" + 0.020*\"place\" + 0.014*\"clot\" + 0.013*\"leagu\" + 0.011*\"folei\" + 0.010*\"yawn\" + 0.009*\"reconstruct\"\n", + "2019-01-31 01:30:56,515 : INFO : topic diff=0.002941, rho=0.021457\n", + "2019-01-31 01:30:56,671 : INFO : PROGRESS: pass 0, at document #4346000/4922894\n", + "2019-01-31 01:30:58,028 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:30:58,295 : INFO : topic #31 (0.020): 0.051*\"fusiform\" + 0.026*\"scientist\" + 0.024*\"taxpay\" + 0.022*\"player\" + 0.020*\"place\" + 0.013*\"clot\" + 0.013*\"leagu\" + 0.011*\"folei\" + 0.010*\"yawn\" + 0.009*\"reconstruct\"\n", + "2019-01-31 01:30:58,296 : INFO : topic #34 (0.020): 0.065*\"start\" + 0.033*\"new\" + 0.031*\"american\" + 0.028*\"unionist\" + 0.027*\"cotton\" + 0.021*\"year\" + 0.016*\"california\" + 0.014*\"warrior\" + 0.013*\"terri\" + 0.011*\"north\"\n", + "2019-01-31 01:30:58,297 : INFO : topic #10 (0.020): 0.011*\"cdd\" + 0.009*\"media\" + 0.008*\"disco\" + 0.007*\"have\" + 0.007*\"pathwai\" + 0.007*\"hormon\" + 0.007*\"caus\" + 0.006*\"proper\" + 0.006*\"treat\" + 0.006*\"effect\"\n", + "2019-01-31 01:30:58,298 : INFO : topic #14 (0.020): 0.024*\"forc\" + 0.023*\"aggress\" + 0.021*\"armi\" + 0.020*\"walter\" + 0.018*\"com\" + 0.013*\"oper\" + 0.013*\"unionist\" + 0.012*\"militari\" + 0.012*\"airbu\" + 0.011*\"diversifi\"\n", + "2019-01-31 01:30:58,299 : INFO : topic #18 (0.020): 0.011*\"théori\" + 0.007*\"later\" + 0.007*\"sack\" + 0.006*\"dai\" + 0.006*\"kill\" + 0.005*\"like\" + 0.005*\"retrospect\" + 0.005*\"end\" + 0.004*\"call\" + 0.004*\"help\"\n", + "2019-01-31 01:30:58,305 : INFO : topic diff=0.002348, rho=0.021452\n", + "2019-01-31 01:30:58,456 : INFO : PROGRESS: pass 0, at document #4348000/4922894\n", + "2019-01-31 01:30:59,810 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:31:00,076 : INFO : topic #27 (0.020): 0.076*\"questionnair\" + 0.020*\"candid\" + 0.018*\"taxpay\" + 0.013*\"ret\" + 0.013*\"tornado\" + 0.012*\"driver\" + 0.012*\"find\" + 0.011*\"fool\" + 0.011*\"horac\" + 0.010*\"squatter\"\n", + "2019-01-31 01:31:00,077 : INFO : topic #0 (0.020): 0.062*\"statewid\" + 0.040*\"line\" + 0.033*\"rivièr\" + 0.031*\"raid\" + 0.026*\"rosenwald\" + 0.022*\"airmen\" + 0.018*\"traceabl\" + 0.018*\"serv\" + 0.013*\"oper\" + 0.010*\"transient\"\n", + "2019-01-31 01:31:00,078 : INFO : topic #38 (0.020): 0.022*\"walter\" + 0.011*\"aza\" + 0.009*\"battalion\" + 0.008*\"forc\" + 0.007*\"teufel\" + 0.007*\"empath\" + 0.007*\"armi\" + 0.007*\"till\" + 0.007*\"govern\" + 0.006*\"citi\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 01:31:00,079 : INFO : topic #47 (0.020): 0.063*\"muscl\" + 0.033*\"perceptu\" + 0.020*\"theater\" + 0.018*\"place\" + 0.017*\"compos\" + 0.015*\"damn\" + 0.014*\"physician\" + 0.013*\"orchestr\" + 0.012*\"jack\" + 0.012*\"olympo\"\n", + "2019-01-31 01:31:00,080 : INFO : topic #32 (0.020): 0.050*\"district\" + 0.045*\"popolo\" + 0.042*\"vigour\" + 0.036*\"tortur\" + 0.033*\"cotton\" + 0.023*\"adulthood\" + 0.022*\"multitud\" + 0.021*\"area\" + 0.019*\"cede\" + 0.018*\"citi\"\n", + "2019-01-31 01:31:00,086 : INFO : topic diff=0.003482, rho=0.021447\n", + "2019-01-31 01:31:00,295 : INFO : PROGRESS: pass 0, at document #4350000/4922894\n", + "2019-01-31 01:31:01,662 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:31:01,928 : INFO : topic #9 (0.020): 0.070*\"bone\" + 0.042*\"american\" + 0.030*\"valour\" + 0.020*\"dutch\" + 0.019*\"player\" + 0.018*\"folei\" + 0.016*\"polit\" + 0.016*\"english\" + 0.012*\"acrimoni\" + 0.012*\"simpler\"\n", + "2019-01-31 01:31:01,929 : INFO : topic #36 (0.020): 0.011*\"network\" + 0.010*\"prognosi\" + 0.010*\"pop\" + 0.008*\"cytokin\" + 0.008*\"softwar\" + 0.008*\"develop\" + 0.008*\"user\" + 0.008*\"diggin\" + 0.008*\"uruguayan\" + 0.007*\"includ\"\n", + "2019-01-31 01:31:01,931 : INFO : topic #5 (0.020): 0.038*\"abroad\" + 0.029*\"son\" + 0.027*\"rel\" + 0.025*\"reconstruct\" + 0.021*\"band\" + 0.017*\"muscl\" + 0.016*\"simultan\" + 0.014*\"charcoal\" + 0.014*\"toyota\" + 0.010*\"myspac\"\n", + "2019-01-31 01:31:01,932 : INFO : topic #23 (0.020): 0.136*\"audit\" + 0.068*\"best\" + 0.033*\"yawn\" + 0.030*\"jacksonvil\" + 0.024*\"japanes\" + 0.022*\"noll\" + 0.019*\"women\" + 0.017*\"festiv\" + 0.017*\"intern\" + 0.014*\"prison\"\n", + "2019-01-31 01:31:01,933 : INFO : topic #18 (0.020): 0.011*\"théori\" + 0.007*\"later\" + 0.007*\"sack\" + 0.006*\"dai\" + 0.006*\"kill\" + 0.005*\"like\" + 0.005*\"retrospect\" + 0.005*\"end\" + 0.004*\"call\" + 0.004*\"help\"\n", + "2019-01-31 01:31:01,939 : INFO : topic diff=0.002871, rho=0.021442\n", + "2019-01-31 01:31:02,094 : INFO : PROGRESS: pass 0, at document #4352000/4922894\n", + "2019-01-31 01:31:03,471 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:31:03,737 : INFO : topic #37 (0.020): 0.013*\"charact\" + 0.012*\"septemb\" + 0.012*\"anim\" + 0.011*\"man\" + 0.008*\"comic\" + 0.007*\"appear\" + 0.007*\"fusiform\" + 0.007*\"workplac\" + 0.007*\"storag\" + 0.006*\"black\"\n", + "2019-01-31 01:31:03,738 : INFO : topic #45 (0.020): 0.045*\"arsen\" + 0.031*\"jpg\" + 0.029*\"fifteenth\" + 0.028*\"museo\" + 0.021*\"pain\" + 0.020*\"illicit\" + 0.017*\"colder\" + 0.016*\"exhaust\" + 0.016*\"gai\" + 0.016*\"artist\"\n", + "2019-01-31 01:31:03,739 : INFO : topic #48 (0.020): 0.082*\"march\" + 0.077*\"sens\" + 0.077*\"octob\" + 0.071*\"januari\" + 0.068*\"notion\" + 0.068*\"juli\" + 0.067*\"august\" + 0.067*\"april\" + 0.066*\"judici\" + 0.064*\"decatur\"\n", + "2019-01-31 01:31:03,740 : INFO : topic #0 (0.020): 0.062*\"statewid\" + 0.040*\"line\" + 0.033*\"rivièr\" + 0.031*\"raid\" + 0.026*\"rosenwald\" + 0.022*\"airmen\" + 0.018*\"traceabl\" + 0.018*\"serv\" + 0.013*\"oper\" + 0.010*\"transient\"\n", + "2019-01-31 01:31:03,741 : INFO : topic #6 (0.020): 0.070*\"fewer\" + 0.023*\"epiru\" + 0.019*\"septemb\" + 0.018*\"teacher\" + 0.014*\"stake\" + 0.012*\"rodríguez\" + 0.012*\"proclaim\" + 0.011*\"direct\" + 0.011*\"movi\" + 0.010*\"acrimoni\"\n", + "2019-01-31 01:31:03,747 : INFO : topic diff=0.003177, rho=0.021437\n", + "2019-01-31 01:31:03,902 : INFO : PROGRESS: pass 0, at document #4354000/4922894\n", + "2019-01-31 01:31:05,256 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:31:05,522 : INFO : topic #42 (0.020): 0.047*\"german\" + 0.032*\"germani\" + 0.017*\"israel\" + 0.015*\"vol\" + 0.015*\"berlin\" + 0.014*\"jewish\" + 0.013*\"der\" + 0.010*\"european\" + 0.010*\"austria\" + 0.009*\"isra\"\n", + "2019-01-31 01:31:05,523 : INFO : topic #6 (0.020): 0.071*\"fewer\" + 0.023*\"epiru\" + 0.019*\"septemb\" + 0.018*\"teacher\" + 0.014*\"stake\" + 0.012*\"rodríguez\" + 0.012*\"proclaim\" + 0.011*\"direct\" + 0.011*\"movi\" + 0.010*\"acrimoni\"\n", + "2019-01-31 01:31:05,524 : INFO : topic #35 (0.020): 0.056*\"russia\" + 0.035*\"sovereignti\" + 0.033*\"rural\" + 0.027*\"poison\" + 0.027*\"reprint\" + 0.024*\"personifi\" + 0.019*\"moscow\" + 0.018*\"poland\" + 0.016*\"tyrant\" + 0.015*\"unfortun\"\n", + "2019-01-31 01:31:05,525 : INFO : topic #44 (0.020): 0.030*\"rooftop\" + 0.026*\"final\" + 0.024*\"wife\" + 0.020*\"tourist\" + 0.019*\"champion\" + 0.016*\"martin\" + 0.015*\"taxpay\" + 0.014*\"chamber\" + 0.014*\"tiepolo\" + 0.013*\"open\"\n", + "2019-01-31 01:31:05,527 : INFO : topic #5 (0.020): 0.038*\"abroad\" + 0.029*\"son\" + 0.027*\"rel\" + 0.026*\"reconstruct\" + 0.021*\"band\" + 0.017*\"muscl\" + 0.016*\"simultan\" + 0.014*\"charcoal\" + 0.014*\"toyota\" + 0.010*\"myspac\"\n", + "2019-01-31 01:31:05,532 : INFO : topic diff=0.002585, rho=0.021432\n", + "2019-01-31 01:31:05,685 : INFO : PROGRESS: pass 0, at document #4356000/4922894\n", + "2019-01-31 01:31:07,057 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:31:07,323 : INFO : topic #27 (0.020): 0.076*\"questionnair\" + 0.020*\"candid\" + 0.018*\"taxpay\" + 0.013*\"tornado\" + 0.013*\"ret\" + 0.012*\"driver\" + 0.012*\"find\" + 0.011*\"fool\" + 0.011*\"horac\" + 0.011*\"squatter\"\n", + "2019-01-31 01:31:07,325 : INFO : topic #11 (0.020): 0.023*\"john\" + 0.012*\"will\" + 0.011*\"jame\" + 0.011*\"david\" + 0.010*\"rival\" + 0.009*\"mexican–american\" + 0.008*\"slur\" + 0.008*\"georg\" + 0.007*\"rhyme\" + 0.007*\"paul\"\n", + "2019-01-31 01:31:07,326 : INFO : topic #36 (0.020): 0.011*\"network\" + 0.010*\"prognosi\" + 0.009*\"pop\" + 0.009*\"cytokin\" + 0.008*\"softwar\" + 0.008*\"develop\" + 0.008*\"user\" + 0.008*\"diggin\" + 0.008*\"uruguayan\" + 0.007*\"includ\"\n", + "2019-01-31 01:31:07,327 : INFO : topic #48 (0.020): 0.082*\"march\" + 0.078*\"sens\" + 0.077*\"octob\" + 0.071*\"januari\" + 0.069*\"notion\" + 0.068*\"juli\" + 0.067*\"august\" + 0.067*\"april\" + 0.066*\"judici\" + 0.065*\"decatur\"\n", + "2019-01-31 01:31:07,328 : INFO : topic #41 (0.020): 0.041*\"citi\" + 0.025*\"palmer\" + 0.020*\"new\" + 0.016*\"strategist\" + 0.013*\"open\" + 0.013*\"center\" + 0.011*\"includ\" + 0.011*\"lobe\" + 0.010*\"dai\" + 0.009*\"hot\"\n", + "2019-01-31 01:31:07,333 : INFO : topic diff=0.003358, rho=0.021427\n", + "2019-01-31 01:31:07,491 : INFO : PROGRESS: pass 0, at document #4358000/4922894\n", + "2019-01-31 01:31:08,865 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:31:09,132 : INFO : topic #37 (0.020): 0.013*\"charact\" + 0.012*\"septemb\" + 0.012*\"anim\" + 0.011*\"man\" + 0.008*\"comic\" + 0.007*\"appear\" + 0.007*\"fusiform\" + 0.007*\"workplac\" + 0.007*\"storag\" + 0.006*\"black\"\n", + "2019-01-31 01:31:09,133 : INFO : topic #5 (0.020): 0.038*\"abroad\" + 0.028*\"son\" + 0.027*\"rel\" + 0.026*\"reconstruct\" + 0.021*\"band\" + 0.017*\"muscl\" + 0.015*\"simultan\" + 0.014*\"charcoal\" + 0.014*\"toyota\" + 0.009*\"myspac\"\n", + "2019-01-31 01:31:09,134 : INFO : topic #29 (0.020): 0.031*\"companhia\" + 0.013*\"busi\" + 0.012*\"million\" + 0.011*\"market\" + 0.011*\"bank\" + 0.011*\"produc\" + 0.010*\"industri\" + 0.009*\"yawn\" + 0.008*\"manag\" + 0.007*\"trace\"\n", + "2019-01-31 01:31:09,135 : INFO : topic #9 (0.020): 0.071*\"bone\" + 0.043*\"american\" + 0.030*\"valour\" + 0.020*\"dutch\" + 0.019*\"player\" + 0.018*\"folei\" + 0.016*\"polit\" + 0.016*\"english\" + 0.013*\"acrimoni\" + 0.012*\"simpler\"\n", + "2019-01-31 01:31:09,136 : INFO : topic #28 (0.020): 0.036*\"build\" + 0.030*\"hous\" + 0.019*\"buford\" + 0.015*\"histor\" + 0.011*\"constitut\" + 0.011*\"centuri\" + 0.011*\"linear\" + 0.011*\"depress\" + 0.011*\"silicon\" + 0.010*\"pistol\"\n", + "2019-01-31 01:31:09,142 : INFO : topic diff=0.003612, rho=0.021423\n", + "2019-01-31 01:31:11,808 : INFO : -11.610 per-word bound, 3126.5 perplexity estimate based on a held-out corpus of 2000 documents with 547628 words\n", + "2019-01-31 01:31:11,809 : INFO : PROGRESS: pass 0, at document #4360000/4922894\n", + "2019-01-31 01:31:13,182 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:31:13,448 : INFO : topic #11 (0.020): 0.023*\"john\" + 0.011*\"will\" + 0.011*\"jame\" + 0.011*\"david\" + 0.010*\"rival\" + 0.009*\"mexican–american\" + 0.008*\"slur\" + 0.008*\"georg\" + 0.007*\"rhyme\" + 0.007*\"paul\"\n", + "2019-01-31 01:31:13,450 : INFO : topic #18 (0.020): 0.011*\"théori\" + 0.007*\"later\" + 0.007*\"sack\" + 0.006*\"dai\" + 0.005*\"kill\" + 0.005*\"like\" + 0.005*\"retrospect\" + 0.005*\"end\" + 0.004*\"call\" + 0.004*\"help\"\n", + "2019-01-31 01:31:13,451 : INFO : topic #32 (0.020): 0.049*\"district\" + 0.045*\"popolo\" + 0.042*\"vigour\" + 0.036*\"tortur\" + 0.033*\"cotton\" + 0.023*\"adulthood\" + 0.022*\"multitud\" + 0.021*\"area\" + 0.019*\"cede\" + 0.018*\"citi\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 01:31:13,452 : INFO : topic #27 (0.020): 0.075*\"questionnair\" + 0.020*\"candid\" + 0.018*\"taxpay\" + 0.013*\"ret\" + 0.013*\"tornado\" + 0.012*\"driver\" + 0.012*\"find\" + 0.011*\"fool\" + 0.011*\"squatter\" + 0.011*\"horac\"\n", + "2019-01-31 01:31:13,453 : INFO : topic #19 (0.020): 0.016*\"languag\" + 0.015*\"centuri\" + 0.011*\"woodcut\" + 0.009*\"form\" + 0.009*\"mean\" + 0.009*\"origin\" + 0.008*\"trade\" + 0.008*\"english\" + 0.007*\"known\" + 0.007*\"uruguayan\"\n", + "2019-01-31 01:31:13,458 : INFO : topic diff=0.003273, rho=0.021418\n", + "2019-01-31 01:31:13,615 : INFO : PROGRESS: pass 0, at document #4362000/4922894\n", + "2019-01-31 01:31:14,987 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:31:15,254 : INFO : topic #49 (0.020): 0.044*\"india\" + 0.033*\"incumb\" + 0.013*\"islam\" + 0.013*\"pakistan\" + 0.011*\"televis\" + 0.011*\"anglo\" + 0.011*\"affection\" + 0.010*\"muskoge\" + 0.010*\"khalsa\" + 0.009*\"alam\"\n", + "2019-01-31 01:31:15,255 : INFO : topic #32 (0.020): 0.049*\"district\" + 0.045*\"popolo\" + 0.042*\"vigour\" + 0.035*\"tortur\" + 0.033*\"cotton\" + 0.023*\"adulthood\" + 0.022*\"multitud\" + 0.021*\"area\" + 0.019*\"cede\" + 0.018*\"citi\"\n", + "2019-01-31 01:31:15,256 : INFO : topic #39 (0.020): 0.062*\"canada\" + 0.045*\"canadian\" + 0.025*\"toronto\" + 0.023*\"hoar\" + 0.020*\"ontario\" + 0.017*\"hydrogen\" + 0.015*\"new\" + 0.015*\"misericordia\" + 0.014*\"novotná\" + 0.013*\"quebec\"\n", + "2019-01-31 01:31:15,257 : INFO : topic #5 (0.020): 0.038*\"abroad\" + 0.029*\"son\" + 0.027*\"rel\" + 0.026*\"reconstruct\" + 0.021*\"band\" + 0.017*\"muscl\" + 0.016*\"simultan\" + 0.014*\"charcoal\" + 0.014*\"toyota\" + 0.010*\"myspac\"\n", + "2019-01-31 01:31:15,258 : INFO : topic #36 (0.020): 0.011*\"network\" + 0.010*\"prognosi\" + 0.009*\"pop\" + 0.009*\"cytokin\" + 0.008*\"develop\" + 0.008*\"softwar\" + 0.008*\"user\" + 0.008*\"diggin\" + 0.007*\"uruguayan\" + 0.007*\"includ\"\n", + "2019-01-31 01:31:15,264 : INFO : topic diff=0.002648, rho=0.021413\n", + "2019-01-31 01:31:15,418 : INFO : PROGRESS: pass 0, at document #4364000/4922894\n", + "2019-01-31 01:31:16,781 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:31:17,048 : INFO : topic #18 (0.020): 0.011*\"théori\" + 0.007*\"later\" + 0.007*\"sack\" + 0.006*\"dai\" + 0.005*\"kill\" + 0.005*\"like\" + 0.005*\"retrospect\" + 0.005*\"end\" + 0.004*\"call\" + 0.004*\"help\"\n", + "2019-01-31 01:31:17,049 : INFO : topic #45 (0.020): 0.046*\"arsen\" + 0.031*\"jpg\" + 0.029*\"fifteenth\" + 0.028*\"museo\" + 0.022*\"pain\" + 0.020*\"illicit\" + 0.016*\"colder\" + 0.016*\"artist\" + 0.016*\"gai\" + 0.016*\"exhaust\"\n", + "2019-01-31 01:31:17,050 : INFO : topic #37 (0.020): 0.013*\"charact\" + 0.012*\"septemb\" + 0.012*\"anim\" + 0.011*\"man\" + 0.008*\"comic\" + 0.007*\"appear\" + 0.007*\"fusiform\" + 0.007*\"workplac\" + 0.007*\"storag\" + 0.006*\"black\"\n", + "2019-01-31 01:31:17,051 : INFO : topic #27 (0.020): 0.075*\"questionnair\" + 0.020*\"candid\" + 0.018*\"taxpay\" + 0.013*\"ret\" + 0.013*\"tornado\" + 0.012*\"driver\" + 0.012*\"find\" + 0.011*\"fool\" + 0.010*\"squatter\" + 0.010*\"horac\"\n", + "2019-01-31 01:31:17,052 : INFO : topic #16 (0.020): 0.055*\"king\" + 0.031*\"priest\" + 0.020*\"rotterdam\" + 0.019*\"duke\" + 0.018*\"idiosyncrat\" + 0.018*\"grammat\" + 0.016*\"quarterli\" + 0.014*\"kingdom\" + 0.013*\"portugues\" + 0.013*\"brazil\"\n", + "2019-01-31 01:31:17,058 : INFO : topic diff=0.003263, rho=0.021408\n", + "2019-01-31 01:31:17,216 : INFO : PROGRESS: pass 0, at document #4366000/4922894\n", + "2019-01-31 01:31:18,592 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:31:18,859 : INFO : topic #8 (0.020): 0.025*\"law\" + 0.022*\"cortic\" + 0.019*\"act\" + 0.018*\"start\" + 0.013*\"ricardo\" + 0.012*\"case\" + 0.010*\"replac\" + 0.009*\"legal\" + 0.008*\"polaris\" + 0.007*\"judaism\"\n", + "2019-01-31 01:31:18,860 : INFO : topic #49 (0.020): 0.044*\"india\" + 0.033*\"incumb\" + 0.014*\"islam\" + 0.013*\"pakistan\" + 0.011*\"anglo\" + 0.011*\"televis\" + 0.011*\"muskoge\" + 0.011*\"affection\" + 0.010*\"khalsa\" + 0.009*\"sri\"\n", + "2019-01-31 01:31:18,861 : INFO : topic #48 (0.020): 0.082*\"march\" + 0.078*\"sens\" + 0.077*\"octob\" + 0.071*\"januari\" + 0.069*\"notion\" + 0.068*\"juli\" + 0.067*\"april\" + 0.067*\"august\" + 0.067*\"judici\" + 0.065*\"decatur\"\n", + "2019-01-31 01:31:18,862 : INFO : topic #30 (0.020): 0.037*\"cleveland\" + 0.036*\"leagu\" + 0.030*\"place\" + 0.028*\"taxpay\" + 0.025*\"scientist\" + 0.023*\"crete\" + 0.021*\"folei\" + 0.016*\"goal\" + 0.015*\"martin\" + 0.012*\"schmitz\"\n", + "2019-01-31 01:31:18,863 : INFO : topic #28 (0.020): 0.036*\"build\" + 0.030*\"hous\" + 0.018*\"buford\" + 0.015*\"histor\" + 0.011*\"constitut\" + 0.011*\"linear\" + 0.011*\"centuri\" + 0.011*\"depress\" + 0.011*\"silicon\" + 0.010*\"pistol\"\n", + "2019-01-31 01:31:18,869 : INFO : topic diff=0.003353, rho=0.021403\n", + "2019-01-31 01:31:19,029 : INFO : PROGRESS: pass 0, at document #4368000/4922894\n", + "2019-01-31 01:31:20,431 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:31:20,697 : INFO : topic #26 (0.020): 0.028*\"workplac\" + 0.027*\"champion\" + 0.027*\"woman\" + 0.025*\"men\" + 0.024*\"olymp\" + 0.021*\"alic\" + 0.020*\"medal\" + 0.020*\"event\" + 0.018*\"taxpay\" + 0.018*\"rainfal\"\n", + "2019-01-31 01:31:20,698 : INFO : topic #32 (0.020): 0.050*\"district\" + 0.045*\"popolo\" + 0.042*\"vigour\" + 0.035*\"tortur\" + 0.033*\"cotton\" + 0.023*\"adulthood\" + 0.022*\"multitud\" + 0.021*\"area\" + 0.019*\"cede\" + 0.018*\"citi\"\n", + "2019-01-31 01:31:20,700 : INFO : topic #11 (0.020): 0.023*\"john\" + 0.012*\"will\" + 0.011*\"jame\" + 0.011*\"david\" + 0.010*\"rival\" + 0.009*\"mexican–american\" + 0.008*\"slur\" + 0.008*\"georg\" + 0.007*\"rhyme\" + 0.007*\"paul\"\n", + "2019-01-31 01:31:20,701 : INFO : topic #46 (0.020): 0.016*\"sweden\" + 0.016*\"stop\" + 0.015*\"swedish\" + 0.014*\"wind\" + 0.014*\"norwai\" + 0.014*\"damag\" + 0.013*\"norwegian\" + 0.012*\"treeless\" + 0.010*\"huntsvil\" + 0.010*\"turkish\"\n", + "2019-01-31 01:31:20,702 : INFO : topic #45 (0.020): 0.046*\"arsen\" + 0.031*\"jpg\" + 0.029*\"fifteenth\" + 0.028*\"museo\" + 0.022*\"pain\" + 0.020*\"illicit\" + 0.016*\"artist\" + 0.016*\"colder\" + 0.016*\"gai\" + 0.016*\"exhaust\"\n", + "2019-01-31 01:31:20,707 : INFO : topic diff=0.002580, rho=0.021398\n", + "2019-01-31 01:31:20,863 : INFO : PROGRESS: pass 0, at document #4370000/4922894\n", + "2019-01-31 01:31:22,214 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:31:22,481 : INFO : topic #40 (0.020): 0.085*\"unit\" + 0.024*\"schuster\" + 0.022*\"requir\" + 0.021*\"institut\" + 0.021*\"collector\" + 0.018*\"student\" + 0.014*\"professor\" + 0.012*\"degre\" + 0.012*\"word\" + 0.011*\"http\"\n", + "2019-01-31 01:31:22,483 : INFO : topic #18 (0.020): 0.011*\"théori\" + 0.007*\"later\" + 0.007*\"sack\" + 0.006*\"dai\" + 0.005*\"kill\" + 0.005*\"retrospect\" + 0.005*\"like\" + 0.005*\"end\" + 0.004*\"call\" + 0.004*\"help\"\n", + "2019-01-31 01:31:22,484 : INFO : topic #4 (0.020): 0.019*\"enfranchis\" + 0.015*\"depress\" + 0.013*\"pour\" + 0.008*\"elabor\" + 0.008*\"mode\" + 0.008*\"veget\" + 0.008*\"uruguayan\" + 0.006*\"teratogen\" + 0.006*\"develop\" + 0.006*\"turn\"\n", + "2019-01-31 01:31:22,485 : INFO : topic #32 (0.020): 0.050*\"district\" + 0.045*\"popolo\" + 0.042*\"vigour\" + 0.035*\"tortur\" + 0.033*\"cotton\" + 0.023*\"adulthood\" + 0.022*\"multitud\" + 0.021*\"area\" + 0.020*\"cede\" + 0.018*\"citi\"\n", + "2019-01-31 01:31:22,486 : INFO : topic #45 (0.020): 0.046*\"arsen\" + 0.031*\"jpg\" + 0.029*\"fifteenth\" + 0.028*\"museo\" + 0.022*\"pain\" + 0.020*\"illicit\" + 0.016*\"artist\" + 0.016*\"exhaust\" + 0.016*\"colder\" + 0.016*\"gai\"\n", + "2019-01-31 01:31:22,492 : INFO : topic diff=0.003363, rho=0.021393\n", + "2019-01-31 01:31:22,647 : INFO : PROGRESS: pass 0, at document #4372000/4922894\n", + "2019-01-31 01:31:24,017 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:31:24,284 : INFO : topic #20 (0.020): 0.143*\"scholar\" + 0.040*\"struggl\" + 0.033*\"high\" + 0.030*\"educ\" + 0.024*\"collector\" + 0.018*\"yawn\" + 0.013*\"prognosi\" + 0.010*\"district\" + 0.009*\"task\" + 0.009*\"gothic\"\n", + "2019-01-31 01:31:24,285 : INFO : topic #9 (0.020): 0.073*\"bone\" + 0.042*\"american\" + 0.030*\"valour\" + 0.019*\"dutch\" + 0.019*\"player\" + 0.018*\"folei\" + 0.017*\"english\" + 0.016*\"polit\" + 0.012*\"acrimoni\" + 0.012*\"simpler\"\n", + "2019-01-31 01:31:24,286 : INFO : topic #30 (0.020): 0.037*\"cleveland\" + 0.036*\"leagu\" + 0.029*\"place\" + 0.028*\"taxpay\" + 0.024*\"scientist\" + 0.023*\"crete\" + 0.021*\"folei\" + 0.016*\"goal\" + 0.015*\"martin\" + 0.012*\"schmitz\"\n", + "2019-01-31 01:31:24,287 : INFO : topic #29 (0.020): 0.031*\"companhia\" + 0.013*\"busi\" + 0.012*\"million\" + 0.011*\"market\" + 0.011*\"produc\" + 0.011*\"bank\" + 0.010*\"industri\" + 0.009*\"yawn\" + 0.008*\"manag\" + 0.007*\"trace\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 01:31:24,288 : INFO : topic #18 (0.020): 0.011*\"théori\" + 0.007*\"later\" + 0.007*\"sack\" + 0.006*\"dai\" + 0.005*\"kill\" + 0.005*\"like\" + 0.005*\"retrospect\" + 0.005*\"end\" + 0.004*\"call\" + 0.004*\"help\"\n", + "2019-01-31 01:31:24,294 : INFO : topic diff=0.003405, rho=0.021388\n", + "2019-01-31 01:31:24,447 : INFO : PROGRESS: pass 0, at document #4374000/4922894\n", + "2019-01-31 01:31:25,806 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:31:26,072 : INFO : topic #45 (0.020): 0.047*\"arsen\" + 0.030*\"jpg\" + 0.029*\"museo\" + 0.028*\"fifteenth\" + 0.022*\"pain\" + 0.020*\"illicit\" + 0.016*\"artist\" + 0.016*\"colder\" + 0.016*\"gai\" + 0.016*\"exhaust\"\n", + "2019-01-31 01:31:26,073 : INFO : topic #14 (0.020): 0.024*\"forc\" + 0.023*\"aggress\" + 0.021*\"armi\" + 0.020*\"walter\" + 0.018*\"com\" + 0.014*\"oper\" + 0.013*\"unionist\" + 0.013*\"militari\" + 0.012*\"airbu\" + 0.012*\"diversifi\"\n", + "2019-01-31 01:31:26,074 : INFO : topic #46 (0.020): 0.016*\"sweden\" + 0.016*\"stop\" + 0.015*\"swedish\" + 0.014*\"wind\" + 0.014*\"norwai\" + 0.014*\"damag\" + 0.013*\"norwegian\" + 0.012*\"treeless\" + 0.010*\"huntsvil\" + 0.010*\"turkish\"\n", + "2019-01-31 01:31:26,075 : INFO : topic #36 (0.020): 0.011*\"network\" + 0.010*\"prognosi\" + 0.009*\"pop\" + 0.009*\"cytokin\" + 0.008*\"develop\" + 0.008*\"softwar\" + 0.008*\"user\" + 0.008*\"uruguayan\" + 0.007*\"diggin\" + 0.007*\"includ\"\n", + "2019-01-31 01:31:26,076 : INFO : topic #3 (0.020): 0.033*\"present\" + 0.025*\"nation\" + 0.025*\"minist\" + 0.024*\"offic\" + 0.023*\"govern\" + 0.021*\"member\" + 0.017*\"start\" + 0.015*\"serv\" + 0.015*\"gener\" + 0.014*\"council\"\n", + "2019-01-31 01:31:26,082 : INFO : topic diff=0.002791, rho=0.021383\n", + "2019-01-31 01:31:26,238 : INFO : PROGRESS: pass 0, at document #4376000/4922894\n", + "2019-01-31 01:31:27,614 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:31:27,880 : INFO : topic #46 (0.020): 0.016*\"sweden\" + 0.016*\"stop\" + 0.015*\"swedish\" + 0.014*\"norwai\" + 0.014*\"wind\" + 0.014*\"damag\" + 0.013*\"norwegian\" + 0.012*\"treeless\" + 0.010*\"turkish\" + 0.010*\"huntsvil\"\n", + "2019-01-31 01:31:27,881 : INFO : topic #37 (0.020): 0.013*\"charact\" + 0.012*\"septemb\" + 0.012*\"anim\" + 0.011*\"man\" + 0.008*\"comic\" + 0.008*\"appear\" + 0.007*\"fusiform\" + 0.007*\"workplac\" + 0.007*\"storag\" + 0.006*\"black\"\n", + "2019-01-31 01:31:27,882 : INFO : topic #23 (0.020): 0.136*\"audit\" + 0.066*\"best\" + 0.036*\"yawn\" + 0.029*\"jacksonvil\" + 0.024*\"japanes\" + 0.022*\"noll\" + 0.019*\"women\" + 0.017*\"festiv\" + 0.017*\"intern\" + 0.014*\"prison\"\n", + "2019-01-31 01:31:27,883 : INFO : topic #41 (0.020): 0.041*\"citi\" + 0.024*\"palmer\" + 0.020*\"new\" + 0.016*\"strategist\" + 0.013*\"open\" + 0.013*\"center\" + 0.011*\"lobe\" + 0.011*\"includ\" + 0.010*\"dai\" + 0.009*\"hot\"\n", + "2019-01-31 01:31:27,884 : INFO : topic #3 (0.020): 0.033*\"present\" + 0.025*\"nation\" + 0.025*\"minist\" + 0.024*\"offic\" + 0.023*\"govern\" + 0.021*\"member\" + 0.017*\"start\" + 0.015*\"serv\" + 0.015*\"gener\" + 0.014*\"council\"\n", + "2019-01-31 01:31:27,890 : INFO : topic diff=0.002574, rho=0.021378\n", + "2019-01-31 01:31:28,048 : INFO : PROGRESS: pass 0, at document #4378000/4922894\n", + "2019-01-31 01:31:29,885 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:31:30,153 : INFO : topic #27 (0.020): 0.076*\"questionnair\" + 0.020*\"candid\" + 0.019*\"taxpay\" + 0.013*\"ret\" + 0.012*\"tornado\" + 0.012*\"driver\" + 0.012*\"fool\" + 0.012*\"find\" + 0.010*\"horac\" + 0.010*\"squatter\"\n", + "2019-01-31 01:31:30,154 : INFO : topic #17 (0.020): 0.079*\"church\" + 0.025*\"christian\" + 0.024*\"cathol\" + 0.021*\"bishop\" + 0.016*\"sail\" + 0.016*\"retroflex\" + 0.010*\"relationship\" + 0.010*\"historiographi\" + 0.009*\"cathedr\" + 0.009*\"parish\"\n", + "2019-01-31 01:31:30,156 : INFO : topic #41 (0.020): 0.041*\"citi\" + 0.024*\"palmer\" + 0.020*\"new\" + 0.016*\"strategist\" + 0.013*\"open\" + 0.013*\"center\" + 0.011*\"lobe\" + 0.011*\"includ\" + 0.010*\"dai\" + 0.009*\"hot\"\n", + "2019-01-31 01:31:30,157 : INFO : topic #25 (0.020): 0.034*\"ring\" + 0.018*\"area\" + 0.017*\"lagrang\" + 0.016*\"mount\" + 0.015*\"warmth\" + 0.010*\"north\" + 0.009*\"land\" + 0.009*\"sourc\" + 0.009*\"foam\" + 0.009*\"vacant\"\n", + "2019-01-31 01:31:30,158 : INFO : topic #36 (0.020): 0.011*\"network\" + 0.010*\"prognosi\" + 0.009*\"pop\" + 0.009*\"cytokin\" + 0.008*\"develop\" + 0.008*\"softwar\" + 0.008*\"user\" + 0.008*\"uruguayan\" + 0.007*\"diggin\" + 0.007*\"includ\"\n", + "2019-01-31 01:31:30,164 : INFO : topic diff=0.003235, rho=0.021374\n", + "2019-01-31 01:31:32,783 : INFO : -11.474 per-word bound, 2844.8 perplexity estimate based on a held-out corpus of 2000 documents with 538335 words\n", + "2019-01-31 01:31:32,783 : INFO : PROGRESS: pass 0, at document #4380000/4922894\n", + "2019-01-31 01:31:34,129 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:31:34,398 : INFO : topic #33 (0.020): 0.060*\"french\" + 0.043*\"franc\" + 0.029*\"pari\" + 0.022*\"jean\" + 0.022*\"sail\" + 0.016*\"daphn\" + 0.015*\"wreath\" + 0.013*\"lazi\" + 0.013*\"loui\" + 0.011*\"piec\"\n", + "2019-01-31 01:31:34,399 : INFO : topic #48 (0.020): 0.084*\"march\" + 0.076*\"octob\" + 0.076*\"sens\" + 0.069*\"januari\" + 0.068*\"notion\" + 0.067*\"juli\" + 0.066*\"august\" + 0.065*\"april\" + 0.065*\"judici\" + 0.064*\"decatur\"\n", + "2019-01-31 01:31:34,400 : INFO : topic #43 (0.020): 0.064*\"elect\" + 0.054*\"parti\" + 0.026*\"voluntari\" + 0.022*\"democrat\" + 0.020*\"member\" + 0.016*\"polici\" + 0.015*\"republ\" + 0.014*\"bypass\" + 0.014*\"seaport\" + 0.013*\"report\"\n", + "2019-01-31 01:31:34,402 : INFO : topic #26 (0.020): 0.029*\"workplac\" + 0.028*\"champion\" + 0.027*\"woman\" + 0.024*\"men\" + 0.024*\"olymp\" + 0.021*\"alic\" + 0.020*\"medal\" + 0.020*\"event\" + 0.018*\"taxpay\" + 0.018*\"nation\"\n", + "2019-01-31 01:31:34,403 : INFO : topic #18 (0.020): 0.011*\"théori\" + 0.007*\"later\" + 0.007*\"sack\" + 0.006*\"dai\" + 0.005*\"kill\" + 0.005*\"like\" + 0.005*\"retrospect\" + 0.005*\"end\" + 0.004*\"call\" + 0.004*\"help\"\n", + "2019-01-31 01:31:34,408 : INFO : topic diff=0.002900, rho=0.021369\n", + "2019-01-31 01:31:34,563 : INFO : PROGRESS: pass 0, at document #4382000/4922894\n", + "2019-01-31 01:31:36,206 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:31:36,473 : INFO : topic #16 (0.020): 0.054*\"king\" + 0.031*\"priest\" + 0.020*\"rotterdam\" + 0.019*\"idiosyncrat\" + 0.019*\"duke\" + 0.018*\"grammat\" + 0.015*\"quarterli\" + 0.014*\"kingdom\" + 0.013*\"portugues\" + 0.013*\"brazil\"\n", + "2019-01-31 01:31:36,474 : INFO : topic #22 (0.020): 0.033*\"spars\" + 0.018*\"factor\" + 0.012*\"plaisir\" + 0.010*\"western\" + 0.010*\"genu\" + 0.009*\"biom\" + 0.008*\"median\" + 0.007*\"incom\" + 0.007*\"florida\" + 0.006*\"trap\"\n", + "2019-01-31 01:31:36,475 : INFO : topic #7 (0.020): 0.021*\"snatch\" + 0.020*\"di\" + 0.018*\"factor\" + 0.016*\"margin\" + 0.016*\"yawn\" + 0.015*\"bone\" + 0.013*\"life\" + 0.012*\"faster\" + 0.012*\"will\" + 0.012*\"deal\"\n", + "2019-01-31 01:31:36,475 : INFO : topic #41 (0.020): 0.041*\"citi\" + 0.024*\"palmer\" + 0.020*\"new\" + 0.016*\"strategist\" + 0.014*\"open\" + 0.013*\"center\" + 0.011*\"lobe\" + 0.011*\"includ\" + 0.010*\"dai\" + 0.009*\"hot\"\n", + "2019-01-31 01:31:36,477 : INFO : topic #42 (0.020): 0.047*\"german\" + 0.032*\"germani\" + 0.017*\"israel\" + 0.015*\"vol\" + 0.015*\"berlin\" + 0.014*\"jewish\" + 0.013*\"der\" + 0.010*\"european\" + 0.009*\"isra\" + 0.009*\"austria\"\n", + "2019-01-31 01:31:36,482 : INFO : topic diff=0.003314, rho=0.021364\n", + "2019-01-31 01:31:36,694 : INFO : PROGRESS: pass 0, at document #4384000/4922894\n", + "2019-01-31 01:31:38,057 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:31:38,323 : INFO : topic #28 (0.020): 0.036*\"build\" + 0.030*\"hous\" + 0.018*\"buford\" + 0.015*\"histor\" + 0.011*\"constitut\" + 0.011*\"linear\" + 0.011*\"centuri\" + 0.011*\"depress\" + 0.010*\"silicon\" + 0.010*\"pistol\"\n", + "2019-01-31 01:31:38,324 : INFO : topic #38 (0.020): 0.022*\"walter\" + 0.011*\"aza\" + 0.009*\"battalion\" + 0.008*\"forc\" + 0.008*\"teufel\" + 0.007*\"armi\" + 0.007*\"till\" + 0.007*\"empath\" + 0.007*\"govern\" + 0.006*\"militari\"\n", + "2019-01-31 01:31:38,325 : INFO : topic #19 (0.020): 0.016*\"languag\" + 0.015*\"centuri\" + 0.011*\"woodcut\" + 0.009*\"mean\" + 0.009*\"form\" + 0.009*\"origin\" + 0.008*\"trade\" + 0.008*\"english\" + 0.007*\"known\" + 0.007*\"uruguayan\"\n", + "2019-01-31 01:31:38,326 : INFO : topic #42 (0.020): 0.047*\"german\" + 0.032*\"germani\" + 0.017*\"israel\" + 0.015*\"vol\" + 0.015*\"berlin\" + 0.014*\"jewish\" + 0.013*\"der\" + 0.010*\"isra\" + 0.010*\"european\" + 0.009*\"austria\"\n", + "2019-01-31 01:31:38,327 : INFO : topic #11 (0.020): 0.023*\"john\" + 0.011*\"will\" + 0.011*\"jame\" + 0.011*\"david\" + 0.010*\"rival\" + 0.009*\"mexican–american\" + 0.008*\"slur\" + 0.008*\"georg\" + 0.007*\"paul\" + 0.007*\"rhyme\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 01:31:38,333 : INFO : topic diff=0.002861, rho=0.021359\n", + "2019-01-31 01:31:38,486 : INFO : PROGRESS: pass 0, at document #4386000/4922894\n", + "2019-01-31 01:31:39,851 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:31:40,117 : INFO : topic #5 (0.020): 0.038*\"abroad\" + 0.028*\"son\" + 0.027*\"rel\" + 0.026*\"reconstruct\" + 0.021*\"band\" + 0.017*\"muscl\" + 0.015*\"simultan\" + 0.014*\"charcoal\" + 0.014*\"toyota\" + 0.009*\"myspac\"\n", + "2019-01-31 01:31:40,118 : INFO : topic #42 (0.020): 0.047*\"german\" + 0.032*\"germani\" + 0.017*\"israel\" + 0.016*\"vol\" + 0.015*\"berlin\" + 0.014*\"jewish\" + 0.013*\"der\" + 0.010*\"european\" + 0.010*\"isra\" + 0.009*\"austria\"\n", + "2019-01-31 01:31:40,120 : INFO : topic #7 (0.020): 0.021*\"snatch\" + 0.020*\"di\" + 0.018*\"factor\" + 0.016*\"yawn\" + 0.016*\"margin\" + 0.015*\"bone\" + 0.013*\"life\" + 0.013*\"faster\" + 0.012*\"will\" + 0.012*\"deal\"\n", + "2019-01-31 01:31:40,121 : INFO : topic #17 (0.020): 0.079*\"church\" + 0.024*\"christian\" + 0.023*\"cathol\" + 0.021*\"bishop\" + 0.017*\"sail\" + 0.016*\"retroflex\" + 0.010*\"relationship\" + 0.010*\"historiographi\" + 0.009*\"cathedr\" + 0.009*\"parish\"\n", + "2019-01-31 01:31:40,122 : INFO : topic #19 (0.020): 0.017*\"languag\" + 0.015*\"centuri\" + 0.011*\"woodcut\" + 0.009*\"mean\" + 0.009*\"form\" + 0.009*\"origin\" + 0.008*\"trade\" + 0.008*\"english\" + 0.007*\"known\" + 0.007*\"uruguayan\"\n", + "2019-01-31 01:31:40,128 : INFO : topic diff=0.003414, rho=0.021354\n", + "2019-01-31 01:31:40,287 : INFO : PROGRESS: pass 0, at document #4388000/4922894\n", + "2019-01-31 01:31:41,845 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:31:42,114 : INFO : topic #14 (0.020): 0.024*\"forc\" + 0.023*\"aggress\" + 0.021*\"armi\" + 0.020*\"walter\" + 0.018*\"com\" + 0.014*\"oper\" + 0.013*\"unionist\" + 0.013*\"airbu\" + 0.013*\"militari\" + 0.011*\"diversifi\"\n", + "2019-01-31 01:31:42,115 : INFO : topic #35 (0.020): 0.055*\"russia\" + 0.033*\"sovereignti\" + 0.033*\"rural\" + 0.026*\"reprint\" + 0.026*\"poison\" + 0.024*\"personifi\" + 0.019*\"moscow\" + 0.018*\"poland\" + 0.016*\"tyrant\" + 0.015*\"czech\"\n", + "2019-01-31 01:31:42,116 : INFO : topic #25 (0.020): 0.033*\"ring\" + 0.018*\"area\" + 0.017*\"lagrang\" + 0.015*\"warmth\" + 0.015*\"mount\" + 0.010*\"north\" + 0.009*\"land\" + 0.009*\"sourc\" + 0.009*\"vacant\" + 0.009*\"foam\"\n", + "2019-01-31 01:31:42,117 : INFO : topic #49 (0.020): 0.044*\"india\" + 0.033*\"incumb\" + 0.014*\"islam\" + 0.013*\"pakistan\" + 0.011*\"anglo\" + 0.011*\"televis\" + 0.011*\"affection\" + 0.011*\"muskoge\" + 0.010*\"khalsa\" + 0.010*\"sri\"\n", + "2019-01-31 01:31:42,118 : INFO : topic #21 (0.020): 0.035*\"samford\" + 0.022*\"spain\" + 0.017*\"del\" + 0.017*\"mexico\" + 0.016*\"italian\" + 0.014*\"soviet\" + 0.013*\"santa\" + 0.011*\"carlo\" + 0.011*\"juan\" + 0.010*\"lizard\"\n", + "2019-01-31 01:31:42,124 : INFO : topic diff=0.003335, rho=0.021349\n", + "2019-01-31 01:31:42,282 : INFO : PROGRESS: pass 0, at document #4390000/4922894\n", + "2019-01-31 01:31:43,758 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:31:44,026 : INFO : topic #43 (0.020): 0.064*\"elect\" + 0.055*\"parti\" + 0.026*\"voluntari\" + 0.022*\"democrat\" + 0.020*\"member\" + 0.016*\"polici\" + 0.015*\"republ\" + 0.014*\"bypass\" + 0.013*\"seaport\" + 0.013*\"report\"\n", + "2019-01-31 01:31:44,028 : INFO : topic #22 (0.020): 0.033*\"spars\" + 0.018*\"factor\" + 0.012*\"plaisir\" + 0.010*\"western\" + 0.010*\"genu\" + 0.009*\"biom\" + 0.008*\"median\" + 0.007*\"florida\" + 0.007*\"incom\" + 0.006*\"trap\"\n", + "2019-01-31 01:31:44,029 : INFO : topic #47 (0.020): 0.064*\"muscl\" + 0.033*\"perceptu\" + 0.020*\"theater\" + 0.018*\"place\" + 0.017*\"compos\" + 0.016*\"damn\" + 0.014*\"orchestr\" + 0.013*\"physician\" + 0.012*\"olympo\" + 0.012*\"jack\"\n", + "2019-01-31 01:31:44,030 : INFO : topic #8 (0.020): 0.026*\"law\" + 0.022*\"cortic\" + 0.018*\"act\" + 0.018*\"start\" + 0.013*\"ricardo\" + 0.012*\"case\" + 0.010*\"replac\" + 0.009*\"legal\" + 0.008*\"polaris\" + 0.007*\"judaism\"\n", + "2019-01-31 01:31:44,031 : INFO : topic #15 (0.020): 0.011*\"small\" + 0.010*\"organ\" + 0.009*\"develop\" + 0.009*\"group\" + 0.009*\"commun\" + 0.008*\"word\" + 0.008*\"peopl\" + 0.007*\"woman\" + 0.007*\"human\" + 0.006*\"summerhil\"\n", + "2019-01-31 01:31:44,038 : INFO : topic diff=0.002902, rho=0.021344\n", + "2019-01-31 01:31:44,199 : INFO : PROGRESS: pass 0, at document #4392000/4922894\n", + "2019-01-31 01:31:45,610 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:31:45,876 : INFO : topic #33 (0.020): 0.060*\"french\" + 0.044*\"franc\" + 0.029*\"pari\" + 0.022*\"jean\" + 0.021*\"sail\" + 0.017*\"daphn\" + 0.014*\"wreath\" + 0.013*\"lazi\" + 0.012*\"loui\" + 0.011*\"wine\"\n", + "2019-01-31 01:31:45,877 : INFO : topic #28 (0.020): 0.036*\"build\" + 0.030*\"hous\" + 0.018*\"buford\" + 0.015*\"histor\" + 0.011*\"constitut\" + 0.011*\"linear\" + 0.011*\"centuri\" + 0.010*\"silicon\" + 0.010*\"depress\" + 0.010*\"pistol\"\n", + "2019-01-31 01:31:45,878 : INFO : topic #6 (0.020): 0.071*\"fewer\" + 0.023*\"epiru\" + 0.020*\"septemb\" + 0.018*\"teacher\" + 0.015*\"stake\" + 0.012*\"proclaim\" + 0.012*\"rodríguez\" + 0.011*\"direct\" + 0.011*\"movi\" + 0.010*\"acrimoni\"\n", + "2019-01-31 01:31:45,880 : INFO : topic #47 (0.020): 0.064*\"muscl\" + 0.033*\"perceptu\" + 0.020*\"theater\" + 0.018*\"place\" + 0.018*\"compos\" + 0.016*\"damn\" + 0.014*\"orchestr\" + 0.013*\"physician\" + 0.012*\"olympo\" + 0.012*\"jack\"\n", + "2019-01-31 01:31:45,881 : INFO : topic #12 (0.020): 0.009*\"number\" + 0.007*\"frontal\" + 0.007*\"gener\" + 0.007*\"servitud\" + 0.006*\"exampl\" + 0.006*\"poet\" + 0.006*\"southern\" + 0.006*\"théori\" + 0.006*\"utopian\" + 0.006*\"method\"\n", + "2019-01-31 01:31:45,886 : INFO : topic diff=0.004120, rho=0.021339\n", + "2019-01-31 01:31:46,047 : INFO : PROGRESS: pass 0, at document #4394000/4922894\n", + "2019-01-31 01:31:47,440 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:31:47,706 : INFO : topic #11 (0.020): 0.024*\"john\" + 0.011*\"will\" + 0.011*\"jame\" + 0.011*\"david\" + 0.010*\"rival\" + 0.009*\"mexican–american\" + 0.008*\"slur\" + 0.008*\"georg\" + 0.007*\"paul\" + 0.007*\"rhyme\"\n", + "2019-01-31 01:31:47,707 : INFO : topic #16 (0.020): 0.054*\"king\" + 0.031*\"priest\" + 0.020*\"rotterdam\" + 0.019*\"idiosyncrat\" + 0.019*\"duke\" + 0.018*\"grammat\" + 0.015*\"quarterli\" + 0.014*\"kingdom\" + 0.013*\"brazil\" + 0.013*\"portugues\"\n", + "2019-01-31 01:31:47,708 : INFO : topic #40 (0.020): 0.086*\"unit\" + 0.024*\"schuster\" + 0.022*\"institut\" + 0.021*\"requir\" + 0.021*\"collector\" + 0.019*\"student\" + 0.014*\"professor\" + 0.012*\"word\" + 0.012*\"degre\" + 0.011*\"http\"\n", + "2019-01-31 01:31:47,709 : INFO : topic #41 (0.020): 0.042*\"citi\" + 0.024*\"palmer\" + 0.020*\"new\" + 0.016*\"strategist\" + 0.013*\"open\" + 0.013*\"center\" + 0.011*\"lobe\" + 0.011*\"includ\" + 0.010*\"dai\" + 0.009*\"hot\"\n", + "2019-01-31 01:31:47,710 : INFO : topic #43 (0.020): 0.064*\"elect\" + 0.055*\"parti\" + 0.025*\"voluntari\" + 0.022*\"democrat\" + 0.020*\"member\" + 0.016*\"polici\" + 0.015*\"republ\" + 0.014*\"bypass\" + 0.013*\"seaport\" + 0.013*\"report\"\n", + "2019-01-31 01:31:47,716 : INFO : topic diff=0.003345, rho=0.021335\n", + "2019-01-31 01:31:47,874 : INFO : PROGRESS: pass 0, at document #4396000/4922894\n", + "2019-01-31 01:31:49,240 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:31:49,506 : INFO : topic #13 (0.020): 0.026*\"australia\" + 0.026*\"london\" + 0.025*\"sourc\" + 0.025*\"new\" + 0.023*\"england\" + 0.023*\"australian\" + 0.020*\"british\" + 0.018*\"ireland\" + 0.015*\"youth\" + 0.013*\"wale\"\n", + "2019-01-31 01:31:49,507 : INFO : topic #21 (0.020): 0.035*\"samford\" + 0.022*\"spain\" + 0.017*\"del\" + 0.016*\"mexico\" + 0.016*\"italian\" + 0.014*\"soviet\" + 0.012*\"santa\" + 0.011*\"carlo\" + 0.011*\"juan\" + 0.010*\"francisco\"\n", + "2019-01-31 01:31:49,508 : INFO : topic #3 (0.020): 0.033*\"present\" + 0.025*\"nation\" + 0.024*\"offic\" + 0.024*\"minist\" + 0.023*\"govern\" + 0.021*\"member\" + 0.017*\"start\" + 0.016*\"serv\" + 0.015*\"gener\" + 0.014*\"council\"\n", + "2019-01-31 01:31:49,509 : INFO : topic #8 (0.020): 0.026*\"law\" + 0.022*\"cortic\" + 0.018*\"act\" + 0.018*\"start\" + 0.013*\"ricardo\" + 0.012*\"case\" + 0.010*\"replac\" + 0.009*\"polaris\" + 0.009*\"legal\" + 0.007*\"judaism\"\n", + "2019-01-31 01:31:49,511 : INFO : topic #46 (0.020): 0.018*\"sweden\" + 0.015*\"stop\" + 0.015*\"swedish\" + 0.015*\"norwai\" + 0.015*\"wind\" + 0.013*\"damag\" + 0.013*\"norwegian\" + 0.012*\"treeless\" + 0.010*\"denmark\" + 0.010*\"turkish\"\n", + "2019-01-31 01:31:49,517 : INFO : topic diff=0.002557, rho=0.021330\n", + "2019-01-31 01:31:49,675 : INFO : PROGRESS: pass 0, at document #4398000/4922894\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 01:31:51,057 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:31:51,324 : INFO : topic #10 (0.020): 0.011*\"cdd\" + 0.009*\"media\" + 0.008*\"disco\" + 0.007*\"pathwai\" + 0.007*\"hormon\" + 0.007*\"have\" + 0.007*\"caus\" + 0.007*\"proper\" + 0.006*\"treat\" + 0.006*\"effect\"\n", + "2019-01-31 01:31:51,325 : INFO : topic #37 (0.020): 0.012*\"charact\" + 0.012*\"septemb\" + 0.012*\"anim\" + 0.011*\"man\" + 0.008*\"comic\" + 0.008*\"appear\" + 0.007*\"fusiform\" + 0.007*\"workplac\" + 0.007*\"storag\" + 0.006*\"black\"\n", + "2019-01-31 01:31:51,326 : INFO : topic #6 (0.020): 0.070*\"fewer\" + 0.024*\"epiru\" + 0.020*\"septemb\" + 0.018*\"teacher\" + 0.015*\"stake\" + 0.012*\"rodríguez\" + 0.012*\"proclaim\" + 0.011*\"direct\" + 0.011*\"movi\" + 0.010*\"acrimoni\"\n", + "2019-01-31 01:31:51,328 : INFO : topic #1 (0.020): 0.055*\"china\" + 0.050*\"chilton\" + 0.024*\"kong\" + 0.024*\"hong\" + 0.022*\"korea\" + 0.018*\"korean\" + 0.017*\"leah\" + 0.017*\"sourc\" + 0.014*\"kim\" + 0.014*\"shirin\"\n", + "2019-01-31 01:31:51,328 : INFO : topic #13 (0.020): 0.026*\"australia\" + 0.026*\"sourc\" + 0.026*\"london\" + 0.025*\"new\" + 0.023*\"england\" + 0.023*\"australian\" + 0.020*\"british\" + 0.018*\"ireland\" + 0.015*\"youth\" + 0.013*\"wale\"\n", + "2019-01-31 01:31:51,334 : INFO : topic diff=0.003255, rho=0.021325\n", + "2019-01-31 01:31:54,099 : INFO : -11.638 per-word bound, 3186.9 perplexity estimate based on a held-out corpus of 2000 documents with 582131 words\n", + "2019-01-31 01:31:54,100 : INFO : PROGRESS: pass 0, at document #4400000/4922894\n", + "2019-01-31 01:31:55,506 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:31:55,772 : INFO : topic #27 (0.020): 0.076*\"questionnair\" + 0.020*\"candid\" + 0.019*\"taxpay\" + 0.013*\"tornado\" + 0.013*\"ret\" + 0.012*\"find\" + 0.012*\"driver\" + 0.011*\"fool\" + 0.010*\"squatter\" + 0.010*\"champion\"\n", + "2019-01-31 01:31:55,774 : INFO : topic #5 (0.020): 0.038*\"abroad\" + 0.028*\"son\" + 0.026*\"rel\" + 0.026*\"reconstruct\" + 0.021*\"band\" + 0.017*\"muscl\" + 0.015*\"simultan\" + 0.014*\"charcoal\" + 0.014*\"toyota\" + 0.009*\"myspac\"\n", + "2019-01-31 01:31:55,775 : INFO : topic #11 (0.020): 0.024*\"john\" + 0.011*\"will\" + 0.011*\"jame\" + 0.011*\"david\" + 0.010*\"rival\" + 0.009*\"mexican–american\" + 0.008*\"slur\" + 0.008*\"georg\" + 0.007*\"paul\" + 0.007*\"rhyme\"\n", + "2019-01-31 01:31:55,776 : INFO : topic #17 (0.020): 0.078*\"church\" + 0.024*\"christian\" + 0.023*\"cathol\" + 0.021*\"bishop\" + 0.017*\"sail\" + 0.016*\"retroflex\" + 0.010*\"relationship\" + 0.010*\"historiographi\" + 0.009*\"cathedr\" + 0.009*\"parish\"\n", + "2019-01-31 01:31:55,777 : INFO : topic #45 (0.020): 0.046*\"arsen\" + 0.031*\"jpg\" + 0.030*\"fifteenth\" + 0.028*\"museo\" + 0.022*\"pain\" + 0.019*\"illicit\" + 0.016*\"artist\" + 0.016*\"gai\" + 0.016*\"exhaust\" + 0.016*\"colder\"\n", + "2019-01-31 01:31:55,783 : INFO : topic diff=0.003138, rho=0.021320\n", + "2019-01-31 01:31:55,940 : INFO : PROGRESS: pass 0, at document #4402000/4922894\n", + "2019-01-31 01:31:57,314 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:31:57,580 : INFO : topic #3 (0.020): 0.032*\"present\" + 0.025*\"nation\" + 0.024*\"offic\" + 0.024*\"minist\" + 0.023*\"govern\" + 0.021*\"member\" + 0.017*\"start\" + 0.016*\"serv\" + 0.015*\"gener\" + 0.014*\"seri\"\n", + "2019-01-31 01:31:57,581 : INFO : topic #16 (0.020): 0.054*\"king\" + 0.031*\"priest\" + 0.019*\"rotterdam\" + 0.019*\"duke\" + 0.019*\"idiosyncrat\" + 0.018*\"grammat\" + 0.015*\"quarterli\" + 0.014*\"kingdom\" + 0.013*\"brazil\" + 0.012*\"portugues\"\n", + "2019-01-31 01:31:57,582 : INFO : topic #7 (0.020): 0.021*\"snatch\" + 0.020*\"di\" + 0.018*\"factor\" + 0.016*\"yawn\" + 0.016*\"margin\" + 0.014*\"bone\" + 0.013*\"life\" + 0.013*\"faster\" + 0.012*\"will\" + 0.012*\"deal\"\n", + "2019-01-31 01:31:57,583 : INFO : topic #32 (0.020): 0.050*\"district\" + 0.045*\"popolo\" + 0.042*\"vigour\" + 0.035*\"tortur\" + 0.032*\"cotton\" + 0.023*\"adulthood\" + 0.022*\"multitud\" + 0.021*\"area\" + 0.020*\"cede\" + 0.019*\"citi\"\n", + "2019-01-31 01:31:57,584 : INFO : topic #24 (0.020): 0.041*\"book\" + 0.035*\"publicis\" + 0.025*\"word\" + 0.020*\"new\" + 0.014*\"edit\" + 0.014*\"presid\" + 0.011*\"worldwid\" + 0.011*\"author\" + 0.011*\"magazin\" + 0.011*\"nicola\"\n", + "2019-01-31 01:31:57,590 : INFO : topic diff=0.003187, rho=0.021315\n", + "2019-01-31 01:31:57,747 : INFO : PROGRESS: pass 0, at document #4404000/4922894\n", + "2019-01-31 01:31:59,323 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:31:59,589 : INFO : topic #44 (0.020): 0.029*\"rooftop\" + 0.026*\"final\" + 0.024*\"wife\" + 0.020*\"tourist\" + 0.019*\"champion\" + 0.016*\"martin\" + 0.015*\"taxpay\" + 0.014*\"tiepolo\" + 0.014*\"chamber\" + 0.012*\"open\"\n", + "2019-01-31 01:31:59,590 : INFO : topic #12 (0.020): 0.008*\"number\" + 0.008*\"frontal\" + 0.007*\"poet\" + 0.007*\"gener\" + 0.007*\"servitud\" + 0.006*\"exampl\" + 0.006*\"southern\" + 0.006*\"utopian\" + 0.006*\"théori\" + 0.006*\"method\"\n", + "2019-01-31 01:31:59,592 : INFO : topic #46 (0.020): 0.018*\"sweden\" + 0.016*\"swedish\" + 0.016*\"stop\" + 0.015*\"norwai\" + 0.015*\"wind\" + 0.014*\"norwegian\" + 0.013*\"damag\" + 0.011*\"treeless\" + 0.010*\"denmark\" + 0.010*\"turkish\"\n", + "2019-01-31 01:31:59,593 : INFO : topic #40 (0.020): 0.087*\"unit\" + 0.023*\"schuster\" + 0.022*\"institut\" + 0.022*\"collector\" + 0.021*\"requir\" + 0.019*\"student\" + 0.014*\"professor\" + 0.011*\"word\" + 0.011*\"degre\" + 0.011*\"http\"\n", + "2019-01-31 01:31:59,594 : INFO : topic #21 (0.020): 0.034*\"samford\" + 0.023*\"spain\" + 0.017*\"del\" + 0.017*\"mexico\" + 0.017*\"italian\" + 0.014*\"soviet\" + 0.013*\"santa\" + 0.011*\"carlo\" + 0.011*\"juan\" + 0.011*\"lizard\"\n", + "2019-01-31 01:31:59,599 : INFO : topic diff=0.003461, rho=0.021310\n", + "2019-01-31 01:31:59,757 : INFO : PROGRESS: pass 0, at document #4406000/4922894\n", + "2019-01-31 01:32:01,143 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:32:01,412 : INFO : topic #41 (0.020): 0.042*\"citi\" + 0.024*\"palmer\" + 0.020*\"new\" + 0.016*\"strategist\" + 0.014*\"open\" + 0.013*\"center\" + 0.011*\"includ\" + 0.011*\"lobe\" + 0.010*\"dai\" + 0.009*\"hot\"\n", + "2019-01-31 01:32:01,413 : INFO : topic #2 (0.020): 0.048*\"isl\" + 0.038*\"shield\" + 0.017*\"narrat\" + 0.014*\"scot\" + 0.013*\"pope\" + 0.012*\"blur\" + 0.011*\"nativist\" + 0.010*\"coalit\" + 0.010*\"class\" + 0.009*\"fleet\"\n", + "2019-01-31 01:32:01,414 : INFO : topic #49 (0.020): 0.043*\"india\" + 0.032*\"incumb\" + 0.014*\"pakistan\" + 0.013*\"islam\" + 0.011*\"affection\" + 0.011*\"televis\" + 0.011*\"anglo\" + 0.010*\"muskoge\" + 0.010*\"khalsa\" + 0.010*\"singh\"\n", + "2019-01-31 01:32:01,415 : INFO : topic #19 (0.020): 0.016*\"languag\" + 0.015*\"centuri\" + 0.011*\"woodcut\" + 0.009*\"mean\" + 0.009*\"form\" + 0.009*\"origin\" + 0.008*\"trade\" + 0.008*\"english\" + 0.007*\"known\" + 0.007*\"uruguayan\"\n", + "2019-01-31 01:32:01,416 : INFO : topic #9 (0.020): 0.071*\"bone\" + 0.043*\"american\" + 0.029*\"valour\" + 0.019*\"dutch\" + 0.019*\"player\" + 0.018*\"folei\" + 0.017*\"polit\" + 0.017*\"english\" + 0.012*\"acrimoni\" + 0.012*\"simpler\"\n", + "2019-01-31 01:32:01,422 : INFO : topic diff=0.003479, rho=0.021306\n", + "2019-01-31 01:32:01,580 : INFO : PROGRESS: pass 0, at document #4408000/4922894\n", + "2019-01-31 01:32:02,985 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:32:03,255 : INFO : topic #11 (0.020): 0.024*\"john\" + 0.012*\"will\" + 0.011*\"jame\" + 0.011*\"david\" + 0.010*\"rival\" + 0.009*\"mexican–american\" + 0.008*\"slur\" + 0.008*\"georg\" + 0.007*\"paul\" + 0.007*\"rhyme\"\n", + "2019-01-31 01:32:03,256 : INFO : topic #3 (0.020): 0.032*\"present\" + 0.025*\"nation\" + 0.024*\"offic\" + 0.024*\"minist\" + 0.023*\"govern\" + 0.021*\"member\" + 0.017*\"start\" + 0.016*\"serv\" + 0.015*\"gener\" + 0.014*\"council\"\n", + "2019-01-31 01:32:03,257 : INFO : topic #48 (0.020): 0.084*\"march\" + 0.077*\"sens\" + 0.076*\"octob\" + 0.071*\"januari\" + 0.069*\"juli\" + 0.068*\"august\" + 0.068*\"notion\" + 0.067*\"judici\" + 0.067*\"april\" + 0.065*\"decatur\"\n", + "2019-01-31 01:32:03,258 : INFO : topic #36 (0.020): 0.010*\"network\" + 0.010*\"prognosi\" + 0.009*\"pop\" + 0.008*\"cytokin\" + 0.008*\"develop\" + 0.008*\"user\" + 0.008*\"softwar\" + 0.008*\"uruguayan\" + 0.008*\"diggin\" + 0.007*\"includ\"\n", + "2019-01-31 01:32:03,259 : INFO : topic #29 (0.020): 0.031*\"companhia\" + 0.013*\"million\" + 0.012*\"busi\" + 0.011*\"market\" + 0.011*\"produc\" + 0.011*\"bank\" + 0.010*\"industri\" + 0.009*\"yawn\" + 0.008*\"manag\" + 0.007*\"serv\"\n", + "2019-01-31 01:32:03,265 : INFO : topic diff=0.003051, rho=0.021301\n", + "2019-01-31 01:32:03,423 : INFO : PROGRESS: pass 0, at document #4410000/4922894\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 01:32:04,821 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:32:05,089 : INFO : topic #2 (0.020): 0.048*\"isl\" + 0.038*\"shield\" + 0.017*\"narrat\" + 0.014*\"scot\" + 0.014*\"pope\" + 0.012*\"blur\" + 0.011*\"nativist\" + 0.010*\"coalit\" + 0.009*\"class\" + 0.009*\"fleet\"\n", + "2019-01-31 01:32:05,090 : INFO : topic #0 (0.020): 0.062*\"statewid\" + 0.039*\"line\" + 0.032*\"rivièr\" + 0.031*\"raid\" + 0.026*\"rosenwald\" + 0.021*\"airmen\" + 0.018*\"traceabl\" + 0.018*\"serv\" + 0.013*\"oper\" + 0.010*\"transient\"\n", + "2019-01-31 01:32:05,091 : INFO : topic #36 (0.020): 0.011*\"network\" + 0.010*\"prognosi\" + 0.009*\"pop\" + 0.008*\"cytokin\" + 0.008*\"develop\" + 0.008*\"user\" + 0.008*\"softwar\" + 0.008*\"uruguayan\" + 0.008*\"diggin\" + 0.007*\"includ\"\n", + "2019-01-31 01:32:05,092 : INFO : topic #1 (0.020): 0.055*\"china\" + 0.049*\"chilton\" + 0.024*\"kong\" + 0.024*\"hong\" + 0.021*\"korea\" + 0.018*\"korean\" + 0.017*\"leah\" + 0.017*\"sourc\" + 0.014*\"kim\" + 0.014*\"shirin\"\n", + "2019-01-31 01:32:05,093 : INFO : topic #29 (0.020): 0.031*\"companhia\" + 0.012*\"million\" + 0.012*\"busi\" + 0.011*\"market\" + 0.011*\"produc\" + 0.011*\"bank\" + 0.010*\"industri\" + 0.009*\"yawn\" + 0.008*\"manag\" + 0.007*\"serv\"\n", + "2019-01-31 01:32:05,100 : INFO : topic diff=0.002522, rho=0.021296\n", + "2019-01-31 01:32:05,260 : INFO : PROGRESS: pass 0, at document #4412000/4922894\n", + "2019-01-31 01:32:06,650 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:32:06,917 : INFO : topic #42 (0.020): 0.048*\"german\" + 0.032*\"germani\" + 0.016*\"israel\" + 0.016*\"vol\" + 0.014*\"berlin\" + 0.014*\"jewish\" + 0.013*\"der\" + 0.009*\"isra\" + 0.009*\"european\" + 0.009*\"austria\"\n", + "2019-01-31 01:32:06,918 : INFO : topic #1 (0.020): 0.054*\"china\" + 0.049*\"chilton\" + 0.024*\"kong\" + 0.024*\"hong\" + 0.021*\"korea\" + 0.018*\"korean\" + 0.017*\"leah\" + 0.017*\"sourc\" + 0.014*\"kim\" + 0.014*\"shirin\"\n", + "2019-01-31 01:32:06,919 : INFO : topic #6 (0.020): 0.070*\"fewer\" + 0.025*\"epiru\" + 0.019*\"septemb\" + 0.018*\"teacher\" + 0.015*\"stake\" + 0.012*\"proclaim\" + 0.012*\"rodríguez\" + 0.011*\"direct\" + 0.011*\"movi\" + 0.010*\"acrimoni\"\n", + "2019-01-31 01:32:06,920 : INFO : topic #10 (0.020): 0.011*\"cdd\" + 0.009*\"media\" + 0.008*\"disco\" + 0.007*\"hormon\" + 0.007*\"pathwai\" + 0.007*\"have\" + 0.007*\"caus\" + 0.007*\"proper\" + 0.006*\"effect\" + 0.006*\"treat\"\n", + "2019-01-31 01:32:06,921 : INFO : topic #37 (0.020): 0.012*\"charact\" + 0.012*\"septemb\" + 0.012*\"anim\" + 0.010*\"man\" + 0.008*\"appear\" + 0.008*\"comic\" + 0.007*\"workplac\" + 0.007*\"fusiform\" + 0.007*\"storag\" + 0.006*\"black\"\n", + "2019-01-31 01:32:06,927 : INFO : topic diff=0.003163, rho=0.021291\n", + "2019-01-31 01:32:07,152 : INFO : PROGRESS: pass 0, at document #4414000/4922894\n", + "2019-01-31 01:32:08,574 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:32:08,840 : INFO : topic #14 (0.020): 0.025*\"forc\" + 0.022*\"aggress\" + 0.021*\"armi\" + 0.020*\"walter\" + 0.018*\"com\" + 0.015*\"oper\" + 0.013*\"unionist\" + 0.013*\"militari\" + 0.013*\"airbu\" + 0.012*\"diversifi\"\n", + "2019-01-31 01:32:08,841 : INFO : topic #34 (0.020): 0.065*\"start\" + 0.033*\"new\" + 0.031*\"american\" + 0.028*\"unionist\" + 0.028*\"cotton\" + 0.021*\"year\" + 0.016*\"california\" + 0.014*\"warrior\" + 0.013*\"terri\" + 0.012*\"north\"\n", + "2019-01-31 01:32:08,842 : INFO : topic #4 (0.020): 0.018*\"enfranchis\" + 0.015*\"depress\" + 0.014*\"pour\" + 0.008*\"elabor\" + 0.008*\"uruguayan\" + 0.008*\"mode\" + 0.008*\"veget\" + 0.006*\"teratogen\" + 0.006*\"develop\" + 0.006*\"turn\"\n", + "2019-01-31 01:32:08,843 : INFO : topic #31 (0.020): 0.049*\"fusiform\" + 0.026*\"scientist\" + 0.025*\"taxpay\" + 0.023*\"player\" + 0.020*\"place\" + 0.014*\"clot\" + 0.013*\"leagu\" + 0.011*\"folei\" + 0.011*\"yawn\" + 0.009*\"reconstruct\"\n", + "2019-01-31 01:32:08,844 : INFO : topic #9 (0.020): 0.072*\"bone\" + 0.042*\"american\" + 0.029*\"valour\" + 0.019*\"dutch\" + 0.019*\"player\" + 0.017*\"folei\" + 0.017*\"polit\" + 0.016*\"english\" + 0.012*\"acrimoni\" + 0.012*\"simpler\"\n", + "2019-01-31 01:32:08,850 : INFO : topic diff=0.003536, rho=0.021286\n", + "2019-01-31 01:32:09,011 : INFO : PROGRESS: pass 0, at document #4416000/4922894\n", + "2019-01-31 01:32:10,390 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:32:10,660 : INFO : topic #45 (0.020): 0.045*\"arsen\" + 0.031*\"jpg\" + 0.030*\"fifteenth\" + 0.028*\"museo\" + 0.022*\"pain\" + 0.020*\"illicit\" + 0.016*\"exhaust\" + 0.016*\"artist\" + 0.016*\"gai\" + 0.016*\"colder\"\n", + "2019-01-31 01:32:10,661 : INFO : topic #22 (0.020): 0.033*\"spars\" + 0.017*\"factor\" + 0.012*\"plaisir\" + 0.010*\"western\" + 0.010*\"genu\" + 0.008*\"biom\" + 0.008*\"median\" + 0.007*\"trap\" + 0.007*\"incom\" + 0.007*\"florida\"\n", + "2019-01-31 01:32:10,662 : INFO : topic #37 (0.020): 0.012*\"charact\" + 0.012*\"septemb\" + 0.012*\"anim\" + 0.011*\"man\" + 0.008*\"appear\" + 0.007*\"comic\" + 0.007*\"workplac\" + 0.007*\"fusiform\" + 0.007*\"storag\" + 0.006*\"black\"\n", + "2019-01-31 01:32:10,663 : INFO : topic #24 (0.020): 0.041*\"book\" + 0.036*\"publicis\" + 0.025*\"word\" + 0.020*\"new\" + 0.014*\"edit\" + 0.014*\"presid\" + 0.011*\"worldwid\" + 0.011*\"author\" + 0.011*\"nicola\" + 0.011*\"storag\"\n", + "2019-01-31 01:32:10,664 : INFO : topic #42 (0.020): 0.048*\"german\" + 0.032*\"germani\" + 0.016*\"vol\" + 0.016*\"israel\" + 0.014*\"berlin\" + 0.014*\"jewish\" + 0.013*\"der\" + 0.009*\"european\" + 0.009*\"isra\" + 0.009*\"austria\"\n", + "2019-01-31 01:32:10,670 : INFO : topic diff=0.003006, rho=0.021281\n", + "2019-01-31 01:32:10,831 : INFO : PROGRESS: pass 0, at document #4418000/4922894\n", + "2019-01-31 01:32:12,219 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:32:12,489 : INFO : topic #39 (0.020): 0.060*\"canada\" + 0.045*\"canadian\" + 0.024*\"toronto\" + 0.022*\"hoar\" + 0.021*\"ontario\" + 0.016*\"new\" + 0.016*\"hydrogen\" + 0.016*\"novotná\" + 0.015*\"misericordia\" + 0.013*\"quebec\"\n", + "2019-01-31 01:32:12,490 : INFO : topic #42 (0.020): 0.047*\"german\" + 0.032*\"germani\" + 0.016*\"vol\" + 0.016*\"israel\" + 0.014*\"berlin\" + 0.014*\"jewish\" + 0.013*\"der\" + 0.010*\"isra\" + 0.010*\"european\" + 0.009*\"austria\"\n", + "2019-01-31 01:32:12,491 : INFO : topic #21 (0.020): 0.038*\"samford\" + 0.022*\"spain\" + 0.017*\"del\" + 0.016*\"italian\" + 0.016*\"mexico\" + 0.014*\"santa\" + 0.014*\"soviet\" + 0.012*\"juan\" + 0.011*\"lizard\" + 0.011*\"carlo\"\n", + "2019-01-31 01:32:12,492 : INFO : topic #38 (0.020): 0.023*\"walter\" + 0.010*\"aza\" + 0.009*\"battalion\" + 0.009*\"forc\" + 0.008*\"teufel\" + 0.007*\"armi\" + 0.007*\"empath\" + 0.007*\"till\" + 0.007*\"govern\" + 0.006*\"militari\"\n", + "2019-01-31 01:32:12,493 : INFO : topic #7 (0.020): 0.021*\"snatch\" + 0.020*\"di\" + 0.019*\"factor\" + 0.016*\"yawn\" + 0.016*\"margin\" + 0.014*\"bone\" + 0.013*\"life\" + 0.013*\"faster\" + 0.012*\"will\" + 0.012*\"deal\"\n", + "2019-01-31 01:32:12,499 : INFO : topic diff=0.002996, rho=0.021277\n", + "2019-01-31 01:32:15,226 : INFO : -11.535 per-word bound, 2967.8 perplexity estimate based on a held-out corpus of 2000 documents with 568219 words\n", + "2019-01-31 01:32:15,226 : INFO : PROGRESS: pass 0, at document #4420000/4922894\n", + "2019-01-31 01:32:16,620 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:32:16,890 : INFO : topic #9 (0.020): 0.071*\"bone\" + 0.042*\"american\" + 0.028*\"valour\" + 0.019*\"dutch\" + 0.019*\"player\" + 0.018*\"folei\" + 0.017*\"polit\" + 0.016*\"english\" + 0.012*\"acrimoni\" + 0.012*\"simpler\"\n", + "2019-01-31 01:32:16,891 : INFO : topic #14 (0.020): 0.025*\"forc\" + 0.022*\"aggress\" + 0.020*\"armi\" + 0.020*\"walter\" + 0.018*\"com\" + 0.015*\"oper\" + 0.013*\"unionist\" + 0.013*\"militari\" + 0.013*\"airbu\" + 0.011*\"diversifi\"\n", + "2019-01-31 01:32:16,892 : INFO : topic #8 (0.020): 0.026*\"law\" + 0.022*\"cortic\" + 0.018*\"start\" + 0.018*\"act\" + 0.012*\"ricardo\" + 0.012*\"case\" + 0.010*\"replac\" + 0.009*\"polaris\" + 0.009*\"legal\" + 0.007*\"judaism\"\n", + "2019-01-31 01:32:16,893 : INFO : topic #15 (0.020): 0.011*\"small\" + 0.010*\"organ\" + 0.009*\"develop\" + 0.009*\"commun\" + 0.009*\"group\" + 0.008*\"word\" + 0.008*\"woman\" + 0.008*\"peopl\" + 0.007*\"human\" + 0.006*\"summerhil\"\n", + "2019-01-31 01:32:16,894 : INFO : topic #46 (0.020): 0.018*\"sweden\" + 0.016*\"swedish\" + 0.016*\"stop\" + 0.015*\"norwai\" + 0.014*\"wind\" + 0.014*\"norwegian\" + 0.012*\"damag\" + 0.011*\"treeless\" + 0.010*\"turkish\" + 0.010*\"denmark\"\n", + "2019-01-31 01:32:16,900 : INFO : topic diff=0.002642, rho=0.021272\n", + "2019-01-31 01:32:17,063 : INFO : PROGRESS: pass 0, at document #4422000/4922894\n", + "2019-01-31 01:32:18,483 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 01:32:18,749 : INFO : topic #14 (0.020): 0.025*\"forc\" + 0.022*\"aggress\" + 0.020*\"armi\" + 0.020*\"walter\" + 0.018*\"com\" + 0.015*\"oper\" + 0.013*\"unionist\" + 0.013*\"militari\" + 0.012*\"airbu\" + 0.011*\"diversifi\"\n", + "2019-01-31 01:32:18,750 : INFO : topic #11 (0.020): 0.023*\"john\" + 0.012*\"will\" + 0.011*\"jame\" + 0.011*\"david\" + 0.010*\"rival\" + 0.009*\"mexican–american\" + 0.008*\"slur\" + 0.008*\"georg\" + 0.007*\"paul\" + 0.007*\"rhyme\"\n", + "2019-01-31 01:32:18,751 : INFO : topic #29 (0.020): 0.031*\"companhia\" + 0.013*\"busi\" + 0.012*\"million\" + 0.011*\"market\" + 0.011*\"produc\" + 0.011*\"bank\" + 0.010*\"industri\" + 0.009*\"yawn\" + 0.008*\"manag\" + 0.007*\"trace\"\n", + "2019-01-31 01:32:18,752 : INFO : topic #35 (0.020): 0.054*\"russia\" + 0.034*\"sovereignti\" + 0.032*\"rural\" + 0.026*\"poison\" + 0.026*\"reprint\" + 0.024*\"personifi\" + 0.020*\"poland\" + 0.019*\"moscow\" + 0.015*\"tyrant\" + 0.014*\"unfortun\"\n", + "2019-01-31 01:32:18,753 : INFO : topic #1 (0.020): 0.054*\"china\" + 0.048*\"chilton\" + 0.024*\"kong\" + 0.023*\"hong\" + 0.022*\"korea\" + 0.018*\"korean\" + 0.017*\"leah\" + 0.017*\"sourc\" + 0.014*\"kim\" + 0.014*\"shirin\"\n", + "2019-01-31 01:32:18,759 : INFO : topic diff=0.003702, rho=0.021267\n", + "2019-01-31 01:32:18,915 : INFO : PROGRESS: pass 0, at document #4424000/4922894\n", + "2019-01-31 01:32:20,314 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:32:20,580 : INFO : topic #41 (0.020): 0.041*\"citi\" + 0.024*\"palmer\" + 0.020*\"new\" + 0.017*\"strategist\" + 0.013*\"open\" + 0.013*\"center\" + 0.011*\"includ\" + 0.011*\"lobe\" + 0.010*\"dai\" + 0.009*\"hot\"\n", + "2019-01-31 01:32:20,581 : INFO : topic #6 (0.020): 0.069*\"fewer\" + 0.025*\"epiru\" + 0.019*\"septemb\" + 0.018*\"teacher\" + 0.015*\"stake\" + 0.012*\"proclaim\" + 0.012*\"rodríguez\" + 0.011*\"direct\" + 0.011*\"movi\" + 0.010*\"acrimoni\"\n", + "2019-01-31 01:32:20,582 : INFO : topic #47 (0.020): 0.064*\"muscl\" + 0.033*\"perceptu\" + 0.020*\"theater\" + 0.018*\"place\" + 0.018*\"compos\" + 0.016*\"damn\" + 0.014*\"physician\" + 0.014*\"orchestr\" + 0.011*\"olympo\" + 0.011*\"jack\"\n", + "2019-01-31 01:32:20,583 : INFO : topic #42 (0.020): 0.048*\"german\" + 0.032*\"germani\" + 0.016*\"vol\" + 0.016*\"israel\" + 0.014*\"berlin\" + 0.014*\"der\" + 0.013*\"jewish\" + 0.010*\"isra\" + 0.010*\"european\" + 0.009*\"austria\"\n", + "2019-01-31 01:32:20,584 : INFO : topic #22 (0.020): 0.033*\"spars\" + 0.017*\"factor\" + 0.012*\"plaisir\" + 0.010*\"western\" + 0.010*\"genu\" + 0.008*\"biom\" + 0.008*\"median\" + 0.007*\"trap\" + 0.007*\"incom\" + 0.007*\"florida\"\n", + "2019-01-31 01:32:20,590 : INFO : topic diff=0.002791, rho=0.021262\n", + "2019-01-31 01:32:20,752 : INFO : PROGRESS: pass 0, at document #4426000/4922894\n", + "2019-01-31 01:32:22,164 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:32:22,430 : INFO : topic #30 (0.020): 0.036*\"cleveland\" + 0.035*\"leagu\" + 0.030*\"place\" + 0.028*\"taxpay\" + 0.025*\"scientist\" + 0.023*\"crete\" + 0.022*\"folei\" + 0.016*\"goal\" + 0.015*\"martin\" + 0.012*\"schmitz\"\n", + "2019-01-31 01:32:22,432 : INFO : topic #28 (0.020): 0.036*\"build\" + 0.030*\"hous\" + 0.019*\"buford\" + 0.015*\"histor\" + 0.011*\"linear\" + 0.011*\"constitut\" + 0.011*\"silicon\" + 0.011*\"centuri\" + 0.011*\"depress\" + 0.010*\"pistol\"\n", + "2019-01-31 01:32:22,433 : INFO : topic #7 (0.020): 0.021*\"snatch\" + 0.020*\"di\" + 0.019*\"factor\" + 0.016*\"yawn\" + 0.016*\"margin\" + 0.014*\"bone\" + 0.013*\"life\" + 0.012*\"faster\" + 0.012*\"will\" + 0.012*\"deal\"\n", + "2019-01-31 01:32:22,434 : INFO : topic #0 (0.020): 0.062*\"statewid\" + 0.039*\"line\" + 0.032*\"raid\" + 0.031*\"rivièr\" + 0.026*\"rosenwald\" + 0.020*\"airmen\" + 0.018*\"traceabl\" + 0.018*\"serv\" + 0.013*\"oper\" + 0.010*\"transient\"\n", + "2019-01-31 01:32:22,435 : INFO : topic #32 (0.020): 0.049*\"district\" + 0.046*\"popolo\" + 0.042*\"vigour\" + 0.036*\"tortur\" + 0.032*\"cotton\" + 0.023*\"adulthood\" + 0.022*\"multitud\" + 0.021*\"area\" + 0.019*\"cede\" + 0.019*\"citi\"\n", + "2019-01-31 01:32:22,441 : INFO : topic diff=0.002783, rho=0.021257\n", + "2019-01-31 01:32:22,603 : INFO : PROGRESS: pass 0, at document #4428000/4922894\n", + "2019-01-31 01:32:24,014 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:32:24,281 : INFO : topic #18 (0.020): 0.011*\"théori\" + 0.007*\"later\" + 0.007*\"sack\" + 0.006*\"dai\" + 0.005*\"kill\" + 0.005*\"retrospect\" + 0.005*\"like\" + 0.005*\"end\" + 0.004*\"call\" + 0.004*\"help\"\n", + "2019-01-31 01:32:24,282 : INFO : topic #41 (0.020): 0.042*\"citi\" + 0.024*\"palmer\" + 0.020*\"new\" + 0.017*\"strategist\" + 0.013*\"open\" + 0.013*\"center\" + 0.011*\"includ\" + 0.011*\"lobe\" + 0.010*\"dai\" + 0.009*\"hot\"\n", + "2019-01-31 01:32:24,283 : INFO : topic #14 (0.020): 0.025*\"forc\" + 0.022*\"aggress\" + 0.020*\"armi\" + 0.020*\"walter\" + 0.018*\"com\" + 0.015*\"oper\" + 0.013*\"unionist\" + 0.013*\"militari\" + 0.012*\"airbu\" + 0.011*\"diversifi\"\n", + "2019-01-31 01:32:24,285 : INFO : topic #5 (0.020): 0.038*\"abroad\" + 0.028*\"son\" + 0.026*\"rel\" + 0.025*\"reconstruct\" + 0.021*\"band\" + 0.017*\"muscl\" + 0.015*\"simultan\" + 0.014*\"charcoal\" + 0.014*\"toyota\" + 0.010*\"myspac\"\n", + "2019-01-31 01:32:24,286 : INFO : topic #49 (0.020): 0.043*\"india\" + 0.032*\"incumb\" + 0.014*\"pakistan\" + 0.013*\"islam\" + 0.011*\"affection\" + 0.011*\"anglo\" + 0.011*\"televis\" + 0.011*\"muskoge\" + 0.010*\"khalsa\" + 0.010*\"alam\"\n", + "2019-01-31 01:32:24,292 : INFO : topic diff=0.003561, rho=0.021253\n", + "2019-01-31 01:32:24,449 : INFO : PROGRESS: pass 0, at document #4430000/4922894\n", + "2019-01-31 01:32:25,831 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:32:26,098 : INFO : topic #0 (0.020): 0.063*\"statewid\" + 0.039*\"line\" + 0.032*\"raid\" + 0.031*\"rivièr\" + 0.026*\"rosenwald\" + 0.020*\"airmen\" + 0.018*\"traceabl\" + 0.018*\"serv\" + 0.013*\"oper\" + 0.010*\"transient\"\n", + "2019-01-31 01:32:26,099 : INFO : topic #16 (0.020): 0.054*\"king\" + 0.031*\"priest\" + 0.019*\"rotterdam\" + 0.019*\"duke\" + 0.019*\"idiosyncrat\" + 0.018*\"grammat\" + 0.016*\"quarterli\" + 0.013*\"kingdom\" + 0.013*\"portugues\" + 0.012*\"order\"\n", + "2019-01-31 01:32:26,100 : INFO : topic #33 (0.020): 0.061*\"french\" + 0.044*\"franc\" + 0.030*\"pari\" + 0.023*\"jean\" + 0.020*\"sail\" + 0.017*\"daphn\" + 0.013*\"lazi\" + 0.012*\"loui\" + 0.012*\"wreath\" + 0.011*\"piec\"\n", + "2019-01-31 01:32:26,101 : INFO : topic #35 (0.020): 0.054*\"russia\" + 0.035*\"sovereignti\" + 0.032*\"rural\" + 0.026*\"poison\" + 0.025*\"reprint\" + 0.023*\"personifi\" + 0.020*\"poland\" + 0.019*\"moscow\" + 0.015*\"tyrant\" + 0.014*\"unfortun\"\n", + "2019-01-31 01:32:26,103 : INFO : topic #22 (0.020): 0.033*\"spars\" + 0.017*\"factor\" + 0.012*\"plaisir\" + 0.010*\"western\" + 0.010*\"genu\" + 0.008*\"biom\" + 0.008*\"median\" + 0.007*\"trap\" + 0.007*\"florida\" + 0.007*\"incom\"\n", + "2019-01-31 01:32:26,109 : INFO : topic diff=0.003078, rho=0.021248\n", + "2019-01-31 01:32:26,264 : INFO : PROGRESS: pass 0, at document #4432000/4922894\n", + "2019-01-31 01:32:27,626 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:32:27,893 : INFO : topic #16 (0.020): 0.054*\"king\" + 0.031*\"priest\" + 0.019*\"rotterdam\" + 0.019*\"duke\" + 0.019*\"idiosyncrat\" + 0.017*\"grammat\" + 0.016*\"quarterli\" + 0.013*\"kingdom\" + 0.013*\"portugues\" + 0.012*\"brazil\"\n", + "2019-01-31 01:32:27,894 : INFO : topic #22 (0.020): 0.033*\"spars\" + 0.017*\"factor\" + 0.012*\"plaisir\" + 0.010*\"western\" + 0.010*\"genu\" + 0.008*\"biom\" + 0.008*\"median\" + 0.007*\"trap\" + 0.007*\"florida\" + 0.007*\"incom\"\n", + "2019-01-31 01:32:27,895 : INFO : topic #28 (0.020): 0.036*\"build\" + 0.030*\"hous\" + 0.019*\"buford\" + 0.015*\"histor\" + 0.011*\"linear\" + 0.011*\"constitut\" + 0.011*\"silicon\" + 0.011*\"centuri\" + 0.011*\"depress\" + 0.010*\"pistol\"\n", + "2019-01-31 01:32:27,896 : INFO : topic #3 (0.020): 0.034*\"present\" + 0.025*\"minist\" + 0.025*\"nation\" + 0.024*\"offic\" + 0.023*\"govern\" + 0.021*\"member\" + 0.017*\"start\" + 0.015*\"gener\" + 0.015*\"serv\" + 0.013*\"seri\"\n", + "2019-01-31 01:32:27,898 : INFO : topic #38 (0.020): 0.022*\"walter\" + 0.010*\"aza\" + 0.009*\"battalion\" + 0.009*\"forc\" + 0.007*\"teufel\" + 0.007*\"armi\" + 0.007*\"empath\" + 0.007*\"govern\" + 0.007*\"till\" + 0.006*\"militari\"\n", + "2019-01-31 01:32:27,903 : INFO : topic diff=0.002767, rho=0.021243\n", + "2019-01-31 01:32:28,061 : INFO : PROGRESS: pass 0, at document #4434000/4922894\n", + "2019-01-31 01:32:29,436 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:32:29,702 : INFO : topic #19 (0.020): 0.016*\"languag\" + 0.015*\"centuri\" + 0.011*\"woodcut\" + 0.009*\"form\" + 0.009*\"mean\" + 0.009*\"origin\" + 0.008*\"trade\" + 0.008*\"english\" + 0.007*\"uruguayan\" + 0.007*\"known\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 01:32:29,703 : INFO : topic #49 (0.020): 0.042*\"india\" + 0.032*\"incumb\" + 0.014*\"pakistan\" + 0.013*\"islam\" + 0.011*\"affection\" + 0.011*\"anglo\" + 0.011*\"muskoge\" + 0.011*\"televis\" + 0.010*\"alam\" + 0.010*\"khalsa\"\n", + "2019-01-31 01:32:29,705 : INFO : topic #42 (0.020): 0.049*\"german\" + 0.032*\"germani\" + 0.016*\"vol\" + 0.016*\"israel\" + 0.014*\"berlin\" + 0.014*\"der\" + 0.013*\"jewish\" + 0.010*\"isra\" + 0.010*\"european\" + 0.009*\"austria\"\n", + "2019-01-31 01:32:29,706 : INFO : topic #46 (0.020): 0.018*\"sweden\" + 0.016*\"stop\" + 0.015*\"swedish\" + 0.015*\"norwai\" + 0.015*\"wind\" + 0.014*\"norwegian\" + 0.013*\"damag\" + 0.011*\"treeless\" + 0.011*\"turkish\" + 0.010*\"denmark\"\n", + "2019-01-31 01:32:29,707 : INFO : topic #6 (0.020): 0.069*\"fewer\" + 0.025*\"epiru\" + 0.019*\"septemb\" + 0.018*\"teacher\" + 0.015*\"stake\" + 0.012*\"proclaim\" + 0.012*\"rodríguez\" + 0.011*\"direct\" + 0.011*\"movi\" + 0.010*\"acrimoni\"\n", + "2019-01-31 01:32:29,713 : INFO : topic diff=0.003246, rho=0.021238\n", + "2019-01-31 01:32:29,868 : INFO : PROGRESS: pass 0, at document #4436000/4922894\n", + "2019-01-31 01:32:31,219 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:32:31,485 : INFO : topic #28 (0.020): 0.036*\"build\" + 0.030*\"hous\" + 0.019*\"buford\" + 0.015*\"histor\" + 0.011*\"linear\" + 0.011*\"constitut\" + 0.011*\"silicon\" + 0.011*\"centuri\" + 0.011*\"depress\" + 0.010*\"pistol\"\n", + "2019-01-31 01:32:31,486 : INFO : topic #8 (0.020): 0.026*\"law\" + 0.022*\"cortic\" + 0.018*\"start\" + 0.018*\"act\" + 0.013*\"ricardo\" + 0.012*\"case\" + 0.010*\"replac\" + 0.009*\"legal\" + 0.009*\"polaris\" + 0.007*\"justic\"\n", + "2019-01-31 01:32:31,488 : INFO : topic #24 (0.020): 0.040*\"book\" + 0.035*\"publicis\" + 0.025*\"word\" + 0.020*\"new\" + 0.015*\"edit\" + 0.014*\"presid\" + 0.012*\"worldwid\" + 0.011*\"author\" + 0.011*\"nicola\" + 0.011*\"storag\"\n", + "2019-01-31 01:32:31,489 : INFO : topic #27 (0.020): 0.074*\"questionnair\" + 0.022*\"candid\" + 0.019*\"taxpay\" + 0.012*\"tornado\" + 0.012*\"driver\" + 0.012*\"find\" + 0.012*\"ret\" + 0.011*\"squatter\" + 0.011*\"fool\" + 0.010*\"champion\"\n", + "2019-01-31 01:32:31,490 : INFO : topic #20 (0.020): 0.145*\"scholar\" + 0.041*\"struggl\" + 0.034*\"high\" + 0.029*\"educ\" + 0.025*\"collector\" + 0.018*\"yawn\" + 0.013*\"prognosi\" + 0.009*\"district\" + 0.009*\"task\" + 0.009*\"class\"\n", + "2019-01-31 01:32:31,496 : INFO : topic diff=0.002800, rho=0.021233\n", + "2019-01-31 01:32:31,654 : INFO : PROGRESS: pass 0, at document #4438000/4922894\n", + "2019-01-31 01:32:33,035 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:32:33,302 : INFO : topic #47 (0.020): 0.065*\"muscl\" + 0.033*\"perceptu\" + 0.020*\"theater\" + 0.018*\"place\" + 0.017*\"compos\" + 0.016*\"damn\" + 0.014*\"physician\" + 0.014*\"orchestr\" + 0.011*\"olympo\" + 0.011*\"jack\"\n", + "2019-01-31 01:32:33,303 : INFO : topic #49 (0.020): 0.042*\"india\" + 0.032*\"incumb\" + 0.014*\"islam\" + 0.013*\"pakistan\" + 0.011*\"anglo\" + 0.011*\"affection\" + 0.011*\"televis\" + 0.010*\"muskoge\" + 0.010*\"alam\" + 0.010*\"khalsa\"\n", + "2019-01-31 01:32:33,304 : INFO : topic #23 (0.020): 0.135*\"audit\" + 0.066*\"best\" + 0.035*\"yawn\" + 0.031*\"jacksonvil\" + 0.024*\"japanes\" + 0.021*\"noll\" + 0.019*\"women\" + 0.017*\"festiv\" + 0.017*\"intern\" + 0.014*\"prison\"\n", + "2019-01-31 01:32:33,305 : INFO : topic #11 (0.020): 0.023*\"john\" + 0.011*\"will\" + 0.011*\"jame\" + 0.011*\"david\" + 0.010*\"rival\" + 0.009*\"mexican–american\" + 0.008*\"slur\" + 0.008*\"georg\" + 0.007*\"paul\" + 0.007*\"rhyme\"\n", + "2019-01-31 01:32:33,306 : INFO : topic #48 (0.020): 0.084*\"march\" + 0.079*\"octob\" + 0.078*\"sens\" + 0.072*\"januari\" + 0.070*\"juli\" + 0.069*\"notion\" + 0.068*\"august\" + 0.068*\"april\" + 0.067*\"judici\" + 0.065*\"decatur\"\n", + "2019-01-31 01:32:33,312 : INFO : topic diff=0.003157, rho=0.021229\n", + "2019-01-31 01:32:35,995 : INFO : -11.712 per-word bound, 3354.2 perplexity estimate based on a held-out corpus of 2000 documents with 556876 words\n", + "2019-01-31 01:32:35,995 : INFO : PROGRESS: pass 0, at document #4440000/4922894\n", + "2019-01-31 01:32:37,370 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:32:37,637 : INFO : topic #27 (0.020): 0.074*\"questionnair\" + 0.021*\"candid\" + 0.019*\"taxpay\" + 0.012*\"tornado\" + 0.012*\"driver\" + 0.012*\"find\" + 0.011*\"ret\" + 0.011*\"squatter\" + 0.011*\"fool\" + 0.010*\"champion\"\n", + "2019-01-31 01:32:37,638 : INFO : topic #6 (0.020): 0.069*\"fewer\" + 0.025*\"epiru\" + 0.019*\"septemb\" + 0.018*\"teacher\" + 0.015*\"stake\" + 0.012*\"proclaim\" + 0.012*\"rodríguez\" + 0.011*\"direct\" + 0.011*\"movi\" + 0.010*\"acrimoni\"\n", + "2019-01-31 01:32:37,640 : INFO : topic #33 (0.020): 0.061*\"french\" + 0.044*\"franc\" + 0.031*\"pari\" + 0.023*\"jean\" + 0.020*\"sail\" + 0.017*\"daphn\" + 0.013*\"lazi\" + 0.012*\"loui\" + 0.011*\"piec\" + 0.011*\"wreath\"\n", + "2019-01-31 01:32:37,641 : INFO : topic #31 (0.020): 0.050*\"fusiform\" + 0.026*\"scientist\" + 0.025*\"taxpay\" + 0.023*\"player\" + 0.019*\"place\" + 0.015*\"clot\" + 0.013*\"leagu\" + 0.011*\"folei\" + 0.011*\"yawn\" + 0.009*\"reconstruct\"\n", + "2019-01-31 01:32:37,642 : INFO : topic #40 (0.020): 0.087*\"unit\" + 0.023*\"schuster\" + 0.022*\"institut\" + 0.022*\"requir\" + 0.021*\"collector\" + 0.019*\"student\" + 0.014*\"professor\" + 0.012*\"word\" + 0.011*\"governor\" + 0.011*\"http\"\n", + "2019-01-31 01:32:37,648 : INFO : topic diff=0.002234, rho=0.021224\n", + "2019-01-31 01:32:37,807 : INFO : PROGRESS: pass 0, at document #4442000/4922894\n", + "2019-01-31 01:32:39,195 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:32:39,461 : INFO : topic #7 (0.020): 0.021*\"snatch\" + 0.020*\"di\" + 0.018*\"factor\" + 0.016*\"yawn\" + 0.016*\"margin\" + 0.014*\"bone\" + 0.013*\"life\" + 0.013*\"faster\" + 0.012*\"will\" + 0.012*\"deal\"\n", + "2019-01-31 01:32:39,462 : INFO : topic #48 (0.020): 0.085*\"march\" + 0.079*\"octob\" + 0.078*\"sens\" + 0.072*\"januari\" + 0.070*\"juli\" + 0.070*\"notion\" + 0.069*\"august\" + 0.068*\"april\" + 0.067*\"judici\" + 0.066*\"decatur\"\n", + "2019-01-31 01:32:39,463 : INFO : topic #9 (0.020): 0.070*\"bone\" + 0.045*\"american\" + 0.027*\"valour\" + 0.019*\"player\" + 0.019*\"folei\" + 0.018*\"dutch\" + 0.017*\"polit\" + 0.017*\"english\" + 0.012*\"acrimoni\" + 0.012*\"simpler\"\n", + "2019-01-31 01:32:39,465 : INFO : topic #6 (0.020): 0.069*\"fewer\" + 0.025*\"epiru\" + 0.019*\"septemb\" + 0.018*\"teacher\" + 0.015*\"stake\" + 0.012*\"proclaim\" + 0.012*\"rodríguez\" + 0.011*\"direct\" + 0.011*\"movi\" + 0.010*\"acrimoni\"\n", + "2019-01-31 01:32:39,466 : INFO : topic #25 (0.020): 0.032*\"ring\" + 0.018*\"area\" + 0.017*\"lagrang\" + 0.016*\"warmth\" + 0.015*\"mount\" + 0.010*\"north\" + 0.009*\"sourc\" + 0.009*\"land\" + 0.009*\"foam\" + 0.008*\"lobe\"\n", + "2019-01-31 01:32:39,472 : INFO : topic diff=0.003017, rho=0.021219\n", + "2019-01-31 01:32:39,627 : INFO : PROGRESS: pass 0, at document #4444000/4922894\n", + "2019-01-31 01:32:40,993 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:32:41,260 : INFO : topic #12 (0.020): 0.008*\"number\" + 0.007*\"frontal\" + 0.007*\"gener\" + 0.006*\"southern\" + 0.006*\"poet\" + 0.006*\"servitud\" + 0.006*\"exampl\" + 0.006*\"utopian\" + 0.006*\"théori\" + 0.006*\"method\"\n", + "2019-01-31 01:32:41,261 : INFO : topic #22 (0.020): 0.033*\"spars\" + 0.018*\"factor\" + 0.012*\"plaisir\" + 0.010*\"genu\" + 0.010*\"western\" + 0.009*\"biom\" + 0.008*\"median\" + 0.007*\"trap\" + 0.007*\"florida\" + 0.007*\"incom\"\n", + "2019-01-31 01:32:41,263 : INFO : topic #23 (0.020): 0.135*\"audit\" + 0.066*\"best\" + 0.035*\"yawn\" + 0.031*\"jacksonvil\" + 0.024*\"japanes\" + 0.021*\"noll\" + 0.019*\"women\" + 0.018*\"festiv\" + 0.017*\"intern\" + 0.014*\"winner\"\n", + "2019-01-31 01:32:41,264 : INFO : topic #4 (0.020): 0.019*\"enfranchis\" + 0.015*\"depress\" + 0.014*\"pour\" + 0.008*\"elabor\" + 0.008*\"uruguayan\" + 0.008*\"mode\" + 0.008*\"veget\" + 0.006*\"teratogen\" + 0.006*\"develop\" + 0.006*\"turn\"\n", + "2019-01-31 01:32:41,265 : INFO : topic #15 (0.020): 0.011*\"small\" + 0.010*\"organ\" + 0.010*\"develop\" + 0.009*\"commun\" + 0.009*\"group\" + 0.008*\"word\" + 0.008*\"peopl\" + 0.008*\"woman\" + 0.007*\"human\" + 0.006*\"summerhil\"\n", + "2019-01-31 01:32:41,271 : INFO : topic diff=0.003178, rho=0.021214\n", + "2019-01-31 01:32:41,483 : INFO : PROGRESS: pass 0, at document #4446000/4922894\n", + "2019-01-31 01:32:42,859 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:32:43,126 : INFO : topic #16 (0.020): 0.056*\"king\" + 0.032*\"priest\" + 0.019*\"rotterdam\" + 0.019*\"idiosyncrat\" + 0.019*\"duke\" + 0.018*\"grammat\" + 0.016*\"quarterli\" + 0.013*\"kingdom\" + 0.012*\"portugues\" + 0.012*\"order\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 01:32:43,127 : INFO : topic #26 (0.020): 0.029*\"workplac\" + 0.028*\"champion\" + 0.027*\"woman\" + 0.025*\"men\" + 0.024*\"olymp\" + 0.023*\"alic\" + 0.020*\"medal\" + 0.019*\"event\" + 0.018*\"taxpay\" + 0.018*\"atheist\"\n", + "2019-01-31 01:32:43,128 : INFO : topic #37 (0.020): 0.012*\"charact\" + 0.012*\"septemb\" + 0.011*\"anim\" + 0.010*\"man\" + 0.008*\"comic\" + 0.008*\"appear\" + 0.007*\"fusiform\" + 0.007*\"workplac\" + 0.007*\"storag\" + 0.006*\"black\"\n", + "2019-01-31 01:32:43,130 : INFO : topic #30 (0.020): 0.036*\"cleveland\" + 0.035*\"leagu\" + 0.030*\"place\" + 0.028*\"taxpay\" + 0.025*\"scientist\" + 0.023*\"crete\" + 0.022*\"folei\" + 0.016*\"goal\" + 0.015*\"martin\" + 0.012*\"schmitz\"\n", + "2019-01-31 01:32:43,131 : INFO : topic #15 (0.020): 0.011*\"small\" + 0.010*\"organ\" + 0.010*\"develop\" + 0.009*\"commun\" + 0.009*\"group\" + 0.008*\"word\" + 0.008*\"peopl\" + 0.008*\"woman\" + 0.007*\"human\" + 0.006*\"summerhil\"\n", + "2019-01-31 01:32:43,137 : INFO : topic diff=0.003520, rho=0.021209\n", + "2019-01-31 01:32:43,287 : INFO : PROGRESS: pass 0, at document #4448000/4922894\n", + "2019-01-31 01:32:44,621 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:32:44,887 : INFO : topic #4 (0.020): 0.019*\"enfranchis\" + 0.015*\"depress\" + 0.014*\"pour\" + 0.008*\"elabor\" + 0.008*\"uruguayan\" + 0.008*\"veget\" + 0.008*\"mode\" + 0.006*\"teratogen\" + 0.006*\"turn\" + 0.006*\"develop\"\n", + "2019-01-31 01:32:44,888 : INFO : topic #28 (0.020): 0.036*\"build\" + 0.030*\"hous\" + 0.019*\"buford\" + 0.015*\"histor\" + 0.012*\"linear\" + 0.011*\"constitut\" + 0.011*\"silicon\" + 0.011*\"centuri\" + 0.011*\"depress\" + 0.010*\"pistol\"\n", + "2019-01-31 01:32:44,889 : INFO : topic #41 (0.020): 0.041*\"citi\" + 0.024*\"palmer\" + 0.019*\"new\" + 0.017*\"strategist\" + 0.013*\"center\" + 0.013*\"open\" + 0.011*\"includ\" + 0.011*\"lobe\" + 0.010*\"dai\" + 0.009*\"hot\"\n", + "2019-01-31 01:32:44,890 : INFO : topic #1 (0.020): 0.054*\"china\" + 0.048*\"chilton\" + 0.023*\"kong\" + 0.023*\"hong\" + 0.022*\"korea\" + 0.018*\"korean\" + 0.017*\"sourc\" + 0.016*\"leah\" + 0.015*\"kim\" + 0.013*\"shirin\"\n", + "2019-01-31 01:32:44,892 : INFO : topic #35 (0.020): 0.054*\"russia\" + 0.035*\"sovereignti\" + 0.032*\"rural\" + 0.026*\"poison\" + 0.025*\"reprint\" + 0.024*\"personifi\" + 0.020*\"poland\" + 0.019*\"moscow\" + 0.014*\"tyrant\" + 0.014*\"unfortun\"\n", + "2019-01-31 01:32:44,897 : INFO : topic diff=0.003505, rho=0.021205\n", + "2019-01-31 01:32:45,058 : INFO : PROGRESS: pass 0, at document #4450000/4922894\n", + "2019-01-31 01:32:46,444 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:32:46,709 : INFO : topic #42 (0.020): 0.049*\"german\" + 0.031*\"germani\" + 0.016*\"vol\" + 0.015*\"israel\" + 0.014*\"berlin\" + 0.014*\"jewish\" + 0.014*\"der\" + 0.010*\"european\" + 0.009*\"europ\" + 0.009*\"isra\"\n", + "2019-01-31 01:32:46,710 : INFO : topic #48 (0.020): 0.085*\"march\" + 0.079*\"octob\" + 0.078*\"sens\" + 0.073*\"januari\" + 0.071*\"juli\" + 0.070*\"notion\" + 0.069*\"august\" + 0.068*\"april\" + 0.068*\"judici\" + 0.066*\"decatur\"\n", + "2019-01-31 01:32:46,712 : INFO : topic #28 (0.020): 0.036*\"build\" + 0.030*\"hous\" + 0.019*\"buford\" + 0.015*\"histor\" + 0.012*\"linear\" + 0.011*\"constitut\" + 0.011*\"silicon\" + 0.011*\"centuri\" + 0.011*\"depress\" + 0.010*\"pistol\"\n", + "2019-01-31 01:32:46,713 : INFO : topic #17 (0.020): 0.077*\"church\" + 0.025*\"christian\" + 0.023*\"cathol\" + 0.021*\"bishop\" + 0.017*\"sail\" + 0.017*\"retroflex\" + 0.010*\"relationship\" + 0.010*\"historiographi\" + 0.009*\"parish\" + 0.009*\"cathedr\"\n", + "2019-01-31 01:32:46,714 : INFO : topic #18 (0.020): 0.011*\"théori\" + 0.007*\"later\" + 0.007*\"sack\" + 0.006*\"dai\" + 0.006*\"kill\" + 0.005*\"retrospect\" + 0.005*\"like\" + 0.005*\"end\" + 0.004*\"call\" + 0.004*\"help\"\n", + "2019-01-31 01:32:46,720 : INFO : topic diff=0.003222, rho=0.021200\n", + "2019-01-31 01:32:46,879 : INFO : PROGRESS: pass 0, at document #4452000/4922894\n", + "2019-01-31 01:32:48,242 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:32:48,508 : INFO : topic #0 (0.020): 0.063*\"statewid\" + 0.039*\"line\" + 0.032*\"raid\" + 0.032*\"rivièr\" + 0.026*\"rosenwald\" + 0.019*\"airmen\" + 0.018*\"traceabl\" + 0.018*\"serv\" + 0.013*\"oper\" + 0.010*\"transient\"\n", + "2019-01-31 01:32:48,509 : INFO : topic #41 (0.020): 0.042*\"citi\" + 0.024*\"palmer\" + 0.019*\"new\" + 0.017*\"strategist\" + 0.013*\"center\" + 0.013*\"open\" + 0.011*\"includ\" + 0.011*\"lobe\" + 0.010*\"dai\" + 0.009*\"hot\"\n", + "2019-01-31 01:32:48,510 : INFO : topic #21 (0.020): 0.038*\"samford\" + 0.022*\"spain\" + 0.018*\"del\" + 0.016*\"italian\" + 0.016*\"mexico\" + 0.013*\"soviet\" + 0.013*\"santa\" + 0.011*\"juan\" + 0.011*\"lizard\" + 0.011*\"josé\"\n", + "2019-01-31 01:32:48,512 : INFO : topic #14 (0.020): 0.024*\"forc\" + 0.022*\"aggress\" + 0.020*\"walter\" + 0.020*\"armi\" + 0.018*\"com\" + 0.014*\"oper\" + 0.013*\"unionist\" + 0.013*\"militari\" + 0.012*\"airbu\" + 0.011*\"diversifi\"\n", + "2019-01-31 01:32:48,513 : INFO : topic #35 (0.020): 0.054*\"russia\" + 0.035*\"sovereignti\" + 0.032*\"rural\" + 0.026*\"poison\" + 0.025*\"reprint\" + 0.024*\"personifi\" + 0.021*\"poland\" + 0.019*\"moscow\" + 0.014*\"tyrant\" + 0.014*\"unfortun\"\n", + "2019-01-31 01:32:48,519 : INFO : topic diff=0.002718, rho=0.021195\n", + "2019-01-31 01:32:48,677 : INFO : PROGRESS: pass 0, at document #4454000/4922894\n", + "2019-01-31 01:32:50,054 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:32:50,321 : INFO : topic #19 (0.020): 0.016*\"languag\" + 0.015*\"centuri\" + 0.010*\"woodcut\" + 0.009*\"form\" + 0.009*\"mean\" + 0.009*\"origin\" + 0.008*\"trade\" + 0.008*\"english\" + 0.007*\"known\" + 0.007*\"uruguayan\"\n", + "2019-01-31 01:32:50,322 : INFO : topic #13 (0.020): 0.026*\"australia\" + 0.025*\"london\" + 0.025*\"new\" + 0.025*\"sourc\" + 0.023*\"england\" + 0.022*\"australian\" + 0.020*\"ireland\" + 0.019*\"british\" + 0.016*\"youth\" + 0.014*\"wale\"\n", + "2019-01-31 01:32:50,323 : INFO : topic #23 (0.020): 0.135*\"audit\" + 0.066*\"best\" + 0.035*\"yawn\" + 0.031*\"jacksonvil\" + 0.024*\"japanes\" + 0.022*\"noll\" + 0.019*\"women\" + 0.017*\"festiv\" + 0.017*\"intern\" + 0.014*\"prison\"\n", + "2019-01-31 01:32:50,324 : INFO : topic #46 (0.020): 0.019*\"sweden\" + 0.017*\"swedish\" + 0.016*\"norwai\" + 0.015*\"stop\" + 0.015*\"norwegian\" + 0.014*\"wind\" + 0.012*\"damag\" + 0.011*\"denmark\" + 0.011*\"turkish\" + 0.011*\"treeless\"\n", + "2019-01-31 01:32:50,325 : INFO : topic #39 (0.020): 0.061*\"canada\" + 0.047*\"canadian\" + 0.024*\"toronto\" + 0.023*\"hoar\" + 0.021*\"ontario\" + 0.016*\"hydrogen\" + 0.015*\"misericordia\" + 0.015*\"new\" + 0.014*\"novotná\" + 0.013*\"quebec\"\n", + "2019-01-31 01:32:50,331 : INFO : topic diff=0.003525, rho=0.021190\n", + "2019-01-31 01:32:50,491 : INFO : PROGRESS: pass 0, at document #4456000/4922894\n", + "2019-01-31 01:32:51,867 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:32:52,133 : INFO : topic #45 (0.020): 0.045*\"arsen\" + 0.031*\"jpg\" + 0.030*\"fifteenth\" + 0.028*\"museo\" + 0.022*\"pain\" + 0.020*\"illicit\" + 0.016*\"artist\" + 0.016*\"exhaust\" + 0.016*\"colder\" + 0.015*\"gai\"\n", + "2019-01-31 01:32:52,135 : INFO : topic #37 (0.020): 0.012*\"charact\" + 0.012*\"septemb\" + 0.011*\"anim\" + 0.010*\"man\" + 0.008*\"comic\" + 0.008*\"appear\" + 0.007*\"workplac\" + 0.007*\"fusiform\" + 0.007*\"storag\" + 0.006*\"black\"\n", + "2019-01-31 01:32:52,136 : INFO : topic #0 (0.020): 0.063*\"statewid\" + 0.039*\"line\" + 0.032*\"rivièr\" + 0.031*\"raid\" + 0.026*\"rosenwald\" + 0.020*\"airmen\" + 0.018*\"traceabl\" + 0.018*\"serv\" + 0.014*\"oper\" + 0.010*\"transient\"\n", + "2019-01-31 01:32:52,137 : INFO : topic #24 (0.020): 0.040*\"book\" + 0.035*\"publicis\" + 0.026*\"word\" + 0.020*\"new\" + 0.014*\"edit\" + 0.014*\"presid\" + 0.011*\"worldwid\" + 0.011*\"author\" + 0.011*\"storag\" + 0.011*\"nicola\"\n", + "2019-01-31 01:32:52,138 : INFO : topic #39 (0.020): 0.061*\"canada\" + 0.047*\"canadian\" + 0.024*\"toronto\" + 0.022*\"hoar\" + 0.021*\"ontario\" + 0.016*\"hydrogen\" + 0.015*\"new\" + 0.015*\"misericordia\" + 0.014*\"novotná\" + 0.013*\"quebec\"\n", + "2019-01-31 01:32:52,144 : INFO : topic diff=0.003538, rho=0.021186\n", + "2019-01-31 01:32:52,304 : INFO : PROGRESS: pass 0, at document #4458000/4922894\n", + "2019-01-31 01:32:53,679 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:32:53,945 : INFO : topic #3 (0.020): 0.034*\"present\" + 0.025*\"minist\" + 0.025*\"nation\" + 0.024*\"offic\" + 0.023*\"govern\" + 0.021*\"member\" + 0.018*\"start\" + 0.017*\"gener\" + 0.015*\"serv\" + 0.014*\"seri\"\n", + "2019-01-31 01:32:53,946 : INFO : topic #27 (0.020): 0.075*\"questionnair\" + 0.021*\"candid\" + 0.019*\"taxpay\" + 0.012*\"tornado\" + 0.012*\"driver\" + 0.012*\"ret\" + 0.012*\"find\" + 0.011*\"fool\" + 0.011*\"squatter\" + 0.010*\"yawn\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 01:32:53,948 : INFO : topic #22 (0.020): 0.032*\"spars\" + 0.018*\"factor\" + 0.012*\"plaisir\" + 0.010*\"western\" + 0.010*\"genu\" + 0.009*\"biom\" + 0.008*\"median\" + 0.007*\"trap\" + 0.007*\"incom\" + 0.007*\"florida\"\n", + "2019-01-31 01:32:53,949 : INFO : topic #1 (0.020): 0.055*\"china\" + 0.047*\"chilton\" + 0.023*\"kong\" + 0.022*\"hong\" + 0.022*\"korea\" + 0.018*\"korean\" + 0.017*\"sourc\" + 0.016*\"leah\" + 0.015*\"kim\" + 0.013*\"shirin\"\n", + "2019-01-31 01:32:53,950 : INFO : topic #48 (0.020): 0.085*\"march\" + 0.079*\"octob\" + 0.078*\"sens\" + 0.072*\"januari\" + 0.071*\"juli\" + 0.069*\"notion\" + 0.069*\"april\" + 0.068*\"august\" + 0.068*\"judici\" + 0.066*\"decatur\"\n", + "2019-01-31 01:32:53,956 : INFO : topic diff=0.003069, rho=0.021181\n", + "2019-01-31 01:32:56,584 : INFO : -11.398 per-word bound, 2699.5 perplexity estimate based on a held-out corpus of 2000 documents with 559111 words\n", + "2019-01-31 01:32:56,585 : INFO : PROGRESS: pass 0, at document #4460000/4922894\n", + "2019-01-31 01:32:57,928 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:32:58,195 : INFO : topic #44 (0.020): 0.031*\"rooftop\" + 0.026*\"final\" + 0.024*\"wife\" + 0.020*\"tourist\" + 0.019*\"champion\" + 0.016*\"martin\" + 0.015*\"taxpay\" + 0.014*\"tiepolo\" + 0.014*\"chamber\" + 0.012*\"open\"\n", + "2019-01-31 01:32:58,196 : INFO : topic #14 (0.020): 0.025*\"forc\" + 0.022*\"aggress\" + 0.020*\"armi\" + 0.020*\"walter\" + 0.018*\"com\" + 0.014*\"oper\" + 0.013*\"unionist\" + 0.013*\"militari\" + 0.012*\"airbu\" + 0.011*\"refut\"\n", + "2019-01-31 01:32:58,197 : INFO : topic #22 (0.020): 0.033*\"spars\" + 0.018*\"factor\" + 0.012*\"plaisir\" + 0.010*\"western\" + 0.010*\"genu\" + 0.008*\"biom\" + 0.008*\"median\" + 0.007*\"trap\" + 0.007*\"incom\" + 0.007*\"florida\"\n", + "2019-01-31 01:32:58,199 : INFO : topic #25 (0.020): 0.032*\"ring\" + 0.018*\"area\" + 0.018*\"lagrang\" + 0.016*\"warmth\" + 0.015*\"mount\" + 0.010*\"north\" + 0.009*\"sourc\" + 0.009*\"foam\" + 0.009*\"land\" + 0.008*\"lobe\"\n", + "2019-01-31 01:32:58,200 : INFO : topic #27 (0.020): 0.076*\"questionnair\" + 0.021*\"candid\" + 0.019*\"taxpay\" + 0.013*\"tornado\" + 0.012*\"driver\" + 0.012*\"find\" + 0.012*\"ret\" + 0.011*\"fool\" + 0.011*\"squatter\" + 0.010*\"yawn\"\n", + "2019-01-31 01:32:58,206 : INFO : topic diff=0.003532, rho=0.021176\n", + "2019-01-31 01:32:58,357 : INFO : PROGRESS: pass 0, at document #4462000/4922894\n", + "2019-01-31 01:32:59,688 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:32:59,954 : INFO : topic #4 (0.020): 0.019*\"enfranchis\" + 0.015*\"depress\" + 0.014*\"pour\" + 0.008*\"elabor\" + 0.008*\"uruguayan\" + 0.008*\"veget\" + 0.008*\"mode\" + 0.006*\"encyclopedia\" + 0.006*\"develop\" + 0.006*\"turn\"\n", + "2019-01-31 01:32:59,955 : INFO : topic #8 (0.020): 0.026*\"law\" + 0.022*\"cortic\" + 0.018*\"start\" + 0.018*\"act\" + 0.013*\"ricardo\" + 0.012*\"case\" + 0.010*\"replac\" + 0.009*\"polaris\" + 0.008*\"legal\" + 0.007*\"judaism\"\n", + "2019-01-31 01:32:59,956 : INFO : topic #0 (0.020): 0.063*\"statewid\" + 0.039*\"line\" + 0.031*\"raid\" + 0.031*\"rivièr\" + 0.025*\"rosenwald\" + 0.020*\"airmen\" + 0.018*\"traceabl\" + 0.018*\"serv\" + 0.014*\"oper\" + 0.010*\"transient\"\n", + "2019-01-31 01:32:59,958 : INFO : topic #37 (0.020): 0.012*\"charact\" + 0.011*\"anim\" + 0.011*\"septemb\" + 0.010*\"man\" + 0.008*\"comic\" + 0.008*\"appear\" + 0.007*\"workplac\" + 0.007*\"fusiform\" + 0.007*\"storag\" + 0.006*\"black\"\n", + "2019-01-31 01:32:59,959 : INFO : topic #38 (0.020): 0.022*\"walter\" + 0.011*\"aza\" + 0.009*\"forc\" + 0.009*\"battalion\" + 0.007*\"teufel\" + 0.007*\"armi\" + 0.007*\"empath\" + 0.007*\"till\" + 0.007*\"govern\" + 0.006*\"militari\"\n", + "2019-01-31 01:32:59,965 : INFO : topic diff=0.003904, rho=0.021171\n", + "2019-01-31 01:33:00,119 : INFO : PROGRESS: pass 0, at document #4464000/4922894\n", + "2019-01-31 01:33:01,463 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:33:01,729 : INFO : topic #7 (0.020): 0.021*\"snatch\" + 0.020*\"di\" + 0.018*\"factor\" + 0.016*\"yawn\" + 0.016*\"margin\" + 0.014*\"bone\" + 0.013*\"life\" + 0.013*\"faster\" + 0.012*\"will\" + 0.012*\"deal\"\n", + "2019-01-31 01:33:01,730 : INFO : topic #48 (0.020): 0.083*\"march\" + 0.078*\"octob\" + 0.077*\"sens\" + 0.071*\"januari\" + 0.070*\"notion\" + 0.070*\"juli\" + 0.067*\"august\" + 0.067*\"april\" + 0.066*\"judici\" + 0.065*\"decatur\"\n", + "2019-01-31 01:33:01,732 : INFO : topic #17 (0.020): 0.078*\"church\" + 0.025*\"christian\" + 0.023*\"cathol\" + 0.022*\"bishop\" + 0.017*\"sail\" + 0.016*\"retroflex\" + 0.010*\"relationship\" + 0.010*\"historiographi\" + 0.009*\"parish\" + 0.009*\"cathedr\"\n", + "2019-01-31 01:33:01,733 : INFO : topic #15 (0.020): 0.011*\"small\" + 0.010*\"organ\" + 0.010*\"develop\" + 0.009*\"commun\" + 0.009*\"group\" + 0.008*\"word\" + 0.008*\"peopl\" + 0.007*\"woman\" + 0.007*\"human\" + 0.006*\"summerhil\"\n", + "2019-01-31 01:33:01,734 : INFO : topic #29 (0.020): 0.032*\"companhia\" + 0.013*\"busi\" + 0.012*\"million\" + 0.012*\"produc\" + 0.012*\"market\" + 0.010*\"bank\" + 0.010*\"industri\" + 0.009*\"yawn\" + 0.008*\"manag\" + 0.007*\"serv\"\n", + "2019-01-31 01:33:01,740 : INFO : topic diff=0.002838, rho=0.021167\n", + "2019-01-31 01:33:01,898 : INFO : PROGRESS: pass 0, at document #4466000/4922894\n", + "2019-01-31 01:33:03,272 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:33:03,538 : INFO : topic #35 (0.020): 0.055*\"russia\" + 0.038*\"sovereignti\" + 0.032*\"rural\" + 0.025*\"poison\" + 0.025*\"reprint\" + 0.024*\"personifi\" + 0.020*\"poland\" + 0.019*\"moscow\" + 0.015*\"tyrant\" + 0.014*\"unfortun\"\n", + "2019-01-31 01:33:03,539 : INFO : topic #41 (0.020): 0.042*\"citi\" + 0.024*\"palmer\" + 0.019*\"new\" + 0.017*\"strategist\" + 0.014*\"center\" + 0.013*\"open\" + 0.011*\"includ\" + 0.011*\"lobe\" + 0.011*\"dai\" + 0.009*\"area\"\n", + "2019-01-31 01:33:03,540 : INFO : topic #48 (0.020): 0.083*\"march\" + 0.078*\"octob\" + 0.077*\"sens\" + 0.071*\"januari\" + 0.070*\"juli\" + 0.070*\"notion\" + 0.067*\"april\" + 0.067*\"august\" + 0.067*\"judici\" + 0.066*\"decatur\"\n", + "2019-01-31 01:33:03,542 : INFO : topic #5 (0.020): 0.038*\"abroad\" + 0.028*\"son\" + 0.026*\"rel\" + 0.025*\"reconstruct\" + 0.021*\"band\" + 0.016*\"muscl\" + 0.015*\"simultan\" + 0.014*\"charcoal\" + 0.014*\"toyota\" + 0.010*\"myspac\"\n", + "2019-01-31 01:33:03,543 : INFO : topic #16 (0.020): 0.055*\"king\" + 0.032*\"priest\" + 0.019*\"idiosyncrat\" + 0.019*\"rotterdam\" + 0.019*\"duke\" + 0.017*\"grammat\" + 0.016*\"quarterli\" + 0.013*\"portugues\" + 0.013*\"kingdom\" + 0.012*\"count\"\n", + "2019-01-31 01:33:03,549 : INFO : topic diff=0.003055, rho=0.021162\n", + "2019-01-31 01:33:03,706 : INFO : PROGRESS: pass 0, at document #4468000/4922894\n", + "2019-01-31 01:33:05,085 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:33:05,351 : INFO : topic #5 (0.020): 0.038*\"abroad\" + 0.028*\"son\" + 0.026*\"rel\" + 0.025*\"reconstruct\" + 0.022*\"band\" + 0.016*\"muscl\" + 0.015*\"simultan\" + 0.014*\"charcoal\" + 0.014*\"toyota\" + 0.010*\"myspac\"\n", + "2019-01-31 01:33:05,353 : INFO : topic #34 (0.020): 0.065*\"start\" + 0.033*\"new\" + 0.032*\"american\" + 0.028*\"unionist\" + 0.026*\"cotton\" + 0.021*\"year\" + 0.016*\"california\" + 0.014*\"warrior\" + 0.012*\"terri\" + 0.012*\"north\"\n", + "2019-01-31 01:33:05,354 : INFO : topic #20 (0.020): 0.144*\"scholar\" + 0.040*\"struggl\" + 0.034*\"high\" + 0.029*\"educ\" + 0.025*\"collector\" + 0.018*\"yawn\" + 0.012*\"prognosi\" + 0.010*\"district\" + 0.009*\"task\" + 0.009*\"gothic\"\n", + "2019-01-31 01:33:05,355 : INFO : topic #21 (0.020): 0.038*\"samford\" + 0.023*\"spain\" + 0.018*\"del\" + 0.017*\"italian\" + 0.016*\"mexico\" + 0.013*\"soviet\" + 0.013*\"santa\" + 0.011*\"juan\" + 0.011*\"lizard\" + 0.011*\"francisco\"\n", + "2019-01-31 01:33:05,356 : INFO : topic #14 (0.020): 0.024*\"forc\" + 0.022*\"aggress\" + 0.020*\"armi\" + 0.020*\"walter\" + 0.018*\"com\" + 0.014*\"oper\" + 0.014*\"unionist\" + 0.013*\"militari\" + 0.012*\"airbu\" + 0.011*\"diversifi\"\n", + "2019-01-31 01:33:05,362 : INFO : topic diff=0.003160, rho=0.021157\n", + "2019-01-31 01:33:05,518 : INFO : PROGRESS: pass 0, at document #4470000/4922894\n", + "2019-01-31 01:33:06,895 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:33:07,161 : INFO : topic #33 (0.020): 0.060*\"french\" + 0.044*\"franc\" + 0.031*\"pari\" + 0.023*\"jean\" + 0.020*\"sail\" + 0.016*\"daphn\" + 0.014*\"lazi\" + 0.012*\"loui\" + 0.012*\"piec\" + 0.010*\"wine\"\n", + "2019-01-31 01:33:07,162 : INFO : topic #4 (0.020): 0.019*\"enfranchis\" + 0.015*\"depress\" + 0.014*\"pour\" + 0.008*\"elabor\" + 0.008*\"uruguayan\" + 0.008*\"veget\" + 0.008*\"mode\" + 0.006*\"develop\" + 0.006*\"encyclopedia\" + 0.006*\"teratogen\"\n", + "2019-01-31 01:33:07,164 : INFO : topic #31 (0.020): 0.050*\"fusiform\" + 0.026*\"scientist\" + 0.025*\"taxpay\" + 0.023*\"player\" + 0.019*\"place\" + 0.015*\"clot\" + 0.014*\"leagu\" + 0.011*\"folei\" + 0.010*\"yawn\" + 0.009*\"reconstruct\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 01:33:07,165 : INFO : topic #26 (0.020): 0.029*\"workplac\" + 0.028*\"champion\" + 0.026*\"woman\" + 0.024*\"olymp\" + 0.024*\"alic\" + 0.024*\"men\" + 0.020*\"medal\" + 0.019*\"event\" + 0.018*\"taxpay\" + 0.018*\"rainfal\"\n", + "2019-01-31 01:33:07,166 : INFO : topic #19 (0.020): 0.017*\"languag\" + 0.015*\"centuri\" + 0.010*\"woodcut\" + 0.009*\"form\" + 0.009*\"mean\" + 0.009*\"origin\" + 0.008*\"trade\" + 0.008*\"english\" + 0.007*\"known\" + 0.007*\"uruguayan\"\n", + "2019-01-31 01:33:07,172 : INFO : topic diff=0.002901, rho=0.021152\n", + "2019-01-31 01:33:07,326 : INFO : PROGRESS: pass 0, at document #4472000/4922894\n", + "2019-01-31 01:33:08,682 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:33:08,949 : INFO : topic #11 (0.020): 0.023*\"john\" + 0.011*\"will\" + 0.011*\"jame\" + 0.011*\"david\" + 0.010*\"rival\" + 0.009*\"mexican–american\" + 0.008*\"slur\" + 0.008*\"georg\" + 0.007*\"paul\" + 0.007*\"rhyme\"\n", + "2019-01-31 01:33:08,950 : INFO : topic #29 (0.020): 0.031*\"companhia\" + 0.013*\"busi\" + 0.012*\"million\" + 0.012*\"market\" + 0.012*\"produc\" + 0.010*\"bank\" + 0.010*\"industri\" + 0.009*\"yawn\" + 0.008*\"manag\" + 0.007*\"serv\"\n", + "2019-01-31 01:33:08,951 : INFO : topic #15 (0.020): 0.011*\"small\" + 0.010*\"organ\" + 0.010*\"develop\" + 0.009*\"commun\" + 0.009*\"group\" + 0.008*\"word\" + 0.008*\"peopl\" + 0.007*\"woman\" + 0.007*\"human\" + 0.006*\"summerhil\"\n", + "2019-01-31 01:33:08,952 : INFO : topic #7 (0.020): 0.021*\"snatch\" + 0.020*\"di\" + 0.018*\"factor\" + 0.016*\"yawn\" + 0.016*\"margin\" + 0.014*\"bone\" + 0.013*\"life\" + 0.013*\"faster\" + 0.012*\"will\" + 0.012*\"deal\"\n", + "2019-01-31 01:33:08,954 : INFO : topic #38 (0.020): 0.022*\"walter\" + 0.010*\"aza\" + 0.009*\"forc\" + 0.009*\"battalion\" + 0.007*\"teufel\" + 0.007*\"armi\" + 0.007*\"empath\" + 0.007*\"govern\" + 0.006*\"till\" + 0.006*\"militari\"\n", + "2019-01-31 01:33:08,960 : INFO : topic diff=0.003029, rho=0.021148\n", + "2019-01-31 01:33:09,111 : INFO : PROGRESS: pass 0, at document #4474000/4922894\n", + "2019-01-31 01:33:10,450 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:33:10,717 : INFO : topic #46 (0.020): 0.018*\"sweden\" + 0.017*\"swedish\" + 0.016*\"norwai\" + 0.015*\"stop\" + 0.015*\"norwegian\" + 0.015*\"wind\" + 0.012*\"damag\" + 0.011*\"turkish\" + 0.011*\"denmark\" + 0.010*\"treeless\"\n", + "2019-01-31 01:33:10,718 : INFO : topic #48 (0.020): 0.082*\"march\" + 0.078*\"octob\" + 0.077*\"sens\" + 0.070*\"januari\" + 0.069*\"notion\" + 0.068*\"juli\" + 0.067*\"judici\" + 0.066*\"august\" + 0.066*\"april\" + 0.065*\"decatur\"\n", + "2019-01-31 01:33:10,719 : INFO : topic #8 (0.020): 0.026*\"law\" + 0.022*\"cortic\" + 0.018*\"start\" + 0.018*\"act\" + 0.013*\"ricardo\" + 0.012*\"case\" + 0.010*\"replac\" + 0.009*\"polaris\" + 0.008*\"legal\" + 0.007*\"judaism\"\n", + "2019-01-31 01:33:10,720 : INFO : topic #40 (0.020): 0.087*\"unit\" + 0.023*\"schuster\" + 0.022*\"institut\" + 0.021*\"requir\" + 0.020*\"collector\" + 0.019*\"student\" + 0.014*\"professor\" + 0.012*\"word\" + 0.011*\"http\" + 0.011*\"degre\"\n", + "2019-01-31 01:33:10,721 : INFO : topic #36 (0.020): 0.011*\"network\" + 0.010*\"prognosi\" + 0.009*\"pop\" + 0.008*\"cytokin\" + 0.008*\"softwar\" + 0.008*\"user\" + 0.008*\"develop\" + 0.008*\"diggin\" + 0.008*\"uruguayan\" + 0.007*\"includ\"\n", + "2019-01-31 01:33:10,727 : INFO : topic diff=0.003180, rho=0.021143\n", + "2019-01-31 01:33:10,888 : INFO : PROGRESS: pass 0, at document #4476000/4922894\n", + "2019-01-31 01:33:12,265 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:33:12,531 : INFO : topic #23 (0.020): 0.135*\"audit\" + 0.068*\"best\" + 0.036*\"yawn\" + 0.031*\"jacksonvil\" + 0.023*\"japanes\" + 0.022*\"noll\" + 0.019*\"women\" + 0.018*\"festiv\" + 0.016*\"intern\" + 0.014*\"prison\"\n", + "2019-01-31 01:33:12,532 : INFO : topic #20 (0.020): 0.146*\"scholar\" + 0.040*\"struggl\" + 0.034*\"high\" + 0.029*\"educ\" + 0.025*\"collector\" + 0.018*\"yawn\" + 0.012*\"prognosi\" + 0.010*\"district\" + 0.009*\"task\" + 0.009*\"class\"\n", + "2019-01-31 01:33:12,533 : INFO : topic #13 (0.020): 0.027*\"australia\" + 0.025*\"new\" + 0.025*\"sourc\" + 0.025*\"london\" + 0.024*\"england\" + 0.022*\"australian\" + 0.020*\"british\" + 0.019*\"ireland\" + 0.016*\"youth\" + 0.014*\"wale\"\n", + "2019-01-31 01:33:12,535 : INFO : topic #37 (0.020): 0.012*\"charact\" + 0.011*\"septemb\" + 0.011*\"anim\" + 0.011*\"man\" + 0.008*\"comic\" + 0.008*\"appear\" + 0.007*\"workplac\" + 0.007*\"fusiform\" + 0.007*\"storag\" + 0.006*\"black\"\n", + "2019-01-31 01:33:12,536 : INFO : topic #0 (0.020): 0.063*\"statewid\" + 0.040*\"line\" + 0.031*\"rivièr\" + 0.031*\"raid\" + 0.026*\"rosenwald\" + 0.021*\"airmen\" + 0.018*\"traceabl\" + 0.018*\"serv\" + 0.014*\"oper\" + 0.010*\"transient\"\n", + "2019-01-31 01:33:12,542 : INFO : topic diff=0.003230, rho=0.021138\n", + "2019-01-31 01:33:12,758 : INFO : PROGRESS: pass 0, at document #4478000/4922894\n", + "2019-01-31 01:33:14,173 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:33:14,439 : INFO : topic #28 (0.020): 0.035*\"build\" + 0.030*\"hous\" + 0.019*\"buford\" + 0.015*\"histor\" + 0.012*\"linear\" + 0.011*\"centuri\" + 0.011*\"constitut\" + 0.011*\"silicon\" + 0.011*\"depress\" + 0.010*\"pistol\"\n", + "2019-01-31 01:33:14,440 : INFO : topic #8 (0.020): 0.026*\"law\" + 0.022*\"cortic\" + 0.018*\"start\" + 0.017*\"act\" + 0.013*\"ricardo\" + 0.012*\"case\" + 0.010*\"replac\" + 0.009*\"polaris\" + 0.008*\"legal\" + 0.007*\"judaism\"\n", + "2019-01-31 01:33:14,441 : INFO : topic #49 (0.020): 0.042*\"india\" + 0.032*\"incumb\" + 0.013*\"pakistan\" + 0.013*\"islam\" + 0.012*\"anglo\" + 0.011*\"televis\" + 0.010*\"muskoge\" + 0.010*\"affection\" + 0.010*\"khalsa\" + 0.010*\"sri\"\n", + "2019-01-31 01:33:14,442 : INFO : topic #22 (0.020): 0.032*\"spars\" + 0.018*\"factor\" + 0.012*\"plaisir\" + 0.010*\"western\" + 0.010*\"genu\" + 0.009*\"biom\" + 0.008*\"median\" + 0.007*\"trap\" + 0.007*\"incom\" + 0.007*\"florida\"\n", + "2019-01-31 01:33:14,444 : INFO : topic #26 (0.020): 0.029*\"workplac\" + 0.028*\"champion\" + 0.026*\"woman\" + 0.024*\"olymp\" + 0.024*\"men\" + 0.023*\"alic\" + 0.020*\"event\" + 0.020*\"medal\" + 0.018*\"taxpay\" + 0.018*\"rainfal\"\n", + "2019-01-31 01:33:14,449 : INFO : topic diff=0.004110, rho=0.021134\n", + "2019-01-31 01:33:17,200 : INFO : -11.560 per-word bound, 3019.7 perplexity estimate based on a held-out corpus of 2000 documents with 586810 words\n", + "2019-01-31 01:33:17,200 : INFO : PROGRESS: pass 0, at document #4480000/4922894\n", + "2019-01-31 01:33:18,607 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:33:18,874 : INFO : topic #7 (0.020): 0.021*\"snatch\" + 0.020*\"di\" + 0.018*\"factor\" + 0.016*\"yawn\" + 0.016*\"margin\" + 0.014*\"bone\" + 0.013*\"life\" + 0.013*\"faster\" + 0.012*\"will\" + 0.012*\"deal\"\n", + "2019-01-31 01:33:18,875 : INFO : topic #12 (0.020): 0.008*\"number\" + 0.007*\"frontal\" + 0.007*\"gener\" + 0.006*\"servitud\" + 0.006*\"exampl\" + 0.006*\"southern\" + 0.006*\"poet\" + 0.006*\"utopian\" + 0.006*\"théori\" + 0.006*\"field\"\n", + "2019-01-31 01:33:18,877 : INFO : topic #47 (0.020): 0.066*\"muscl\" + 0.032*\"perceptu\" + 0.020*\"theater\" + 0.018*\"place\" + 0.018*\"compos\" + 0.016*\"damn\" + 0.014*\"physician\" + 0.014*\"orchestr\" + 0.011*\"olympo\" + 0.011*\"jack\"\n", + "2019-01-31 01:33:18,878 : INFO : topic #3 (0.020): 0.033*\"present\" + 0.025*\"nation\" + 0.024*\"minist\" + 0.024*\"offic\" + 0.023*\"govern\" + 0.021*\"member\" + 0.018*\"start\" + 0.016*\"gener\" + 0.015*\"serv\" + 0.014*\"seri\"\n", + "2019-01-31 01:33:18,879 : INFO : topic #49 (0.020): 0.042*\"india\" + 0.032*\"incumb\" + 0.013*\"pakistan\" + 0.013*\"islam\" + 0.012*\"anglo\" + 0.011*\"televis\" + 0.010*\"muskoge\" + 0.010*\"affection\" + 0.010*\"khalsa\" + 0.010*\"sri\"\n", + "2019-01-31 01:33:18,884 : INFO : topic diff=0.003466, rho=0.021129\n", + "2019-01-31 01:33:19,046 : INFO : PROGRESS: pass 0, at document #4482000/4922894\n", + "2019-01-31 01:33:20,449 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:33:20,715 : INFO : topic #38 (0.020): 0.022*\"walter\" + 0.010*\"aza\" + 0.009*\"forc\" + 0.008*\"battalion\" + 0.007*\"teufel\" + 0.007*\"armi\" + 0.007*\"empath\" + 0.007*\"govern\" + 0.006*\"till\" + 0.006*\"militari\"\n", + "2019-01-31 01:33:20,717 : INFO : topic #21 (0.020): 0.038*\"samford\" + 0.023*\"spain\" + 0.018*\"del\" + 0.017*\"italian\" + 0.016*\"mexico\" + 0.013*\"soviet\" + 0.012*\"santa\" + 0.012*\"juan\" + 0.011*\"lizard\" + 0.010*\"francisco\"\n", + "2019-01-31 01:33:20,718 : INFO : topic #37 (0.020): 0.012*\"charact\" + 0.011*\"septemb\" + 0.011*\"anim\" + 0.011*\"man\" + 0.008*\"comic\" + 0.008*\"appear\" + 0.007*\"fusiform\" + 0.007*\"workplac\" + 0.007*\"storag\" + 0.006*\"black\"\n", + "2019-01-31 01:33:20,719 : INFO : topic #13 (0.020): 0.027*\"australia\" + 0.026*\"sourc\" + 0.025*\"new\" + 0.025*\"london\" + 0.023*\"england\" + 0.022*\"australian\" + 0.020*\"british\" + 0.019*\"ireland\" + 0.015*\"youth\" + 0.014*\"wale\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 01:33:20,720 : INFO : topic #27 (0.020): 0.077*\"questionnair\" + 0.021*\"candid\" + 0.019*\"taxpay\" + 0.013*\"tornado\" + 0.012*\"fool\" + 0.012*\"ret\" + 0.012*\"driver\" + 0.011*\"find\" + 0.010*\"yawn\" + 0.010*\"champion\"\n", + "2019-01-31 01:33:20,726 : INFO : topic diff=0.002771, rho=0.021124\n", + "2019-01-31 01:33:20,884 : INFO : PROGRESS: pass 0, at document #4484000/4922894\n", + "2019-01-31 01:33:22,267 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:33:22,534 : INFO : topic #11 (0.020): 0.023*\"john\" + 0.011*\"will\" + 0.011*\"jame\" + 0.011*\"david\" + 0.010*\"rival\" + 0.009*\"mexican–american\" + 0.008*\"slur\" + 0.008*\"georg\" + 0.008*\"paul\" + 0.007*\"rhyme\"\n", + "2019-01-31 01:33:22,535 : INFO : topic #17 (0.020): 0.078*\"church\" + 0.023*\"christian\" + 0.022*\"cathol\" + 0.021*\"bishop\" + 0.018*\"sail\" + 0.016*\"retroflex\" + 0.010*\"relationship\" + 0.010*\"historiographi\" + 0.010*\"parish\" + 0.009*\"cathedr\"\n", + "2019-01-31 01:33:22,536 : INFO : topic #7 (0.020): 0.021*\"snatch\" + 0.020*\"di\" + 0.018*\"factor\" + 0.016*\"yawn\" + 0.016*\"margin\" + 0.014*\"bone\" + 0.013*\"life\" + 0.013*\"faster\" + 0.012*\"deal\" + 0.012*\"will\"\n", + "2019-01-31 01:33:22,537 : INFO : topic #16 (0.020): 0.056*\"king\" + 0.032*\"priest\" + 0.019*\"rotterdam\" + 0.019*\"idiosyncrat\" + 0.018*\"duke\" + 0.018*\"grammat\" + 0.016*\"quarterli\" + 0.013*\"kingdom\" + 0.013*\"portugues\" + 0.012*\"princ\"\n", + "2019-01-31 01:33:22,538 : INFO : topic #43 (0.020): 0.064*\"elect\" + 0.055*\"parti\" + 0.024*\"voluntari\" + 0.023*\"democrat\" + 0.020*\"member\" + 0.016*\"polici\" + 0.016*\"republ\" + 0.014*\"bypass\" + 0.013*\"report\" + 0.013*\"selma\"\n", + "2019-01-31 01:33:22,544 : INFO : topic diff=0.003295, rho=0.021119\n", + "2019-01-31 01:33:22,702 : INFO : PROGRESS: pass 0, at document #4486000/4922894\n", + "2019-01-31 01:33:24,087 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:33:24,354 : INFO : topic #21 (0.020): 0.038*\"samford\" + 0.023*\"spain\" + 0.018*\"del\" + 0.017*\"italian\" + 0.016*\"mexico\" + 0.013*\"soviet\" + 0.012*\"santa\" + 0.012*\"juan\" + 0.011*\"lizard\" + 0.010*\"francisco\"\n", + "2019-01-31 01:33:24,355 : INFO : topic #16 (0.020): 0.056*\"king\" + 0.032*\"priest\" + 0.019*\"rotterdam\" + 0.019*\"idiosyncrat\" + 0.018*\"duke\" + 0.018*\"grammat\" + 0.016*\"quarterli\" + 0.013*\"kingdom\" + 0.013*\"portugues\" + 0.012*\"princ\"\n", + "2019-01-31 01:33:24,356 : INFO : topic #23 (0.020): 0.134*\"audit\" + 0.068*\"best\" + 0.036*\"yawn\" + 0.031*\"jacksonvil\" + 0.023*\"japanes\" + 0.022*\"noll\" + 0.019*\"women\" + 0.018*\"festiv\" + 0.016*\"intern\" + 0.014*\"prison\"\n", + "2019-01-31 01:33:24,357 : INFO : topic #44 (0.020): 0.030*\"rooftop\" + 0.026*\"final\" + 0.024*\"wife\" + 0.020*\"tourist\" + 0.018*\"champion\" + 0.016*\"martin\" + 0.015*\"taxpay\" + 0.014*\"tiepolo\" + 0.014*\"chamber\" + 0.012*\"open\"\n", + "2019-01-31 01:33:24,358 : INFO : topic #26 (0.020): 0.028*\"workplac\" + 0.028*\"champion\" + 0.026*\"woman\" + 0.024*\"olymp\" + 0.024*\"men\" + 0.023*\"alic\" + 0.020*\"medal\" + 0.020*\"event\" + 0.018*\"taxpay\" + 0.018*\"rainfal\"\n", + "2019-01-31 01:33:24,364 : INFO : topic diff=0.003386, rho=0.021115\n", + "2019-01-31 01:33:24,523 : INFO : PROGRESS: pass 0, at document #4488000/4922894\n", + "2019-01-31 01:33:25,876 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:33:26,145 : INFO : topic #7 (0.020): 0.021*\"snatch\" + 0.020*\"di\" + 0.018*\"factor\" + 0.016*\"yawn\" + 0.016*\"margin\" + 0.014*\"bone\" + 0.013*\"life\" + 0.012*\"faster\" + 0.012*\"deal\" + 0.012*\"will\"\n", + "2019-01-31 01:33:26,146 : INFO : topic #22 (0.020): 0.032*\"spars\" + 0.018*\"factor\" + 0.012*\"plaisir\" + 0.010*\"western\" + 0.010*\"genu\" + 0.009*\"biom\" + 0.008*\"median\" + 0.007*\"trap\" + 0.007*\"incom\" + 0.007*\"florida\"\n", + "2019-01-31 01:33:26,147 : INFO : topic #0 (0.020): 0.062*\"statewid\" + 0.039*\"line\" + 0.032*\"rivièr\" + 0.031*\"raid\" + 0.026*\"rosenwald\" + 0.022*\"airmen\" + 0.018*\"traceabl\" + 0.018*\"serv\" + 0.013*\"oper\" + 0.010*\"transient\"\n", + "2019-01-31 01:33:26,149 : INFO : topic #17 (0.020): 0.078*\"church\" + 0.023*\"christian\" + 0.022*\"cathol\" + 0.021*\"bishop\" + 0.018*\"sail\" + 0.016*\"retroflex\" + 0.010*\"relationship\" + 0.010*\"historiographi\" + 0.009*\"parish\" + 0.009*\"cathedr\"\n", + "2019-01-31 01:33:26,149 : INFO : topic #48 (0.020): 0.082*\"march\" + 0.078*\"octob\" + 0.078*\"sens\" + 0.071*\"januari\" + 0.070*\"notion\" + 0.069*\"juli\" + 0.068*\"august\" + 0.067*\"april\" + 0.067*\"judici\" + 0.066*\"decatur\"\n", + "2019-01-31 01:33:26,155 : INFO : topic diff=0.003947, rho=0.021110\n", + "2019-01-31 01:33:26,312 : INFO : PROGRESS: pass 0, at document #4490000/4922894\n", + "2019-01-31 01:33:27,678 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:33:27,944 : INFO : topic #15 (0.020): 0.011*\"small\" + 0.010*\"organ\" + 0.010*\"develop\" + 0.009*\"commun\" + 0.009*\"group\" + 0.008*\"word\" + 0.008*\"peopl\" + 0.008*\"woman\" + 0.007*\"human\" + 0.006*\"summerhil\"\n", + "2019-01-31 01:33:27,946 : INFO : topic #27 (0.020): 0.077*\"questionnair\" + 0.021*\"candid\" + 0.019*\"taxpay\" + 0.013*\"tornado\" + 0.013*\"ret\" + 0.012*\"fool\" + 0.012*\"driver\" + 0.011*\"find\" + 0.010*\"champion\" + 0.010*\"squatter\"\n", + "2019-01-31 01:33:27,947 : INFO : topic #1 (0.020): 0.055*\"china\" + 0.050*\"chilton\" + 0.022*\"kong\" + 0.022*\"hong\" + 0.021*\"korea\" + 0.018*\"korean\" + 0.016*\"leah\" + 0.016*\"kim\" + 0.016*\"sourc\" + 0.013*\"shirin\"\n", + "2019-01-31 01:33:27,948 : INFO : topic #28 (0.020): 0.035*\"build\" + 0.031*\"hous\" + 0.019*\"buford\" + 0.015*\"histor\" + 0.011*\"linear\" + 0.011*\"centuri\" + 0.011*\"constitut\" + 0.011*\"silicon\" + 0.011*\"depress\" + 0.010*\"pistol\"\n", + "2019-01-31 01:33:27,949 : INFO : topic #29 (0.020): 0.032*\"companhia\" + 0.013*\"busi\" + 0.012*\"million\" + 0.012*\"produc\" + 0.012*\"market\" + 0.011*\"bank\" + 0.010*\"industri\" + 0.009*\"yawn\" + 0.008*\"manag\" + 0.007*\"trace\"\n", + "2019-01-31 01:33:27,955 : INFO : topic diff=0.003029, rho=0.021105\n", + "2019-01-31 01:33:28,114 : INFO : PROGRESS: pass 0, at document #4492000/4922894\n", + "2019-01-31 01:33:29,517 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:33:29,784 : INFO : topic #28 (0.020): 0.035*\"build\" + 0.031*\"hous\" + 0.019*\"buford\" + 0.015*\"histor\" + 0.011*\"linear\" + 0.011*\"centuri\" + 0.011*\"constitut\" + 0.011*\"silicon\" + 0.011*\"depress\" + 0.010*\"pistol\"\n", + "2019-01-31 01:33:29,785 : INFO : topic #30 (0.020): 0.035*\"leagu\" + 0.035*\"cleveland\" + 0.030*\"place\" + 0.028*\"taxpay\" + 0.025*\"scientist\" + 0.023*\"crete\" + 0.021*\"folei\" + 0.016*\"goal\" + 0.015*\"martin\" + 0.012*\"schmitz\"\n", + "2019-01-31 01:33:29,786 : INFO : topic #37 (0.020): 0.012*\"charact\" + 0.011*\"septemb\" + 0.011*\"anim\" + 0.010*\"man\" + 0.008*\"comic\" + 0.008*\"appear\" + 0.007*\"workplac\" + 0.007*\"fusiform\" + 0.007*\"storag\" + 0.006*\"black\"\n", + "2019-01-31 01:33:29,787 : INFO : topic #10 (0.020): 0.011*\"cdd\" + 0.009*\"media\" + 0.008*\"disco\" + 0.008*\"have\" + 0.007*\"pathwai\" + 0.007*\"hormon\" + 0.007*\"caus\" + 0.006*\"proper\" + 0.006*\"treat\" + 0.006*\"effect\"\n", + "2019-01-31 01:33:29,788 : INFO : topic #22 (0.020): 0.032*\"spars\" + 0.018*\"factor\" + 0.012*\"plaisir\" + 0.010*\"western\" + 0.009*\"genu\" + 0.009*\"biom\" + 0.008*\"median\" + 0.008*\"trap\" + 0.007*\"incom\" + 0.007*\"florida\"\n", + "2019-01-31 01:33:29,794 : INFO : topic diff=0.003244, rho=0.021101\n", + "2019-01-31 01:33:29,953 : INFO : PROGRESS: pass 0, at document #4494000/4922894\n", + "2019-01-31 01:33:31,323 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:33:31,590 : INFO : topic #22 (0.020): 0.032*\"spars\" + 0.018*\"factor\" + 0.012*\"plaisir\" + 0.010*\"western\" + 0.009*\"genu\" + 0.009*\"biom\" + 0.008*\"median\" + 0.008*\"trap\" + 0.007*\"incom\" + 0.007*\"florida\"\n", + "2019-01-31 01:33:31,591 : INFO : topic #33 (0.020): 0.060*\"french\" + 0.044*\"franc\" + 0.031*\"pari\" + 0.022*\"jean\" + 0.022*\"sail\" + 0.017*\"daphn\" + 0.013*\"lazi\" + 0.012*\"loui\" + 0.012*\"piec\" + 0.009*\"wine\"\n", + "2019-01-31 01:33:31,592 : INFO : topic #31 (0.020): 0.050*\"fusiform\" + 0.026*\"scientist\" + 0.025*\"taxpay\" + 0.022*\"player\" + 0.019*\"place\" + 0.015*\"clot\" + 0.013*\"leagu\" + 0.011*\"folei\" + 0.010*\"yawn\" + 0.009*\"reconstruct\"\n", + "2019-01-31 01:33:31,593 : INFO : topic #44 (0.020): 0.030*\"rooftop\" + 0.026*\"final\" + 0.024*\"wife\" + 0.020*\"tourist\" + 0.019*\"champion\" + 0.016*\"martin\" + 0.015*\"taxpay\" + 0.014*\"tiepolo\" + 0.014*\"chamber\" + 0.012*\"open\"\n", + "2019-01-31 01:33:31,594 : INFO : topic #13 (0.020): 0.027*\"australia\" + 0.026*\"london\" + 0.025*\"new\" + 0.025*\"sourc\" + 0.023*\"england\" + 0.022*\"australian\" + 0.020*\"british\" + 0.018*\"ireland\" + 0.015*\"youth\" + 0.014*\"wale\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 01:33:31,600 : INFO : topic diff=0.003030, rho=0.021096\n", + "2019-01-31 01:33:31,753 : INFO : PROGRESS: pass 0, at document #4496000/4922894\n", + "2019-01-31 01:33:33,112 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:33:33,380 : INFO : topic #19 (0.020): 0.017*\"languag\" + 0.015*\"centuri\" + 0.010*\"woodcut\" + 0.010*\"form\" + 0.009*\"mean\" + 0.009*\"origin\" + 0.008*\"trade\" + 0.008*\"english\" + 0.007*\"known\" + 0.007*\"uruguayan\"\n", + "2019-01-31 01:33:33,381 : INFO : topic #43 (0.020): 0.064*\"elect\" + 0.055*\"parti\" + 0.024*\"voluntari\" + 0.023*\"democrat\" + 0.020*\"member\" + 0.017*\"polici\" + 0.015*\"republ\" + 0.014*\"bypass\" + 0.013*\"selma\" + 0.013*\"report\"\n", + "2019-01-31 01:33:33,382 : INFO : topic #31 (0.020): 0.050*\"fusiform\" + 0.026*\"scientist\" + 0.025*\"taxpay\" + 0.022*\"player\" + 0.019*\"place\" + 0.015*\"clot\" + 0.013*\"leagu\" + 0.011*\"folei\" + 0.010*\"yawn\" + 0.009*\"reconstruct\"\n", + "2019-01-31 01:33:33,383 : INFO : topic #29 (0.020): 0.032*\"companhia\" + 0.013*\"busi\" + 0.012*\"million\" + 0.012*\"produc\" + 0.012*\"market\" + 0.011*\"bank\" + 0.010*\"industri\" + 0.009*\"yawn\" + 0.008*\"manag\" + 0.007*\"trace\"\n", + "2019-01-31 01:33:33,384 : INFO : topic #13 (0.020): 0.027*\"australia\" + 0.026*\"london\" + 0.026*\"new\" + 0.026*\"sourc\" + 0.023*\"england\" + 0.022*\"australian\" + 0.020*\"british\" + 0.018*\"ireland\" + 0.015*\"youth\" + 0.014*\"wale\"\n", + "2019-01-31 01:33:33,390 : INFO : topic diff=0.003168, rho=0.021091\n", + "2019-01-31 01:33:33,552 : INFO : PROGRESS: pass 0, at document #4498000/4922894\n", + "2019-01-31 01:33:34,972 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:33:35,238 : INFO : topic #13 (0.020): 0.027*\"australia\" + 0.026*\"sourc\" + 0.026*\"london\" + 0.025*\"new\" + 0.023*\"england\" + 0.022*\"australian\" + 0.020*\"british\" + 0.018*\"ireland\" + 0.015*\"youth\" + 0.014*\"wale\"\n", + "2019-01-31 01:33:35,239 : INFO : topic #29 (0.020): 0.032*\"companhia\" + 0.013*\"busi\" + 0.012*\"million\" + 0.012*\"produc\" + 0.012*\"market\" + 0.011*\"bank\" + 0.010*\"industri\" + 0.009*\"yawn\" + 0.008*\"manag\" + 0.007*\"trace\"\n", + "2019-01-31 01:33:35,240 : INFO : topic #30 (0.020): 0.035*\"leagu\" + 0.035*\"cleveland\" + 0.030*\"place\" + 0.028*\"taxpay\" + 0.025*\"scientist\" + 0.023*\"crete\" + 0.021*\"folei\" + 0.016*\"goal\" + 0.015*\"martin\" + 0.012*\"schmitz\"\n", + "2019-01-31 01:33:35,241 : INFO : topic #5 (0.020): 0.038*\"abroad\" + 0.029*\"son\" + 0.026*\"rel\" + 0.025*\"reconstruct\" + 0.021*\"band\" + 0.016*\"muscl\" + 0.016*\"simultan\" + 0.014*\"charcoal\" + 0.013*\"toyota\" + 0.009*\"myspac\"\n", + "2019-01-31 01:33:35,242 : INFO : topic #48 (0.020): 0.082*\"march\" + 0.078*\"octob\" + 0.077*\"sens\" + 0.071*\"januari\" + 0.069*\"notion\" + 0.069*\"juli\" + 0.067*\"august\" + 0.067*\"april\" + 0.066*\"judici\" + 0.066*\"decatur\"\n", + "2019-01-31 01:33:35,248 : INFO : topic diff=0.003618, rho=0.021087\n", + "2019-01-31 01:33:37,925 : INFO : -11.841 per-word bound, 3667.8 perplexity estimate based on a held-out corpus of 2000 documents with 535707 words\n", + "2019-01-31 01:33:37,926 : INFO : PROGRESS: pass 0, at document #4500000/4922894\n", + "2019-01-31 01:33:39,306 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:33:39,572 : INFO : topic #26 (0.020): 0.029*\"workplac\" + 0.028*\"champion\" + 0.026*\"woman\" + 0.025*\"olymp\" + 0.023*\"men\" + 0.022*\"alic\" + 0.020*\"medal\" + 0.020*\"event\" + 0.018*\"taxpay\" + 0.018*\"rainfal\"\n", + "2019-01-31 01:33:39,573 : INFO : topic #18 (0.020): 0.011*\"théori\" + 0.007*\"later\" + 0.007*\"sack\" + 0.006*\"dai\" + 0.005*\"kill\" + 0.005*\"like\" + 0.005*\"end\" + 0.005*\"retrospect\" + 0.004*\"call\" + 0.004*\"help\"\n", + "2019-01-31 01:33:39,574 : INFO : topic #14 (0.020): 0.024*\"forc\" + 0.021*\"aggress\" + 0.020*\"armi\" + 0.020*\"walter\" + 0.018*\"com\" + 0.014*\"oper\" + 0.013*\"unionist\" + 0.013*\"militari\" + 0.012*\"airbu\" + 0.011*\"diversifi\"\n", + "2019-01-31 01:33:39,575 : INFO : topic #46 (0.020): 0.018*\"sweden\" + 0.017*\"norwai\" + 0.016*\"swedish\" + 0.016*\"norwegian\" + 0.016*\"stop\" + 0.014*\"wind\" + 0.011*\"damag\" + 0.011*\"turkish\" + 0.011*\"denmark\" + 0.010*\"farid\"\n", + "2019-01-31 01:33:39,576 : INFO : topic #37 (0.020): 0.012*\"charact\" + 0.011*\"septemb\" + 0.011*\"anim\" + 0.010*\"man\" + 0.008*\"comic\" + 0.008*\"appear\" + 0.007*\"fusiform\" + 0.007*\"workplac\" + 0.007*\"storag\" + 0.006*\"black\"\n", + "2019-01-31 01:33:39,582 : INFO : topic diff=0.003336, rho=0.021082\n", + "2019-01-31 01:33:39,744 : INFO : PROGRESS: pass 0, at document #4502000/4922894\n", + "2019-01-31 01:33:41,144 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:33:41,411 : INFO : topic #49 (0.020): 0.042*\"india\" + 0.032*\"incumb\" + 0.013*\"pakistan\" + 0.013*\"islam\" + 0.012*\"anglo\" + 0.012*\"televis\" + 0.010*\"muskoge\" + 0.010*\"sri\" + 0.010*\"affection\" + 0.010*\"khalsa\"\n", + "2019-01-31 01:33:41,412 : INFO : topic #11 (0.020): 0.023*\"john\" + 0.011*\"will\" + 0.011*\"david\" + 0.011*\"jame\" + 0.010*\"rival\" + 0.009*\"mexican–american\" + 0.008*\"slur\" + 0.008*\"georg\" + 0.007*\"paul\" + 0.007*\"rhyme\"\n", + "2019-01-31 01:33:41,413 : INFO : topic #43 (0.020): 0.064*\"elect\" + 0.054*\"parti\" + 0.025*\"voluntari\" + 0.023*\"democrat\" + 0.020*\"member\" + 0.016*\"polici\" + 0.015*\"republ\" + 0.014*\"liber\" + 0.014*\"selma\" + 0.013*\"bypass\"\n", + "2019-01-31 01:33:41,414 : INFO : topic #27 (0.020): 0.076*\"questionnair\" + 0.021*\"candid\" + 0.019*\"taxpay\" + 0.014*\"tornado\" + 0.012*\"fool\" + 0.012*\"driver\" + 0.011*\"ret\" + 0.011*\"find\" + 0.010*\"champion\" + 0.010*\"squatter\"\n", + "2019-01-31 01:33:41,415 : INFO : topic #18 (0.020): 0.011*\"théori\" + 0.007*\"sack\" + 0.007*\"later\" + 0.006*\"dai\" + 0.006*\"kill\" + 0.005*\"like\" + 0.005*\"end\" + 0.005*\"retrospect\" + 0.004*\"call\" + 0.004*\"help\"\n", + "2019-01-31 01:33:41,421 : INFO : topic diff=0.003045, rho=0.021077\n", + "2019-01-31 01:33:41,582 : INFO : PROGRESS: pass 0, at document #4504000/4922894\n", + "2019-01-31 01:33:42,980 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:33:43,247 : INFO : topic #18 (0.020): 0.011*\"théori\" + 0.007*\"sack\" + 0.007*\"later\" + 0.006*\"dai\" + 0.006*\"kill\" + 0.005*\"like\" + 0.005*\"end\" + 0.005*\"retrospect\" + 0.004*\"call\" + 0.004*\"help\"\n", + "2019-01-31 01:33:43,248 : INFO : topic #29 (0.020): 0.032*\"companhia\" + 0.013*\"busi\" + 0.012*\"million\" + 0.012*\"produc\" + 0.011*\"market\" + 0.011*\"bank\" + 0.010*\"industri\" + 0.009*\"yawn\" + 0.008*\"manag\" + 0.007*\"trace\"\n", + "2019-01-31 01:33:43,249 : INFO : topic #13 (0.020): 0.027*\"australia\" + 0.026*\"sourc\" + 0.026*\"london\" + 0.025*\"new\" + 0.023*\"england\" + 0.022*\"australian\" + 0.020*\"british\" + 0.018*\"ireland\" + 0.015*\"youth\" + 0.014*\"wale\"\n", + "2019-01-31 01:33:43,250 : INFO : topic #20 (0.020): 0.146*\"scholar\" + 0.040*\"struggl\" + 0.034*\"high\" + 0.029*\"educ\" + 0.025*\"collector\" + 0.018*\"yawn\" + 0.013*\"prognosi\" + 0.010*\"district\" + 0.009*\"task\" + 0.009*\"gothic\"\n", + "2019-01-31 01:33:43,251 : INFO : topic #27 (0.020): 0.076*\"questionnair\" + 0.021*\"candid\" + 0.019*\"taxpay\" + 0.013*\"tornado\" + 0.012*\"fool\" + 0.012*\"driver\" + 0.011*\"find\" + 0.011*\"ret\" + 0.010*\"squatter\" + 0.010*\"champion\"\n", + "2019-01-31 01:33:43,257 : INFO : topic diff=0.003388, rho=0.021072\n", + "2019-01-31 01:33:43,418 : INFO : PROGRESS: pass 0, at document #4506000/4922894\n", + "2019-01-31 01:33:44,805 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:33:45,072 : INFO : topic #45 (0.020): 0.045*\"arsen\" + 0.030*\"jpg\" + 0.030*\"fifteenth\" + 0.027*\"museo\" + 0.021*\"pain\" + 0.020*\"illicit\" + 0.016*\"artist\" + 0.016*\"exhaust\" + 0.016*\"colder\" + 0.015*\"gai\"\n", + "2019-01-31 01:33:45,073 : INFO : topic #12 (0.020): 0.008*\"number\" + 0.008*\"frontal\" + 0.007*\"southern\" + 0.006*\"poet\" + 0.006*\"gener\" + 0.006*\"servitud\" + 0.006*\"exampl\" + 0.006*\"théori\" + 0.006*\"utopian\" + 0.006*\"field\"\n", + "2019-01-31 01:33:45,074 : INFO : topic #29 (0.020): 0.032*\"companhia\" + 0.013*\"busi\" + 0.012*\"million\" + 0.012*\"produc\" + 0.011*\"market\" + 0.011*\"bank\" + 0.010*\"industri\" + 0.009*\"yawn\" + 0.008*\"manag\" + 0.007*\"trace\"\n", + "2019-01-31 01:33:45,075 : INFO : topic #19 (0.020): 0.016*\"languag\" + 0.015*\"centuri\" + 0.010*\"woodcut\" + 0.009*\"form\" + 0.009*\"mean\" + 0.009*\"origin\" + 0.008*\"trade\" + 0.008*\"english\" + 0.007*\"known\" + 0.007*\"uruguayan\"\n", + "2019-01-31 01:33:45,076 : INFO : topic #38 (0.020): 0.022*\"walter\" + 0.010*\"aza\" + 0.008*\"forc\" + 0.008*\"battalion\" + 0.007*\"teufel\" + 0.007*\"armi\" + 0.007*\"empath\" + 0.006*\"govern\" + 0.006*\"pour\" + 0.006*\"militari\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 01:33:45,082 : INFO : topic diff=0.003315, rho=0.021068\n", + "2019-01-31 01:33:45,246 : INFO : PROGRESS: pass 0, at document #4508000/4922894\n", + "2019-01-31 01:33:46,671 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:33:46,937 : INFO : topic #24 (0.020): 0.040*\"book\" + 0.035*\"publicis\" + 0.026*\"word\" + 0.020*\"new\" + 0.015*\"edit\" + 0.015*\"presid\" + 0.011*\"worldwid\" + 0.011*\"magazin\" + 0.011*\"nicola\" + 0.011*\"storag\"\n", + "2019-01-31 01:33:46,939 : INFO : topic #18 (0.020): 0.011*\"théori\" + 0.007*\"later\" + 0.007*\"sack\" + 0.006*\"dai\" + 0.006*\"kill\" + 0.005*\"like\" + 0.005*\"retrospect\" + 0.005*\"end\" + 0.004*\"call\" + 0.004*\"help\"\n", + "2019-01-31 01:33:46,940 : INFO : topic #7 (0.020): 0.021*\"snatch\" + 0.020*\"di\" + 0.018*\"factor\" + 0.016*\"margin\" + 0.016*\"yawn\" + 0.014*\"bone\" + 0.013*\"life\" + 0.012*\"faster\" + 0.012*\"will\" + 0.012*\"deal\"\n", + "2019-01-31 01:33:46,941 : INFO : topic #6 (0.020): 0.070*\"fewer\" + 0.024*\"epiru\" + 0.019*\"septemb\" + 0.018*\"teacher\" + 0.015*\"stake\" + 0.013*\"proclaim\" + 0.012*\"rodríguez\" + 0.011*\"direct\" + 0.010*\"movi\" + 0.010*\"acrimoni\"\n", + "2019-01-31 01:33:46,942 : INFO : topic #28 (0.020): 0.035*\"build\" + 0.030*\"hous\" + 0.020*\"buford\" + 0.015*\"histor\" + 0.012*\"linear\" + 0.011*\"centuri\" + 0.011*\"constitut\" + 0.011*\"silicon\" + 0.010*\"depress\" + 0.010*\"pistol\"\n", + "2019-01-31 01:33:46,948 : INFO : topic diff=0.005003, rho=0.021063\n", + "2019-01-31 01:33:47,107 : INFO : PROGRESS: pass 0, at document #4510000/4922894\n", + "2019-01-31 01:33:48,486 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:33:48,753 : INFO : topic #18 (0.020): 0.011*\"théori\" + 0.007*\"later\" + 0.007*\"sack\" + 0.006*\"dai\" + 0.006*\"kill\" + 0.005*\"like\" + 0.005*\"retrospect\" + 0.005*\"end\" + 0.004*\"call\" + 0.004*\"help\"\n", + "2019-01-31 01:33:48,754 : INFO : topic #12 (0.020): 0.008*\"number\" + 0.008*\"frontal\" + 0.007*\"southern\" + 0.006*\"poet\" + 0.006*\"gener\" + 0.006*\"servitud\" + 0.006*\"exampl\" + 0.006*\"théori\" + 0.006*\"utopian\" + 0.006*\"field\"\n", + "2019-01-31 01:33:48,755 : INFO : topic #38 (0.020): 0.022*\"walter\" + 0.010*\"aza\" + 0.008*\"forc\" + 0.008*\"battalion\" + 0.007*\"empath\" + 0.007*\"teufel\" + 0.007*\"armi\" + 0.006*\"govern\" + 0.006*\"pour\" + 0.006*\"militari\"\n", + "2019-01-31 01:33:48,756 : INFO : topic #40 (0.020): 0.088*\"unit\" + 0.023*\"schuster\" + 0.022*\"requir\" + 0.022*\"institut\" + 0.020*\"collector\" + 0.019*\"student\" + 0.014*\"professor\" + 0.012*\"word\" + 0.011*\"governor\" + 0.011*\"degre\"\n", + "2019-01-31 01:33:48,757 : INFO : topic #30 (0.020): 0.035*\"leagu\" + 0.035*\"cleveland\" + 0.030*\"place\" + 0.027*\"taxpay\" + 0.025*\"scientist\" + 0.023*\"crete\" + 0.021*\"folei\" + 0.016*\"goal\" + 0.015*\"martin\" + 0.012*\"schmitz\"\n", + "2019-01-31 01:33:48,763 : INFO : topic diff=0.002978, rho=0.021058\n", + "2019-01-31 01:33:48,979 : INFO : PROGRESS: pass 0, at document #4512000/4922894\n", + "2019-01-31 01:33:50,344 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:33:50,610 : INFO : topic #47 (0.020): 0.064*\"muscl\" + 0.031*\"perceptu\" + 0.019*\"theater\" + 0.018*\"compos\" + 0.018*\"place\" + 0.017*\"physician\" + 0.015*\"damn\" + 0.014*\"orchestr\" + 0.012*\"olympo\" + 0.012*\"son\"\n", + "2019-01-31 01:33:50,611 : INFO : topic #30 (0.020): 0.035*\"cleveland\" + 0.035*\"leagu\" + 0.030*\"place\" + 0.027*\"taxpay\" + 0.025*\"scientist\" + 0.023*\"crete\" + 0.021*\"folei\" + 0.017*\"goal\" + 0.015*\"martin\" + 0.012*\"schmitz\"\n", + "2019-01-31 01:33:50,612 : INFO : topic #16 (0.020): 0.057*\"king\" + 0.032*\"priest\" + 0.019*\"rotterdam\" + 0.019*\"idiosyncrat\" + 0.017*\"duke\" + 0.017*\"grammat\" + 0.016*\"quarterli\" + 0.013*\"kingdom\" + 0.013*\"portugues\" + 0.012*\"princ\"\n", + "2019-01-31 01:33:50,613 : INFO : topic #15 (0.020): 0.011*\"small\" + 0.010*\"organ\" + 0.010*\"develop\" + 0.009*\"commun\" + 0.009*\"group\" + 0.008*\"word\" + 0.008*\"peopl\" + 0.008*\"woman\" + 0.007*\"human\" + 0.006*\"summerhil\"\n", + "2019-01-31 01:33:50,615 : INFO : topic #42 (0.020): 0.045*\"german\" + 0.031*\"germani\" + 0.017*\"vol\" + 0.016*\"israel\" + 0.015*\"der\" + 0.015*\"jewish\" + 0.013*\"berlin\" + 0.010*\"isra\" + 0.009*\"european\" + 0.009*\"austria\"\n", + "2019-01-31 01:33:50,620 : INFO : topic diff=0.003161, rho=0.021054\n", + "2019-01-31 01:33:50,776 : INFO : PROGRESS: pass 0, at document #4514000/4922894\n", + "2019-01-31 01:33:52,140 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:33:52,407 : INFO : topic #27 (0.020): 0.076*\"questionnair\" + 0.021*\"candid\" + 0.019*\"taxpay\" + 0.013*\"tornado\" + 0.012*\"fool\" + 0.012*\"find\" + 0.012*\"driver\" + 0.011*\"ret\" + 0.010*\"champion\" + 0.010*\"horac\"\n", + "2019-01-31 01:33:52,408 : INFO : topic #39 (0.020): 0.061*\"canada\" + 0.047*\"canadian\" + 0.024*\"toronto\" + 0.022*\"ontario\" + 0.021*\"hoar\" + 0.016*\"hydrogen\" + 0.015*\"new\" + 0.015*\"misericordia\" + 0.015*\"novotná\" + 0.014*\"quebec\"\n", + "2019-01-31 01:33:52,409 : INFO : topic #22 (0.020): 0.032*\"spars\" + 0.017*\"factor\" + 0.012*\"plaisir\" + 0.010*\"genu\" + 0.010*\"western\" + 0.009*\"biom\" + 0.008*\"median\" + 0.007*\"trap\" + 0.007*\"incom\" + 0.007*\"florida\"\n", + "2019-01-31 01:33:52,410 : INFO : topic #44 (0.020): 0.030*\"rooftop\" + 0.026*\"final\" + 0.023*\"wife\" + 0.021*\"tourist\" + 0.018*\"champion\" + 0.017*\"martin\" + 0.015*\"taxpay\" + 0.014*\"tiepolo\" + 0.014*\"chamber\" + 0.012*\"open\"\n", + "2019-01-31 01:33:52,411 : INFO : topic #37 (0.020): 0.012*\"charact\" + 0.011*\"septemb\" + 0.011*\"anim\" + 0.010*\"man\" + 0.008*\"comic\" + 0.007*\"appear\" + 0.007*\"storag\" + 0.007*\"fusiform\" + 0.007*\"workplac\" + 0.006*\"black\"\n", + "2019-01-31 01:33:52,417 : INFO : topic diff=0.003314, rho=0.021049\n", + "2019-01-31 01:33:52,575 : INFO : PROGRESS: pass 0, at document #4516000/4922894\n", + "2019-01-31 01:33:53,961 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:33:54,228 : INFO : topic #20 (0.020): 0.145*\"scholar\" + 0.040*\"struggl\" + 0.033*\"high\" + 0.029*\"educ\" + 0.024*\"collector\" + 0.018*\"yawn\" + 0.013*\"prognosi\" + 0.010*\"district\" + 0.009*\"task\" + 0.009*\"gothic\"\n", + "2019-01-31 01:33:54,229 : INFO : topic #34 (0.020): 0.065*\"start\" + 0.033*\"new\" + 0.031*\"american\" + 0.028*\"unionist\" + 0.027*\"cotton\" + 0.021*\"year\" + 0.015*\"california\" + 0.013*\"warrior\" + 0.012*\"terri\" + 0.012*\"north\"\n", + "2019-01-31 01:33:54,230 : INFO : topic #16 (0.020): 0.056*\"king\" + 0.031*\"priest\" + 0.019*\"rotterdam\" + 0.019*\"idiosyncrat\" + 0.018*\"duke\" + 0.017*\"grammat\" + 0.016*\"quarterli\" + 0.014*\"portugues\" + 0.013*\"kingdom\" + 0.012*\"princ\"\n", + "2019-01-31 01:33:54,231 : INFO : topic #29 (0.020): 0.032*\"companhia\" + 0.013*\"busi\" + 0.012*\"million\" + 0.012*\"produc\" + 0.012*\"market\" + 0.011*\"bank\" + 0.010*\"industri\" + 0.009*\"yawn\" + 0.008*\"manag\" + 0.007*\"trace\"\n", + "2019-01-31 01:33:54,232 : INFO : topic #35 (0.020): 0.056*\"russia\" + 0.038*\"sovereignti\" + 0.034*\"rural\" + 0.026*\"personifi\" + 0.025*\"reprint\" + 0.025*\"poison\" + 0.019*\"moscow\" + 0.019*\"poland\" + 0.015*\"unfortun\" + 0.014*\"tyrant\"\n", + "2019-01-31 01:33:54,237 : INFO : topic diff=0.003146, rho=0.021044\n", + "2019-01-31 01:33:54,394 : INFO : PROGRESS: pass 0, at document #4518000/4922894\n", + "2019-01-31 01:33:55,762 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:33:56,029 : INFO : topic #39 (0.020): 0.061*\"canada\" + 0.047*\"canadian\" + 0.024*\"toronto\" + 0.022*\"ontario\" + 0.021*\"hoar\" + 0.016*\"hydrogen\" + 0.015*\"new\" + 0.015*\"misericordia\" + 0.015*\"novotná\" + 0.014*\"quebec\"\n", + "2019-01-31 01:33:56,030 : INFO : topic #36 (0.020): 0.011*\"network\" + 0.010*\"prognosi\" + 0.009*\"pop\" + 0.009*\"cytokin\" + 0.008*\"develop\" + 0.008*\"user\" + 0.008*\"softwar\" + 0.008*\"diggin\" + 0.008*\"uruguayan\" + 0.007*\"includ\"\n", + "2019-01-31 01:33:56,031 : INFO : topic #32 (0.020): 0.050*\"district\" + 0.045*\"popolo\" + 0.042*\"vigour\" + 0.036*\"tortur\" + 0.032*\"cotton\" + 0.023*\"adulthood\" + 0.022*\"area\" + 0.021*\"multitud\" + 0.020*\"cede\" + 0.018*\"citi\"\n", + "2019-01-31 01:33:56,032 : INFO : topic #38 (0.020): 0.022*\"walter\" + 0.010*\"aza\" + 0.008*\"forc\" + 0.008*\"battalion\" + 0.007*\"empath\" + 0.007*\"armi\" + 0.007*\"teufel\" + 0.006*\"govern\" + 0.006*\"pour\" + 0.006*\"militari\"\n", + "2019-01-31 01:33:56,033 : INFO : topic #0 (0.020): 0.062*\"statewid\" + 0.039*\"line\" + 0.032*\"raid\" + 0.031*\"rivièr\" + 0.025*\"rosenwald\" + 0.022*\"airmen\" + 0.018*\"serv\" + 0.017*\"traceabl\" + 0.013*\"oper\" + 0.010*\"transient\"\n", + "2019-01-31 01:33:56,039 : INFO : topic diff=0.002334, rho=0.021040\n", + "2019-01-31 01:33:59,719 : INFO : -11.583 per-word bound, 3068.0 perplexity estimate based on a held-out corpus of 2000 documents with 562568 words\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 01:33:59,720 : INFO : PROGRESS: pass 0, at document #4520000/4922894\n", + "2019-01-31 01:34:01,117 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:34:01,383 : INFO : topic #41 (0.020): 0.042*\"citi\" + 0.025*\"palmer\" + 0.019*\"new\" + 0.016*\"strategist\" + 0.013*\"open\" + 0.013*\"center\" + 0.011*\"includ\" + 0.011*\"lobe\" + 0.010*\"dai\" + 0.009*\"highli\"\n", + "2019-01-31 01:34:01,385 : INFO : topic #1 (0.020): 0.055*\"china\" + 0.048*\"chilton\" + 0.023*\"kong\" + 0.023*\"hong\" + 0.021*\"korea\" + 0.018*\"leah\" + 0.018*\"korean\" + 0.016*\"sourc\" + 0.015*\"kim\" + 0.013*\"shirin\"\n", + "2019-01-31 01:34:01,386 : INFO : topic #16 (0.020): 0.056*\"king\" + 0.031*\"priest\" + 0.019*\"rotterdam\" + 0.019*\"idiosyncrat\" + 0.018*\"duke\" + 0.017*\"grammat\" + 0.016*\"quarterli\" + 0.014*\"portugues\" + 0.014*\"kingdom\" + 0.012*\"princ\"\n", + "2019-01-31 01:34:01,387 : INFO : topic #13 (0.020): 0.026*\"australia\" + 0.026*\"sourc\" + 0.025*\"london\" + 0.025*\"new\" + 0.023*\"england\" + 0.022*\"australian\" + 0.020*\"british\" + 0.018*\"ireland\" + 0.015*\"youth\" + 0.014*\"wale\"\n", + "2019-01-31 01:34:01,388 : INFO : topic #37 (0.020): 0.012*\"charact\" + 0.011*\"septemb\" + 0.011*\"anim\" + 0.011*\"man\" + 0.008*\"comic\" + 0.007*\"appear\" + 0.007*\"storag\" + 0.007*\"fusiform\" + 0.007*\"workplac\" + 0.006*\"black\"\n", + "2019-01-31 01:34:01,394 : INFO : topic diff=0.003146, rho=0.021035\n", + "2019-01-31 01:34:01,552 : INFO : PROGRESS: pass 0, at document #4522000/4922894\n", + "2019-01-31 01:34:02,926 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:34:03,193 : INFO : topic #2 (0.020): 0.048*\"isl\" + 0.040*\"shield\" + 0.017*\"narrat\" + 0.017*\"scot\" + 0.013*\"pope\" + 0.012*\"nativist\" + 0.012*\"blur\" + 0.010*\"class\" + 0.010*\"coalit\" + 0.009*\"fleet\"\n", + "2019-01-31 01:34:03,194 : INFO : topic #16 (0.020): 0.056*\"king\" + 0.031*\"priest\" + 0.020*\"rotterdam\" + 0.018*\"idiosyncrat\" + 0.018*\"duke\" + 0.017*\"grammat\" + 0.017*\"quarterli\" + 0.014*\"portugues\" + 0.013*\"kingdom\" + 0.012*\"princ\"\n", + "2019-01-31 01:34:03,195 : INFO : topic #3 (0.020): 0.034*\"present\" + 0.024*\"minist\" + 0.024*\"nation\" + 0.024*\"offic\" + 0.022*\"govern\" + 0.021*\"member\" + 0.018*\"start\" + 0.016*\"gener\" + 0.015*\"serv\" + 0.014*\"council\"\n", + "2019-01-31 01:34:03,197 : INFO : topic #45 (0.020): 0.045*\"arsen\" + 0.030*\"jpg\" + 0.029*\"fifteenth\" + 0.028*\"museo\" + 0.022*\"pain\" + 0.020*\"illicit\" + 0.017*\"artist\" + 0.016*\"exhaust\" + 0.015*\"colder\" + 0.015*\"gai\"\n", + "2019-01-31 01:34:03,198 : INFO : topic #33 (0.020): 0.060*\"french\" + 0.045*\"franc\" + 0.031*\"pari\" + 0.024*\"sail\" + 0.022*\"jean\" + 0.017*\"daphn\" + 0.014*\"lazi\" + 0.012*\"loui\" + 0.011*\"piec\" + 0.008*\"wine\"\n", + "2019-01-31 01:34:03,204 : INFO : topic diff=0.003080, rho=0.021031\n", + "2019-01-31 01:34:03,361 : INFO : PROGRESS: pass 0, at document #4524000/4922894\n", + "2019-01-31 01:34:04,739 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:34:05,006 : INFO : topic #10 (0.020): 0.011*\"cdd\" + 0.009*\"media\" + 0.008*\"disco\" + 0.008*\"have\" + 0.007*\"pathwai\" + 0.007*\"hormon\" + 0.007*\"caus\" + 0.006*\"proper\" + 0.006*\"treat\" + 0.006*\"effect\"\n", + "2019-01-31 01:34:05,007 : INFO : topic #47 (0.020): 0.064*\"muscl\" + 0.030*\"perceptu\" + 0.019*\"theater\" + 0.018*\"compos\" + 0.018*\"place\" + 0.016*\"physician\" + 0.015*\"damn\" + 0.014*\"orchestr\" + 0.012*\"olympo\" + 0.012*\"son\"\n", + "2019-01-31 01:34:05,009 : INFO : topic #14 (0.020): 0.024*\"forc\" + 0.020*\"aggress\" + 0.020*\"armi\" + 0.020*\"walter\" + 0.018*\"com\" + 0.014*\"unionist\" + 0.014*\"oper\" + 0.013*\"militari\" + 0.012*\"airbu\" + 0.011*\"diversifi\"\n", + "2019-01-31 01:34:05,010 : INFO : topic #46 (0.020): 0.017*\"stop\" + 0.017*\"sweden\" + 0.016*\"norwai\" + 0.015*\"swedish\" + 0.015*\"norwegian\" + 0.013*\"wind\" + 0.013*\"treeless\" + 0.013*\"damag\" + 0.011*\"turkish\" + 0.010*\"denmark\"\n", + "2019-01-31 01:34:05,011 : INFO : topic #20 (0.020): 0.145*\"scholar\" + 0.040*\"struggl\" + 0.033*\"high\" + 0.029*\"educ\" + 0.024*\"collector\" + 0.018*\"yawn\" + 0.012*\"prognosi\" + 0.011*\"district\" + 0.009*\"task\" + 0.009*\"gothic\"\n", + "2019-01-31 01:34:05,018 : INFO : topic diff=0.003270, rho=0.021026\n", + "2019-01-31 01:34:05,178 : INFO : PROGRESS: pass 0, at document #4526000/4922894\n", + "2019-01-31 01:34:06,572 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:34:06,838 : INFO : topic #49 (0.020): 0.041*\"india\" + 0.032*\"incumb\" + 0.013*\"pakistan\" + 0.013*\"islam\" + 0.012*\"anglo\" + 0.012*\"televis\" + 0.010*\"muskoge\" + 0.010*\"khalsa\" + 0.010*\"affection\" + 0.010*\"tajikistan\"\n", + "2019-01-31 01:34:06,839 : INFO : topic #6 (0.020): 0.069*\"fewer\" + 0.024*\"epiru\" + 0.019*\"septemb\" + 0.018*\"teacher\" + 0.015*\"stake\" + 0.013*\"proclaim\" + 0.012*\"rodríguez\" + 0.011*\"direct\" + 0.010*\"movi\" + 0.010*\"acrimoni\"\n", + "2019-01-31 01:34:06,841 : INFO : topic #42 (0.020): 0.046*\"german\" + 0.031*\"germani\" + 0.017*\"vol\" + 0.015*\"berlin\" + 0.015*\"israel\" + 0.015*\"jewish\" + 0.015*\"der\" + 0.009*\"austria\" + 0.009*\"isra\" + 0.009*\"european\"\n", + "2019-01-31 01:34:06,842 : INFO : topic #12 (0.020): 0.008*\"number\" + 0.007*\"frontal\" + 0.007*\"gener\" + 0.006*\"poet\" + 0.006*\"southern\" + 0.006*\"servitud\" + 0.006*\"exampl\" + 0.006*\"utopian\" + 0.006*\"théori\" + 0.006*\"measur\"\n", + "2019-01-31 01:34:06,843 : INFO : topic #2 (0.020): 0.049*\"isl\" + 0.039*\"shield\" + 0.018*\"narrat\" + 0.017*\"scot\" + 0.013*\"pope\" + 0.012*\"nativist\" + 0.012*\"blur\" + 0.010*\"class\" + 0.010*\"coalit\" + 0.009*\"fleet\"\n", + "2019-01-31 01:34:06,849 : INFO : topic diff=0.003658, rho=0.021021\n", + "2019-01-31 01:34:07,008 : INFO : PROGRESS: pass 0, at document #4528000/4922894\n", + "2019-01-31 01:34:08,390 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:34:08,657 : INFO : topic #26 (0.020): 0.028*\"workplac\" + 0.028*\"champion\" + 0.026*\"woman\" + 0.024*\"olymp\" + 0.023*\"men\" + 0.021*\"alic\" + 0.020*\"medal\" + 0.020*\"event\" + 0.018*\"rainfal\" + 0.018*\"taxpay\"\n", + "2019-01-31 01:34:08,658 : INFO : topic #7 (0.020): 0.021*\"snatch\" + 0.019*\"di\" + 0.018*\"factor\" + 0.016*\"margin\" + 0.016*\"yawn\" + 0.014*\"bone\" + 0.013*\"life\" + 0.012*\"faster\" + 0.012*\"will\" + 0.012*\"deal\"\n", + "2019-01-31 01:34:08,659 : INFO : topic #19 (0.020): 0.017*\"languag\" + 0.015*\"centuri\" + 0.010*\"woodcut\" + 0.010*\"form\" + 0.009*\"mean\" + 0.009*\"origin\" + 0.008*\"trade\" + 0.008*\"english\" + 0.007*\"known\" + 0.007*\"uruguayan\"\n", + "2019-01-31 01:34:08,660 : INFO : topic #18 (0.020): 0.010*\"théori\" + 0.007*\"later\" + 0.007*\"sack\" + 0.006*\"dai\" + 0.006*\"kill\" + 0.005*\"like\" + 0.005*\"end\" + 0.005*\"retrospect\" + 0.004*\"call\" + 0.004*\"help\"\n", + "2019-01-31 01:34:08,662 : INFO : topic #32 (0.020): 0.050*\"district\" + 0.045*\"popolo\" + 0.042*\"vigour\" + 0.036*\"tortur\" + 0.032*\"cotton\" + 0.023*\"adulthood\" + 0.022*\"area\" + 0.021*\"multitud\" + 0.020*\"cede\" + 0.018*\"citi\"\n", + "2019-01-31 01:34:08,667 : INFO : topic diff=0.002950, rho=0.021017\n", + "2019-01-31 01:34:08,827 : INFO : PROGRESS: pass 0, at document #4530000/4922894\n", + "2019-01-31 01:34:10,222 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:34:10,489 : INFO : topic #10 (0.020): 0.010*\"cdd\" + 0.009*\"media\" + 0.008*\"disco\" + 0.008*\"have\" + 0.007*\"pathwai\" + 0.007*\"hormon\" + 0.007*\"caus\" + 0.006*\"proper\" + 0.006*\"treat\" + 0.006*\"effect\"\n", + "2019-01-31 01:34:10,490 : INFO : topic #7 (0.020): 0.021*\"snatch\" + 0.019*\"di\" + 0.018*\"factor\" + 0.016*\"yawn\" + 0.016*\"margin\" + 0.014*\"bone\" + 0.013*\"life\" + 0.012*\"faster\" + 0.012*\"will\" + 0.012*\"deal\"\n", + "2019-01-31 01:34:10,491 : INFO : topic #48 (0.020): 0.081*\"march\" + 0.077*\"octob\" + 0.076*\"sens\" + 0.072*\"januari\" + 0.069*\"notion\" + 0.068*\"juli\" + 0.067*\"april\" + 0.066*\"august\" + 0.066*\"decatur\" + 0.065*\"judici\"\n", + "2019-01-31 01:34:10,492 : INFO : topic #4 (0.020): 0.021*\"enfranchis\" + 0.015*\"depress\" + 0.013*\"pour\" + 0.008*\"mode\" + 0.008*\"uruguayan\" + 0.008*\"elabor\" + 0.007*\"veget\" + 0.006*\"turn\" + 0.006*\"produc\" + 0.006*\"develop\"\n", + "2019-01-31 01:34:10,494 : INFO : topic #3 (0.020): 0.034*\"present\" + 0.024*\"minist\" + 0.024*\"nation\" + 0.024*\"offic\" + 0.023*\"govern\" + 0.021*\"member\" + 0.018*\"start\" + 0.016*\"gener\" + 0.015*\"serv\" + 0.014*\"chickasaw\"\n", + "2019-01-31 01:34:10,499 : INFO : topic diff=0.003394, rho=0.021012\n", + "2019-01-31 01:34:10,658 : INFO : PROGRESS: pass 0, at document #4532000/4922894\n", + "2019-01-31 01:34:12,061 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:34:12,327 : INFO : topic #32 (0.020): 0.050*\"district\" + 0.045*\"popolo\" + 0.043*\"vigour\" + 0.036*\"tortur\" + 0.032*\"cotton\" + 0.023*\"adulthood\" + 0.022*\"area\" + 0.021*\"multitud\" + 0.020*\"cede\" + 0.018*\"citi\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 01:34:12,328 : INFO : topic #34 (0.020): 0.066*\"start\" + 0.033*\"new\" + 0.031*\"american\" + 0.029*\"unionist\" + 0.026*\"cotton\" + 0.022*\"year\" + 0.015*\"california\" + 0.013*\"warrior\" + 0.012*\"terri\" + 0.012*\"north\"\n", + "2019-01-31 01:34:12,329 : INFO : topic #6 (0.020): 0.069*\"fewer\" + 0.024*\"epiru\" + 0.019*\"septemb\" + 0.018*\"teacher\" + 0.015*\"stake\" + 0.012*\"proclaim\" + 0.012*\"rodríguez\" + 0.012*\"direct\" + 0.010*\"movi\" + 0.010*\"acrimoni\"\n", + "2019-01-31 01:34:12,331 : INFO : topic #45 (0.020): 0.045*\"arsen\" + 0.030*\"jpg\" + 0.029*\"fifteenth\" + 0.028*\"museo\" + 0.022*\"pain\" + 0.020*\"illicit\" + 0.017*\"artist\" + 0.015*\"exhaust\" + 0.015*\"colder\" + 0.015*\"gai\"\n", + "2019-01-31 01:34:12,332 : INFO : topic #36 (0.020): 0.010*\"network\" + 0.010*\"prognosi\" + 0.009*\"pop\" + 0.009*\"cytokin\" + 0.008*\"develop\" + 0.008*\"user\" + 0.008*\"softwar\" + 0.008*\"diggin\" + 0.008*\"uruguayan\" + 0.007*\"includ\"\n", + "2019-01-31 01:34:12,338 : INFO : topic diff=0.003423, rho=0.021007\n", + "2019-01-31 01:34:12,496 : INFO : PROGRESS: pass 0, at document #4534000/4922894\n", + "2019-01-31 01:34:13,891 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:34:14,157 : INFO : topic #11 (0.020): 0.023*\"john\" + 0.011*\"will\" + 0.011*\"david\" + 0.011*\"jame\" + 0.010*\"rival\" + 0.009*\"mexican–american\" + 0.008*\"slur\" + 0.008*\"georg\" + 0.007*\"paul\" + 0.007*\"rhyme\"\n", + "2019-01-31 01:34:14,159 : INFO : topic #41 (0.020): 0.042*\"citi\" + 0.024*\"palmer\" + 0.020*\"new\" + 0.017*\"strategist\" + 0.013*\"open\" + 0.013*\"center\" + 0.011*\"includ\" + 0.011*\"lobe\" + 0.010*\"dai\" + 0.009*\"highli\"\n", + "2019-01-31 01:34:14,160 : INFO : topic #31 (0.020): 0.050*\"fusiform\" + 0.026*\"scientist\" + 0.025*\"taxpay\" + 0.022*\"player\" + 0.019*\"place\" + 0.014*\"clot\" + 0.013*\"leagu\" + 0.011*\"folei\" + 0.011*\"yawn\" + 0.009*\"reconstruct\"\n", + "2019-01-31 01:34:14,161 : INFO : topic #10 (0.020): 0.010*\"cdd\" + 0.009*\"media\" + 0.008*\"disco\" + 0.008*\"have\" + 0.007*\"pathwai\" + 0.007*\"hormon\" + 0.007*\"caus\" + 0.006*\"proper\" + 0.006*\"treat\" + 0.006*\"effect\"\n", + "2019-01-31 01:34:14,162 : INFO : topic #2 (0.020): 0.049*\"isl\" + 0.039*\"shield\" + 0.018*\"narrat\" + 0.017*\"scot\" + 0.013*\"nativist\" + 0.013*\"pope\" + 0.012*\"blur\" + 0.010*\"class\" + 0.010*\"coalit\" + 0.009*\"fleet\"\n", + "2019-01-31 01:34:14,168 : INFO : topic diff=0.003446, rho=0.021003\n", + "2019-01-31 01:34:14,320 : INFO : PROGRESS: pass 0, at document #4536000/4922894\n", + "2019-01-31 01:34:15,669 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:34:15,936 : INFO : topic #23 (0.020): 0.135*\"audit\" + 0.067*\"best\" + 0.035*\"yawn\" + 0.030*\"jacksonvil\" + 0.024*\"japanes\" + 0.022*\"noll\" + 0.019*\"women\" + 0.017*\"festiv\" + 0.016*\"intern\" + 0.014*\"prison\"\n", + "2019-01-31 01:34:15,937 : INFO : topic #2 (0.020): 0.048*\"isl\" + 0.039*\"shield\" + 0.018*\"narrat\" + 0.017*\"scot\" + 0.013*\"nativist\" + 0.013*\"pope\" + 0.012*\"blur\" + 0.010*\"class\" + 0.010*\"coalit\" + 0.009*\"fleet\"\n", + "2019-01-31 01:34:15,938 : INFO : topic #25 (0.020): 0.031*\"ring\" + 0.018*\"area\" + 0.018*\"lagrang\" + 0.016*\"warmth\" + 0.015*\"mount\" + 0.010*\"north\" + 0.009*\"land\" + 0.009*\"sourc\" + 0.008*\"lobe\" + 0.008*\"foam\"\n", + "2019-01-31 01:34:15,939 : INFO : topic #15 (0.020): 0.011*\"small\" + 0.010*\"organ\" + 0.010*\"develop\" + 0.009*\"commun\" + 0.009*\"group\" + 0.008*\"word\" + 0.008*\"peopl\" + 0.007*\"woman\" + 0.007*\"human\" + 0.006*\"workplac\"\n", + "2019-01-31 01:34:15,940 : INFO : topic #5 (0.020): 0.038*\"abroad\" + 0.028*\"son\" + 0.026*\"rel\" + 0.026*\"reconstruct\" + 0.021*\"band\" + 0.016*\"muscl\" + 0.016*\"simultan\" + 0.014*\"charcoal\" + 0.013*\"toyota\" + 0.010*\"myspac\"\n", + "2019-01-31 01:34:15,946 : INFO : topic diff=0.003079, rho=0.020998\n", + "2019-01-31 01:34:16,102 : INFO : PROGRESS: pass 0, at document #4538000/4922894\n", + "2019-01-31 01:34:17,470 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:34:17,737 : INFO : topic #35 (0.020): 0.055*\"russia\" + 0.038*\"sovereignti\" + 0.034*\"rural\" + 0.026*\"personifi\" + 0.025*\"reprint\" + 0.024*\"poison\" + 0.021*\"moscow\" + 0.018*\"poland\" + 0.015*\"unfortun\" + 0.014*\"czech\"\n", + "2019-01-31 01:34:17,738 : INFO : topic #29 (0.020): 0.031*\"companhia\" + 0.013*\"busi\" + 0.013*\"million\" + 0.012*\"produc\" + 0.012*\"market\" + 0.011*\"bank\" + 0.010*\"industri\" + 0.009*\"yawn\" + 0.008*\"manag\" + 0.007*\"trace\"\n", + "2019-01-31 01:34:17,739 : INFO : topic #13 (0.020): 0.026*\"australia\" + 0.026*\"sourc\" + 0.025*\"london\" + 0.025*\"new\" + 0.023*\"england\" + 0.023*\"australian\" + 0.020*\"british\" + 0.018*\"ireland\" + 0.015*\"youth\" + 0.014*\"wale\"\n", + "2019-01-31 01:34:17,740 : INFO : topic #43 (0.020): 0.065*\"elect\" + 0.054*\"parti\" + 0.024*\"voluntari\" + 0.023*\"democrat\" + 0.020*\"member\" + 0.016*\"polici\" + 0.016*\"republ\" + 0.014*\"selma\" + 0.014*\"report\" + 0.014*\"bypass\"\n", + "2019-01-31 01:34:17,741 : INFO : topic #22 (0.020): 0.033*\"spars\" + 0.018*\"factor\" + 0.011*\"plaisir\" + 0.010*\"genu\" + 0.010*\"western\" + 0.008*\"median\" + 0.008*\"biom\" + 0.007*\"trap\" + 0.007*\"incom\" + 0.007*\"florida\"\n", + "2019-01-31 01:34:17,747 : INFO : topic diff=0.003340, rho=0.020993\n", + "2019-01-31 01:34:20,452 : INFO : -11.600 per-word bound, 3103.9 perplexity estimate based on a held-out corpus of 2000 documents with 563320 words\n", + "2019-01-31 01:34:20,453 : INFO : PROGRESS: pass 0, at document #4540000/4922894\n", + "2019-01-31 01:34:21,832 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:34:22,099 : INFO : topic #35 (0.020): 0.055*\"russia\" + 0.038*\"sovereignti\" + 0.034*\"rural\" + 0.025*\"personifi\" + 0.025*\"reprint\" + 0.025*\"poison\" + 0.021*\"moscow\" + 0.018*\"poland\" + 0.015*\"unfortun\" + 0.014*\"czech\"\n", + "2019-01-31 01:34:22,100 : INFO : topic #26 (0.020): 0.028*\"workplac\" + 0.028*\"champion\" + 0.026*\"woman\" + 0.024*\"olymp\" + 0.023*\"men\" + 0.022*\"alic\" + 0.020*\"medal\" + 0.020*\"event\" + 0.019*\"rainfal\" + 0.018*\"taxpay\"\n", + "2019-01-31 01:34:22,101 : INFO : topic #34 (0.020): 0.066*\"start\" + 0.033*\"new\" + 0.031*\"american\" + 0.029*\"unionist\" + 0.026*\"cotton\" + 0.022*\"year\" + 0.015*\"california\" + 0.013*\"warrior\" + 0.012*\"terri\" + 0.012*\"north\"\n", + "2019-01-31 01:34:22,102 : INFO : topic #2 (0.020): 0.048*\"isl\" + 0.039*\"shield\" + 0.018*\"narrat\" + 0.017*\"scot\" + 0.013*\"nativist\" + 0.012*\"pope\" + 0.012*\"blur\" + 0.010*\"coalit\" + 0.010*\"class\" + 0.009*\"fleet\"\n", + "2019-01-31 01:34:22,104 : INFO : topic #31 (0.020): 0.050*\"fusiform\" + 0.027*\"scientist\" + 0.025*\"taxpay\" + 0.022*\"player\" + 0.020*\"place\" + 0.015*\"clot\" + 0.014*\"leagu\" + 0.011*\"folei\" + 0.011*\"yawn\" + 0.009*\"reconstruct\"\n", + "2019-01-31 01:34:22,110 : INFO : topic diff=0.003248, rho=0.020989\n", + "2019-01-31 01:34:22,323 : INFO : PROGRESS: pass 0, at document #4542000/4922894\n", + "2019-01-31 01:34:23,690 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:34:23,956 : INFO : topic #44 (0.020): 0.030*\"rooftop\" + 0.026*\"final\" + 0.023*\"wife\" + 0.021*\"tourist\" + 0.018*\"champion\" + 0.016*\"martin\" + 0.014*\"taxpay\" + 0.014*\"tiepolo\" + 0.014*\"chamber\" + 0.012*\"open\"\n", + "2019-01-31 01:34:23,957 : INFO : topic #42 (0.020): 0.047*\"german\" + 0.031*\"germani\" + 0.016*\"vol\" + 0.015*\"jewish\" + 0.015*\"berlin\" + 0.015*\"der\" + 0.014*\"israel\" + 0.009*\"austria\" + 0.009*\"european\" + 0.009*\"isra\"\n", + "2019-01-31 01:34:23,959 : INFO : topic #43 (0.020): 0.065*\"elect\" + 0.054*\"parti\" + 0.024*\"voluntari\" + 0.023*\"democrat\" + 0.020*\"member\" + 0.016*\"polici\" + 0.015*\"republ\" + 0.014*\"selma\" + 0.014*\"report\" + 0.014*\"bypass\"\n", + "2019-01-31 01:34:23,960 : INFO : topic #26 (0.020): 0.028*\"workplac\" + 0.028*\"champion\" + 0.026*\"woman\" + 0.024*\"olymp\" + 0.023*\"men\" + 0.022*\"alic\" + 0.020*\"medal\" + 0.020*\"event\" + 0.019*\"rainfal\" + 0.018*\"taxpay\"\n", + "2019-01-31 01:34:23,961 : INFO : topic #11 (0.020): 0.023*\"john\" + 0.011*\"david\" + 0.011*\"will\" + 0.011*\"jame\" + 0.010*\"rival\" + 0.009*\"mexican–american\" + 0.008*\"slur\" + 0.008*\"georg\" + 0.007*\"paul\" + 0.007*\"rhyme\"\n", + "2019-01-31 01:34:23,967 : INFO : topic diff=0.003207, rho=0.020984\n", + "2019-01-31 01:34:24,123 : INFO : PROGRESS: pass 0, at document #4544000/4922894\n", + "2019-01-31 01:34:25,498 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:34:25,765 : INFO : topic #25 (0.020): 0.031*\"ring\" + 0.018*\"area\" + 0.018*\"lagrang\" + 0.016*\"warmth\" + 0.016*\"mount\" + 0.010*\"north\" + 0.009*\"sourc\" + 0.009*\"land\" + 0.009*\"lobe\" + 0.008*\"palmer\"\n", + "2019-01-31 01:34:25,766 : INFO : topic #11 (0.020): 0.023*\"john\" + 0.011*\"david\" + 0.011*\"will\" + 0.011*\"jame\" + 0.010*\"rival\" + 0.009*\"mexican–american\" + 0.008*\"slur\" + 0.008*\"georg\" + 0.007*\"paul\" + 0.007*\"rhyme\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 01:34:25,767 : INFO : topic #6 (0.020): 0.069*\"fewer\" + 0.023*\"epiru\" + 0.020*\"septemb\" + 0.018*\"teacher\" + 0.015*\"stake\" + 0.012*\"proclaim\" + 0.012*\"rodríguez\" + 0.011*\"direct\" + 0.010*\"acrimoni\" + 0.010*\"movi\"\n", + "2019-01-31 01:34:25,768 : INFO : topic #48 (0.020): 0.081*\"march\" + 0.077*\"octob\" + 0.077*\"sens\" + 0.072*\"januari\" + 0.069*\"notion\" + 0.068*\"juli\" + 0.067*\"april\" + 0.067*\"august\" + 0.066*\"decatur\" + 0.065*\"judici\"\n", + "2019-01-31 01:34:25,769 : INFO : topic #8 (0.020): 0.027*\"law\" + 0.024*\"cortic\" + 0.018*\"start\" + 0.016*\"act\" + 0.012*\"ricardo\" + 0.012*\"case\" + 0.010*\"replac\" + 0.009*\"polaris\" + 0.008*\"legal\" + 0.007*\"judaism\"\n", + "2019-01-31 01:34:25,775 : INFO : topic diff=0.003201, rho=0.020980\n", + "2019-01-31 01:34:25,930 : INFO : PROGRESS: pass 0, at document #4546000/4922894\n", + "2019-01-31 01:34:27,301 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:34:27,567 : INFO : topic #36 (0.020): 0.011*\"prognosi\" + 0.010*\"network\" + 0.009*\"pop\" + 0.009*\"cytokin\" + 0.008*\"develop\" + 0.008*\"softwar\" + 0.008*\"diggin\" + 0.008*\"user\" + 0.008*\"uruguayan\" + 0.007*\"includ\"\n", + "2019-01-31 01:34:27,568 : INFO : topic #27 (0.020): 0.076*\"questionnair\" + 0.020*\"candid\" + 0.018*\"taxpay\" + 0.014*\"tornado\" + 0.012*\"driver\" + 0.012*\"fool\" + 0.012*\"find\" + 0.011*\"ret\" + 0.010*\"squatter\" + 0.010*\"landslid\"\n", + "2019-01-31 01:34:27,570 : INFO : topic #15 (0.020): 0.011*\"small\" + 0.010*\"organ\" + 0.010*\"develop\" + 0.009*\"commun\" + 0.009*\"group\" + 0.008*\"word\" + 0.008*\"peopl\" + 0.007*\"woman\" + 0.007*\"human\" + 0.006*\"workplac\"\n", + "2019-01-31 01:34:27,571 : INFO : topic #3 (0.020): 0.034*\"present\" + 0.024*\"offic\" + 0.024*\"nation\" + 0.024*\"minist\" + 0.023*\"govern\" + 0.021*\"member\" + 0.018*\"start\" + 0.016*\"gener\" + 0.015*\"serv\" + 0.014*\"seri\"\n", + "2019-01-31 01:34:27,572 : INFO : topic #40 (0.020): 0.088*\"unit\" + 0.023*\"schuster\" + 0.022*\"institut\" + 0.022*\"requir\" + 0.020*\"collector\" + 0.019*\"student\" + 0.014*\"professor\" + 0.012*\"word\" + 0.011*\"governor\" + 0.011*\"degre\"\n", + "2019-01-31 01:34:27,578 : INFO : topic diff=0.003255, rho=0.020975\n", + "2019-01-31 01:34:27,739 : INFO : PROGRESS: pass 0, at document #4548000/4922894\n", + "2019-01-31 01:34:29,144 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:34:29,410 : INFO : topic #46 (0.020): 0.017*\"sweden\" + 0.016*\"norwai\" + 0.016*\"stop\" + 0.016*\"swedish\" + 0.014*\"norwegian\" + 0.013*\"wind\" + 0.013*\"treeless\" + 0.012*\"damag\" + 0.010*\"huntsvil\" + 0.010*\"turkish\"\n", + "2019-01-31 01:34:29,411 : INFO : topic #12 (0.020): 0.008*\"number\" + 0.007*\"frontal\" + 0.006*\"gener\" + 0.006*\"poet\" + 0.006*\"servitud\" + 0.006*\"southern\" + 0.006*\"exampl\" + 0.006*\"utopian\" + 0.006*\"théori\" + 0.006*\"measur\"\n", + "2019-01-31 01:34:29,412 : INFO : topic #11 (0.020): 0.023*\"john\" + 0.012*\"david\" + 0.011*\"will\" + 0.011*\"jame\" + 0.010*\"rival\" + 0.009*\"mexican–american\" + 0.008*\"paul\" + 0.008*\"slur\" + 0.008*\"georg\" + 0.007*\"rhyme\"\n", + "2019-01-31 01:34:29,413 : INFO : topic #14 (0.020): 0.024*\"forc\" + 0.020*\"armi\" + 0.020*\"aggress\" + 0.020*\"walter\" + 0.018*\"com\" + 0.014*\"oper\" + 0.014*\"unionist\" + 0.012*\"militari\" + 0.012*\"diversifi\" + 0.012*\"airbu\"\n", + "2019-01-31 01:34:29,414 : INFO : topic #2 (0.020): 0.049*\"isl\" + 0.039*\"shield\" + 0.018*\"narrat\" + 0.017*\"scot\" + 0.013*\"nativist\" + 0.012*\"pope\" + 0.011*\"blur\" + 0.010*\"coalit\" + 0.010*\"class\" + 0.009*\"fleet\"\n", + "2019-01-31 01:34:29,420 : INFO : topic diff=0.003421, rho=0.020970\n", + "2019-01-31 01:34:29,583 : INFO : PROGRESS: pass 0, at document #4550000/4922894\n", + "2019-01-31 01:34:30,991 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:34:31,258 : INFO : topic #41 (0.020): 0.042*\"citi\" + 0.024*\"palmer\" + 0.020*\"new\" + 0.018*\"strategist\" + 0.014*\"open\" + 0.013*\"center\" + 0.011*\"includ\" + 0.011*\"lobe\" + 0.010*\"dai\" + 0.009*\"highli\"\n", + "2019-01-31 01:34:31,259 : INFO : topic #49 (0.020): 0.041*\"india\" + 0.031*\"incumb\" + 0.013*\"islam\" + 0.013*\"anglo\" + 0.013*\"pakistan\" + 0.012*\"televis\" + 0.011*\"muskoge\" + 0.010*\"khalsa\" + 0.010*\"affection\" + 0.010*\"sri\"\n", + "2019-01-31 01:34:31,260 : INFO : topic #22 (0.020): 0.032*\"spars\" + 0.017*\"factor\" + 0.012*\"plaisir\" + 0.010*\"genu\" + 0.010*\"western\" + 0.008*\"median\" + 0.008*\"biom\" + 0.007*\"trap\" + 0.007*\"incom\" + 0.007*\"florida\"\n", + "2019-01-31 01:34:31,261 : INFO : topic #46 (0.020): 0.017*\"sweden\" + 0.016*\"norwai\" + 0.016*\"stop\" + 0.015*\"swedish\" + 0.014*\"norwegian\" + 0.013*\"wind\" + 0.012*\"treeless\" + 0.012*\"damag\" + 0.010*\"huntsvil\" + 0.010*\"denmark\"\n", + "2019-01-31 01:34:31,262 : INFO : topic #15 (0.020): 0.011*\"small\" + 0.010*\"organ\" + 0.010*\"develop\" + 0.009*\"commun\" + 0.009*\"group\" + 0.008*\"word\" + 0.008*\"peopl\" + 0.008*\"woman\" + 0.007*\"human\" + 0.006*\"workplac\"\n", + "2019-01-31 01:34:31,268 : INFO : topic diff=0.003661, rho=0.020966\n", + "2019-01-31 01:34:31,429 : INFO : PROGRESS: pass 0, at document #4552000/4922894\n", + "2019-01-31 01:34:32,847 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:34:33,114 : INFO : topic #38 (0.020): 0.022*\"walter\" + 0.010*\"aza\" + 0.009*\"battalion\" + 0.009*\"forc\" + 0.007*\"empath\" + 0.007*\"armi\" + 0.007*\"teufel\" + 0.007*\"govern\" + 0.006*\"pour\" + 0.006*\"militari\"\n", + "2019-01-31 01:34:33,115 : INFO : topic #11 (0.020): 0.023*\"john\" + 0.012*\"david\" + 0.011*\"will\" + 0.011*\"jame\" + 0.010*\"rival\" + 0.009*\"mexican–american\" + 0.008*\"paul\" + 0.008*\"slur\" + 0.008*\"georg\" + 0.007*\"rhyme\"\n", + "2019-01-31 01:34:33,116 : INFO : topic #43 (0.020): 0.064*\"elect\" + 0.054*\"parti\" + 0.024*\"voluntari\" + 0.023*\"democrat\" + 0.020*\"member\" + 0.016*\"polici\" + 0.015*\"republ\" + 0.014*\"report\" + 0.014*\"selma\" + 0.014*\"bypass\"\n", + "2019-01-31 01:34:33,117 : INFO : topic #17 (0.020): 0.080*\"church\" + 0.023*\"christian\" + 0.022*\"cathol\" + 0.022*\"bishop\" + 0.017*\"sail\" + 0.016*\"retroflex\" + 0.010*\"relationship\" + 0.010*\"historiographi\" + 0.010*\"poll\" + 0.009*\"cathedr\"\n", + "2019-01-31 01:34:33,118 : INFO : topic #47 (0.020): 0.065*\"muscl\" + 0.030*\"perceptu\" + 0.019*\"compos\" + 0.019*\"theater\" + 0.017*\"place\" + 0.015*\"physician\" + 0.015*\"damn\" + 0.013*\"orchestr\" + 0.013*\"olympo\" + 0.011*\"son\"\n", + "2019-01-31 01:34:33,124 : INFO : topic diff=0.003049, rho=0.020961\n", + "2019-01-31 01:34:33,284 : INFO : PROGRESS: pass 0, at document #4554000/4922894\n", + "2019-01-31 01:34:34,680 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:34:34,947 : INFO : topic #34 (0.020): 0.066*\"start\" + 0.033*\"new\" + 0.031*\"american\" + 0.029*\"unionist\" + 0.026*\"cotton\" + 0.022*\"year\" + 0.015*\"california\" + 0.013*\"warrior\" + 0.012*\"terri\" + 0.012*\"north\"\n", + "2019-01-31 01:34:34,948 : INFO : topic #31 (0.020): 0.051*\"fusiform\" + 0.027*\"scientist\" + 0.025*\"taxpay\" + 0.022*\"player\" + 0.020*\"place\" + 0.014*\"clot\" + 0.014*\"leagu\" + 0.011*\"folei\" + 0.011*\"yawn\" + 0.009*\"reconstruct\"\n", + "2019-01-31 01:34:34,949 : INFO : topic #22 (0.020): 0.033*\"spars\" + 0.017*\"factor\" + 0.012*\"plaisir\" + 0.010*\"genu\" + 0.010*\"western\" + 0.008*\"median\" + 0.008*\"biom\" + 0.007*\"trap\" + 0.007*\"incom\" + 0.007*\"florida\"\n", + "2019-01-31 01:34:34,950 : INFO : topic #35 (0.020): 0.056*\"russia\" + 0.039*\"sovereignti\" + 0.034*\"rural\" + 0.025*\"poison\" + 0.025*\"personifi\" + 0.024*\"reprint\" + 0.020*\"moscow\" + 0.018*\"poland\" + 0.015*\"unfortun\" + 0.014*\"tyrant\"\n", + "2019-01-31 01:34:34,951 : INFO : topic #36 (0.020): 0.011*\"network\" + 0.010*\"prognosi\" + 0.009*\"pop\" + 0.009*\"cytokin\" + 0.008*\"develop\" + 0.008*\"diggin\" + 0.008*\"softwar\" + 0.008*\"user\" + 0.008*\"uruguayan\" + 0.007*\"includ\"\n", + "2019-01-31 01:34:34,957 : INFO : topic diff=0.003596, rho=0.020956\n", + "2019-01-31 01:34:35,107 : INFO : PROGRESS: pass 0, at document #4556000/4922894\n", + "2019-01-31 01:34:36,430 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:34:36,696 : INFO : topic #19 (0.020): 0.017*\"languag\" + 0.015*\"centuri\" + 0.010*\"woodcut\" + 0.010*\"form\" + 0.009*\"origin\" + 0.009*\"mean\" + 0.009*\"trade\" + 0.007*\"english\" + 0.007*\"known\" + 0.007*\"uruguayan\"\n", + "2019-01-31 01:34:36,697 : INFO : topic #47 (0.020): 0.065*\"muscl\" + 0.030*\"perceptu\" + 0.019*\"theater\" + 0.019*\"compos\" + 0.017*\"place\" + 0.015*\"physician\" + 0.015*\"damn\" + 0.013*\"orchestr\" + 0.013*\"olympo\" + 0.011*\"son\"\n", + "2019-01-31 01:34:36,698 : INFO : topic #45 (0.020): 0.046*\"arsen\" + 0.030*\"jpg\" + 0.029*\"fifteenth\" + 0.029*\"museo\" + 0.021*\"pain\" + 0.020*\"illicit\" + 0.017*\"artist\" + 0.016*\"exhaust\" + 0.015*\"gai\" + 0.015*\"colder\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 01:34:36,699 : INFO : topic #15 (0.020): 0.011*\"small\" + 0.010*\"organ\" + 0.010*\"develop\" + 0.009*\"commun\" + 0.009*\"group\" + 0.008*\"word\" + 0.008*\"woman\" + 0.008*\"peopl\" + 0.007*\"human\" + 0.006*\"workplac\"\n", + "2019-01-31 01:34:36,700 : INFO : topic #0 (0.020): 0.062*\"statewid\" + 0.041*\"line\" + 0.032*\"rivièr\" + 0.030*\"raid\" + 0.025*\"rosenwald\" + 0.020*\"airmen\" + 0.018*\"traceabl\" + 0.018*\"serv\" + 0.013*\"oper\" + 0.010*\"transient\"\n", + "2019-01-31 01:34:36,706 : INFO : topic diff=0.003217, rho=0.020952\n", + "2019-01-31 01:34:36,866 : INFO : PROGRESS: pass 0, at document #4558000/4922894\n", + "2019-01-31 01:34:38,242 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:34:38,508 : INFO : topic #15 (0.020): 0.011*\"small\" + 0.010*\"organ\" + 0.010*\"develop\" + 0.009*\"commun\" + 0.009*\"group\" + 0.008*\"word\" + 0.008*\"woman\" + 0.008*\"peopl\" + 0.007*\"human\" + 0.006*\"workplac\"\n", + "2019-01-31 01:34:38,510 : INFO : topic #7 (0.020): 0.021*\"snatch\" + 0.020*\"di\" + 0.018*\"factor\" + 0.016*\"yawn\" + 0.016*\"margin\" + 0.014*\"bone\" + 0.013*\"life\" + 0.013*\"faster\" + 0.012*\"will\" + 0.012*\"deal\"\n", + "2019-01-31 01:34:38,511 : INFO : topic #48 (0.020): 0.079*\"march\" + 0.076*\"sens\" + 0.075*\"octob\" + 0.070*\"januari\" + 0.067*\"april\" + 0.066*\"notion\" + 0.066*\"august\" + 0.066*\"juli\" + 0.065*\"decatur\" + 0.064*\"judici\"\n", + "2019-01-31 01:34:38,511 : INFO : topic #30 (0.020): 0.036*\"cleveland\" + 0.035*\"leagu\" + 0.029*\"place\" + 0.027*\"taxpay\" + 0.024*\"scientist\" + 0.023*\"crete\" + 0.021*\"folei\" + 0.017*\"goal\" + 0.015*\"martin\" + 0.012*\"schmitz\"\n", + "2019-01-31 01:34:38,513 : INFO : topic #9 (0.020): 0.073*\"bone\" + 0.047*\"american\" + 0.027*\"valour\" + 0.018*\"player\" + 0.018*\"folei\" + 0.018*\"dutch\" + 0.017*\"english\" + 0.017*\"polit\" + 0.013*\"acrimoni\" + 0.011*\"simpler\"\n", + "2019-01-31 01:34:38,519 : INFO : topic diff=0.003054, rho=0.020947\n", + "2019-01-31 01:34:41,191 : INFO : -11.745 per-word bound, 3432.3 perplexity estimate based on a held-out corpus of 2000 documents with 548948 words\n", + "2019-01-31 01:34:41,191 : INFO : PROGRESS: pass 0, at document #4560000/4922894\n", + "2019-01-31 01:34:42,556 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:34:42,822 : INFO : topic #22 (0.020): 0.033*\"spars\" + 0.017*\"factor\" + 0.012*\"plaisir\" + 0.011*\"genu\" + 0.010*\"western\" + 0.008*\"median\" + 0.008*\"biom\" + 0.007*\"trap\" + 0.007*\"incom\" + 0.007*\"florida\"\n", + "2019-01-31 01:34:42,823 : INFO : topic #35 (0.020): 0.056*\"russia\" + 0.039*\"sovereignti\" + 0.034*\"rural\" + 0.025*\"personifi\" + 0.025*\"poison\" + 0.025*\"reprint\" + 0.020*\"moscow\" + 0.018*\"poland\" + 0.015*\"unfortun\" + 0.015*\"tyrant\"\n", + "2019-01-31 01:34:42,824 : INFO : topic #40 (0.020): 0.087*\"unit\" + 0.023*\"schuster\" + 0.022*\"institut\" + 0.021*\"requir\" + 0.020*\"collector\" + 0.019*\"student\" + 0.014*\"professor\" + 0.012*\"word\" + 0.011*\"http\" + 0.011*\"degre\"\n", + "2019-01-31 01:34:42,825 : INFO : topic #17 (0.020): 0.080*\"church\" + 0.023*\"christian\" + 0.022*\"bishop\" + 0.022*\"cathol\" + 0.017*\"sail\" + 0.016*\"retroflex\" + 0.010*\"relationship\" + 0.010*\"historiographi\" + 0.009*\"poll\" + 0.009*\"cathedr\"\n", + "2019-01-31 01:34:42,827 : INFO : topic #19 (0.020): 0.017*\"languag\" + 0.015*\"centuri\" + 0.010*\"woodcut\" + 0.010*\"form\" + 0.009*\"mean\" + 0.009*\"origin\" + 0.009*\"trade\" + 0.007*\"english\" + 0.007*\"known\" + 0.007*\"uruguayan\"\n", + "2019-01-31 01:34:42,832 : INFO : topic diff=0.003177, rho=0.020943\n", + "2019-01-31 01:34:42,988 : INFO : PROGRESS: pass 0, at document #4562000/4922894\n", + "2019-01-31 01:34:44,357 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:34:44,623 : INFO : topic #15 (0.020): 0.011*\"small\" + 0.010*\"organ\" + 0.010*\"develop\" + 0.009*\"commun\" + 0.009*\"group\" + 0.008*\"word\" + 0.008*\"woman\" + 0.008*\"peopl\" + 0.007*\"human\" + 0.006*\"workplac\"\n", + "2019-01-31 01:34:44,624 : INFO : topic #35 (0.020): 0.056*\"russia\" + 0.038*\"sovereignti\" + 0.035*\"rural\" + 0.025*\"personifi\" + 0.025*\"reprint\" + 0.025*\"poison\" + 0.020*\"moscow\" + 0.018*\"poland\" + 0.015*\"unfortun\" + 0.015*\"tyrant\"\n", + "2019-01-31 01:34:44,625 : INFO : topic #31 (0.020): 0.051*\"fusiform\" + 0.027*\"scientist\" + 0.025*\"taxpay\" + 0.022*\"player\" + 0.020*\"place\" + 0.014*\"clot\" + 0.014*\"leagu\" + 0.011*\"folei\" + 0.011*\"yawn\" + 0.009*\"reconstruct\"\n", + "2019-01-31 01:34:44,627 : INFO : topic #36 (0.020): 0.011*\"network\" + 0.011*\"prognosi\" + 0.009*\"pop\" + 0.009*\"cytokin\" + 0.008*\"develop\" + 0.008*\"diggin\" + 0.008*\"softwar\" + 0.008*\"uruguayan\" + 0.008*\"user\" + 0.007*\"includ\"\n", + "2019-01-31 01:34:44,628 : INFO : topic #2 (0.020): 0.048*\"isl\" + 0.039*\"shield\" + 0.018*\"narrat\" + 0.016*\"scot\" + 0.012*\"nativist\" + 0.012*\"pope\" + 0.012*\"blur\" + 0.010*\"coalit\" + 0.010*\"fleet\" + 0.009*\"class\"\n", + "2019-01-31 01:34:44,633 : INFO : topic diff=0.003266, rho=0.020938\n", + "2019-01-31 01:34:44,790 : INFO : PROGRESS: pass 0, at document #4564000/4922894\n", + "2019-01-31 01:34:46,175 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:34:46,442 : INFO : topic #14 (0.020): 0.024*\"forc\" + 0.020*\"armi\" + 0.020*\"aggress\" + 0.020*\"walter\" + 0.018*\"com\" + 0.015*\"oper\" + 0.013*\"unionist\" + 0.012*\"militari\" + 0.012*\"airbu\" + 0.012*\"diversifi\"\n", + "2019-01-31 01:34:46,443 : INFO : topic #38 (0.020): 0.022*\"walter\" + 0.010*\"aza\" + 0.009*\"battalion\" + 0.009*\"forc\" + 0.007*\"empath\" + 0.007*\"armi\" + 0.007*\"govern\" + 0.006*\"teufel\" + 0.006*\"militari\" + 0.006*\"pour\"\n", + "2019-01-31 01:34:46,444 : INFO : topic #46 (0.020): 0.017*\"stop\" + 0.016*\"sweden\" + 0.016*\"norwai\" + 0.015*\"swedish\" + 0.014*\"norwegian\" + 0.014*\"damag\" + 0.013*\"wind\" + 0.012*\"treeless\" + 0.011*\"huntsvil\" + 0.010*\"turkish\"\n", + "2019-01-31 01:34:46,445 : INFO : topic #33 (0.020): 0.059*\"french\" + 0.043*\"franc\" + 0.031*\"pari\" + 0.023*\"sail\" + 0.021*\"jean\" + 0.017*\"daphn\" + 0.013*\"lazi\" + 0.011*\"piec\" + 0.011*\"loui\" + 0.009*\"wine\"\n", + "2019-01-31 01:34:46,446 : INFO : topic #12 (0.020): 0.008*\"number\" + 0.007*\"frontal\" + 0.006*\"gener\" + 0.006*\"poet\" + 0.006*\"servitud\" + 0.006*\"southern\" + 0.006*\"method\" + 0.006*\"exampl\" + 0.006*\"utopian\" + 0.006*\"measur\"\n", + "2019-01-31 01:34:46,452 : INFO : topic diff=0.003177, rho=0.020934\n", + "2019-01-31 01:34:46,616 : INFO : PROGRESS: pass 0, at document #4566000/4922894\n", + "2019-01-31 01:34:48,031 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:34:48,298 : INFO : topic #18 (0.020): 0.010*\"théori\" + 0.007*\"later\" + 0.007*\"sack\" + 0.006*\"dai\" + 0.006*\"kill\" + 0.005*\"like\" + 0.005*\"end\" + 0.005*\"retrospect\" + 0.004*\"call\" + 0.004*\"kenworthi\"\n", + "2019-01-31 01:34:48,299 : INFO : topic #26 (0.020): 0.029*\"workplac\" + 0.028*\"champion\" + 0.025*\"woman\" + 0.024*\"men\" + 0.024*\"olymp\" + 0.021*\"medal\" + 0.020*\"alic\" + 0.020*\"event\" + 0.018*\"rainfal\" + 0.018*\"taxpay\"\n", + "2019-01-31 01:34:48,300 : INFO : topic #33 (0.020): 0.059*\"french\" + 0.043*\"franc\" + 0.031*\"pari\" + 0.023*\"sail\" + 0.021*\"jean\" + 0.017*\"daphn\" + 0.013*\"lazi\" + 0.012*\"piec\" + 0.011*\"loui\" + 0.009*\"wine\"\n", + "2019-01-31 01:34:48,301 : INFO : topic #43 (0.020): 0.065*\"elect\" + 0.055*\"parti\" + 0.025*\"voluntari\" + 0.023*\"democrat\" + 0.020*\"member\" + 0.016*\"polici\" + 0.015*\"republ\" + 0.014*\"report\" + 0.014*\"selma\" + 0.014*\"bypass\"\n", + "2019-01-31 01:34:48,301 : INFO : topic #30 (0.020): 0.036*\"cleveland\" + 0.035*\"leagu\" + 0.029*\"place\" + 0.027*\"taxpay\" + 0.024*\"scientist\" + 0.023*\"crete\" + 0.021*\"folei\" + 0.017*\"goal\" + 0.015*\"martin\" + 0.012*\"schmitz\"\n", + "2019-01-31 01:34:48,307 : INFO : topic diff=0.004027, rho=0.020929\n", + "2019-01-31 01:34:48,467 : INFO : PROGRESS: pass 0, at document #4568000/4922894\n", + "2019-01-31 01:34:49,856 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:34:50,122 : INFO : topic #3 (0.020): 0.034*\"present\" + 0.025*\"offic\" + 0.025*\"nation\" + 0.024*\"minist\" + 0.023*\"govern\" + 0.021*\"member\" + 0.018*\"start\" + 0.016*\"gener\" + 0.015*\"serv\" + 0.014*\"chickasaw\"\n", + "2019-01-31 01:34:50,123 : INFO : topic #7 (0.020): 0.022*\"snatch\" + 0.019*\"di\" + 0.018*\"factor\" + 0.016*\"yawn\" + 0.016*\"margin\" + 0.014*\"bone\" + 0.013*\"life\" + 0.013*\"faster\" + 0.012*\"will\" + 0.012*\"deal\"\n", + "2019-01-31 01:34:50,125 : INFO : topic #49 (0.020): 0.041*\"india\" + 0.031*\"incumb\" + 0.013*\"islam\" + 0.013*\"anglo\" + 0.012*\"pakistan\" + 0.012*\"televis\" + 0.010*\"khalsa\" + 0.010*\"muskoge\" + 0.010*\"affection\" + 0.010*\"sri\"\n", + "2019-01-31 01:34:50,126 : INFO : topic #2 (0.020): 0.049*\"isl\" + 0.039*\"shield\" + 0.018*\"narrat\" + 0.016*\"scot\" + 0.012*\"pope\" + 0.012*\"nativist\" + 0.012*\"blur\" + 0.010*\"coalit\" + 0.009*\"class\" + 0.009*\"fleet\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 01:34:50,127 : INFO : topic #45 (0.020): 0.047*\"arsen\" + 0.031*\"jpg\" + 0.029*\"fifteenth\" + 0.028*\"museo\" + 0.021*\"pain\" + 0.020*\"illicit\" + 0.017*\"artist\" + 0.016*\"exhaust\" + 0.015*\"gai\" + 0.015*\"colder\"\n", + "2019-01-31 01:34:50,133 : INFO : topic diff=0.003309, rho=0.020924\n", + "2019-01-31 01:34:50,290 : INFO : PROGRESS: pass 0, at document #4570000/4922894\n", + "2019-01-31 01:34:51,668 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:34:51,935 : INFO : topic #44 (0.020): 0.029*\"rooftop\" + 0.025*\"final\" + 0.023*\"wife\" + 0.021*\"tourist\" + 0.018*\"champion\" + 0.015*\"martin\" + 0.015*\"taxpay\" + 0.014*\"chamber\" + 0.013*\"tiepolo\" + 0.012*\"women\"\n", + "2019-01-31 01:34:51,936 : INFO : topic #34 (0.020): 0.066*\"start\" + 0.033*\"new\" + 0.031*\"american\" + 0.029*\"unionist\" + 0.026*\"cotton\" + 0.022*\"year\" + 0.015*\"california\" + 0.013*\"warrior\" + 0.012*\"terri\" + 0.012*\"north\"\n", + "2019-01-31 01:34:51,937 : INFO : topic #2 (0.020): 0.049*\"isl\" + 0.039*\"shield\" + 0.018*\"narrat\" + 0.016*\"scot\" + 0.012*\"pope\" + 0.012*\"nativist\" + 0.012*\"blur\" + 0.010*\"coalit\" + 0.009*\"class\" + 0.009*\"fleet\"\n", + "2019-01-31 01:34:51,938 : INFO : topic #49 (0.020): 0.041*\"india\" + 0.031*\"incumb\" + 0.013*\"islam\" + 0.013*\"pakistan\" + 0.012*\"anglo\" + 0.012*\"televis\" + 0.010*\"khalsa\" + 0.010*\"muskoge\" + 0.010*\"affection\" + 0.010*\"sri\"\n", + "2019-01-31 01:34:51,939 : INFO : topic #1 (0.020): 0.055*\"china\" + 0.048*\"chilton\" + 0.024*\"kong\" + 0.023*\"hong\" + 0.021*\"korea\" + 0.018*\"korean\" + 0.016*\"leah\" + 0.016*\"sourc\" + 0.014*\"kim\" + 0.013*\"shirin\"\n", + "2019-01-31 01:34:51,944 : INFO : topic diff=0.003055, rho=0.020920\n", + "2019-01-31 01:34:52,103 : INFO : PROGRESS: pass 0, at document #4572000/4922894\n", + "2019-01-31 01:34:53,499 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:34:53,765 : INFO : topic #27 (0.020): 0.075*\"questionnair\" + 0.019*\"candid\" + 0.018*\"taxpay\" + 0.014*\"tornado\" + 0.012*\"driver\" + 0.012*\"fool\" + 0.012*\"ret\" + 0.011*\"find\" + 0.010*\"squatter\" + 0.010*\"landslid\"\n", + "2019-01-31 01:34:53,766 : INFO : topic #2 (0.020): 0.049*\"isl\" + 0.039*\"shield\" + 0.018*\"narrat\" + 0.016*\"scot\" + 0.012*\"pope\" + 0.012*\"nativist\" + 0.012*\"blur\" + 0.010*\"coalit\" + 0.009*\"class\" + 0.009*\"fleet\"\n", + "2019-01-31 01:34:53,767 : INFO : topic #42 (0.020): 0.048*\"german\" + 0.031*\"germani\" + 0.016*\"vol\" + 0.016*\"jewish\" + 0.015*\"israel\" + 0.015*\"berlin\" + 0.014*\"der\" + 0.010*\"isra\" + 0.009*\"europ\" + 0.009*\"austria\"\n", + "2019-01-31 01:34:53,768 : INFO : topic #32 (0.020): 0.050*\"district\" + 0.045*\"popolo\" + 0.042*\"vigour\" + 0.034*\"tortur\" + 0.033*\"cotton\" + 0.023*\"adulthood\" + 0.022*\"area\" + 0.022*\"multitud\" + 0.020*\"cede\" + 0.018*\"citi\"\n", + "2019-01-31 01:34:53,769 : INFO : topic #19 (0.020): 0.017*\"languag\" + 0.015*\"centuri\" + 0.010*\"woodcut\" + 0.010*\"form\" + 0.009*\"mean\" + 0.009*\"origin\" + 0.009*\"trade\" + 0.008*\"english\" + 0.007*\"known\" + 0.007*\"ancestor\"\n", + "2019-01-31 01:34:53,775 : INFO : topic diff=0.004102, rho=0.020915\n", + "2019-01-31 01:34:53,986 : INFO : PROGRESS: pass 0, at document #4574000/4922894\n", + "2019-01-31 01:34:55,374 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:34:55,640 : INFO : topic #1 (0.020): 0.055*\"china\" + 0.048*\"chilton\" + 0.023*\"kong\" + 0.023*\"hong\" + 0.020*\"korea\" + 0.018*\"korean\" + 0.016*\"leah\" + 0.015*\"sourc\" + 0.014*\"kim\" + 0.012*\"shirin\"\n", + "2019-01-31 01:34:55,641 : INFO : topic #41 (0.020): 0.042*\"citi\" + 0.024*\"palmer\" + 0.019*\"new\" + 0.018*\"strategist\" + 0.013*\"open\" + 0.013*\"center\" + 0.011*\"includ\" + 0.011*\"lobe\" + 0.011*\"dai\" + 0.009*\"highli\"\n", + "2019-01-31 01:34:55,642 : INFO : topic #0 (0.020): 0.063*\"statewid\" + 0.041*\"line\" + 0.032*\"rivièr\" + 0.030*\"raid\" + 0.025*\"rosenwald\" + 0.020*\"airmen\" + 0.018*\"serv\" + 0.018*\"traceabl\" + 0.013*\"oper\" + 0.010*\"transient\"\n", + "2019-01-31 01:34:55,643 : INFO : topic #30 (0.020): 0.035*\"leagu\" + 0.035*\"cleveland\" + 0.029*\"place\" + 0.027*\"taxpay\" + 0.024*\"scientist\" + 0.023*\"crete\" + 0.021*\"folei\" + 0.017*\"goal\" + 0.015*\"martin\" + 0.012*\"schmitz\"\n", + "2019-01-31 01:34:55,644 : INFO : topic #35 (0.020): 0.057*\"russia\" + 0.038*\"sovereignti\" + 0.034*\"rural\" + 0.026*\"poison\" + 0.025*\"reprint\" + 0.025*\"personifi\" + 0.020*\"moscow\" + 0.018*\"poland\" + 0.015*\"unfortun\" + 0.015*\"tyrant\"\n", + "2019-01-31 01:34:55,649 : INFO : topic diff=0.002974, rho=0.020911\n", + "2019-01-31 01:34:55,805 : INFO : PROGRESS: pass 0, at document #4576000/4922894\n", + "2019-01-31 01:34:57,181 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:34:57,447 : INFO : topic #25 (0.020): 0.032*\"ring\" + 0.018*\"area\" + 0.018*\"lagrang\" + 0.017*\"warmth\" + 0.015*\"mount\" + 0.010*\"north\" + 0.009*\"land\" + 0.009*\"sourc\" + 0.008*\"lobe\" + 0.008*\"palmer\"\n", + "2019-01-31 01:34:57,448 : INFO : topic #35 (0.020): 0.057*\"russia\" + 0.038*\"sovereignti\" + 0.034*\"rural\" + 0.025*\"reprint\" + 0.025*\"poison\" + 0.025*\"personifi\" + 0.020*\"moscow\" + 0.018*\"poland\" + 0.015*\"unfortun\" + 0.015*\"tyrant\"\n", + "2019-01-31 01:34:57,449 : INFO : topic #17 (0.020): 0.080*\"church\" + 0.023*\"christian\" + 0.022*\"cathol\" + 0.022*\"bishop\" + 0.016*\"sail\" + 0.016*\"retroflex\" + 0.010*\"relationship\" + 0.010*\"historiographi\" + 0.009*\"cathedr\" + 0.009*\"poll\"\n", + "2019-01-31 01:34:57,450 : INFO : topic #30 (0.020): 0.035*\"leagu\" + 0.035*\"cleveland\" + 0.029*\"place\" + 0.027*\"taxpay\" + 0.024*\"scientist\" + 0.023*\"crete\" + 0.021*\"folei\" + 0.017*\"goal\" + 0.015*\"martin\" + 0.012*\"schmitz\"\n", + "2019-01-31 01:34:57,451 : INFO : topic #43 (0.020): 0.066*\"elect\" + 0.056*\"parti\" + 0.025*\"voluntari\" + 0.023*\"democrat\" + 0.020*\"member\" + 0.016*\"polici\" + 0.015*\"republ\" + 0.014*\"report\" + 0.014*\"bypass\" + 0.014*\"selma\"\n", + "2019-01-31 01:34:57,457 : INFO : topic diff=0.003470, rho=0.020906\n", + "2019-01-31 01:34:57,614 : INFO : PROGRESS: pass 0, at document #4578000/4922894\n", + "2019-01-31 01:34:58,984 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:34:59,251 : INFO : topic #25 (0.020): 0.032*\"ring\" + 0.018*\"area\" + 0.017*\"lagrang\" + 0.017*\"warmth\" + 0.015*\"mount\" + 0.010*\"north\" + 0.009*\"land\" + 0.009*\"sourc\" + 0.008*\"lobe\" + 0.008*\"palmer\"\n", + "2019-01-31 01:34:59,252 : INFO : topic #21 (0.020): 0.036*\"samford\" + 0.022*\"spain\" + 0.017*\"del\" + 0.016*\"italian\" + 0.016*\"mexico\" + 0.014*\"soviet\" + 0.012*\"santa\" + 0.011*\"juan\" + 0.011*\"lizard\" + 0.010*\"francisco\"\n", + "2019-01-31 01:34:59,253 : INFO : topic #11 (0.020): 0.023*\"john\" + 0.012*\"david\" + 0.011*\"will\" + 0.011*\"jame\" + 0.010*\"rival\" + 0.009*\"mexican–american\" + 0.008*\"paul\" + 0.008*\"slur\" + 0.008*\"georg\" + 0.007*\"rhyme\"\n", + "2019-01-31 01:34:59,254 : INFO : topic #28 (0.020): 0.035*\"build\" + 0.030*\"hous\" + 0.019*\"buford\" + 0.014*\"histor\" + 0.012*\"linear\" + 0.011*\"depress\" + 0.011*\"centuri\" + 0.011*\"silicon\" + 0.011*\"constitut\" + 0.010*\"pistol\"\n", + "2019-01-31 01:34:59,254 : INFO : topic #32 (0.020): 0.051*\"district\" + 0.045*\"popolo\" + 0.042*\"vigour\" + 0.034*\"tortur\" + 0.033*\"cotton\" + 0.023*\"adulthood\" + 0.022*\"area\" + 0.022*\"multitud\" + 0.020*\"cede\" + 0.018*\"citi\"\n", + "2019-01-31 01:34:59,260 : INFO : topic diff=0.003281, rho=0.020901\n", + "2019-01-31 01:35:01,933 : INFO : -11.547 per-word bound, 2992.5 perplexity estimate based on a held-out corpus of 2000 documents with 547904 words\n", + "2019-01-31 01:35:01,933 : INFO : PROGRESS: pass 0, at document #4580000/4922894\n", + "2019-01-31 01:35:03,305 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:35:03,572 : INFO : topic #31 (0.020): 0.051*\"fusiform\" + 0.027*\"scientist\" + 0.025*\"taxpay\" + 0.022*\"player\" + 0.020*\"place\" + 0.014*\"clot\" + 0.014*\"leagu\" + 0.011*\"folei\" + 0.011*\"yawn\" + 0.009*\"reconstruct\"\n", + "2019-01-31 01:35:03,573 : INFO : topic #9 (0.020): 0.077*\"bone\" + 0.047*\"american\" + 0.026*\"valour\" + 0.019*\"folei\" + 0.018*\"player\" + 0.018*\"dutch\" + 0.017*\"english\" + 0.017*\"polit\" + 0.013*\"acrimoni\" + 0.011*\"simpler\"\n", + "2019-01-31 01:35:03,574 : INFO : topic #16 (0.020): 0.057*\"king\" + 0.032*\"priest\" + 0.021*\"rotterdam\" + 0.018*\"duke\" + 0.018*\"idiosyncrat\" + 0.017*\"grammat\" + 0.016*\"quarterli\" + 0.014*\"kingdom\" + 0.013*\"portugues\" + 0.012*\"princ\"\n", + "2019-01-31 01:35:03,575 : INFO : topic #24 (0.020): 0.040*\"book\" + 0.036*\"publicis\" + 0.025*\"word\" + 0.020*\"new\" + 0.015*\"presid\" + 0.015*\"edit\" + 0.011*\"magazin\" + 0.011*\"author\" + 0.011*\"nicola\" + 0.011*\"storag\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 01:35:03,576 : INFO : topic #14 (0.020): 0.024*\"forc\" + 0.021*\"aggress\" + 0.021*\"armi\" + 0.019*\"walter\" + 0.018*\"com\" + 0.014*\"oper\" + 0.013*\"unionist\" + 0.012*\"militari\" + 0.012*\"airbu\" + 0.011*\"diversifi\"\n", + "2019-01-31 01:35:03,582 : INFO : topic diff=0.002793, rho=0.020897\n", + "2019-01-31 01:35:03,741 : INFO : PROGRESS: pass 0, at document #4582000/4922894\n", + "2019-01-31 01:35:05,120 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:35:05,386 : INFO : topic #22 (0.020): 0.033*\"spars\" + 0.017*\"factor\" + 0.012*\"plaisir\" + 0.011*\"genu\" + 0.010*\"western\" + 0.008*\"median\" + 0.008*\"biom\" + 0.008*\"trap\" + 0.007*\"incom\" + 0.006*\"florida\"\n", + "2019-01-31 01:35:05,387 : INFO : topic #45 (0.020): 0.047*\"arsen\" + 0.031*\"jpg\" + 0.029*\"museo\" + 0.029*\"fifteenth\" + 0.021*\"pain\" + 0.020*\"illicit\" + 0.017*\"artist\" + 0.016*\"exhaust\" + 0.016*\"gai\" + 0.015*\"colder\"\n", + "2019-01-31 01:35:05,388 : INFO : topic #12 (0.020): 0.008*\"number\" + 0.007*\"frontal\" + 0.006*\"poet\" + 0.006*\"gener\" + 0.006*\"servitud\" + 0.006*\"exampl\" + 0.006*\"measur\" + 0.006*\"method\" + 0.006*\"utopian\" + 0.006*\"southern\"\n", + "2019-01-31 01:35:05,389 : INFO : topic #14 (0.020): 0.024*\"forc\" + 0.021*\"aggress\" + 0.021*\"armi\" + 0.019*\"walter\" + 0.018*\"com\" + 0.014*\"oper\" + 0.013*\"unionist\" + 0.012*\"militari\" + 0.012*\"airbu\" + 0.011*\"diversifi\"\n", + "2019-01-31 01:35:05,390 : INFO : topic #23 (0.020): 0.136*\"audit\" + 0.070*\"best\" + 0.036*\"yawn\" + 0.029*\"jacksonvil\" + 0.024*\"japanes\" + 0.022*\"noll\" + 0.019*\"women\" + 0.018*\"intern\" + 0.018*\"festiv\" + 0.014*\"prison\"\n", + "2019-01-31 01:35:05,396 : INFO : topic diff=0.003381, rho=0.020892\n", + "2019-01-31 01:35:05,555 : INFO : PROGRESS: pass 0, at document #4584000/4922894\n", + "2019-01-31 01:35:06,947 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:35:07,213 : INFO : topic #13 (0.020): 0.026*\"australia\" + 0.026*\"london\" + 0.025*\"sourc\" + 0.025*\"new\" + 0.023*\"england\" + 0.022*\"australian\" + 0.020*\"british\" + 0.018*\"ireland\" + 0.014*\"youth\" + 0.014*\"wale\"\n", + "2019-01-31 01:35:07,214 : INFO : topic #12 (0.020): 0.008*\"number\" + 0.007*\"frontal\" + 0.006*\"poet\" + 0.006*\"gener\" + 0.006*\"exampl\" + 0.006*\"servitud\" + 0.006*\"measur\" + 0.006*\"method\" + 0.006*\"utopian\" + 0.006*\"southern\"\n", + "2019-01-31 01:35:07,215 : INFO : topic #34 (0.020): 0.066*\"start\" + 0.033*\"new\" + 0.031*\"american\" + 0.029*\"unionist\" + 0.026*\"cotton\" + 0.022*\"year\" + 0.015*\"california\" + 0.013*\"warrior\" + 0.012*\"terri\" + 0.011*\"north\"\n", + "2019-01-31 01:35:07,216 : INFO : topic #10 (0.020): 0.010*\"cdd\" + 0.009*\"media\" + 0.008*\"disco\" + 0.007*\"have\" + 0.007*\"pathwai\" + 0.007*\"hormon\" + 0.007*\"proper\" + 0.007*\"caus\" + 0.006*\"treat\" + 0.006*\"effect\"\n", + "2019-01-31 01:35:07,218 : INFO : topic #18 (0.020): 0.010*\"théori\" + 0.007*\"later\" + 0.007*\"sack\" + 0.006*\"dai\" + 0.005*\"kill\" + 0.005*\"like\" + 0.005*\"retrospect\" + 0.005*\"end\" + 0.004*\"call\" + 0.004*\"help\"\n", + "2019-01-31 01:35:07,223 : INFO : topic diff=0.003149, rho=0.020888\n", + "2019-01-31 01:35:07,379 : INFO : PROGRESS: pass 0, at document #4586000/4922894\n", + "2019-01-31 01:35:08,751 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:35:09,019 : INFO : topic #2 (0.020): 0.048*\"isl\" + 0.038*\"shield\" + 0.018*\"narrat\" + 0.016*\"scot\" + 0.012*\"pope\" + 0.012*\"blur\" + 0.012*\"nativist\" + 0.010*\"coalit\" + 0.010*\"fleet\" + 0.010*\"class\"\n", + "2019-01-31 01:35:09,020 : INFO : topic #14 (0.020): 0.024*\"forc\" + 0.021*\"aggress\" + 0.021*\"armi\" + 0.019*\"walter\" + 0.018*\"com\" + 0.014*\"oper\" + 0.013*\"unionist\" + 0.012*\"militari\" + 0.012*\"airbu\" + 0.011*\"diversifi\"\n", + "2019-01-31 01:35:09,021 : INFO : topic #13 (0.020): 0.026*\"australia\" + 0.025*\"sourc\" + 0.025*\"london\" + 0.025*\"new\" + 0.023*\"england\" + 0.022*\"australian\" + 0.020*\"british\" + 0.018*\"ireland\" + 0.015*\"youth\" + 0.014*\"wale\"\n", + "2019-01-31 01:35:09,022 : INFO : topic #11 (0.020): 0.023*\"john\" + 0.011*\"david\" + 0.011*\"will\" + 0.011*\"jame\" + 0.010*\"rival\" + 0.009*\"mexican–american\" + 0.008*\"paul\" + 0.008*\"slur\" + 0.008*\"georg\" + 0.007*\"rhyme\"\n", + "2019-01-31 01:35:09,023 : INFO : topic #21 (0.020): 0.036*\"samford\" + 0.022*\"spain\" + 0.017*\"mexico\" + 0.017*\"del\" + 0.016*\"italian\" + 0.014*\"soviet\" + 0.012*\"santa\" + 0.011*\"juan\" + 0.010*\"lizard\" + 0.010*\"francisco\"\n", + "2019-01-31 01:35:09,028 : INFO : topic diff=0.003194, rho=0.020883\n", + "2019-01-31 01:35:09,187 : INFO : PROGRESS: pass 0, at document #4588000/4922894\n", + "2019-01-31 01:35:10,564 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:35:10,830 : INFO : topic #7 (0.020): 0.021*\"snatch\" + 0.020*\"di\" + 0.018*\"factor\" + 0.016*\"yawn\" + 0.016*\"margin\" + 0.014*\"bone\" + 0.013*\"life\" + 0.013*\"faster\" + 0.012*\"will\" + 0.012*\"deal\"\n", + "2019-01-31 01:35:10,831 : INFO : topic #33 (0.020): 0.060*\"french\" + 0.043*\"franc\" + 0.031*\"pari\" + 0.023*\"sail\" + 0.022*\"jean\" + 0.017*\"daphn\" + 0.013*\"lazi\" + 0.012*\"piec\" + 0.012*\"loui\" + 0.009*\"wine\"\n", + "2019-01-31 01:35:10,833 : INFO : topic #6 (0.020): 0.069*\"fewer\" + 0.023*\"epiru\" + 0.019*\"septemb\" + 0.018*\"teacher\" + 0.015*\"stake\" + 0.012*\"rodríguez\" + 0.012*\"proclaim\" + 0.011*\"direct\" + 0.011*\"acrimoni\" + 0.010*\"movi\"\n", + "2019-01-31 01:35:10,834 : INFO : topic #20 (0.020): 0.145*\"scholar\" + 0.039*\"struggl\" + 0.032*\"high\" + 0.030*\"educ\" + 0.024*\"collector\" + 0.018*\"yawn\" + 0.012*\"prognosi\" + 0.011*\"district\" + 0.010*\"gothic\" + 0.010*\"task\"\n", + "2019-01-31 01:35:10,835 : INFO : topic #40 (0.020): 0.087*\"unit\" + 0.023*\"schuster\" + 0.022*\"institut\" + 0.022*\"requir\" + 0.020*\"collector\" + 0.019*\"student\" + 0.014*\"professor\" + 0.012*\"word\" + 0.011*\"governor\" + 0.011*\"degre\"\n", + "2019-01-31 01:35:10,840 : INFO : topic diff=0.002834, rho=0.020879\n", + "2019-01-31 01:35:10,998 : INFO : PROGRESS: pass 0, at document #4590000/4922894\n", + "2019-01-31 01:35:12,397 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:35:12,663 : INFO : topic #48 (0.020): 0.080*\"march\" + 0.077*\"sens\" + 0.077*\"octob\" + 0.071*\"januari\" + 0.069*\"april\" + 0.069*\"juli\" + 0.068*\"august\" + 0.068*\"notion\" + 0.066*\"decatur\" + 0.066*\"judici\"\n", + "2019-01-31 01:35:12,664 : INFO : topic #45 (0.020): 0.047*\"arsen\" + 0.030*\"jpg\" + 0.030*\"museo\" + 0.028*\"fifteenth\" + 0.022*\"pain\" + 0.020*\"illicit\" + 0.017*\"artist\" + 0.016*\"exhaust\" + 0.016*\"gai\" + 0.015*\"colder\"\n", + "2019-01-31 01:35:12,665 : INFO : topic #9 (0.020): 0.076*\"bone\" + 0.047*\"american\" + 0.026*\"valour\" + 0.019*\"folei\" + 0.018*\"dutch\" + 0.018*\"player\" + 0.017*\"english\" + 0.017*\"polit\" + 0.013*\"acrimoni\" + 0.012*\"simpler\"\n", + "2019-01-31 01:35:12,666 : INFO : topic #23 (0.020): 0.136*\"audit\" + 0.069*\"best\" + 0.036*\"yawn\" + 0.029*\"jacksonvil\" + 0.025*\"japanes\" + 0.021*\"noll\" + 0.019*\"women\" + 0.018*\"intern\" + 0.018*\"festiv\" + 0.015*\"prison\"\n", + "2019-01-31 01:35:12,667 : INFO : topic #4 (0.020): 0.020*\"enfranchis\" + 0.014*\"depress\" + 0.014*\"pour\" + 0.008*\"uruguayan\" + 0.008*\"mode\" + 0.008*\"elabor\" + 0.007*\"veget\" + 0.007*\"turn\" + 0.006*\"teratogen\" + 0.006*\"stanc\"\n", + "2019-01-31 01:35:12,673 : INFO : topic diff=0.002706, rho=0.020874\n", + "2019-01-31 01:35:12,831 : INFO : PROGRESS: pass 0, at document #4592000/4922894\n", + "2019-01-31 01:35:14,204 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:35:14,470 : INFO : topic #32 (0.020): 0.051*\"district\" + 0.045*\"popolo\" + 0.042*\"vigour\" + 0.035*\"tortur\" + 0.032*\"cotton\" + 0.023*\"adulthood\" + 0.022*\"area\" + 0.022*\"multitud\" + 0.020*\"cede\" + 0.018*\"citi\"\n", + "2019-01-31 01:35:14,471 : INFO : topic #26 (0.020): 0.029*\"workplac\" + 0.028*\"champion\" + 0.026*\"woman\" + 0.025*\"olymp\" + 0.024*\"men\" + 0.021*\"medal\" + 0.020*\"event\" + 0.019*\"alic\" + 0.018*\"taxpay\" + 0.018*\"rainfal\"\n", + "2019-01-31 01:35:14,472 : INFO : topic #39 (0.020): 0.059*\"canada\" + 0.046*\"canadian\" + 0.023*\"toronto\" + 0.023*\"hoar\" + 0.023*\"ontario\" + 0.016*\"hydrogen\" + 0.015*\"novotná\" + 0.015*\"new\" + 0.014*\"misericordia\" + 0.013*\"quebec\"\n", + "2019-01-31 01:35:14,473 : INFO : topic #15 (0.020): 0.011*\"small\" + 0.010*\"organ\" + 0.010*\"develop\" + 0.009*\"commun\" + 0.009*\"group\" + 0.008*\"woman\" + 0.008*\"word\" + 0.008*\"peopl\" + 0.007*\"human\" + 0.006*\"summerhil\"\n", + "2019-01-31 01:35:14,474 : INFO : topic #22 (0.020): 0.033*\"spars\" + 0.017*\"factor\" + 0.012*\"plaisir\" + 0.010*\"genu\" + 0.010*\"western\" + 0.008*\"biom\" + 0.008*\"median\" + 0.007*\"trap\" + 0.007*\"incom\" + 0.006*\"florida\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 01:35:14,480 : INFO : topic diff=0.003560, rho=0.020870\n", + "2019-01-31 01:35:14,636 : INFO : PROGRESS: pass 0, at document #4594000/4922894\n", + "2019-01-31 01:35:15,990 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:35:16,256 : INFO : topic #21 (0.020): 0.036*\"samford\" + 0.022*\"spain\" + 0.017*\"mexico\" + 0.017*\"del\" + 0.017*\"italian\" + 0.014*\"soviet\" + 0.012*\"santa\" + 0.011*\"juan\" + 0.010*\"lizard\" + 0.010*\"francisco\"\n", + "2019-01-31 01:35:16,257 : INFO : topic #14 (0.020): 0.024*\"forc\" + 0.021*\"aggress\" + 0.021*\"armi\" + 0.020*\"walter\" + 0.019*\"com\" + 0.014*\"oper\" + 0.013*\"unionist\" + 0.013*\"militari\" + 0.012*\"airbu\" + 0.011*\"diversifi\"\n", + "2019-01-31 01:35:16,258 : INFO : topic #47 (0.020): 0.065*\"muscl\" + 0.031*\"perceptu\" + 0.020*\"theater\" + 0.018*\"compos\" + 0.017*\"place\" + 0.016*\"damn\" + 0.014*\"physician\" + 0.013*\"olympo\" + 0.013*\"orchestr\" + 0.011*\"son\"\n", + "2019-01-31 01:35:16,259 : INFO : topic #41 (0.020): 0.042*\"citi\" + 0.024*\"palmer\" + 0.020*\"new\" + 0.017*\"strategist\" + 0.013*\"open\" + 0.013*\"center\" + 0.011*\"lobe\" + 0.011*\"includ\" + 0.011*\"dai\" + 0.009*\"highli\"\n", + "2019-01-31 01:35:16,261 : INFO : topic #27 (0.020): 0.076*\"questionnair\" + 0.019*\"candid\" + 0.018*\"taxpay\" + 0.013*\"tornado\" + 0.012*\"driver\" + 0.012*\"fool\" + 0.011*\"ret\" + 0.011*\"find\" + 0.010*\"landslid\" + 0.010*\"squatter\"\n", + "2019-01-31 01:35:16,266 : INFO : topic diff=0.003182, rho=0.020865\n", + "2019-01-31 01:35:16,420 : INFO : PROGRESS: pass 0, at document #4596000/4922894\n", + "2019-01-31 01:35:17,766 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:35:18,032 : INFO : topic #43 (0.020): 0.066*\"elect\" + 0.055*\"parti\" + 0.024*\"voluntari\" + 0.023*\"democrat\" + 0.020*\"member\" + 0.016*\"polici\" + 0.015*\"republ\" + 0.014*\"selma\" + 0.014*\"bypass\" + 0.014*\"report\"\n", + "2019-01-31 01:35:18,033 : INFO : topic #1 (0.020): 0.057*\"china\" + 0.049*\"chilton\" + 0.023*\"kong\" + 0.023*\"hong\" + 0.021*\"korea\" + 0.018*\"korean\" + 0.016*\"leah\" + 0.015*\"sourc\" + 0.014*\"kim\" + 0.013*\"shirin\"\n", + "2019-01-31 01:35:18,034 : INFO : topic #33 (0.020): 0.061*\"french\" + 0.044*\"franc\" + 0.030*\"pari\" + 0.023*\"sail\" + 0.022*\"jean\" + 0.017*\"daphn\" + 0.013*\"lazi\" + 0.012*\"piec\" + 0.012*\"loui\" + 0.010*\"wreath\"\n", + "2019-01-31 01:35:18,035 : INFO : topic #13 (0.020): 0.026*\"australia\" + 0.026*\"sourc\" + 0.025*\"london\" + 0.025*\"new\" + 0.023*\"england\" + 0.022*\"australian\" + 0.019*\"british\" + 0.018*\"ireland\" + 0.015*\"youth\" + 0.014*\"wale\"\n", + "2019-01-31 01:35:18,036 : INFO : topic #21 (0.020): 0.035*\"samford\" + 0.022*\"spain\" + 0.017*\"mexico\" + 0.017*\"del\" + 0.017*\"italian\" + 0.014*\"soviet\" + 0.012*\"santa\" + 0.011*\"juan\" + 0.011*\"francisco\" + 0.010*\"carlo\"\n", + "2019-01-31 01:35:18,042 : INFO : topic diff=0.003279, rho=0.020861\n", + "2019-01-31 01:35:18,208 : INFO : PROGRESS: pass 0, at document #4598000/4922894\n", + "2019-01-31 01:35:19,622 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:35:19,888 : INFO : topic #9 (0.020): 0.076*\"bone\" + 0.046*\"american\" + 0.026*\"valour\" + 0.019*\"folei\" + 0.019*\"dutch\" + 0.018*\"player\" + 0.017*\"english\" + 0.017*\"polit\" + 0.012*\"acrimoni\" + 0.011*\"simpler\"\n", + "2019-01-31 01:35:19,889 : INFO : topic #11 (0.020): 0.023*\"john\" + 0.011*\"david\" + 0.011*\"jame\" + 0.011*\"will\" + 0.010*\"rival\" + 0.009*\"mexican–american\" + 0.008*\"paul\" + 0.008*\"slur\" + 0.008*\"georg\" + 0.007*\"rhyme\"\n", + "2019-01-31 01:35:19,890 : INFO : topic #13 (0.020): 0.026*\"australia\" + 0.025*\"sourc\" + 0.025*\"london\" + 0.025*\"new\" + 0.023*\"england\" + 0.022*\"australian\" + 0.019*\"british\" + 0.018*\"ireland\" + 0.015*\"youth\" + 0.014*\"wale\"\n", + "2019-01-31 01:35:19,891 : INFO : topic #34 (0.020): 0.066*\"start\" + 0.033*\"new\" + 0.031*\"american\" + 0.029*\"unionist\" + 0.027*\"cotton\" + 0.022*\"year\" + 0.015*\"california\" + 0.013*\"warrior\" + 0.012*\"north\" + 0.012*\"terri\"\n", + "2019-01-31 01:35:19,892 : INFO : topic #40 (0.020): 0.087*\"unit\" + 0.023*\"schuster\" + 0.022*\"institut\" + 0.022*\"requir\" + 0.020*\"collector\" + 0.019*\"student\" + 0.014*\"professor\" + 0.012*\"word\" + 0.011*\"governor\" + 0.011*\"degre\"\n", + "2019-01-31 01:35:19,898 : INFO : topic diff=0.003189, rho=0.020856\n", + "2019-01-31 01:35:22,686 : INFO : -11.689 per-word bound, 3302.6 perplexity estimate based on a held-out corpus of 2000 documents with 598140 words\n", + "2019-01-31 01:35:22,687 : INFO : PROGRESS: pass 0, at document #4600000/4922894\n", + "2019-01-31 01:35:24,102 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:35:24,369 : INFO : topic #45 (0.020): 0.048*\"arsen\" + 0.031*\"museo\" + 0.030*\"jpg\" + 0.028*\"fifteenth\" + 0.022*\"pain\" + 0.020*\"illicit\" + 0.017*\"artist\" + 0.016*\"exhaust\" + 0.016*\"gai\" + 0.015*\"colder\"\n", + "2019-01-31 01:35:24,370 : INFO : topic #28 (0.020): 0.035*\"build\" + 0.031*\"hous\" + 0.019*\"buford\" + 0.015*\"histor\" + 0.012*\"linear\" + 0.011*\"depress\" + 0.011*\"centuri\" + 0.011*\"silicon\" + 0.011*\"constitut\" + 0.010*\"pistol\"\n", + "2019-01-31 01:35:24,371 : INFO : topic #25 (0.020): 0.032*\"ring\" + 0.019*\"area\" + 0.017*\"lagrang\" + 0.017*\"warmth\" + 0.015*\"mount\" + 0.010*\"north\" + 0.009*\"land\" + 0.009*\"sourc\" + 0.009*\"palmer\" + 0.008*\"lobe\"\n", + "2019-01-31 01:35:24,372 : INFO : topic #48 (0.020): 0.079*\"march\" + 0.078*\"sens\" + 0.077*\"octob\" + 0.071*\"januari\" + 0.069*\"april\" + 0.069*\"juli\" + 0.069*\"august\" + 0.068*\"notion\" + 0.066*\"judici\" + 0.066*\"decatur\"\n", + "2019-01-31 01:35:24,373 : INFO : topic #26 (0.020): 0.029*\"workplac\" + 0.028*\"champion\" + 0.025*\"woman\" + 0.024*\"olymp\" + 0.024*\"men\" + 0.022*\"alic\" + 0.021*\"medal\" + 0.020*\"event\" + 0.018*\"rainfal\" + 0.018*\"taxpay\"\n", + "2019-01-31 01:35:24,379 : INFO : topic diff=0.003067, rho=0.020851\n", + "2019-01-31 01:35:24,537 : INFO : PROGRESS: pass 0, at document #4602000/4922894\n", + "2019-01-31 01:35:25,897 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:35:26,163 : INFO : topic #27 (0.020): 0.076*\"questionnair\" + 0.020*\"candid\" + 0.017*\"taxpay\" + 0.013*\"tornado\" + 0.012*\"driver\" + 0.012*\"fool\" + 0.011*\"find\" + 0.011*\"ret\" + 0.010*\"landslid\" + 0.010*\"squatter\"\n", + "2019-01-31 01:35:26,164 : INFO : topic #9 (0.020): 0.075*\"bone\" + 0.046*\"american\" + 0.026*\"valour\" + 0.020*\"folei\" + 0.019*\"dutch\" + 0.018*\"player\" + 0.017*\"english\" + 0.017*\"polit\" + 0.012*\"acrimoni\" + 0.011*\"simpler\"\n", + "2019-01-31 01:35:26,165 : INFO : topic #8 (0.020): 0.027*\"law\" + 0.023*\"cortic\" + 0.018*\"start\" + 0.016*\"act\" + 0.013*\"ricardo\" + 0.012*\"case\" + 0.010*\"replac\" + 0.009*\"polaris\" + 0.009*\"legal\" + 0.007*\"judaism\"\n", + "2019-01-31 01:35:26,166 : INFO : topic #48 (0.020): 0.079*\"march\" + 0.078*\"sens\" + 0.077*\"octob\" + 0.071*\"januari\" + 0.069*\"juli\" + 0.069*\"august\" + 0.069*\"april\" + 0.068*\"notion\" + 0.067*\"judici\" + 0.066*\"decatur\"\n", + "2019-01-31 01:35:26,167 : INFO : topic #32 (0.020): 0.050*\"district\" + 0.045*\"popolo\" + 0.042*\"vigour\" + 0.034*\"tortur\" + 0.032*\"cotton\" + 0.023*\"adulthood\" + 0.022*\"area\" + 0.022*\"multitud\" + 0.020*\"cede\" + 0.018*\"citi\"\n", + "2019-01-31 01:35:26,173 : INFO : topic diff=0.003019, rho=0.020847\n", + "2019-01-31 01:35:26,327 : INFO : PROGRESS: pass 0, at document #4604000/4922894\n", + "2019-01-31 01:35:27,697 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:35:27,963 : INFO : topic #48 (0.020): 0.079*\"march\" + 0.078*\"sens\" + 0.077*\"octob\" + 0.071*\"januari\" + 0.070*\"juli\" + 0.069*\"august\" + 0.069*\"april\" + 0.068*\"notion\" + 0.067*\"judici\" + 0.066*\"decatur\"\n", + "2019-01-31 01:35:27,964 : INFO : topic #44 (0.020): 0.030*\"rooftop\" + 0.026*\"final\" + 0.023*\"wife\" + 0.021*\"tourist\" + 0.018*\"champion\" + 0.016*\"martin\" + 0.014*\"taxpay\" + 0.014*\"chamber\" + 0.013*\"tiepolo\" + 0.012*\"winner\"\n", + "2019-01-31 01:35:27,966 : INFO : topic #10 (0.020): 0.010*\"cdd\" + 0.009*\"media\" + 0.008*\"disco\" + 0.007*\"have\" + 0.007*\"hormon\" + 0.007*\"pathwai\" + 0.007*\"caus\" + 0.006*\"proper\" + 0.006*\"treat\" + 0.006*\"effect\"\n", + "2019-01-31 01:35:27,967 : INFO : topic #43 (0.020): 0.066*\"elect\" + 0.055*\"parti\" + 0.025*\"voluntari\" + 0.023*\"democrat\" + 0.020*\"member\" + 0.017*\"polici\" + 0.015*\"republ\" + 0.014*\"selma\" + 0.014*\"bypass\" + 0.014*\"report\"\n", + "2019-01-31 01:35:27,968 : INFO : topic #42 (0.020): 0.047*\"german\" + 0.031*\"germani\" + 0.016*\"vol\" + 0.015*\"jewish\" + 0.015*\"israel\" + 0.015*\"berlin\" + 0.014*\"der\" + 0.009*\"isra\" + 0.009*\"europ\" + 0.009*\"austria\"\n", + "2019-01-31 01:35:27,973 : INFO : topic diff=0.002804, rho=0.020842\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 01:35:28,132 : INFO : PROGRESS: pass 0, at document #4606000/4922894\n", + "2019-01-31 01:35:29,514 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:35:29,780 : INFO : topic #8 (0.020): 0.027*\"law\" + 0.023*\"cortic\" + 0.018*\"start\" + 0.016*\"act\" + 0.013*\"ricardo\" + 0.012*\"case\" + 0.010*\"replac\" + 0.009*\"polaris\" + 0.009*\"legal\" + 0.007*\"judaism\"\n", + "2019-01-31 01:35:29,781 : INFO : topic #41 (0.020): 0.042*\"citi\" + 0.024*\"palmer\" + 0.020*\"new\" + 0.017*\"strategist\" + 0.013*\"open\" + 0.013*\"center\" + 0.011*\"lobe\" + 0.011*\"includ\" + 0.010*\"dai\" + 0.009*\"highli\"\n", + "2019-01-31 01:35:29,782 : INFO : topic #30 (0.020): 0.035*\"cleveland\" + 0.034*\"leagu\" + 0.030*\"place\" + 0.027*\"taxpay\" + 0.024*\"scientist\" + 0.023*\"crete\" + 0.021*\"folei\" + 0.017*\"goal\" + 0.015*\"martin\" + 0.013*\"schmitz\"\n", + "2019-01-31 01:35:29,783 : INFO : topic #19 (0.020): 0.017*\"languag\" + 0.015*\"centuri\" + 0.010*\"woodcut\" + 0.010*\"form\" + 0.009*\"origin\" + 0.009*\"mean\" + 0.008*\"trade\" + 0.008*\"english\" + 0.007*\"known\" + 0.007*\"uruguayan\"\n", + "2019-01-31 01:35:29,784 : INFO : topic #46 (0.020): 0.017*\"stop\" + 0.015*\"sweden\" + 0.015*\"swedish\" + 0.014*\"norwai\" + 0.014*\"damag\" + 0.014*\"wind\" + 0.013*\"norwegian\" + 0.012*\"treeless\" + 0.011*\"huntsvil\" + 0.010*\"turkish\"\n", + "2019-01-31 01:35:29,790 : INFO : topic diff=0.002650, rho=0.020838\n", + "2019-01-31 01:35:30,005 : INFO : PROGRESS: pass 0, at document #4608000/4922894\n", + "2019-01-31 01:35:31,372 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:35:31,639 : INFO : topic #3 (0.020): 0.034*\"present\" + 0.027*\"minist\" + 0.025*\"offic\" + 0.025*\"nation\" + 0.023*\"govern\" + 0.021*\"member\" + 0.018*\"start\" + 0.016*\"gener\" + 0.015*\"serv\" + 0.014*\"chickasaw\"\n", + "2019-01-31 01:35:31,640 : INFO : topic #2 (0.020): 0.048*\"isl\" + 0.038*\"shield\" + 0.017*\"narrat\" + 0.015*\"scot\" + 0.012*\"upturn\" + 0.012*\"pope\" + 0.012*\"blur\" + 0.011*\"nativist\" + 0.010*\"coalit\" + 0.010*\"fleet\"\n", + "2019-01-31 01:35:31,641 : INFO : topic #7 (0.020): 0.022*\"snatch\" + 0.020*\"di\" + 0.019*\"factor\" + 0.016*\"yawn\" + 0.016*\"margin\" + 0.014*\"bone\" + 0.013*\"faster\" + 0.013*\"life\" + 0.012*\"will\" + 0.012*\"deal\"\n", + "2019-01-31 01:35:31,642 : INFO : topic #24 (0.020): 0.041*\"book\" + 0.036*\"publicis\" + 0.025*\"word\" + 0.020*\"new\" + 0.015*\"presid\" + 0.015*\"edit\" + 0.011*\"nicola\" + 0.011*\"magazin\" + 0.011*\"worldwid\" + 0.011*\"author\"\n", + "2019-01-31 01:35:31,643 : INFO : topic #27 (0.020): 0.076*\"questionnair\" + 0.020*\"candid\" + 0.017*\"taxpay\" + 0.013*\"tornado\" + 0.012*\"driver\" + 0.012*\"fool\" + 0.011*\"find\" + 0.011*\"ret\" + 0.010*\"squatter\" + 0.010*\"landslid\"\n", + "2019-01-31 01:35:31,649 : INFO : topic diff=0.003006, rho=0.020833\n", + "2019-01-31 01:35:31,809 : INFO : PROGRESS: pass 0, at document #4610000/4922894\n", + "2019-01-31 01:35:33,211 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:35:33,478 : INFO : topic #40 (0.020): 0.087*\"unit\" + 0.022*\"schuster\" + 0.022*\"institut\" + 0.021*\"requir\" + 0.020*\"collector\" + 0.019*\"student\" + 0.014*\"professor\" + 0.012*\"word\" + 0.011*\"governor\" + 0.011*\"degre\"\n", + "2019-01-31 01:35:33,479 : INFO : topic #12 (0.020): 0.008*\"number\" + 0.007*\"frontal\" + 0.006*\"poet\" + 0.006*\"gener\" + 0.006*\"exampl\" + 0.006*\"servitud\" + 0.006*\"théori\" + 0.006*\"utopian\" + 0.006*\"method\" + 0.006*\"measur\"\n", + "2019-01-31 01:35:33,480 : INFO : topic #24 (0.020): 0.040*\"book\" + 0.036*\"publicis\" + 0.025*\"word\" + 0.020*\"new\" + 0.015*\"presid\" + 0.015*\"edit\" + 0.011*\"nicola\" + 0.011*\"magazin\" + 0.011*\"author\" + 0.011*\"storag\"\n", + "2019-01-31 01:35:33,481 : INFO : topic #44 (0.020): 0.030*\"rooftop\" + 0.025*\"final\" + 0.023*\"wife\" + 0.020*\"tourist\" + 0.019*\"champion\" + 0.016*\"martin\" + 0.014*\"taxpay\" + 0.014*\"chamber\" + 0.013*\"tiepolo\" + 0.012*\"women\"\n", + "2019-01-31 01:35:33,482 : INFO : topic #23 (0.020): 0.137*\"audit\" + 0.068*\"best\" + 0.036*\"yawn\" + 0.030*\"jacksonvil\" + 0.025*\"japanes\" + 0.021*\"noll\" + 0.019*\"women\" + 0.018*\"intern\" + 0.018*\"festiv\" + 0.014*\"prison\"\n", + "2019-01-31 01:35:33,488 : INFO : topic diff=0.003296, rho=0.020829\n", + "2019-01-31 01:35:33,649 : INFO : PROGRESS: pass 0, at document #4612000/4922894\n", + "2019-01-31 01:35:35,041 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:35:35,308 : INFO : topic #33 (0.020): 0.060*\"french\" + 0.044*\"franc\" + 0.030*\"pari\" + 0.023*\"sail\" + 0.022*\"jean\" + 0.016*\"daphn\" + 0.013*\"lazi\" + 0.012*\"piec\" + 0.011*\"loui\" + 0.010*\"wreath\"\n", + "2019-01-31 01:35:35,309 : INFO : topic #23 (0.020): 0.137*\"audit\" + 0.068*\"best\" + 0.035*\"yawn\" + 0.030*\"jacksonvil\" + 0.025*\"japanes\" + 0.021*\"noll\" + 0.019*\"women\" + 0.018*\"intern\" + 0.018*\"festiv\" + 0.014*\"prison\"\n", + "2019-01-31 01:35:35,310 : INFO : topic #13 (0.020): 0.026*\"australia\" + 0.026*\"london\" + 0.026*\"sourc\" + 0.025*\"new\" + 0.023*\"england\" + 0.022*\"australian\" + 0.020*\"british\" + 0.018*\"ireland\" + 0.015*\"youth\" + 0.014*\"wale\"\n", + "2019-01-31 01:35:35,311 : INFO : topic #15 (0.020): 0.011*\"small\" + 0.010*\"organ\" + 0.010*\"develop\" + 0.009*\"commun\" + 0.009*\"group\" + 0.008*\"word\" + 0.008*\"peopl\" + 0.008*\"woman\" + 0.007*\"human\" + 0.006*\"summerhil\"\n", + "2019-01-31 01:35:35,312 : INFO : topic #26 (0.020): 0.030*\"workplac\" + 0.029*\"champion\" + 0.025*\"woman\" + 0.024*\"olymp\" + 0.024*\"men\" + 0.022*\"medal\" + 0.021*\"alic\" + 0.020*\"event\" + 0.018*\"taxpay\" + 0.018*\"rainfal\"\n", + "2019-01-31 01:35:35,318 : INFO : topic diff=0.003460, rho=0.020824\n", + "2019-01-31 01:35:35,475 : INFO : PROGRESS: pass 0, at document #4614000/4922894\n", + "2019-01-31 01:35:36,845 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:35:37,112 : INFO : topic #26 (0.020): 0.030*\"workplac\" + 0.029*\"champion\" + 0.025*\"woman\" + 0.024*\"olymp\" + 0.024*\"men\" + 0.022*\"medal\" + 0.021*\"alic\" + 0.020*\"event\" + 0.018*\"taxpay\" + 0.018*\"rainfal\"\n", + "2019-01-31 01:35:37,113 : INFO : topic #9 (0.020): 0.073*\"bone\" + 0.047*\"american\" + 0.026*\"valour\" + 0.019*\"folei\" + 0.019*\"dutch\" + 0.018*\"player\" + 0.017*\"english\" + 0.017*\"polit\" + 0.012*\"acrimoni\" + 0.011*\"simpler\"\n", + "2019-01-31 01:35:37,114 : INFO : topic #0 (0.020): 0.062*\"statewid\" + 0.040*\"line\" + 0.032*\"rivièr\" + 0.031*\"raid\" + 0.026*\"rosenwald\" + 0.021*\"airmen\" + 0.018*\"traceabl\" + 0.018*\"serv\" + 0.013*\"oper\" + 0.010*\"briarwood\"\n", + "2019-01-31 01:35:37,115 : INFO : topic #20 (0.020): 0.146*\"scholar\" + 0.040*\"struggl\" + 0.032*\"high\" + 0.030*\"educ\" + 0.024*\"collector\" + 0.018*\"yawn\" + 0.012*\"prognosi\" + 0.010*\"district\" + 0.010*\"gothic\" + 0.010*\"task\"\n", + "2019-01-31 01:35:37,116 : INFO : topic #46 (0.020): 0.017*\"stop\" + 0.016*\"sweden\" + 0.016*\"swedish\" + 0.015*\"norwai\" + 0.014*\"damag\" + 0.013*\"wind\" + 0.013*\"norwegian\" + 0.011*\"treeless\" + 0.011*\"huntsvil\" + 0.010*\"denmark\"\n", + "2019-01-31 01:35:37,122 : INFO : topic diff=0.002780, rho=0.020820\n", + "2019-01-31 01:35:37,278 : INFO : PROGRESS: pass 0, at document #4616000/4922894\n", + "2019-01-31 01:35:38,655 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:35:38,921 : INFO : topic #28 (0.020): 0.036*\"build\" + 0.030*\"hous\" + 0.019*\"buford\" + 0.015*\"histor\" + 0.012*\"depress\" + 0.011*\"linear\" + 0.011*\"centuri\" + 0.011*\"silicon\" + 0.011*\"constitut\" + 0.010*\"pistol\"\n", + "2019-01-31 01:35:38,922 : INFO : topic #47 (0.020): 0.066*\"muscl\" + 0.031*\"perceptu\" + 0.020*\"theater\" + 0.018*\"compos\" + 0.017*\"place\" + 0.015*\"damn\" + 0.013*\"physician\" + 0.013*\"orchestr\" + 0.013*\"olympo\" + 0.011*\"word\"\n", + "2019-01-31 01:35:38,923 : INFO : topic #5 (0.020): 0.038*\"abroad\" + 0.028*\"son\" + 0.026*\"rel\" + 0.025*\"reconstruct\" + 0.020*\"band\" + 0.017*\"muscl\" + 0.016*\"simultan\" + 0.014*\"charcoal\" + 0.014*\"toyota\" + 0.009*\"myspac\"\n", + "2019-01-31 01:35:38,925 : INFO : topic #10 (0.020): 0.010*\"cdd\" + 0.009*\"media\" + 0.008*\"disco\" + 0.008*\"have\" + 0.007*\"pathwai\" + 0.007*\"hormon\" + 0.007*\"caus\" + 0.006*\"proper\" + 0.006*\"treat\" + 0.006*\"effect\"\n", + "2019-01-31 01:35:38,925 : INFO : topic #32 (0.020): 0.049*\"district\" + 0.046*\"popolo\" + 0.043*\"vigour\" + 0.034*\"tortur\" + 0.032*\"cotton\" + 0.023*\"adulthood\" + 0.022*\"area\" + 0.021*\"multitud\" + 0.020*\"cede\" + 0.018*\"citi\"\n", + "2019-01-31 01:35:38,931 : INFO : topic diff=0.002501, rho=0.020815\n", + "2019-01-31 01:35:39,091 : INFO : PROGRESS: pass 0, at document #4618000/4922894\n", + "2019-01-31 01:35:40,492 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 01:35:40,759 : INFO : topic #38 (0.020): 0.022*\"walter\" + 0.010*\"aza\" + 0.009*\"forc\" + 0.009*\"battalion\" + 0.007*\"armi\" + 0.007*\"empath\" + 0.007*\"govern\" + 0.006*\"teufel\" + 0.006*\"militari\" + 0.006*\"pour\"\n", + "2019-01-31 01:35:40,760 : INFO : topic #45 (0.020): 0.047*\"arsen\" + 0.031*\"museo\" + 0.030*\"jpg\" + 0.028*\"fifteenth\" + 0.022*\"pain\" + 0.020*\"illicit\" + 0.017*\"artist\" + 0.016*\"exhaust\" + 0.016*\"gai\" + 0.015*\"colder\"\n", + "2019-01-31 01:35:40,762 : INFO : topic #4 (0.020): 0.019*\"enfranchis\" + 0.014*\"depress\" + 0.014*\"pour\" + 0.008*\"mode\" + 0.008*\"elabor\" + 0.008*\"uruguayan\" + 0.008*\"veget\" + 0.007*\"turn\" + 0.006*\"produc\" + 0.006*\"develop\"\n", + "2019-01-31 01:35:40,763 : INFO : topic #41 (0.020): 0.042*\"citi\" + 0.024*\"palmer\" + 0.020*\"new\" + 0.017*\"strategist\" + 0.013*\"open\" + 0.013*\"center\" + 0.011*\"lobe\" + 0.011*\"includ\" + 0.010*\"dai\" + 0.009*\"highli\"\n", + "2019-01-31 01:35:40,764 : INFO : topic #3 (0.020): 0.034*\"present\" + 0.027*\"minist\" + 0.025*\"nation\" + 0.024*\"offic\" + 0.023*\"govern\" + 0.021*\"member\" + 0.017*\"start\" + 0.016*\"gener\" + 0.015*\"serv\" + 0.014*\"chickasaw\"\n", + "2019-01-31 01:35:40,770 : INFO : topic diff=0.002865, rho=0.020811\n", + "2019-01-31 01:35:43,446 : INFO : -11.793 per-word bound, 3548.8 perplexity estimate based on a held-out corpus of 2000 documents with 539496 words\n", + "2019-01-31 01:35:43,446 : INFO : PROGRESS: pass 0, at document #4620000/4922894\n", + "2019-01-31 01:35:44,816 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:35:45,082 : INFO : topic #40 (0.020): 0.087*\"unit\" + 0.023*\"schuster\" + 0.022*\"institut\" + 0.022*\"requir\" + 0.020*\"collector\" + 0.019*\"student\" + 0.014*\"professor\" + 0.012*\"word\" + 0.011*\"governor\" + 0.011*\"degre\"\n", + "2019-01-31 01:35:45,084 : INFO : topic #0 (0.020): 0.062*\"statewid\" + 0.039*\"line\" + 0.031*\"rivièr\" + 0.031*\"raid\" + 0.026*\"rosenwald\" + 0.021*\"airmen\" + 0.018*\"traceabl\" + 0.018*\"serv\" + 0.013*\"oper\" + 0.010*\"briarwood\"\n", + "2019-01-31 01:35:45,085 : INFO : topic #26 (0.020): 0.030*\"workplac\" + 0.029*\"champion\" + 0.026*\"woman\" + 0.025*\"men\" + 0.024*\"olymp\" + 0.022*\"medal\" + 0.021*\"alic\" + 0.020*\"event\" + 0.018*\"taxpay\" + 0.018*\"rainfal\"\n", + "2019-01-31 01:35:45,086 : INFO : topic #33 (0.020): 0.060*\"french\" + 0.044*\"franc\" + 0.030*\"pari\" + 0.023*\"sail\" + 0.022*\"jean\" + 0.016*\"daphn\" + 0.013*\"lazi\" + 0.012*\"piec\" + 0.012*\"loui\" + 0.009*\"wine\"\n", + "2019-01-31 01:35:45,087 : INFO : topic #43 (0.020): 0.066*\"elect\" + 0.055*\"parti\" + 0.024*\"voluntari\" + 0.023*\"democrat\" + 0.020*\"member\" + 0.017*\"polici\" + 0.015*\"republ\" + 0.014*\"report\" + 0.014*\"bypass\" + 0.014*\"selma\"\n", + "2019-01-31 01:35:45,092 : INFO : topic diff=0.002813, rho=0.020806\n", + "2019-01-31 01:35:45,255 : INFO : PROGRESS: pass 0, at document #4622000/4922894\n", + "2019-01-31 01:35:46,673 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:35:46,939 : INFO : topic #13 (0.020): 0.026*\"australia\" + 0.026*\"sourc\" + 0.026*\"london\" + 0.025*\"new\" + 0.023*\"england\" + 0.022*\"australian\" + 0.020*\"british\" + 0.018*\"ireland\" + 0.015*\"youth\" + 0.013*\"wale\"\n", + "2019-01-31 01:35:46,940 : INFO : topic #42 (0.020): 0.048*\"german\" + 0.031*\"germani\" + 0.016*\"vol\" + 0.015*\"israel\" + 0.015*\"jewish\" + 0.014*\"berlin\" + 0.014*\"der\" + 0.009*\"european\" + 0.009*\"europ\" + 0.009*\"austria\"\n", + "2019-01-31 01:35:46,941 : INFO : topic #23 (0.020): 0.137*\"audit\" + 0.069*\"best\" + 0.035*\"yawn\" + 0.030*\"jacksonvil\" + 0.025*\"japanes\" + 0.021*\"noll\" + 0.019*\"women\" + 0.018*\"intern\" + 0.018*\"festiv\" + 0.014*\"prison\"\n", + "2019-01-31 01:35:46,942 : INFO : topic #5 (0.020): 0.038*\"abroad\" + 0.028*\"son\" + 0.026*\"rel\" + 0.025*\"reconstruct\" + 0.020*\"band\" + 0.017*\"muscl\" + 0.015*\"simultan\" + 0.014*\"charcoal\" + 0.014*\"toyota\" + 0.010*\"myspac\"\n", + "2019-01-31 01:35:46,943 : INFO : topic #17 (0.020): 0.080*\"church\" + 0.024*\"cathol\" + 0.024*\"christian\" + 0.021*\"bishop\" + 0.016*\"sail\" + 0.015*\"retroflex\" + 0.010*\"relationship\" + 0.010*\"historiographi\" + 0.009*\"cathedr\" + 0.009*\"poll\"\n", + "2019-01-31 01:35:46,949 : INFO : topic diff=0.003733, rho=0.020802\n", + "2019-01-31 01:35:47,108 : INFO : PROGRESS: pass 0, at document #4624000/4922894\n", + "2019-01-31 01:35:48,501 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:35:48,767 : INFO : topic #22 (0.020): 0.033*\"spars\" + 0.017*\"factor\" + 0.012*\"plaisir\" + 0.010*\"genu\" + 0.010*\"western\" + 0.008*\"biom\" + 0.008*\"median\" + 0.007*\"trap\" + 0.007*\"incom\" + 0.006*\"florida\"\n", + "2019-01-31 01:35:48,768 : INFO : topic #11 (0.020): 0.023*\"john\" + 0.011*\"david\" + 0.011*\"jame\" + 0.011*\"will\" + 0.010*\"rival\" + 0.010*\"mexican–american\" + 0.008*\"paul\" + 0.008*\"slur\" + 0.008*\"georg\" + 0.007*\"rhyme\"\n", + "2019-01-31 01:35:48,769 : INFO : topic #10 (0.020): 0.010*\"cdd\" + 0.009*\"media\" + 0.008*\"disco\" + 0.008*\"have\" + 0.007*\"pathwai\" + 0.007*\"hormon\" + 0.007*\"caus\" + 0.006*\"proper\" + 0.006*\"effect\" + 0.006*\"treat\"\n", + "2019-01-31 01:35:48,770 : INFO : topic #40 (0.020): 0.086*\"unit\" + 0.023*\"schuster\" + 0.022*\"institut\" + 0.022*\"requir\" + 0.020*\"collector\" + 0.019*\"student\" + 0.014*\"professor\" + 0.012*\"word\" + 0.011*\"governor\" + 0.011*\"degre\"\n", + "2019-01-31 01:35:48,771 : INFO : topic #39 (0.020): 0.060*\"canada\" + 0.047*\"canadian\" + 0.024*\"toronto\" + 0.023*\"hoar\" + 0.022*\"ontario\" + 0.016*\"misericordia\" + 0.015*\"novotná\" + 0.015*\"hydrogen\" + 0.014*\"new\" + 0.014*\"quebec\"\n", + "2019-01-31 01:35:48,777 : INFO : topic diff=0.003301, rho=0.020797\n", + "2019-01-31 01:35:48,933 : INFO : PROGRESS: pass 0, at document #4626000/4922894\n", + "2019-01-31 01:35:50,301 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:35:50,568 : INFO : topic #48 (0.020): 0.082*\"march\" + 0.077*\"sens\" + 0.076*\"octob\" + 0.072*\"januari\" + 0.069*\"juli\" + 0.069*\"april\" + 0.068*\"august\" + 0.068*\"notion\" + 0.067*\"judici\" + 0.065*\"decatur\"\n", + "2019-01-31 01:35:50,569 : INFO : topic #8 (0.020): 0.027*\"law\" + 0.023*\"cortic\" + 0.018*\"start\" + 0.016*\"act\" + 0.013*\"ricardo\" + 0.012*\"case\" + 0.010*\"replac\" + 0.009*\"polaris\" + 0.009*\"legal\" + 0.007*\"judaism\"\n", + "2019-01-31 01:35:50,570 : INFO : topic #13 (0.020): 0.027*\"australia\" + 0.026*\"sourc\" + 0.025*\"london\" + 0.025*\"new\" + 0.023*\"england\" + 0.022*\"australian\" + 0.020*\"british\" + 0.018*\"ireland\" + 0.015*\"youth\" + 0.014*\"wale\"\n", + "2019-01-31 01:35:50,571 : INFO : topic #31 (0.020): 0.051*\"fusiform\" + 0.027*\"scientist\" + 0.025*\"taxpay\" + 0.022*\"player\" + 0.020*\"place\" + 0.015*\"clot\" + 0.013*\"leagu\" + 0.011*\"folei\" + 0.011*\"yawn\" + 0.009*\"reconstruct\"\n", + "2019-01-31 01:35:50,572 : INFO : topic #5 (0.020): 0.038*\"abroad\" + 0.028*\"son\" + 0.026*\"rel\" + 0.025*\"reconstruct\" + 0.020*\"band\" + 0.016*\"muscl\" + 0.015*\"simultan\" + 0.014*\"charcoal\" + 0.014*\"toyota\" + 0.010*\"myspac\"\n", + "2019-01-31 01:35:50,578 : INFO : topic diff=0.003136, rho=0.020793\n", + "2019-01-31 01:35:50,735 : INFO : PROGRESS: pass 0, at document #4628000/4922894\n", + "2019-01-31 01:35:52,108 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:35:52,374 : INFO : topic #43 (0.020): 0.066*\"elect\" + 0.055*\"parti\" + 0.024*\"voluntari\" + 0.024*\"democrat\" + 0.020*\"member\" + 0.016*\"polici\" + 0.015*\"republ\" + 0.014*\"bypass\" + 0.014*\"selma\" + 0.014*\"liber\"\n", + "2019-01-31 01:35:52,375 : INFO : topic #45 (0.020): 0.047*\"arsen\" + 0.031*\"museo\" + 0.030*\"jpg\" + 0.028*\"fifteenth\" + 0.022*\"pain\" + 0.020*\"illicit\" + 0.017*\"artist\" + 0.016*\"exhaust\" + 0.016*\"gai\" + 0.015*\"colder\"\n", + "2019-01-31 01:35:52,376 : INFO : topic #39 (0.020): 0.060*\"canada\" + 0.048*\"canadian\" + 0.024*\"toronto\" + 0.023*\"hoar\" + 0.023*\"ontario\" + 0.016*\"misericordia\" + 0.015*\"novotná\" + 0.015*\"hydrogen\" + 0.014*\"new\" + 0.014*\"quebec\"\n", + "2019-01-31 01:35:52,377 : INFO : topic #47 (0.020): 0.066*\"muscl\" + 0.031*\"perceptu\" + 0.020*\"theater\" + 0.018*\"compos\" + 0.017*\"place\" + 0.015*\"damn\" + 0.013*\"orchestr\" + 0.013*\"olympo\" + 0.013*\"physician\" + 0.011*\"word\"\n", + "2019-01-31 01:35:52,378 : INFO : topic #24 (0.020): 0.041*\"book\" + 0.036*\"publicis\" + 0.025*\"word\" + 0.020*\"new\" + 0.014*\"presid\" + 0.014*\"edit\" + 0.012*\"nicola\" + 0.011*\"magazin\" + 0.011*\"worldwid\" + 0.011*\"author\"\n", + "2019-01-31 01:35:52,384 : INFO : topic diff=0.003417, rho=0.020788\n", + "2019-01-31 01:35:52,537 : INFO : PROGRESS: pass 0, at document #4630000/4922894\n", + "2019-01-31 01:35:53,894 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 01:35:54,160 : INFO : topic #26 (0.020): 0.029*\"workplac\" + 0.028*\"champion\" + 0.026*\"woman\" + 0.025*\"men\" + 0.024*\"olymp\" + 0.022*\"alic\" + 0.022*\"medal\" + 0.020*\"event\" + 0.018*\"taxpay\" + 0.018*\"rainfal\"\n", + "2019-01-31 01:35:54,161 : INFO : topic #39 (0.020): 0.060*\"canada\" + 0.049*\"canadian\" + 0.024*\"toronto\" + 0.023*\"hoar\" + 0.022*\"ontario\" + 0.016*\"misericordia\" + 0.015*\"novotná\" + 0.015*\"hydrogen\" + 0.014*\"new\" + 0.014*\"quebec\"\n", + "2019-01-31 01:35:54,162 : INFO : topic #23 (0.020): 0.137*\"audit\" + 0.069*\"best\" + 0.035*\"yawn\" + 0.030*\"jacksonvil\" + 0.025*\"japanes\" + 0.022*\"noll\" + 0.019*\"women\" + 0.018*\"intern\" + 0.018*\"festiv\" + 0.014*\"prison\"\n", + "2019-01-31 01:35:54,163 : INFO : topic #40 (0.020): 0.086*\"unit\" + 0.023*\"schuster\" + 0.022*\"institut\" + 0.022*\"requir\" + 0.020*\"collector\" + 0.019*\"student\" + 0.014*\"professor\" + 0.012*\"word\" + 0.011*\"governor\" + 0.011*\"degre\"\n", + "2019-01-31 01:35:54,164 : INFO : topic #38 (0.020): 0.023*\"walter\" + 0.009*\"aza\" + 0.009*\"forc\" + 0.009*\"battalion\" + 0.007*\"armi\" + 0.007*\"empath\" + 0.007*\"govern\" + 0.006*\"militari\" + 0.006*\"teufel\" + 0.006*\"pour\"\n", + "2019-01-31 01:35:54,170 : INFO : topic diff=0.003429, rho=0.020784\n", + "2019-01-31 01:35:54,320 : INFO : PROGRESS: pass 0, at document #4632000/4922894\n", + "2019-01-31 01:35:56,120 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:35:56,386 : INFO : topic #30 (0.020): 0.034*\"cleveland\" + 0.034*\"leagu\" + 0.030*\"place\" + 0.027*\"taxpay\" + 0.024*\"scientist\" + 0.023*\"crete\" + 0.021*\"folei\" + 0.017*\"goal\" + 0.015*\"martin\" + 0.013*\"schmitz\"\n", + "2019-01-31 01:35:56,388 : INFO : topic #31 (0.020): 0.051*\"fusiform\" + 0.027*\"scientist\" + 0.026*\"taxpay\" + 0.022*\"player\" + 0.020*\"place\" + 0.014*\"clot\" + 0.013*\"leagu\" + 0.011*\"folei\" + 0.011*\"yawn\" + 0.009*\"reconstruct\"\n", + "2019-01-31 01:35:56,389 : INFO : topic #42 (0.020): 0.048*\"german\" + 0.031*\"germani\" + 0.016*\"vol\" + 0.015*\"israel\" + 0.014*\"jewish\" + 0.014*\"berlin\" + 0.014*\"der\" + 0.009*\"european\" + 0.009*\"austria\" + 0.009*\"europ\"\n", + "2019-01-31 01:35:56,390 : INFO : topic #49 (0.020): 0.042*\"india\" + 0.030*\"incumb\" + 0.013*\"islam\" + 0.012*\"pakistan\" + 0.012*\"anglo\" + 0.011*\"televis\" + 0.011*\"affection\" + 0.010*\"muskoge\" + 0.010*\"khalsa\" + 0.009*\"sri\"\n", + "2019-01-31 01:35:56,391 : INFO : topic #27 (0.020): 0.075*\"questionnair\" + 0.020*\"candid\" + 0.017*\"taxpay\" + 0.014*\"ret\" + 0.013*\"driver\" + 0.012*\"tornado\" + 0.012*\"fool\" + 0.011*\"find\" + 0.010*\"squatter\" + 0.010*\"landslid\"\n", + "2019-01-31 01:35:56,396 : INFO : topic diff=0.003634, rho=0.020779\n", + "2019-01-31 01:35:56,558 : INFO : PROGRESS: pass 0, at document #4634000/4922894\n", + "2019-01-31 01:35:58,045 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:35:58,312 : INFO : topic #37 (0.020): 0.012*\"charact\" + 0.012*\"septemb\" + 0.011*\"anim\" + 0.011*\"man\" + 0.009*\"comic\" + 0.007*\"appear\" + 0.007*\"storag\" + 0.007*\"fusiform\" + 0.007*\"workplac\" + 0.006*\"black\"\n", + "2019-01-31 01:35:58,313 : INFO : topic #27 (0.020): 0.075*\"questionnair\" + 0.020*\"candid\" + 0.017*\"taxpay\" + 0.014*\"ret\" + 0.013*\"driver\" + 0.013*\"tornado\" + 0.012*\"fool\" + 0.011*\"find\" + 0.011*\"squatter\" + 0.010*\"landslid\"\n", + "2019-01-31 01:35:58,314 : INFO : topic #2 (0.020): 0.048*\"isl\" + 0.038*\"shield\" + 0.017*\"narrat\" + 0.015*\"scot\" + 0.012*\"pope\" + 0.012*\"blur\" + 0.011*\"nativist\" + 0.010*\"upturn\" + 0.010*\"coalit\" + 0.010*\"fleet\"\n", + "2019-01-31 01:35:58,315 : INFO : topic #28 (0.020): 0.036*\"build\" + 0.031*\"hous\" + 0.019*\"buford\" + 0.015*\"histor\" + 0.012*\"linear\" + 0.011*\"depress\" + 0.011*\"centuri\" + 0.011*\"constitut\" + 0.011*\"silicon\" + 0.010*\"pistol\"\n", + "2019-01-31 01:35:58,316 : INFO : topic #41 (0.020): 0.042*\"citi\" + 0.024*\"palmer\" + 0.019*\"new\" + 0.017*\"strategist\" + 0.013*\"open\" + 0.013*\"center\" + 0.011*\"lobe\" + 0.011*\"includ\" + 0.010*\"dai\" + 0.009*\"highli\"\n", + "2019-01-31 01:35:58,322 : INFO : topic diff=0.003200, rho=0.020775\n", + "2019-01-31 01:35:58,482 : INFO : PROGRESS: pass 0, at document #4636000/4922894\n", + "2019-01-31 01:35:59,864 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:36:00,130 : INFO : topic #38 (0.020): 0.023*\"walter\" + 0.009*\"aza\" + 0.009*\"forc\" + 0.009*\"battalion\" + 0.007*\"armi\" + 0.007*\"empath\" + 0.007*\"govern\" + 0.006*\"teufel\" + 0.006*\"militari\" + 0.006*\"pour\"\n", + "2019-01-31 01:36:00,132 : INFO : topic #14 (0.020): 0.024*\"forc\" + 0.021*\"aggress\" + 0.021*\"armi\" + 0.020*\"walter\" + 0.019*\"com\" + 0.014*\"oper\" + 0.013*\"unionist\" + 0.013*\"airbu\" + 0.012*\"militari\" + 0.011*\"refut\"\n", + "2019-01-31 01:36:00,133 : INFO : topic #1 (0.020): 0.056*\"china\" + 0.048*\"chilton\" + 0.026*\"hong\" + 0.025*\"kong\" + 0.020*\"korea\" + 0.017*\"korean\" + 0.015*\"leah\" + 0.014*\"sourc\" + 0.014*\"kim\" + 0.013*\"shirin\"\n", + "2019-01-31 01:36:00,134 : INFO : topic #26 (0.020): 0.029*\"workplac\" + 0.028*\"champion\" + 0.026*\"woman\" + 0.025*\"men\" + 0.024*\"olymp\" + 0.022*\"alic\" + 0.022*\"medal\" + 0.020*\"event\" + 0.018*\"taxpay\" + 0.018*\"rainfal\"\n", + "2019-01-31 01:36:00,135 : INFO : topic #17 (0.020): 0.080*\"church\" + 0.024*\"cathol\" + 0.023*\"christian\" + 0.021*\"bishop\" + 0.016*\"sail\" + 0.015*\"retroflex\" + 0.010*\"relationship\" + 0.010*\"historiographi\" + 0.009*\"cathedr\" + 0.008*\"poll\"\n", + "2019-01-31 01:36:00,141 : INFO : topic diff=0.002718, rho=0.020770\n", + "2019-01-31 01:36:00,358 : INFO : PROGRESS: pass 0, at document #4638000/4922894\n", + "2019-01-31 01:36:01,746 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:36:02,013 : INFO : topic #22 (0.020): 0.033*\"spars\" + 0.017*\"factor\" + 0.012*\"plaisir\" + 0.010*\"genu\" + 0.010*\"western\" + 0.009*\"biom\" + 0.008*\"median\" + 0.007*\"trap\" + 0.007*\"incom\" + 0.006*\"florida\"\n", + "2019-01-31 01:36:02,014 : INFO : topic #0 (0.020): 0.062*\"statewid\" + 0.040*\"line\" + 0.031*\"raid\" + 0.031*\"rivièr\" + 0.025*\"rosenwald\" + 0.022*\"airmen\" + 0.018*\"traceabl\" + 0.018*\"serv\" + 0.013*\"oper\" + 0.010*\"briarwood\"\n", + "2019-01-31 01:36:02,015 : INFO : topic #3 (0.020): 0.034*\"present\" + 0.026*\"minist\" + 0.026*\"nation\" + 0.025*\"offic\" + 0.023*\"govern\" + 0.021*\"member\" + 0.017*\"start\" + 0.017*\"serv\" + 0.016*\"gener\" + 0.014*\"chickasaw\"\n", + "2019-01-31 01:36:02,016 : INFO : topic #13 (0.020): 0.027*\"australia\" + 0.026*\"sourc\" + 0.026*\"london\" + 0.025*\"new\" + 0.023*\"england\" + 0.022*\"australian\" + 0.019*\"british\" + 0.018*\"ireland\" + 0.015*\"youth\" + 0.013*\"wale\"\n", + "2019-01-31 01:36:02,017 : INFO : topic #42 (0.020): 0.048*\"german\" + 0.032*\"germani\" + 0.016*\"vol\" + 0.015*\"israel\" + 0.014*\"berlin\" + 0.014*\"jewish\" + 0.014*\"der\" + 0.009*\"european\" + 0.009*\"austria\" + 0.009*\"europ\"\n", + "2019-01-31 01:36:02,023 : INFO : topic diff=0.003064, rho=0.020766\n", + "2019-01-31 01:36:04,662 : INFO : -11.738 per-word bound, 3415.9 perplexity estimate based on a held-out corpus of 2000 documents with 547135 words\n", + "2019-01-31 01:36:04,663 : INFO : PROGRESS: pass 0, at document #4640000/4922894\n", + "2019-01-31 01:36:06,023 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:36:06,289 : INFO : topic #17 (0.020): 0.080*\"church\" + 0.024*\"cathol\" + 0.023*\"christian\" + 0.021*\"bishop\" + 0.016*\"sail\" + 0.015*\"retroflex\" + 0.010*\"relationship\" + 0.010*\"historiographi\" + 0.009*\"cathedr\" + 0.009*\"parish\"\n", + "2019-01-31 01:36:06,291 : INFO : topic #34 (0.020): 0.066*\"start\" + 0.033*\"new\" + 0.032*\"american\" + 0.029*\"unionist\" + 0.025*\"cotton\" + 0.021*\"year\" + 0.015*\"california\" + 0.013*\"warrior\" + 0.012*\"terri\" + 0.012*\"north\"\n", + "2019-01-31 01:36:06,292 : INFO : topic #44 (0.020): 0.030*\"rooftop\" + 0.025*\"final\" + 0.022*\"wife\" + 0.020*\"tourist\" + 0.019*\"champion\" + 0.015*\"martin\" + 0.015*\"taxpay\" + 0.014*\"chamber\" + 0.014*\"tiepolo\" + 0.012*\"workplac\"\n", + "2019-01-31 01:36:06,293 : INFO : topic #46 (0.020): 0.018*\"stop\" + 0.017*\"sweden\" + 0.016*\"swedish\" + 0.015*\"norwai\" + 0.014*\"damag\" + 0.013*\"wind\" + 0.013*\"norwegian\" + 0.011*\"huntsvil\" + 0.011*\"treeless\" + 0.011*\"turkish\"\n", + "2019-01-31 01:36:06,294 : INFO : topic #5 (0.020): 0.038*\"abroad\" + 0.028*\"son\" + 0.026*\"rel\" + 0.025*\"reconstruct\" + 0.020*\"band\" + 0.016*\"muscl\" + 0.015*\"simultan\" + 0.014*\"charcoal\" + 0.013*\"toyota\" + 0.010*\"myspac\"\n", + "2019-01-31 01:36:06,300 : INFO : topic diff=0.003229, rho=0.020761\n", + "2019-01-31 01:36:06,459 : INFO : PROGRESS: pass 0, at document #4642000/4922894\n", + "2019-01-31 01:36:07,833 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 01:36:08,100 : INFO : topic #23 (0.020): 0.138*\"audit\" + 0.069*\"best\" + 0.036*\"yawn\" + 0.029*\"jacksonvil\" + 0.024*\"japanes\" + 0.021*\"noll\" + 0.019*\"women\" + 0.018*\"intern\" + 0.018*\"festiv\" + 0.014*\"prison\"\n", + "2019-01-31 01:36:08,101 : INFO : topic #3 (0.020): 0.033*\"present\" + 0.026*\"minist\" + 0.026*\"nation\" + 0.025*\"offic\" + 0.023*\"govern\" + 0.021*\"member\" + 0.017*\"start\" + 0.017*\"serv\" + 0.016*\"gener\" + 0.014*\"chickasaw\"\n", + "2019-01-31 01:36:08,103 : INFO : topic #44 (0.020): 0.030*\"rooftop\" + 0.025*\"final\" + 0.022*\"wife\" + 0.020*\"tourist\" + 0.019*\"champion\" + 0.015*\"martin\" + 0.014*\"taxpay\" + 0.014*\"chamber\" + 0.014*\"tiepolo\" + 0.012*\"open\"\n", + "2019-01-31 01:36:08,104 : INFO : topic #1 (0.020): 0.056*\"china\" + 0.049*\"chilton\" + 0.025*\"hong\" + 0.024*\"kong\" + 0.020*\"korea\" + 0.017*\"korean\" + 0.016*\"leah\" + 0.014*\"sourc\" + 0.014*\"kim\" + 0.013*\"shirin\"\n", + "2019-01-31 01:36:08,105 : INFO : topic #30 (0.020): 0.034*\"cleveland\" + 0.034*\"leagu\" + 0.030*\"place\" + 0.027*\"taxpay\" + 0.024*\"scientist\" + 0.023*\"crete\" + 0.021*\"folei\" + 0.017*\"goal\" + 0.015*\"martin\" + 0.013*\"schmitz\"\n", + "2019-01-31 01:36:08,111 : INFO : topic diff=0.002943, rho=0.020757\n", + "2019-01-31 01:36:08,269 : INFO : PROGRESS: pass 0, at document #4644000/4922894\n", + "2019-01-31 01:36:09,659 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:36:09,925 : INFO : topic #20 (0.020): 0.144*\"scholar\" + 0.040*\"struggl\" + 0.033*\"high\" + 0.029*\"educ\" + 0.024*\"collector\" + 0.018*\"yawn\" + 0.012*\"prognosi\" + 0.010*\"district\" + 0.010*\"gothic\" + 0.009*\"task\"\n", + "2019-01-31 01:36:09,926 : INFO : topic #19 (0.020): 0.017*\"languag\" + 0.015*\"centuri\" + 0.010*\"woodcut\" + 0.009*\"form\" + 0.009*\"origin\" + 0.009*\"mean\" + 0.008*\"trade\" + 0.007*\"english\" + 0.007*\"known\" + 0.007*\"uruguayan\"\n", + "2019-01-31 01:36:09,928 : INFO : topic #9 (0.020): 0.070*\"bone\" + 0.046*\"american\" + 0.028*\"valour\" + 0.020*\"folei\" + 0.019*\"dutch\" + 0.019*\"player\" + 0.017*\"english\" + 0.016*\"polit\" + 0.013*\"acrimoni\" + 0.011*\"simpler\"\n", + "2019-01-31 01:36:09,929 : INFO : topic #31 (0.020): 0.050*\"fusiform\" + 0.027*\"scientist\" + 0.025*\"taxpay\" + 0.022*\"player\" + 0.020*\"place\" + 0.014*\"clot\" + 0.014*\"leagu\" + 0.011*\"yawn\" + 0.011*\"folei\" + 0.009*\"reconstruct\"\n", + "2019-01-31 01:36:09,930 : INFO : topic #22 (0.020): 0.033*\"spars\" + 0.017*\"factor\" + 0.012*\"plaisir\" + 0.011*\"genu\" + 0.010*\"western\" + 0.009*\"biom\" + 0.008*\"median\" + 0.007*\"trap\" + 0.007*\"incom\" + 0.006*\"florida\"\n", + "2019-01-31 01:36:09,936 : INFO : topic diff=0.003041, rho=0.020752\n", + "2019-01-31 01:36:10,093 : INFO : PROGRESS: pass 0, at document #4646000/4922894\n", + "2019-01-31 01:36:11,450 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:36:11,716 : INFO : topic #39 (0.020): 0.060*\"canada\" + 0.048*\"canadian\" + 0.024*\"toronto\" + 0.023*\"hoar\" + 0.022*\"ontario\" + 0.015*\"misericordia\" + 0.015*\"hydrogen\" + 0.015*\"novotná\" + 0.014*\"new\" + 0.013*\"quebec\"\n", + "2019-01-31 01:36:11,717 : INFO : topic #3 (0.020): 0.033*\"present\" + 0.026*\"minist\" + 0.026*\"nation\" + 0.024*\"offic\" + 0.023*\"govern\" + 0.021*\"member\" + 0.017*\"start\" + 0.017*\"serv\" + 0.016*\"gener\" + 0.014*\"chickasaw\"\n", + "2019-01-31 01:36:11,718 : INFO : topic #27 (0.020): 0.075*\"questionnair\" + 0.020*\"candid\" + 0.017*\"taxpay\" + 0.013*\"ret\" + 0.012*\"driver\" + 0.012*\"tornado\" + 0.012*\"fool\" + 0.011*\"squatter\" + 0.011*\"find\" + 0.010*\"horac\"\n", + "2019-01-31 01:36:11,720 : INFO : topic #48 (0.020): 0.080*\"march\" + 0.076*\"sens\" + 0.075*\"octob\" + 0.071*\"januari\" + 0.068*\"juli\" + 0.068*\"notion\" + 0.068*\"april\" + 0.067*\"august\" + 0.065*\"judici\" + 0.064*\"decatur\"\n", + "2019-01-31 01:36:11,721 : INFO : topic #47 (0.020): 0.065*\"muscl\" + 0.031*\"perceptu\" + 0.021*\"theater\" + 0.018*\"compos\" + 0.017*\"place\" + 0.016*\"damn\" + 0.013*\"physician\" + 0.013*\"orchestr\" + 0.013*\"olympo\" + 0.011*\"word\"\n", + "2019-01-31 01:36:11,727 : INFO : topic diff=0.003355, rho=0.020748\n", + "2019-01-31 01:36:11,881 : INFO : PROGRESS: pass 0, at document #4648000/4922894\n", + "2019-01-31 01:36:13,231 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:36:13,497 : INFO : topic #28 (0.020): 0.036*\"build\" + 0.031*\"hous\" + 0.019*\"buford\" + 0.015*\"histor\" + 0.011*\"linear\" + 0.011*\"depress\" + 0.011*\"centuri\" + 0.011*\"constitut\" + 0.011*\"silicon\" + 0.010*\"pistol\"\n", + "2019-01-31 01:36:13,498 : INFO : topic #46 (0.020): 0.018*\"stop\" + 0.016*\"sweden\" + 0.015*\"swedish\" + 0.015*\"norwai\" + 0.014*\"damag\" + 0.014*\"wind\" + 0.013*\"norwegian\" + 0.011*\"treeless\" + 0.011*\"huntsvil\" + 0.010*\"turkish\"\n", + "2019-01-31 01:36:13,500 : INFO : topic #32 (0.020): 0.049*\"district\" + 0.046*\"popolo\" + 0.043*\"vigour\" + 0.034*\"tortur\" + 0.032*\"cotton\" + 0.023*\"adulthood\" + 0.022*\"multitud\" + 0.021*\"area\" + 0.020*\"cede\" + 0.018*\"citi\"\n", + "2019-01-31 01:36:13,501 : INFO : topic #24 (0.020): 0.041*\"book\" + 0.036*\"publicis\" + 0.025*\"word\" + 0.020*\"new\" + 0.015*\"presid\" + 0.014*\"edit\" + 0.012*\"nicola\" + 0.011*\"magazin\" + 0.011*\"worldwid\" + 0.011*\"storag\"\n", + "2019-01-31 01:36:13,502 : INFO : topic #43 (0.020): 0.066*\"elect\" + 0.054*\"parti\" + 0.025*\"voluntari\" + 0.024*\"democrat\" + 0.020*\"member\" + 0.016*\"polici\" + 0.015*\"republ\" + 0.014*\"bypass\" + 0.014*\"selma\" + 0.013*\"report\"\n", + "2019-01-31 01:36:13,508 : INFO : topic diff=0.002759, rho=0.020743\n", + "2019-01-31 01:36:13,675 : INFO : PROGRESS: pass 0, at document #4650000/4922894\n", + "2019-01-31 01:36:15,091 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:36:15,357 : INFO : topic #33 (0.020): 0.061*\"french\" + 0.045*\"franc\" + 0.031*\"pari\" + 0.022*\"jean\" + 0.022*\"sail\" + 0.017*\"daphn\" + 0.013*\"loui\" + 0.013*\"lazi\" + 0.013*\"piec\" + 0.009*\"wine\"\n", + "2019-01-31 01:36:15,358 : INFO : topic #44 (0.020): 0.030*\"rooftop\" + 0.025*\"final\" + 0.022*\"wife\" + 0.020*\"tourist\" + 0.019*\"champion\" + 0.015*\"martin\" + 0.015*\"taxpay\" + 0.014*\"tiepolo\" + 0.014*\"chamber\" + 0.012*\"open\"\n", + "2019-01-31 01:36:15,360 : INFO : topic #39 (0.020): 0.060*\"canada\" + 0.049*\"canadian\" + 0.024*\"toronto\" + 0.023*\"hoar\" + 0.022*\"ontario\" + 0.015*\"misericordia\" + 0.015*\"novotná\" + 0.015*\"hydrogen\" + 0.014*\"new\" + 0.013*\"quebec\"\n", + "2019-01-31 01:36:15,361 : INFO : topic #16 (0.020): 0.057*\"king\" + 0.031*\"priest\" + 0.020*\"duke\" + 0.019*\"rotterdam\" + 0.018*\"idiosyncrat\" + 0.017*\"grammat\" + 0.017*\"quarterli\" + 0.015*\"portugues\" + 0.014*\"kingdom\" + 0.012*\"brazil\"\n", + "2019-01-31 01:36:15,362 : INFO : topic #4 (0.020): 0.019*\"enfranchis\" + 0.014*\"depress\" + 0.014*\"pour\" + 0.008*\"mode\" + 0.008*\"elabor\" + 0.008*\"uruguayan\" + 0.007*\"veget\" + 0.007*\"turn\" + 0.006*\"produc\" + 0.006*\"develop\"\n", + "2019-01-31 01:36:15,368 : INFO : topic diff=0.004041, rho=0.020739\n", + "2019-01-31 01:36:15,528 : INFO : PROGRESS: pass 0, at document #4652000/4922894\n", + "2019-01-31 01:36:16,919 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:36:17,186 : INFO : topic #29 (0.020): 0.031*\"companhia\" + 0.013*\"million\" + 0.012*\"busi\" + 0.012*\"produc\" + 0.011*\"market\" + 0.010*\"industri\" + 0.010*\"bank\" + 0.009*\"yawn\" + 0.008*\"manag\" + 0.007*\"trace\"\n", + "2019-01-31 01:36:17,187 : INFO : topic #16 (0.020): 0.057*\"king\" + 0.031*\"priest\" + 0.021*\"duke\" + 0.018*\"rotterdam\" + 0.018*\"idiosyncrat\" + 0.017*\"grammat\" + 0.017*\"quarterli\" + 0.015*\"portugues\" + 0.014*\"kingdom\" + 0.012*\"brazil\"\n", + "2019-01-31 01:36:17,188 : INFO : topic #43 (0.020): 0.066*\"elect\" + 0.054*\"parti\" + 0.025*\"voluntari\" + 0.024*\"democrat\" + 0.020*\"member\" + 0.016*\"polici\" + 0.015*\"republ\" + 0.014*\"bypass\" + 0.014*\"selma\" + 0.014*\"report\"\n", + "2019-01-31 01:36:17,189 : INFO : topic #12 (0.020): 0.008*\"number\" + 0.007*\"frontal\" + 0.006*\"gener\" + 0.006*\"poet\" + 0.006*\"exampl\" + 0.006*\"servitud\" + 0.006*\"théori\" + 0.006*\"mode\" + 0.006*\"measur\" + 0.006*\"southern\"\n", + "2019-01-31 01:36:17,190 : INFO : topic #48 (0.020): 0.080*\"march\" + 0.076*\"sens\" + 0.074*\"octob\" + 0.070*\"januari\" + 0.068*\"juli\" + 0.067*\"april\" + 0.067*\"notion\" + 0.067*\"august\" + 0.065*\"judici\" + 0.063*\"decatur\"\n", + "2019-01-31 01:36:17,196 : INFO : topic diff=0.003276, rho=0.020735\n", + "2019-01-31 01:36:17,355 : INFO : PROGRESS: pass 0, at document #4654000/4922894\n", + "2019-01-31 01:36:18,719 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:36:18,985 : INFO : topic #39 (0.020): 0.060*\"canada\" + 0.048*\"canadian\" + 0.024*\"toronto\" + 0.023*\"hoar\" + 0.022*\"ontario\" + 0.015*\"misericordia\" + 0.015*\"hydrogen\" + 0.015*\"novotná\" + 0.014*\"new\" + 0.013*\"quebec\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 01:36:18,987 : INFO : topic #37 (0.020): 0.012*\"charact\" + 0.012*\"septemb\" + 0.011*\"anim\" + 0.010*\"man\" + 0.009*\"comic\" + 0.007*\"appear\" + 0.007*\"storag\" + 0.007*\"fusiform\" + 0.007*\"workplac\" + 0.006*\"black\"\n", + "2019-01-31 01:36:18,988 : INFO : topic #33 (0.020): 0.061*\"french\" + 0.045*\"franc\" + 0.030*\"pari\" + 0.023*\"jean\" + 0.022*\"sail\" + 0.017*\"daphn\" + 0.014*\"loui\" + 0.013*\"lazi\" + 0.013*\"piec\" + 0.010*\"wine\"\n", + "2019-01-31 01:36:18,989 : INFO : topic #40 (0.020): 0.085*\"unit\" + 0.023*\"schuster\" + 0.022*\"requir\" + 0.022*\"institut\" + 0.020*\"collector\" + 0.019*\"student\" + 0.014*\"professor\" + 0.012*\"word\" + 0.011*\"governor\" + 0.011*\"degre\"\n", + "2019-01-31 01:36:18,990 : INFO : topic #3 (0.020): 0.034*\"present\" + 0.027*\"minist\" + 0.026*\"nation\" + 0.024*\"offic\" + 0.023*\"govern\" + 0.021*\"member\" + 0.018*\"start\" + 0.017*\"serv\" + 0.016*\"gener\" + 0.014*\"chickasaw\"\n", + "2019-01-31 01:36:18,996 : INFO : topic diff=0.003550, rho=0.020730\n", + "2019-01-31 01:36:19,154 : INFO : PROGRESS: pass 0, at document #4656000/4922894\n", + "2019-01-31 01:36:20,531 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:36:20,797 : INFO : topic #36 (0.020): 0.011*\"network\" + 0.010*\"prognosi\" + 0.009*\"pop\" + 0.009*\"cytokin\" + 0.008*\"develop\" + 0.008*\"diggin\" + 0.008*\"softwar\" + 0.008*\"uruguayan\" + 0.008*\"user\" + 0.007*\"includ\"\n", + "2019-01-31 01:36:20,798 : INFO : topic #1 (0.020): 0.056*\"china\" + 0.049*\"chilton\" + 0.025*\"hong\" + 0.024*\"kong\" + 0.021*\"korea\" + 0.018*\"korean\" + 0.015*\"leah\" + 0.015*\"sourc\" + 0.014*\"kim\" + 0.013*\"shirin\"\n", + "2019-01-31 01:36:20,799 : INFO : topic #24 (0.020): 0.041*\"book\" + 0.036*\"publicis\" + 0.025*\"word\" + 0.020*\"new\" + 0.015*\"presid\" + 0.014*\"edit\" + 0.012*\"nicola\" + 0.011*\"magazin\" + 0.011*\"worldwid\" + 0.011*\"storag\"\n", + "2019-01-31 01:36:20,800 : INFO : topic #45 (0.020): 0.048*\"arsen\" + 0.030*\"jpg\" + 0.030*\"museo\" + 0.028*\"fifteenth\" + 0.022*\"pain\" + 0.020*\"illicit\" + 0.017*\"artist\" + 0.017*\"exhaust\" + 0.016*\"colder\" + 0.016*\"gai\"\n", + "2019-01-31 01:36:20,801 : INFO : topic #9 (0.020): 0.070*\"bone\" + 0.047*\"american\" + 0.029*\"valour\" + 0.020*\"folei\" + 0.020*\"dutch\" + 0.018*\"player\" + 0.017*\"english\" + 0.017*\"polit\" + 0.013*\"acrimoni\" + 0.011*\"simpler\"\n", + "2019-01-31 01:36:20,807 : INFO : topic diff=0.003081, rho=0.020726\n", + "2019-01-31 01:36:20,964 : INFO : PROGRESS: pass 0, at document #4658000/4922894\n", + "2019-01-31 01:36:22,329 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:36:22,595 : INFO : topic #2 (0.020): 0.049*\"isl\" + 0.038*\"shield\" + 0.017*\"narrat\" + 0.015*\"scot\" + 0.012*\"pope\" + 0.012*\"blur\" + 0.011*\"nativist\" + 0.010*\"class\" + 0.010*\"coalit\" + 0.009*\"fleet\"\n", + "2019-01-31 01:36:22,596 : INFO : topic #0 (0.020): 0.061*\"statewid\" + 0.040*\"line\" + 0.031*\"raid\" + 0.030*\"rivièr\" + 0.026*\"rosenwald\" + 0.022*\"airmen\" + 0.018*\"traceabl\" + 0.018*\"serv\" + 0.013*\"oper\" + 0.010*\"briarwood\"\n", + "2019-01-31 01:36:22,597 : INFO : topic #34 (0.020): 0.066*\"start\" + 0.033*\"new\" + 0.032*\"american\" + 0.029*\"unionist\" + 0.025*\"cotton\" + 0.021*\"year\" + 0.015*\"california\" + 0.013*\"warrior\" + 0.012*\"terri\" + 0.012*\"north\"\n", + "2019-01-31 01:36:22,598 : INFO : topic #14 (0.020): 0.024*\"forc\" + 0.022*\"aggress\" + 0.021*\"armi\" + 0.020*\"walter\" + 0.018*\"com\" + 0.014*\"oper\" + 0.013*\"unionist\" + 0.013*\"airbu\" + 0.012*\"militari\" + 0.011*\"refut\"\n", + "2019-01-31 01:36:22,599 : INFO : topic #27 (0.020): 0.075*\"questionnair\" + 0.020*\"candid\" + 0.017*\"taxpay\" + 0.014*\"tornado\" + 0.013*\"ret\" + 0.012*\"driver\" + 0.011*\"fool\" + 0.011*\"squatter\" + 0.011*\"find\" + 0.010*\"horac\"\n", + "2019-01-31 01:36:22,605 : INFO : topic diff=0.002912, rho=0.020721\n", + "2019-01-31 01:36:25,307 : INFO : -11.554 per-word bound, 3005.8 perplexity estimate based on a held-out corpus of 2000 documents with 547383 words\n", + "2019-01-31 01:36:25,308 : INFO : PROGRESS: pass 0, at document #4660000/4922894\n", + "2019-01-31 01:36:26,687 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:36:26,953 : INFO : topic #19 (0.020): 0.016*\"languag\" + 0.015*\"centuri\" + 0.010*\"woodcut\" + 0.009*\"form\" + 0.009*\"origin\" + 0.009*\"mean\" + 0.008*\"trade\" + 0.007*\"english\" + 0.007*\"known\" + 0.007*\"uruguayan\"\n", + "2019-01-31 01:36:26,954 : INFO : topic #37 (0.020): 0.012*\"charact\" + 0.012*\"septemb\" + 0.011*\"anim\" + 0.010*\"man\" + 0.008*\"comic\" + 0.007*\"fusiform\" + 0.007*\"appear\" + 0.007*\"storag\" + 0.007*\"workplac\" + 0.006*\"black\"\n", + "2019-01-31 01:36:26,955 : INFO : topic #45 (0.020): 0.047*\"arsen\" + 0.030*\"jpg\" + 0.029*\"museo\" + 0.028*\"fifteenth\" + 0.022*\"pain\" + 0.020*\"illicit\" + 0.017*\"artist\" + 0.016*\"exhaust\" + 0.016*\"colder\" + 0.016*\"gai\"\n", + "2019-01-31 01:36:26,956 : INFO : topic #2 (0.020): 0.049*\"isl\" + 0.038*\"shield\" + 0.017*\"narrat\" + 0.015*\"scot\" + 0.012*\"pope\" + 0.012*\"blur\" + 0.011*\"nativist\" + 0.010*\"class\" + 0.010*\"coalit\" + 0.009*\"fleet\"\n", + "2019-01-31 01:36:26,957 : INFO : topic #10 (0.020): 0.011*\"cdd\" + 0.008*\"media\" + 0.008*\"disco\" + 0.007*\"have\" + 0.007*\"hormon\" + 0.007*\"pathwai\" + 0.007*\"caus\" + 0.006*\"proper\" + 0.006*\"effect\" + 0.006*\"treat\"\n", + "2019-01-31 01:36:26,963 : INFO : topic diff=0.002779, rho=0.020717\n", + "2019-01-31 01:36:27,122 : INFO : PROGRESS: pass 0, at document #4662000/4922894\n", + "2019-01-31 01:36:28,494 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:36:28,761 : INFO : topic #35 (0.020): 0.059*\"russia\" + 0.036*\"sovereignti\" + 0.036*\"rural\" + 0.026*\"reprint\" + 0.025*\"poison\" + 0.024*\"personifi\" + 0.020*\"moscow\" + 0.017*\"poland\" + 0.015*\"tyrant\" + 0.014*\"unfortun\"\n", + "2019-01-31 01:36:28,762 : INFO : topic #21 (0.020): 0.037*\"samford\" + 0.022*\"spain\" + 0.017*\"del\" + 0.017*\"italian\" + 0.016*\"mexico\" + 0.014*\"soviet\" + 0.012*\"santa\" + 0.011*\"juan\" + 0.011*\"francisco\" + 0.010*\"carlo\"\n", + "2019-01-31 01:36:28,762 : INFO : topic #33 (0.020): 0.061*\"french\" + 0.045*\"franc\" + 0.031*\"pari\" + 0.023*\"jean\" + 0.021*\"sail\" + 0.017*\"daphn\" + 0.013*\"loui\" + 0.013*\"lazi\" + 0.013*\"piec\" + 0.010*\"wine\"\n", + "2019-01-31 01:36:28,764 : INFO : topic #49 (0.020): 0.042*\"india\" + 0.029*\"incumb\" + 0.013*\"islam\" + 0.012*\"anglo\" + 0.011*\"pakistan\" + 0.011*\"televis\" + 0.011*\"affection\" + 0.010*\"muskoge\" + 0.010*\"khalsa\" + 0.010*\"sri\"\n", + "2019-01-31 01:36:28,765 : INFO : topic #11 (0.020): 0.022*\"john\" + 0.011*\"will\" + 0.011*\"david\" + 0.011*\"jame\" + 0.010*\"rival\" + 0.009*\"mexican–american\" + 0.008*\"slur\" + 0.008*\"rhyme\" + 0.008*\"paul\" + 0.007*\"georg\"\n", + "2019-01-31 01:36:28,770 : INFO : topic diff=0.002856, rho=0.020712\n", + "2019-01-31 01:36:28,931 : INFO : PROGRESS: pass 0, at document #4664000/4922894\n", + "2019-01-31 01:36:30,294 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:36:30,563 : INFO : topic #29 (0.020): 0.031*\"companhia\" + 0.012*\"million\" + 0.012*\"busi\" + 0.012*\"produc\" + 0.011*\"market\" + 0.010*\"bank\" + 0.010*\"industri\" + 0.009*\"yawn\" + 0.008*\"manag\" + 0.007*\"trace\"\n", + "2019-01-31 01:36:30,564 : INFO : topic #41 (0.020): 0.041*\"citi\" + 0.025*\"palmer\" + 0.019*\"new\" + 0.017*\"strategist\" + 0.013*\"open\" + 0.012*\"center\" + 0.012*\"lobe\" + 0.011*\"includ\" + 0.011*\"dai\" + 0.009*\"highli\"\n", + "2019-01-31 01:36:30,565 : INFO : topic #33 (0.020): 0.061*\"french\" + 0.045*\"franc\" + 0.031*\"pari\" + 0.023*\"jean\" + 0.021*\"sail\" + 0.017*\"daphn\" + 0.013*\"loui\" + 0.013*\"lazi\" + 0.013*\"piec\" + 0.010*\"wine\"\n", + "2019-01-31 01:36:30,566 : INFO : topic #2 (0.020): 0.048*\"isl\" + 0.038*\"shield\" + 0.017*\"narrat\" + 0.015*\"scot\" + 0.012*\"pope\" + 0.012*\"blur\" + 0.011*\"nativist\" + 0.010*\"class\" + 0.010*\"coalit\" + 0.009*\"fleet\"\n", + "2019-01-31 01:36:30,567 : INFO : topic #16 (0.020): 0.057*\"king\" + 0.031*\"priest\" + 0.021*\"duke\" + 0.019*\"rotterdam\" + 0.018*\"idiosyncrat\" + 0.017*\"quarterli\" + 0.017*\"grammat\" + 0.016*\"portugues\" + 0.013*\"kingdom\" + 0.012*\"brazil\"\n", + "2019-01-31 01:36:30,573 : INFO : topic diff=0.002665, rho=0.020708\n", + "2019-01-31 01:36:30,730 : INFO : PROGRESS: pass 0, at document #4666000/4922894\n", + "2019-01-31 01:36:32,103 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:36:32,370 : INFO : topic #44 (0.020): 0.030*\"rooftop\" + 0.025*\"final\" + 0.023*\"wife\" + 0.020*\"tourist\" + 0.019*\"champion\" + 0.015*\"martin\" + 0.015*\"taxpay\" + 0.014*\"chamber\" + 0.014*\"tiepolo\" + 0.012*\"open\"\n", + "2019-01-31 01:36:32,372 : INFO : topic #6 (0.020): 0.068*\"fewer\" + 0.024*\"epiru\" + 0.020*\"septemb\" + 0.018*\"teacher\" + 0.015*\"stake\" + 0.012*\"rodríguez\" + 0.012*\"proclaim\" + 0.011*\"direct\" + 0.010*\"movi\" + 0.010*\"acrimoni\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 01:36:32,373 : INFO : topic #20 (0.020): 0.143*\"scholar\" + 0.039*\"struggl\" + 0.032*\"high\" + 0.029*\"educ\" + 0.024*\"collector\" + 0.017*\"yawn\" + 0.012*\"prognosi\" + 0.011*\"district\" + 0.010*\"gothic\" + 0.010*\"task\"\n", + "2019-01-31 01:36:32,374 : INFO : topic #27 (0.020): 0.075*\"questionnair\" + 0.020*\"candid\" + 0.017*\"taxpay\" + 0.013*\"tornado\" + 0.012*\"ret\" + 0.012*\"driver\" + 0.012*\"fool\" + 0.011*\"find\" + 0.011*\"squatter\" + 0.010*\"horac\"\n", + "2019-01-31 01:36:32,375 : INFO : topic #2 (0.020): 0.048*\"isl\" + 0.038*\"shield\" + 0.018*\"narrat\" + 0.015*\"scot\" + 0.012*\"pope\" + 0.012*\"blur\" + 0.011*\"nativist\" + 0.010*\"class\" + 0.010*\"coalit\" + 0.009*\"fleet\"\n", + "2019-01-31 01:36:32,381 : INFO : topic diff=0.003147, rho=0.020703\n", + "2019-01-31 01:36:32,536 : INFO : PROGRESS: pass 0, at document #4668000/4922894\n", + "2019-01-31 01:36:33,893 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:36:34,159 : INFO : topic #17 (0.020): 0.082*\"church\" + 0.023*\"cathol\" + 0.023*\"christian\" + 0.021*\"bishop\" + 0.017*\"sail\" + 0.015*\"retroflex\" + 0.011*\"relationship\" + 0.010*\"historiographi\" + 0.009*\"cathedr\" + 0.009*\"parish\"\n", + "2019-01-31 01:36:34,160 : INFO : topic #38 (0.020): 0.022*\"walter\" + 0.009*\"aza\" + 0.009*\"forc\" + 0.009*\"battalion\" + 0.007*\"armi\" + 0.007*\"teufel\" + 0.007*\"empath\" + 0.007*\"govern\" + 0.006*\"pour\" + 0.006*\"till\"\n", + "2019-01-31 01:36:34,161 : INFO : topic #43 (0.020): 0.066*\"elect\" + 0.054*\"parti\" + 0.024*\"voluntari\" + 0.023*\"democrat\" + 0.020*\"member\" + 0.017*\"polici\" + 0.015*\"republ\" + 0.014*\"bypass\" + 0.014*\"selma\" + 0.013*\"report\"\n", + "2019-01-31 01:36:34,162 : INFO : topic #39 (0.020): 0.060*\"canada\" + 0.048*\"canadian\" + 0.025*\"toronto\" + 0.022*\"hoar\" + 0.022*\"ontario\" + 0.015*\"misericordia\" + 0.015*\"hydrogen\" + 0.014*\"new\" + 0.014*\"novotná\" + 0.014*\"quebec\"\n", + "2019-01-31 01:36:34,163 : INFO : topic #41 (0.020): 0.041*\"citi\" + 0.025*\"palmer\" + 0.019*\"new\" + 0.017*\"strategist\" + 0.013*\"open\" + 0.012*\"center\" + 0.012*\"lobe\" + 0.011*\"includ\" + 0.011*\"dai\" + 0.009*\"highli\"\n", + "2019-01-31 01:36:34,169 : INFO : topic diff=0.003079, rho=0.020699\n", + "2019-01-31 01:36:34,383 : INFO : PROGRESS: pass 0, at document #4670000/4922894\n", + "2019-01-31 01:36:35,785 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:36:36,051 : INFO : topic #40 (0.020): 0.085*\"unit\" + 0.023*\"schuster\" + 0.022*\"requir\" + 0.022*\"institut\" + 0.020*\"collector\" + 0.019*\"student\" + 0.014*\"professor\" + 0.012*\"word\" + 0.011*\"governor\" + 0.011*\"degre\"\n", + "2019-01-31 01:36:36,052 : INFO : topic #25 (0.020): 0.032*\"ring\" + 0.019*\"area\" + 0.017*\"lagrang\" + 0.017*\"warmth\" + 0.015*\"mount\" + 0.010*\"north\" + 0.009*\"land\" + 0.009*\"sourc\" + 0.009*\"lobe\" + 0.008*\"palmer\"\n", + "2019-01-31 01:36:36,053 : INFO : topic #30 (0.020): 0.035*\"leagu\" + 0.035*\"cleveland\" + 0.030*\"place\" + 0.027*\"taxpay\" + 0.024*\"scientist\" + 0.023*\"crete\" + 0.021*\"folei\" + 0.017*\"goal\" + 0.015*\"martin\" + 0.013*\"schmitz\"\n", + "2019-01-31 01:36:36,054 : INFO : topic #0 (0.020): 0.061*\"statewid\" + 0.040*\"line\" + 0.030*\"raid\" + 0.030*\"rivièr\" + 0.026*\"rosenwald\" + 0.022*\"airmen\" + 0.018*\"serv\" + 0.018*\"traceabl\" + 0.013*\"oper\" + 0.011*\"briarwood\"\n", + "2019-01-31 01:36:36,055 : INFO : topic #15 (0.020): 0.011*\"small\" + 0.010*\"organ\" + 0.010*\"develop\" + 0.009*\"commun\" + 0.009*\"group\" + 0.008*\"word\" + 0.008*\"peopl\" + 0.008*\"woman\" + 0.007*\"human\" + 0.006*\"workplac\"\n", + "2019-01-31 01:36:36,062 : INFO : topic diff=0.002544, rho=0.020695\n", + "2019-01-31 01:36:36,215 : INFO : PROGRESS: pass 0, at document #4672000/4922894\n", + "2019-01-31 01:36:37,569 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:36:37,835 : INFO : topic #24 (0.020): 0.040*\"book\" + 0.036*\"publicis\" + 0.025*\"word\" + 0.020*\"new\" + 0.015*\"presid\" + 0.014*\"edit\" + 0.011*\"magazin\" + 0.011*\"nicola\" + 0.011*\"worldwid\" + 0.011*\"storag\"\n", + "2019-01-31 01:36:37,836 : INFO : topic #45 (0.020): 0.047*\"arsen\" + 0.031*\"jpg\" + 0.029*\"museo\" + 0.028*\"fifteenth\" + 0.022*\"pain\" + 0.020*\"illicit\" + 0.017*\"artist\" + 0.016*\"colder\" + 0.016*\"exhaust\" + 0.016*\"gai\"\n", + "2019-01-31 01:36:37,837 : INFO : topic #7 (0.020): 0.022*\"snatch\" + 0.020*\"di\" + 0.019*\"factor\" + 0.016*\"yawn\" + 0.016*\"margin\" + 0.014*\"bone\" + 0.013*\"life\" + 0.013*\"faster\" + 0.012*\"daughter\" + 0.012*\"deal\"\n", + "2019-01-31 01:36:37,838 : INFO : topic #25 (0.020): 0.032*\"ring\" + 0.019*\"area\" + 0.017*\"lagrang\" + 0.017*\"warmth\" + 0.015*\"mount\" + 0.010*\"north\" + 0.009*\"land\" + 0.009*\"sourc\" + 0.009*\"foam\" + 0.008*\"lobe\"\n", + "2019-01-31 01:36:37,839 : INFO : topic #19 (0.020): 0.016*\"languag\" + 0.015*\"centuri\" + 0.010*\"woodcut\" + 0.009*\"form\" + 0.009*\"origin\" + 0.009*\"mean\" + 0.008*\"trade\" + 0.008*\"english\" + 0.007*\"known\" + 0.007*\"uruguayan\"\n", + "2019-01-31 01:36:37,845 : INFO : topic diff=0.002748, rho=0.020690\n", + "2019-01-31 01:36:38,004 : INFO : PROGRESS: pass 0, at document #4674000/4922894\n", + "2019-01-31 01:36:39,358 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:36:39,628 : INFO : topic #18 (0.020): 0.011*\"théori\" + 0.007*\"later\" + 0.007*\"sack\" + 0.006*\"dai\" + 0.005*\"kill\" + 0.005*\"like\" + 0.005*\"end\" + 0.005*\"retrospect\" + 0.004*\"call\" + 0.004*\"help\"\n", + "2019-01-31 01:36:39,629 : INFO : topic #11 (0.020): 0.023*\"john\" + 0.011*\"david\" + 0.011*\"will\" + 0.011*\"jame\" + 0.010*\"rival\" + 0.009*\"mexican–american\" + 0.008*\"slur\" + 0.008*\"rhyme\" + 0.008*\"paul\" + 0.007*\"georg\"\n", + "2019-01-31 01:36:39,630 : INFO : topic #33 (0.020): 0.061*\"french\" + 0.045*\"franc\" + 0.031*\"pari\" + 0.023*\"jean\" + 0.022*\"sail\" + 0.017*\"daphn\" + 0.014*\"loui\" + 0.013*\"lazi\" + 0.012*\"piec\" + 0.011*\"wine\"\n", + "2019-01-31 01:36:39,631 : INFO : topic #31 (0.020): 0.050*\"fusiform\" + 0.027*\"scientist\" + 0.025*\"taxpay\" + 0.022*\"player\" + 0.020*\"place\" + 0.014*\"clot\" + 0.013*\"leagu\" + 0.011*\"folei\" + 0.010*\"yawn\" + 0.009*\"reconstruct\"\n", + "2019-01-31 01:36:39,632 : INFO : topic #39 (0.020): 0.060*\"canada\" + 0.047*\"canadian\" + 0.025*\"toronto\" + 0.022*\"hoar\" + 0.022*\"ontario\" + 0.015*\"hydrogen\" + 0.015*\"misericordia\" + 0.014*\"new\" + 0.014*\"novotná\" + 0.013*\"quebec\"\n", + "2019-01-31 01:36:39,638 : INFO : topic diff=0.003452, rho=0.020686\n", + "2019-01-31 01:36:39,795 : INFO : PROGRESS: pass 0, at document #4676000/4922894\n", + "2019-01-31 01:36:41,180 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:36:41,446 : INFO : topic #44 (0.020): 0.031*\"rooftop\" + 0.026*\"final\" + 0.024*\"wife\" + 0.021*\"tourist\" + 0.019*\"champion\" + 0.015*\"martin\" + 0.015*\"taxpay\" + 0.014*\"chamber\" + 0.014*\"tiepolo\" + 0.013*\"open\"\n", + "2019-01-31 01:36:41,447 : INFO : topic #35 (0.020): 0.059*\"russia\" + 0.036*\"sovereignti\" + 0.036*\"rural\" + 0.026*\"reprint\" + 0.025*\"poison\" + 0.024*\"personifi\" + 0.020*\"moscow\" + 0.017*\"poland\" + 0.014*\"unfortun\" + 0.014*\"tyrant\"\n", + "2019-01-31 01:36:41,448 : INFO : topic #20 (0.020): 0.143*\"scholar\" + 0.040*\"struggl\" + 0.032*\"high\" + 0.029*\"educ\" + 0.024*\"collector\" + 0.017*\"yawn\" + 0.012*\"prognosi\" + 0.010*\"district\" + 0.010*\"gothic\" + 0.010*\"task\"\n", + "2019-01-31 01:36:41,449 : INFO : topic #37 (0.020): 0.012*\"charact\" + 0.012*\"septemb\" + 0.011*\"anim\" + 0.010*\"man\" + 0.008*\"comic\" + 0.007*\"appear\" + 0.007*\"fusiform\" + 0.007*\"storag\" + 0.007*\"workplac\" + 0.006*\"black\"\n", + "2019-01-31 01:36:41,450 : INFO : topic #46 (0.020): 0.017*\"sweden\" + 0.017*\"stop\" + 0.016*\"swedish\" + 0.016*\"norwai\" + 0.014*\"wind\" + 0.013*\"damag\" + 0.013*\"norwegian\" + 0.011*\"treeless\" + 0.010*\"turkish\" + 0.010*\"denmark\"\n", + "2019-01-31 01:36:41,456 : INFO : topic diff=0.003220, rho=0.020681\n", + "2019-01-31 01:36:41,616 : INFO : PROGRESS: pass 0, at document #4678000/4922894\n", + "2019-01-31 01:36:43,012 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:36:43,279 : INFO : topic #34 (0.020): 0.066*\"start\" + 0.033*\"new\" + 0.032*\"american\" + 0.029*\"unionist\" + 0.026*\"cotton\" + 0.021*\"year\" + 0.016*\"california\" + 0.013*\"warrior\" + 0.012*\"terri\" + 0.012*\"north\"\n", + "2019-01-31 01:36:43,280 : INFO : topic #12 (0.020): 0.008*\"number\" + 0.007*\"frontal\" + 0.006*\"gener\" + 0.006*\"exampl\" + 0.006*\"poet\" + 0.006*\"théori\" + 0.006*\"servitud\" + 0.006*\"mode\" + 0.006*\"measur\" + 0.006*\"southern\"\n", + "2019-01-31 01:36:43,281 : INFO : topic #47 (0.020): 0.065*\"muscl\" + 0.032*\"perceptu\" + 0.021*\"theater\" + 0.018*\"compos\" + 0.017*\"place\" + 0.016*\"damn\" + 0.013*\"physician\" + 0.013*\"orchestr\" + 0.012*\"olympo\" + 0.011*\"word\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 01:36:43,282 : INFO : topic #22 (0.020): 0.033*\"spars\" + 0.017*\"factor\" + 0.011*\"plaisir\" + 0.011*\"genu\" + 0.010*\"western\" + 0.009*\"biom\" + 0.008*\"median\" + 0.007*\"trap\" + 0.007*\"incom\" + 0.006*\"florida\"\n", + "2019-01-31 01:36:43,283 : INFO : topic #43 (0.020): 0.066*\"elect\" + 0.054*\"parti\" + 0.024*\"voluntari\" + 0.023*\"democrat\" + 0.020*\"member\" + 0.017*\"polici\" + 0.015*\"republ\" + 0.014*\"bypass\" + 0.014*\"liber\" + 0.013*\"report\"\n", + "2019-01-31 01:36:43,289 : INFO : topic diff=0.002784, rho=0.020677\n", + "2019-01-31 01:36:45,969 : INFO : -11.830 per-word bound, 3640.8 perplexity estimate based on a held-out corpus of 2000 documents with 564955 words\n", + "2019-01-31 01:36:45,969 : INFO : PROGRESS: pass 0, at document #4680000/4922894\n", + "2019-01-31 01:36:47,338 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:36:47,605 : INFO : topic #8 (0.020): 0.027*\"law\" + 0.022*\"cortic\" + 0.018*\"start\" + 0.016*\"act\" + 0.012*\"case\" + 0.012*\"ricardo\" + 0.010*\"replac\" + 0.009*\"polaris\" + 0.009*\"legal\" + 0.007*\"rudolf\"\n", + "2019-01-31 01:36:47,606 : INFO : topic #42 (0.020): 0.048*\"german\" + 0.032*\"germani\" + 0.016*\"vol\" + 0.014*\"berlin\" + 0.014*\"israel\" + 0.014*\"jewish\" + 0.014*\"der\" + 0.010*\"european\" + 0.009*\"austria\" + 0.009*\"europ\"\n", + "2019-01-31 01:36:47,607 : INFO : topic #39 (0.020): 0.060*\"canada\" + 0.047*\"canadian\" + 0.025*\"toronto\" + 0.022*\"hoar\" + 0.022*\"ontario\" + 0.015*\"misericordia\" + 0.015*\"hydrogen\" + 0.014*\"new\" + 0.014*\"novotná\" + 0.014*\"quebec\"\n", + "2019-01-31 01:36:47,608 : INFO : topic #2 (0.020): 0.048*\"isl\" + 0.038*\"shield\" + 0.018*\"narrat\" + 0.014*\"scot\" + 0.012*\"pope\" + 0.012*\"blur\" + 0.011*\"nativist\" + 0.010*\"coalit\" + 0.010*\"class\" + 0.009*\"fleet\"\n", + "2019-01-31 01:36:47,609 : INFO : topic #29 (0.020): 0.031*\"companhia\" + 0.012*\"million\" + 0.012*\"busi\" + 0.012*\"produc\" + 0.011*\"market\" + 0.010*\"industri\" + 0.010*\"bank\" + 0.009*\"yawn\" + 0.008*\"manag\" + 0.007*\"trace\"\n", + "2019-01-31 01:36:47,615 : INFO : topic diff=0.003103, rho=0.020672\n", + "2019-01-31 01:36:47,775 : INFO : PROGRESS: pass 0, at document #4682000/4922894\n", + "2019-01-31 01:36:49,161 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:36:49,427 : INFO : topic #5 (0.020): 0.039*\"abroad\" + 0.028*\"son\" + 0.027*\"rel\" + 0.025*\"reconstruct\" + 0.021*\"band\" + 0.017*\"muscl\" + 0.015*\"simultan\" + 0.014*\"charcoal\" + 0.013*\"toyota\" + 0.009*\"myspac\"\n", + "2019-01-31 01:36:49,428 : INFO : topic #4 (0.020): 0.019*\"enfranchis\" + 0.015*\"depress\" + 0.013*\"pour\" + 0.008*\"elabor\" + 0.008*\"mode\" + 0.008*\"uruguayan\" + 0.007*\"veget\" + 0.006*\"turn\" + 0.006*\"produc\" + 0.006*\"develop\"\n", + "2019-01-31 01:36:49,429 : INFO : topic #15 (0.020): 0.011*\"small\" + 0.010*\"organ\" + 0.009*\"develop\" + 0.009*\"commun\" + 0.009*\"group\" + 0.008*\"word\" + 0.008*\"peopl\" + 0.008*\"woman\" + 0.007*\"human\" + 0.006*\"workplac\"\n", + "2019-01-31 01:36:49,430 : INFO : topic #13 (0.020): 0.027*\"australia\" + 0.026*\"sourc\" + 0.026*\"london\" + 0.025*\"new\" + 0.023*\"england\" + 0.022*\"australian\" + 0.019*\"british\" + 0.017*\"ireland\" + 0.014*\"youth\" + 0.013*\"wale\"\n", + "2019-01-31 01:36:49,431 : INFO : topic #0 (0.020): 0.062*\"statewid\" + 0.040*\"line\" + 0.030*\"raid\" + 0.030*\"rivièr\" + 0.026*\"rosenwald\" + 0.022*\"airmen\" + 0.018*\"serv\" + 0.018*\"traceabl\" + 0.013*\"oper\" + 0.012*\"briarwood\"\n", + "2019-01-31 01:36:49,438 : INFO : topic diff=0.002960, rho=0.020668\n", + "2019-01-31 01:36:49,591 : INFO : PROGRESS: pass 0, at document #4684000/4922894\n", + "2019-01-31 01:36:50,940 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:36:51,207 : INFO : topic #19 (0.020): 0.016*\"languag\" + 0.015*\"centuri\" + 0.010*\"woodcut\" + 0.009*\"form\" + 0.009*\"origin\" + 0.009*\"mean\" + 0.008*\"trade\" + 0.008*\"english\" + 0.007*\"known\" + 0.007*\"uruguayan\"\n", + "2019-01-31 01:36:51,208 : INFO : topic #43 (0.020): 0.066*\"elect\" + 0.054*\"parti\" + 0.025*\"voluntari\" + 0.023*\"democrat\" + 0.020*\"member\" + 0.017*\"polici\" + 0.014*\"bypass\" + 0.014*\"republ\" + 0.014*\"liber\" + 0.013*\"report\"\n", + "2019-01-31 01:36:51,209 : INFO : topic #45 (0.020): 0.048*\"arsen\" + 0.030*\"jpg\" + 0.029*\"museo\" + 0.028*\"fifteenth\" + 0.022*\"pain\" + 0.020*\"illicit\" + 0.017*\"artist\" + 0.016*\"exhaust\" + 0.016*\"colder\" + 0.016*\"gai\"\n", + "2019-01-31 01:36:51,210 : INFO : topic #17 (0.020): 0.082*\"church\" + 0.023*\"cathol\" + 0.023*\"christian\" + 0.021*\"bishop\" + 0.017*\"sail\" + 0.015*\"retroflex\" + 0.010*\"relationship\" + 0.010*\"historiographi\" + 0.009*\"cathedr\" + 0.009*\"parish\"\n", + "2019-01-31 01:36:51,211 : INFO : topic #39 (0.020): 0.060*\"canada\" + 0.047*\"canadian\" + 0.025*\"toronto\" + 0.022*\"hoar\" + 0.022*\"ontario\" + 0.015*\"misericordia\" + 0.015*\"hydrogen\" + 0.014*\"new\" + 0.014*\"novotná\" + 0.014*\"quebec\"\n", + "2019-01-31 01:36:51,217 : INFO : topic diff=0.003033, rho=0.020664\n", + "2019-01-31 01:36:51,375 : INFO : PROGRESS: pass 0, at document #4686000/4922894\n", + "2019-01-31 01:36:52,754 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:36:53,020 : INFO : topic #2 (0.020): 0.049*\"isl\" + 0.038*\"shield\" + 0.018*\"narrat\" + 0.015*\"scot\" + 0.012*\"pope\" + 0.012*\"blur\" + 0.011*\"nativist\" + 0.010*\"coalit\" + 0.010*\"class\" + 0.009*\"fleet\"\n", + "2019-01-31 01:36:53,021 : INFO : topic #12 (0.020): 0.009*\"number\" + 0.007*\"frontal\" + 0.006*\"gener\" + 0.006*\"exampl\" + 0.006*\"poet\" + 0.006*\"théori\" + 0.006*\"southern\" + 0.006*\"servitud\" + 0.006*\"mode\" + 0.006*\"measur\"\n", + "2019-01-31 01:36:53,022 : INFO : topic #28 (0.020): 0.036*\"build\" + 0.030*\"hous\" + 0.019*\"buford\" + 0.015*\"histor\" + 0.011*\"linear\" + 0.011*\"constitut\" + 0.011*\"depress\" + 0.011*\"centuri\" + 0.011*\"silicon\" + 0.010*\"pistol\"\n", + "2019-01-31 01:36:53,024 : INFO : topic #30 (0.020): 0.035*\"leagu\" + 0.035*\"cleveland\" + 0.030*\"place\" + 0.027*\"taxpay\" + 0.024*\"scientist\" + 0.024*\"crete\" + 0.021*\"folei\" + 0.017*\"goal\" + 0.015*\"martin\" + 0.013*\"schmitz\"\n", + "2019-01-31 01:36:53,025 : INFO : topic #17 (0.020): 0.082*\"church\" + 0.023*\"cathol\" + 0.023*\"christian\" + 0.021*\"bishop\" + 0.017*\"sail\" + 0.015*\"retroflex\" + 0.010*\"relationship\" + 0.010*\"historiographi\" + 0.009*\"cathedr\" + 0.009*\"parish\"\n", + "2019-01-31 01:36:53,030 : INFO : topic diff=0.003063, rho=0.020659\n", + "2019-01-31 01:36:53,189 : INFO : PROGRESS: pass 0, at document #4688000/4922894\n", + "2019-01-31 01:36:54,597 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:36:54,864 : INFO : topic #40 (0.020): 0.085*\"unit\" + 0.023*\"schuster\" + 0.022*\"requir\" + 0.022*\"institut\" + 0.020*\"collector\" + 0.019*\"student\" + 0.014*\"professor\" + 0.012*\"word\" + 0.011*\"governor\" + 0.011*\"http\"\n", + "2019-01-31 01:36:54,865 : INFO : topic #35 (0.020): 0.059*\"russia\" + 0.036*\"sovereignti\" + 0.035*\"rural\" + 0.026*\"reprint\" + 0.026*\"poison\" + 0.024*\"personifi\" + 0.020*\"moscow\" + 0.017*\"poland\" + 0.014*\"czech\" + 0.014*\"unfortun\"\n", + "2019-01-31 01:36:54,866 : INFO : topic #45 (0.020): 0.047*\"arsen\" + 0.030*\"jpg\" + 0.029*\"museo\" + 0.028*\"fifteenth\" + 0.022*\"pain\" + 0.022*\"illicit\" + 0.017*\"artist\" + 0.016*\"exhaust\" + 0.016*\"colder\" + 0.016*\"gai\"\n", + "2019-01-31 01:36:54,867 : INFO : topic #20 (0.020): 0.143*\"scholar\" + 0.039*\"struggl\" + 0.032*\"high\" + 0.029*\"educ\" + 0.024*\"collector\" + 0.017*\"yawn\" + 0.012*\"prognosi\" + 0.011*\"district\" + 0.010*\"task\" + 0.010*\"gothic\"\n", + "2019-01-31 01:36:54,868 : INFO : topic #3 (0.020): 0.034*\"present\" + 0.026*\"minist\" + 0.026*\"nation\" + 0.025*\"offic\" + 0.023*\"govern\" + 0.021*\"member\" + 0.017*\"start\" + 0.017*\"serv\" + 0.016*\"gener\" + 0.014*\"chickasaw\"\n", + "2019-01-31 01:36:54,874 : INFO : topic diff=0.003146, rho=0.020655\n", + "2019-01-31 01:36:55,032 : INFO : PROGRESS: pass 0, at document #4690000/4922894\n", + "2019-01-31 01:36:56,394 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:36:56,662 : INFO : topic #27 (0.020): 0.076*\"questionnair\" + 0.022*\"candid\" + 0.017*\"taxpay\" + 0.013*\"tornado\" + 0.012*\"driver\" + 0.012*\"fool\" + 0.011*\"ret\" + 0.011*\"find\" + 0.011*\"squatter\" + 0.010*\"horac\"\n", + "2019-01-31 01:36:56,663 : INFO : topic #16 (0.020): 0.057*\"king\" + 0.031*\"priest\" + 0.020*\"duke\" + 0.018*\"rotterdam\" + 0.018*\"idiosyncrat\" + 0.017*\"grammat\" + 0.017*\"portugues\" + 0.017*\"quarterli\" + 0.013*\"kingdom\" + 0.013*\"brazil\"\n", + "2019-01-31 01:36:56,664 : INFO : topic #31 (0.020): 0.049*\"fusiform\" + 0.027*\"scientist\" + 0.026*\"taxpay\" + 0.022*\"player\" + 0.020*\"place\" + 0.014*\"clot\" + 0.014*\"leagu\" + 0.011*\"folei\" + 0.010*\"yawn\" + 0.009*\"reconstruct\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 01:36:56,665 : INFO : topic #6 (0.020): 0.068*\"fewer\" + 0.023*\"epiru\" + 0.020*\"septemb\" + 0.018*\"teacher\" + 0.014*\"stake\" + 0.012*\"proclaim\" + 0.012*\"rodríguez\" + 0.010*\"movi\" + 0.010*\"direct\" + 0.010*\"acrimoni\"\n", + "2019-01-31 01:36:56,666 : INFO : topic #13 (0.020): 0.026*\"australia\" + 0.026*\"sourc\" + 0.026*\"london\" + 0.025*\"new\" + 0.023*\"england\" + 0.022*\"australian\" + 0.019*\"british\" + 0.017*\"ireland\" + 0.015*\"youth\" + 0.013*\"wale\"\n", + "2019-01-31 01:36:56,672 : INFO : topic diff=0.003062, rho=0.020650\n", + "2019-01-31 01:36:56,827 : INFO : PROGRESS: pass 0, at document #4692000/4922894\n", + "2019-01-31 01:36:58,190 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:36:58,457 : INFO : topic #21 (0.020): 0.037*\"samford\" + 0.023*\"spain\" + 0.018*\"del\" + 0.017*\"mexico\" + 0.017*\"italian\" + 0.014*\"soviet\" + 0.012*\"santa\" + 0.011*\"juan\" + 0.011*\"francisco\" + 0.010*\"carlo\"\n", + "2019-01-31 01:36:58,459 : INFO : topic #27 (0.020): 0.076*\"questionnair\" + 0.022*\"candid\" + 0.017*\"taxpay\" + 0.014*\"tornado\" + 0.012*\"driver\" + 0.012*\"fool\" + 0.011*\"ret\" + 0.011*\"squatter\" + 0.011*\"find\" + 0.010*\"horac\"\n", + "2019-01-31 01:36:58,460 : INFO : topic #35 (0.020): 0.059*\"russia\" + 0.037*\"sovereignti\" + 0.035*\"rural\" + 0.026*\"reprint\" + 0.026*\"poison\" + 0.024*\"personifi\" + 0.020*\"moscow\" + 0.017*\"poland\" + 0.014*\"unfortun\" + 0.014*\"czech\"\n", + "2019-01-31 01:36:58,460 : INFO : topic #26 (0.020): 0.030*\"workplac\" + 0.029*\"champion\" + 0.026*\"woman\" + 0.025*\"olymp\" + 0.024*\"men\" + 0.022*\"medal\" + 0.020*\"event\" + 0.020*\"alic\" + 0.018*\"taxpay\" + 0.017*\"rainfal\"\n", + "2019-01-31 01:36:58,462 : INFO : topic #11 (0.020): 0.023*\"john\" + 0.011*\"will\" + 0.011*\"david\" + 0.011*\"jame\" + 0.010*\"rival\" + 0.009*\"mexican–american\" + 0.008*\"slur\" + 0.008*\"rhyme\" + 0.008*\"paul\" + 0.007*\"georg\"\n", + "2019-01-31 01:36:58,467 : INFO : topic diff=0.002836, rho=0.020646\n", + "2019-01-31 01:36:58,624 : INFO : PROGRESS: pass 0, at document #4694000/4922894\n", + "2019-01-31 01:36:59,987 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:37:00,254 : INFO : topic #39 (0.020): 0.060*\"canada\" + 0.046*\"canadian\" + 0.025*\"toronto\" + 0.022*\"hoar\" + 0.021*\"ontario\" + 0.015*\"misericordia\" + 0.015*\"hydrogen\" + 0.014*\"new\" + 0.014*\"novotná\" + 0.013*\"quebec\"\n", + "2019-01-31 01:37:00,255 : INFO : topic #8 (0.020): 0.027*\"law\" + 0.022*\"cortic\" + 0.017*\"start\" + 0.017*\"act\" + 0.012*\"case\" + 0.012*\"ricardo\" + 0.010*\"replac\" + 0.009*\"polaris\" + 0.009*\"legal\" + 0.008*\"order\"\n", + "2019-01-31 01:37:00,256 : INFO : topic #3 (0.020): 0.033*\"present\" + 0.026*\"minist\" + 0.026*\"nation\" + 0.025*\"offic\" + 0.022*\"govern\" + 0.021*\"member\" + 0.017*\"start\" + 0.017*\"serv\" + 0.016*\"gener\" + 0.014*\"chickasaw\"\n", + "2019-01-31 01:37:00,257 : INFO : topic #29 (0.020): 0.031*\"companhia\" + 0.012*\"busi\" + 0.012*\"million\" + 0.012*\"produc\" + 0.012*\"market\" + 0.010*\"industri\" + 0.010*\"bank\" + 0.009*\"yawn\" + 0.008*\"manag\" + 0.007*\"trace\"\n", + "2019-01-31 01:37:00,258 : INFO : topic #40 (0.020): 0.085*\"unit\" + 0.023*\"schuster\" + 0.022*\"requir\" + 0.022*\"institut\" + 0.020*\"collector\" + 0.019*\"student\" + 0.014*\"professor\" + 0.012*\"word\" + 0.011*\"governor\" + 0.011*\"http\"\n", + "2019-01-31 01:37:00,264 : INFO : topic diff=0.003665, rho=0.020642\n", + "2019-01-31 01:37:00,417 : INFO : PROGRESS: pass 0, at document #4696000/4922894\n", + "2019-01-31 01:37:01,766 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:37:02,032 : INFO : topic #48 (0.020): 0.081*\"march\" + 0.077*\"sens\" + 0.076*\"octob\" + 0.071*\"januari\" + 0.071*\"juli\" + 0.069*\"april\" + 0.068*\"august\" + 0.068*\"notion\" + 0.068*\"judici\" + 0.065*\"decatur\"\n", + "2019-01-31 01:37:02,034 : INFO : topic #12 (0.020): 0.009*\"number\" + 0.007*\"frontal\" + 0.007*\"gener\" + 0.006*\"exampl\" + 0.006*\"poet\" + 0.006*\"théori\" + 0.006*\"servitud\" + 0.006*\"southern\" + 0.006*\"mode\" + 0.006*\"measur\"\n", + "2019-01-31 01:37:02,035 : INFO : topic #0 (0.020): 0.061*\"statewid\" + 0.040*\"line\" + 0.032*\"rivièr\" + 0.029*\"raid\" + 0.025*\"rosenwald\" + 0.022*\"airmen\" + 0.018*\"serv\" + 0.018*\"traceabl\" + 0.013*\"oper\" + 0.012*\"briarwood\"\n", + "2019-01-31 01:37:02,036 : INFO : topic #26 (0.020): 0.029*\"workplac\" + 0.029*\"champion\" + 0.026*\"woman\" + 0.025*\"olymp\" + 0.024*\"men\" + 0.023*\"alic\" + 0.022*\"medal\" + 0.020*\"event\" + 0.018*\"taxpay\" + 0.017*\"rainfal\"\n", + "2019-01-31 01:37:02,037 : INFO : topic #43 (0.020): 0.066*\"elect\" + 0.054*\"parti\" + 0.025*\"voluntari\" + 0.023*\"democrat\" + 0.020*\"member\" + 0.017*\"polici\" + 0.014*\"republ\" + 0.014*\"bypass\" + 0.014*\"liber\" + 0.013*\"report\"\n", + "2019-01-31 01:37:02,043 : INFO : topic diff=0.003034, rho=0.020637\n", + "2019-01-31 01:37:02,196 : INFO : PROGRESS: pass 0, at document #4698000/4922894\n", + "2019-01-31 01:37:03,541 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:37:03,807 : INFO : topic #4 (0.020): 0.019*\"enfranchis\" + 0.015*\"depress\" + 0.013*\"pour\" + 0.008*\"mode\" + 0.008*\"elabor\" + 0.008*\"uruguayan\" + 0.007*\"veget\" + 0.006*\"produc\" + 0.006*\"turn\" + 0.006*\"encyclopedia\"\n", + "2019-01-31 01:37:03,808 : INFO : topic #15 (0.020): 0.011*\"small\" + 0.010*\"organ\" + 0.009*\"develop\" + 0.009*\"commun\" + 0.009*\"group\" + 0.008*\"word\" + 0.008*\"peopl\" + 0.008*\"woman\" + 0.007*\"human\" + 0.006*\"workplac\"\n", + "2019-01-31 01:37:03,810 : INFO : topic #28 (0.020): 0.036*\"build\" + 0.030*\"hous\" + 0.019*\"buford\" + 0.016*\"histor\" + 0.011*\"linear\" + 0.011*\"depress\" + 0.011*\"centuri\" + 0.011*\"constitut\" + 0.011*\"silicon\" + 0.010*\"pistol\"\n", + "2019-01-31 01:37:03,811 : INFO : topic #11 (0.020): 0.023*\"john\" + 0.011*\"will\" + 0.011*\"david\" + 0.011*\"jame\" + 0.010*\"rival\" + 0.010*\"mexican–american\" + 0.008*\"slur\" + 0.008*\"rhyme\" + 0.008*\"paul\" + 0.007*\"georg\"\n", + "2019-01-31 01:37:03,812 : INFO : topic #37 (0.020): 0.012*\"charact\" + 0.011*\"septemb\" + 0.011*\"man\" + 0.011*\"anim\" + 0.008*\"comic\" + 0.007*\"appear\" + 0.007*\"fusiform\" + 0.007*\"workplac\" + 0.007*\"storag\" + 0.006*\"black\"\n", + "2019-01-31 01:37:03,818 : INFO : topic diff=0.003210, rho=0.020633\n", + "2019-01-31 01:37:06,495 : INFO : -11.710 per-word bound, 3349.6 perplexity estimate based on a held-out corpus of 2000 documents with 559991 words\n", + "2019-01-31 01:37:06,495 : INFO : PROGRESS: pass 0, at document #4700000/4922894\n", + "2019-01-31 01:37:07,862 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:37:08,128 : INFO : topic #49 (0.020): 0.044*\"india\" + 0.030*\"incumb\" + 0.013*\"islam\" + 0.012*\"pakistan\" + 0.011*\"anglo\" + 0.011*\"televis\" + 0.011*\"khalsa\" + 0.011*\"affection\" + 0.010*\"muskoge\" + 0.010*\"sri\"\n", + "2019-01-31 01:37:08,129 : INFO : topic #0 (0.020): 0.061*\"statewid\" + 0.039*\"line\" + 0.033*\"rivièr\" + 0.029*\"raid\" + 0.026*\"rosenwald\" + 0.021*\"airmen\" + 0.018*\"serv\" + 0.017*\"traceabl\" + 0.013*\"oper\" + 0.012*\"briarwood\"\n", + "2019-01-31 01:37:08,130 : INFO : topic #22 (0.020): 0.034*\"spars\" + 0.017*\"factor\" + 0.012*\"plaisir\" + 0.010*\"genu\" + 0.010*\"western\" + 0.008*\"biom\" + 0.008*\"median\" + 0.007*\"trap\" + 0.006*\"incom\" + 0.006*\"florida\"\n", + "2019-01-31 01:37:08,131 : INFO : topic #3 (0.020): 0.033*\"present\" + 0.026*\"nation\" + 0.026*\"minist\" + 0.025*\"offic\" + 0.023*\"govern\" + 0.021*\"member\" + 0.017*\"start\" + 0.017*\"serv\" + 0.016*\"gener\" + 0.014*\"chickasaw\"\n", + "2019-01-31 01:37:08,132 : INFO : topic #5 (0.020): 0.039*\"abroad\" + 0.028*\"son\" + 0.027*\"rel\" + 0.025*\"reconstruct\" + 0.021*\"band\" + 0.017*\"muscl\" + 0.015*\"simultan\" + 0.014*\"charcoal\" + 0.013*\"toyota\" + 0.009*\"myspac\"\n", + "2019-01-31 01:37:08,138 : INFO : topic diff=0.002938, rho=0.020628\n", + "2019-01-31 01:37:08,296 : INFO : PROGRESS: pass 0, at document #4702000/4922894\n", + "2019-01-31 01:37:09,667 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:37:09,934 : INFO : topic #43 (0.020): 0.066*\"elect\" + 0.054*\"parti\" + 0.025*\"voluntari\" + 0.023*\"democrat\" + 0.020*\"member\" + 0.017*\"polici\" + 0.014*\"republ\" + 0.014*\"bypass\" + 0.014*\"liber\" + 0.013*\"report\"\n", + "2019-01-31 01:37:09,936 : INFO : topic #6 (0.020): 0.068*\"fewer\" + 0.023*\"epiru\" + 0.020*\"septemb\" + 0.018*\"teacher\" + 0.014*\"stake\" + 0.012*\"proclaim\" + 0.012*\"rodríguez\" + 0.010*\"movi\" + 0.010*\"direct\" + 0.010*\"acrimoni\"\n", + "2019-01-31 01:37:09,937 : INFO : topic #17 (0.020): 0.080*\"church\" + 0.023*\"christian\" + 0.022*\"cathol\" + 0.020*\"bishop\" + 0.017*\"sail\" + 0.015*\"retroflex\" + 0.010*\"relationship\" + 0.009*\"parish\" + 0.009*\"historiographi\" + 0.009*\"cathedr\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 01:37:09,938 : INFO : topic #27 (0.020): 0.075*\"questionnair\" + 0.022*\"candid\" + 0.017*\"taxpay\" + 0.014*\"tornado\" + 0.012*\"driver\" + 0.012*\"squatter\" + 0.011*\"find\" + 0.011*\"fool\" + 0.011*\"ret\" + 0.010*\"horac\"\n", + "2019-01-31 01:37:09,939 : INFO : topic #2 (0.020): 0.049*\"isl\" + 0.038*\"shield\" + 0.018*\"narrat\" + 0.014*\"scot\" + 0.012*\"pope\" + 0.012*\"blur\" + 0.011*\"nativist\" + 0.010*\"coalit\" + 0.010*\"class\" + 0.009*\"fleet\"\n", + "2019-01-31 01:37:09,945 : INFO : topic diff=0.003708, rho=0.020624\n", + "2019-01-31 01:37:10,160 : INFO : PROGRESS: pass 0, at document #4704000/4922894\n", + "2019-01-31 01:37:11,533 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:37:11,800 : INFO : topic #19 (0.020): 0.016*\"languag\" + 0.015*\"centuri\" + 0.010*\"woodcut\" + 0.009*\"form\" + 0.009*\"origin\" + 0.009*\"mean\" + 0.008*\"trade\" + 0.007*\"english\" + 0.007*\"known\" + 0.006*\"uruguayan\"\n", + "2019-01-31 01:37:11,801 : INFO : topic #40 (0.020): 0.085*\"unit\" + 0.023*\"schuster\" + 0.022*\"requir\" + 0.022*\"institut\" + 0.020*\"collector\" + 0.019*\"student\" + 0.014*\"professor\" + 0.012*\"word\" + 0.011*\"governor\" + 0.011*\"http\"\n", + "2019-01-31 01:37:11,803 : INFO : topic #24 (0.020): 0.040*\"book\" + 0.036*\"publicis\" + 0.025*\"word\" + 0.020*\"new\" + 0.015*\"presid\" + 0.014*\"edit\" + 0.012*\"magazin\" + 0.011*\"nicola\" + 0.011*\"worldwid\" + 0.011*\"storag\"\n", + "2019-01-31 01:37:11,804 : INFO : topic #35 (0.020): 0.059*\"russia\" + 0.036*\"sovereignti\" + 0.035*\"rural\" + 0.026*\"poison\" + 0.026*\"reprint\" + 0.023*\"personifi\" + 0.020*\"moscow\" + 0.017*\"poland\" + 0.014*\"tyrant\" + 0.014*\"unfortun\"\n", + "2019-01-31 01:37:11,805 : INFO : topic #29 (0.020): 0.031*\"companhia\" + 0.012*\"busi\" + 0.012*\"million\" + 0.012*\"market\" + 0.012*\"produc\" + 0.010*\"bank\" + 0.010*\"industri\" + 0.009*\"yawn\" + 0.008*\"manag\" + 0.007*\"trace\"\n", + "2019-01-31 01:37:11,811 : INFO : topic diff=0.003334, rho=0.020620\n", + "2019-01-31 01:37:11,970 : INFO : PROGRESS: pass 0, at document #4706000/4922894\n", + "2019-01-31 01:37:13,352 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:37:13,618 : INFO : topic #39 (0.020): 0.060*\"canada\" + 0.046*\"canadian\" + 0.025*\"toronto\" + 0.022*\"hoar\" + 0.021*\"ontario\" + 0.015*\"hydrogen\" + 0.015*\"misericordia\" + 0.014*\"new\" + 0.014*\"quebec\" + 0.014*\"novotná\"\n", + "2019-01-31 01:37:13,619 : INFO : topic #0 (0.020): 0.061*\"statewid\" + 0.039*\"line\" + 0.033*\"rivièr\" + 0.029*\"raid\" + 0.025*\"rosenwald\" + 0.021*\"airmen\" + 0.018*\"serv\" + 0.018*\"traceabl\" + 0.013*\"oper\" + 0.012*\"briarwood\"\n", + "2019-01-31 01:37:13,620 : INFO : topic #42 (0.020): 0.047*\"german\" + 0.031*\"germani\" + 0.015*\"vol\" + 0.015*\"israel\" + 0.014*\"berlin\" + 0.014*\"jewish\" + 0.014*\"der\" + 0.010*\"european\" + 0.009*\"europ\" + 0.009*\"austria\"\n", + "2019-01-31 01:37:13,621 : INFO : topic #40 (0.020): 0.085*\"unit\" + 0.023*\"schuster\" + 0.022*\"institut\" + 0.022*\"requir\" + 0.020*\"collector\" + 0.019*\"student\" + 0.014*\"professor\" + 0.012*\"word\" + 0.011*\"governor\" + 0.011*\"http\"\n", + "2019-01-31 01:37:13,622 : INFO : topic #24 (0.020): 0.040*\"book\" + 0.036*\"publicis\" + 0.024*\"word\" + 0.020*\"new\" + 0.015*\"presid\" + 0.014*\"edit\" + 0.012*\"magazin\" + 0.011*\"nicola\" + 0.011*\"worldwid\" + 0.011*\"storag\"\n", + "2019-01-31 01:37:13,628 : INFO : topic diff=0.003315, rho=0.020615\n", + "2019-01-31 01:37:13,782 : INFO : PROGRESS: pass 0, at document #4708000/4922894\n", + "2019-01-31 01:37:15,149 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:37:15,416 : INFO : topic #20 (0.020): 0.141*\"scholar\" + 0.039*\"struggl\" + 0.032*\"high\" + 0.030*\"educ\" + 0.024*\"collector\" + 0.017*\"yawn\" + 0.012*\"prognosi\" + 0.011*\"district\" + 0.010*\"task\" + 0.009*\"gothic\"\n", + "2019-01-31 01:37:15,417 : INFO : topic #6 (0.020): 0.068*\"fewer\" + 0.023*\"epiru\" + 0.020*\"septemb\" + 0.018*\"teacher\" + 0.014*\"stake\" + 0.012*\"proclaim\" + 0.012*\"rodríguez\" + 0.010*\"movi\" + 0.010*\"direct\" + 0.010*\"acrimoni\"\n", + "2019-01-31 01:37:15,418 : INFO : topic #47 (0.020): 0.065*\"muscl\" + 0.032*\"perceptu\" + 0.021*\"theater\" + 0.018*\"compos\" + 0.017*\"place\" + 0.016*\"damn\" + 0.013*\"orchestr\" + 0.013*\"physician\" + 0.013*\"olympo\" + 0.011*\"word\"\n", + "2019-01-31 01:37:15,419 : INFO : topic #30 (0.020): 0.035*\"cleveland\" + 0.035*\"leagu\" + 0.029*\"place\" + 0.027*\"taxpay\" + 0.024*\"scientist\" + 0.023*\"crete\" + 0.021*\"folei\" + 0.017*\"goal\" + 0.015*\"martin\" + 0.013*\"schmitz\"\n", + "2019-01-31 01:37:15,420 : INFO : topic #21 (0.020): 0.036*\"samford\" + 0.022*\"spain\" + 0.019*\"del\" + 0.016*\"mexico\" + 0.016*\"italian\" + 0.014*\"soviet\" + 0.012*\"santa\" + 0.011*\"francisco\" + 0.011*\"juan\" + 0.010*\"lizard\"\n", + "2019-01-31 01:37:15,426 : INFO : topic diff=0.002818, rho=0.020611\n", + "2019-01-31 01:37:15,581 : INFO : PROGRESS: pass 0, at document #4710000/4922894\n", + "2019-01-31 01:37:16,943 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:37:17,209 : INFO : topic #35 (0.020): 0.061*\"russia\" + 0.037*\"rural\" + 0.037*\"sovereignti\" + 0.026*\"poison\" + 0.026*\"reprint\" + 0.024*\"personifi\" + 0.020*\"moscow\" + 0.018*\"poland\" + 0.015*\"tyrant\" + 0.014*\"unfortun\"\n", + "2019-01-31 01:37:17,211 : INFO : topic #19 (0.020): 0.016*\"languag\" + 0.014*\"centuri\" + 0.010*\"woodcut\" + 0.009*\"form\" + 0.009*\"origin\" + 0.009*\"mean\" + 0.008*\"trade\" + 0.007*\"english\" + 0.007*\"known\" + 0.007*\"uruguayan\"\n", + "2019-01-31 01:37:17,212 : INFO : topic #12 (0.020): 0.009*\"number\" + 0.007*\"frontal\" + 0.007*\"gener\" + 0.006*\"exampl\" + 0.006*\"poet\" + 0.006*\"théori\" + 0.006*\"servitud\" + 0.006*\"southern\" + 0.006*\"mode\" + 0.006*\"measur\"\n", + "2019-01-31 01:37:17,213 : INFO : topic #47 (0.020): 0.065*\"muscl\" + 0.032*\"perceptu\" + 0.021*\"theater\" + 0.018*\"compos\" + 0.017*\"place\" + 0.016*\"damn\" + 0.014*\"orchestr\" + 0.013*\"physician\" + 0.013*\"olympo\" + 0.011*\"word\"\n", + "2019-01-31 01:37:17,214 : INFO : topic #32 (0.020): 0.050*\"district\" + 0.045*\"popolo\" + 0.042*\"vigour\" + 0.034*\"tortur\" + 0.032*\"cotton\" + 0.023*\"adulthood\" + 0.022*\"multitud\" + 0.021*\"area\" + 0.020*\"commun\" + 0.020*\"cede\"\n", + "2019-01-31 01:37:17,220 : INFO : topic diff=0.002997, rho=0.020607\n", + "2019-01-31 01:37:17,379 : INFO : PROGRESS: pass 0, at document #4712000/4922894\n", + "2019-01-31 01:37:18,766 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:37:19,033 : INFO : topic #3 (0.020): 0.033*\"present\" + 0.026*\"nation\" + 0.025*\"minist\" + 0.025*\"offic\" + 0.023*\"govern\" + 0.021*\"member\" + 0.018*\"start\" + 0.017*\"serv\" + 0.016*\"gener\" + 0.014*\"chickasaw\"\n", + "2019-01-31 01:37:19,034 : INFO : topic #48 (0.020): 0.081*\"march\" + 0.075*\"octob\" + 0.075*\"sens\" + 0.073*\"januari\" + 0.070*\"juli\" + 0.069*\"april\" + 0.068*\"notion\" + 0.068*\"judici\" + 0.067*\"august\" + 0.067*\"decatur\"\n", + "2019-01-31 01:37:19,035 : INFO : topic #21 (0.020): 0.036*\"samford\" + 0.022*\"spain\" + 0.019*\"del\" + 0.017*\"mexico\" + 0.016*\"italian\" + 0.014*\"soviet\" + 0.012*\"santa\" + 0.011*\"francisco\" + 0.011*\"juan\" + 0.010*\"lizard\"\n", + "2019-01-31 01:37:19,036 : INFO : topic #36 (0.020): 0.011*\"network\" + 0.011*\"prognosi\" + 0.010*\"pop\" + 0.009*\"cytokin\" + 0.008*\"develop\" + 0.008*\"diggin\" + 0.007*\"softwar\" + 0.007*\"uruguayan\" + 0.007*\"includ\" + 0.007*\"user\"\n", + "2019-01-31 01:37:19,037 : INFO : topic #7 (0.020): 0.021*\"snatch\" + 0.020*\"di\" + 0.019*\"factor\" + 0.016*\"yawn\" + 0.016*\"margin\" + 0.014*\"bone\" + 0.013*\"life\" + 0.013*\"faster\" + 0.012*\"deal\" + 0.012*\"will\"\n", + "2019-01-31 01:37:19,043 : INFO : topic diff=0.003257, rho=0.020602\n", + "2019-01-31 01:37:19,205 : INFO : PROGRESS: pass 0, at document #4714000/4922894\n", + "2019-01-31 01:37:20,580 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:37:20,847 : INFO : topic #24 (0.020): 0.040*\"book\" + 0.036*\"publicis\" + 0.025*\"word\" + 0.020*\"new\" + 0.014*\"presid\" + 0.014*\"edit\" + 0.012*\"magazin\" + 0.011*\"worldwid\" + 0.011*\"nicola\" + 0.011*\"author\"\n", + "2019-01-31 01:37:20,849 : INFO : topic #5 (0.020): 0.039*\"abroad\" + 0.028*\"son\" + 0.027*\"rel\" + 0.025*\"reconstruct\" + 0.021*\"band\" + 0.017*\"muscl\" + 0.016*\"simultan\" + 0.014*\"charcoal\" + 0.013*\"toyota\" + 0.009*\"myspac\"\n", + "2019-01-31 01:37:20,850 : INFO : topic #44 (0.020): 0.031*\"rooftop\" + 0.026*\"final\" + 0.024*\"wife\" + 0.021*\"tourist\" + 0.018*\"champion\" + 0.014*\"chamber\" + 0.014*\"martin\" + 0.014*\"taxpay\" + 0.014*\"tiepolo\" + 0.012*\"open\"\n", + "2019-01-31 01:37:20,851 : INFO : topic #36 (0.020): 0.011*\"network\" + 0.011*\"prognosi\" + 0.010*\"pop\" + 0.009*\"cytokin\" + 0.008*\"diggin\" + 0.008*\"develop\" + 0.007*\"softwar\" + 0.007*\"uruguayan\" + 0.007*\"includ\" + 0.007*\"user\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 01:37:20,852 : INFO : topic #4 (0.020): 0.019*\"enfranchis\" + 0.015*\"depress\" + 0.013*\"pour\" + 0.008*\"mode\" + 0.008*\"veget\" + 0.008*\"uruguayan\" + 0.008*\"elabor\" + 0.006*\"turn\" + 0.006*\"produc\" + 0.006*\"develop\"\n", + "2019-01-31 01:37:20,858 : INFO : topic diff=0.003233, rho=0.020598\n", + "2019-01-31 01:37:21,020 : INFO : PROGRESS: pass 0, at document #4716000/4922894\n", + "2019-01-31 01:37:22,404 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:37:22,671 : INFO : topic #23 (0.020): 0.139*\"audit\" + 0.068*\"best\" + 0.035*\"yawn\" + 0.028*\"jacksonvil\" + 0.023*\"japanes\" + 0.021*\"noll\" + 0.019*\"women\" + 0.018*\"intern\" + 0.017*\"festiv\" + 0.015*\"prison\"\n", + "2019-01-31 01:37:22,672 : INFO : topic #34 (0.020): 0.066*\"start\" + 0.033*\"new\" + 0.031*\"american\" + 0.029*\"unionist\" + 0.026*\"cotton\" + 0.021*\"year\" + 0.015*\"california\" + 0.013*\"warrior\" + 0.012*\"terri\" + 0.012*\"north\"\n", + "2019-01-31 01:37:22,672 : INFO : topic #40 (0.020): 0.086*\"unit\" + 0.023*\"schuster\" + 0.022*\"requir\" + 0.022*\"institut\" + 0.020*\"collector\" + 0.019*\"student\" + 0.014*\"professor\" + 0.012*\"word\" + 0.011*\"governor\" + 0.011*\"http\"\n", + "2019-01-31 01:37:22,674 : INFO : topic #37 (0.020): 0.012*\"charact\" + 0.011*\"septemb\" + 0.011*\"man\" + 0.010*\"anim\" + 0.008*\"comic\" + 0.007*\"appear\" + 0.007*\"fusiform\" + 0.007*\"workplac\" + 0.007*\"storag\" + 0.006*\"black\"\n", + "2019-01-31 01:37:22,675 : INFO : topic #44 (0.020): 0.031*\"rooftop\" + 0.026*\"final\" + 0.024*\"wife\" + 0.021*\"tourist\" + 0.018*\"champion\" + 0.014*\"chamber\" + 0.014*\"martin\" + 0.014*\"taxpay\" + 0.014*\"tiepolo\" + 0.012*\"open\"\n", + "2019-01-31 01:37:22,680 : INFO : topic diff=0.002917, rho=0.020593\n", + "2019-01-31 01:37:22,837 : INFO : PROGRESS: pass 0, at document #4718000/4922894\n", + "2019-01-31 01:37:24,203 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:37:24,469 : INFO : topic #49 (0.020): 0.043*\"india\" + 0.030*\"incumb\" + 0.013*\"islam\" + 0.012*\"pakistan\" + 0.012*\"anglo\" + 0.011*\"affection\" + 0.011*\"tajikistan\" + 0.010*\"televis\" + 0.010*\"muskoge\" + 0.010*\"khalsa\"\n", + "2019-01-31 01:37:24,471 : INFO : topic #14 (0.020): 0.024*\"forc\" + 0.022*\"aggress\" + 0.021*\"armi\" + 0.020*\"walter\" + 0.018*\"com\" + 0.014*\"oper\" + 0.013*\"unionist\" + 0.012*\"militari\" + 0.012*\"airbu\" + 0.011*\"diversifi\"\n", + "2019-01-31 01:37:24,472 : INFO : topic #30 (0.020): 0.035*\"cleveland\" + 0.035*\"leagu\" + 0.030*\"place\" + 0.027*\"taxpay\" + 0.024*\"scientist\" + 0.023*\"crete\" + 0.021*\"folei\" + 0.017*\"goal\" + 0.015*\"martin\" + 0.013*\"schmitz\"\n", + "2019-01-31 01:37:24,473 : INFO : topic #16 (0.020): 0.054*\"king\" + 0.030*\"priest\" + 0.020*\"duke\" + 0.018*\"idiosyncrat\" + 0.018*\"rotterdam\" + 0.017*\"portugues\" + 0.017*\"grammat\" + 0.016*\"quarterli\" + 0.014*\"kingdom\" + 0.014*\"brazil\"\n", + "2019-01-31 01:37:24,474 : INFO : topic #3 (0.020): 0.032*\"present\" + 0.026*\"nation\" + 0.025*\"minist\" + 0.025*\"offic\" + 0.024*\"govern\" + 0.022*\"member\" + 0.018*\"start\" + 0.017*\"serv\" + 0.016*\"gener\" + 0.014*\"chickasaw\"\n", + "2019-01-31 01:37:24,480 : INFO : topic diff=0.002491, rho=0.020589\n", + "2019-01-31 01:37:27,158 : INFO : -11.889 per-word bound, 3792.9 perplexity estimate based on a held-out corpus of 2000 documents with 552936 words\n", + "2019-01-31 01:37:27,159 : INFO : PROGRESS: pass 0, at document #4720000/4922894\n", + "2019-01-31 01:37:28,533 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:37:28,799 : INFO : topic #29 (0.020): 0.031*\"companhia\" + 0.013*\"busi\" + 0.012*\"million\" + 0.012*\"market\" + 0.011*\"produc\" + 0.010*\"industri\" + 0.010*\"bank\" + 0.009*\"manag\" + 0.009*\"yawn\" + 0.007*\"trace\"\n", + "2019-01-31 01:37:28,800 : INFO : topic #44 (0.020): 0.030*\"rooftop\" + 0.026*\"final\" + 0.024*\"wife\" + 0.021*\"tourist\" + 0.018*\"champion\" + 0.014*\"chamber\" + 0.014*\"martin\" + 0.014*\"taxpay\" + 0.014*\"tiepolo\" + 0.012*\"open\"\n", + "2019-01-31 01:37:28,801 : INFO : topic #33 (0.020): 0.060*\"french\" + 0.044*\"franc\" + 0.030*\"pari\" + 0.022*\"jean\" + 0.022*\"wreath\" + 0.021*\"sail\" + 0.017*\"daphn\" + 0.013*\"lazi\" + 0.012*\"loui\" + 0.012*\"piec\"\n", + "2019-01-31 01:37:28,802 : INFO : topic #23 (0.020): 0.138*\"audit\" + 0.068*\"best\" + 0.035*\"yawn\" + 0.028*\"jacksonvil\" + 0.023*\"japanes\" + 0.021*\"noll\" + 0.019*\"women\" + 0.018*\"intern\" + 0.017*\"festiv\" + 0.015*\"prison\"\n", + "2019-01-31 01:37:28,804 : INFO : topic #18 (0.020): 0.010*\"théori\" + 0.007*\"later\" + 0.006*\"sack\" + 0.006*\"dai\" + 0.005*\"kill\" + 0.005*\"end\" + 0.005*\"like\" + 0.005*\"retrospect\" + 0.004*\"help\" + 0.004*\"call\"\n", + "2019-01-31 01:37:28,809 : INFO : topic diff=0.002880, rho=0.020585\n", + "2019-01-31 01:37:28,967 : INFO : PROGRESS: pass 0, at document #4722000/4922894\n", + "2019-01-31 01:37:30,334 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:37:30,601 : INFO : topic #44 (0.020): 0.030*\"rooftop\" + 0.026*\"final\" + 0.024*\"wife\" + 0.021*\"tourist\" + 0.018*\"champion\" + 0.015*\"chamber\" + 0.014*\"martin\" + 0.014*\"taxpay\" + 0.014*\"tiepolo\" + 0.012*\"open\"\n", + "2019-01-31 01:37:30,602 : INFO : topic #1 (0.020): 0.054*\"china\" + 0.047*\"chilton\" + 0.028*\"kong\" + 0.027*\"hong\" + 0.021*\"korea\" + 0.018*\"korean\" + 0.015*\"leah\" + 0.015*\"sourc\" + 0.014*\"kim\" + 0.014*\"shirin\"\n", + "2019-01-31 01:37:30,603 : INFO : topic #31 (0.020): 0.049*\"fusiform\" + 0.027*\"scientist\" + 0.025*\"taxpay\" + 0.022*\"player\" + 0.019*\"place\" + 0.014*\"clot\" + 0.013*\"leagu\" + 0.011*\"folei\" + 0.010*\"yawn\" + 0.009*\"reconstruct\"\n", + "2019-01-31 01:37:30,604 : INFO : topic #12 (0.020): 0.009*\"number\" + 0.007*\"frontal\" + 0.006*\"gener\" + 0.006*\"exampl\" + 0.006*\"poet\" + 0.006*\"théori\" + 0.006*\"servitud\" + 0.006*\"mode\" + 0.006*\"measur\" + 0.006*\"southern\"\n", + "2019-01-31 01:37:30,605 : INFO : topic #19 (0.020): 0.017*\"languag\" + 0.015*\"centuri\" + 0.010*\"woodcut\" + 0.009*\"form\" + 0.009*\"mean\" + 0.009*\"origin\" + 0.008*\"trade\" + 0.007*\"english\" + 0.007*\"known\" + 0.007*\"uruguayan\"\n", + "2019-01-31 01:37:30,611 : INFO : topic diff=0.003509, rho=0.020580\n", + "2019-01-31 01:37:30,769 : INFO : PROGRESS: pass 0, at document #4724000/4922894\n", + "2019-01-31 01:37:32,164 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:37:32,431 : INFO : topic #37 (0.020): 0.012*\"charact\" + 0.011*\"septemb\" + 0.011*\"man\" + 0.010*\"anim\" + 0.008*\"comic\" + 0.007*\"fusiform\" + 0.007*\"appear\" + 0.007*\"workplac\" + 0.007*\"storag\" + 0.006*\"black\"\n", + "2019-01-31 01:37:32,432 : INFO : topic #25 (0.020): 0.033*\"ring\" + 0.019*\"area\" + 0.018*\"lagrang\" + 0.016*\"warmth\" + 0.015*\"mount\" + 0.010*\"north\" + 0.009*\"land\" + 0.009*\"sourc\" + 0.009*\"palmer\" + 0.009*\"foam\"\n", + "2019-01-31 01:37:32,433 : INFO : topic #26 (0.020): 0.029*\"workplac\" + 0.029*\"champion\" + 0.025*\"woman\" + 0.025*\"olymp\" + 0.024*\"men\" + 0.021*\"medal\" + 0.020*\"alic\" + 0.020*\"event\" + 0.018*\"taxpay\" + 0.018*\"atheist\"\n", + "2019-01-31 01:37:32,434 : INFO : topic #41 (0.020): 0.042*\"citi\" + 0.026*\"palmer\" + 0.019*\"new\" + 0.018*\"strategist\" + 0.013*\"open\" + 0.013*\"center\" + 0.011*\"lobe\" + 0.011*\"includ\" + 0.010*\"dai\" + 0.009*\"highli\"\n", + "2019-01-31 01:37:32,435 : INFO : topic #28 (0.020): 0.036*\"build\" + 0.030*\"hous\" + 0.019*\"buford\" + 0.016*\"histor\" + 0.012*\"linear\" + 0.012*\"depress\" + 0.011*\"centuri\" + 0.011*\"constitut\" + 0.011*\"silicon\" + 0.010*\"pistol\"\n", + "2019-01-31 01:37:32,441 : INFO : topic diff=0.003054, rho=0.020576\n", + "2019-01-31 01:37:32,595 : INFO : PROGRESS: pass 0, at document #4726000/4922894\n", + "2019-01-31 01:37:33,932 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:37:34,198 : INFO : topic #25 (0.020): 0.033*\"ring\" + 0.019*\"area\" + 0.018*\"lagrang\" + 0.016*\"warmth\" + 0.015*\"mount\" + 0.010*\"north\" + 0.009*\"land\" + 0.009*\"sourc\" + 0.009*\"palmer\" + 0.009*\"foam\"\n", + "2019-01-31 01:37:34,200 : INFO : topic #29 (0.020): 0.031*\"companhia\" + 0.013*\"busi\" + 0.012*\"million\" + 0.012*\"market\" + 0.011*\"produc\" + 0.010*\"industri\" + 0.010*\"bank\" + 0.009*\"manag\" + 0.009*\"yawn\" + 0.007*\"oper\"\n", + "2019-01-31 01:37:34,201 : INFO : topic #13 (0.020): 0.028*\"australia\" + 0.027*\"london\" + 0.026*\"sourc\" + 0.025*\"new\" + 0.023*\"england\" + 0.022*\"australian\" + 0.019*\"british\" + 0.018*\"ireland\" + 0.015*\"youth\" + 0.014*\"wale\"\n", + "2019-01-31 01:37:34,202 : INFO : topic #34 (0.020): 0.066*\"start\" + 0.033*\"new\" + 0.031*\"american\" + 0.029*\"unionist\" + 0.026*\"cotton\" + 0.021*\"year\" + 0.015*\"california\" + 0.013*\"warrior\" + 0.012*\"terri\" + 0.011*\"north\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 01:37:34,203 : INFO : topic #0 (0.020): 0.061*\"statewid\" + 0.039*\"line\" + 0.033*\"rivièr\" + 0.029*\"raid\" + 0.026*\"rosenwald\" + 0.021*\"airmen\" + 0.018*\"traceabl\" + 0.018*\"serv\" + 0.013*\"oper\" + 0.012*\"briarwood\"\n", + "2019-01-31 01:37:34,208 : INFO : topic diff=0.002606, rho=0.020572\n", + "2019-01-31 01:37:34,360 : INFO : PROGRESS: pass 0, at document #4728000/4922894\n", + "2019-01-31 01:37:35,719 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:37:35,986 : INFO : topic #42 (0.020): 0.047*\"german\" + 0.031*\"germani\" + 0.016*\"vol\" + 0.015*\"jewish\" + 0.014*\"israel\" + 0.014*\"der\" + 0.014*\"berlin\" + 0.010*\"european\" + 0.010*\"europ\" + 0.009*\"austria\"\n", + "2019-01-31 01:37:35,987 : INFO : topic #26 (0.020): 0.029*\"workplac\" + 0.029*\"champion\" + 0.026*\"woman\" + 0.024*\"olymp\" + 0.024*\"men\" + 0.021*\"medal\" + 0.020*\"alic\" + 0.020*\"event\" + 0.018*\"taxpay\" + 0.017*\"atheist\"\n", + "2019-01-31 01:37:35,988 : INFO : topic #46 (0.020): 0.017*\"sweden\" + 0.016*\"stop\" + 0.016*\"swedish\" + 0.016*\"norwai\" + 0.014*\"wind\" + 0.013*\"norwegian\" + 0.013*\"damag\" + 0.010*\"turkish\" + 0.010*\"denmark\" + 0.010*\"farid\"\n", + "2019-01-31 01:37:35,989 : INFO : topic #6 (0.020): 0.068*\"fewer\" + 0.024*\"epiru\" + 0.020*\"septemb\" + 0.018*\"teacher\" + 0.014*\"stake\" + 0.012*\"rodríguez\" + 0.012*\"proclaim\" + 0.011*\"movi\" + 0.010*\"direct\" + 0.010*\"acrimoni\"\n", + "2019-01-31 01:37:35,990 : INFO : topic #15 (0.020): 0.012*\"small\" + 0.010*\"organ\" + 0.010*\"develop\" + 0.009*\"commun\" + 0.008*\"group\" + 0.008*\"peopl\" + 0.008*\"word\" + 0.007*\"woman\" + 0.007*\"human\" + 0.006*\"summerhil\"\n", + "2019-01-31 01:37:35,996 : INFO : topic diff=0.003487, rho=0.020567\n", + "2019-01-31 01:37:36,152 : INFO : PROGRESS: pass 0, at document #4730000/4922894\n", + "2019-01-31 01:37:37,519 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:37:37,785 : INFO : topic #39 (0.020): 0.059*\"canada\" + 0.046*\"canadian\" + 0.025*\"toronto\" + 0.023*\"hoar\" + 0.021*\"ontario\" + 0.015*\"hydrogen\" + 0.015*\"misericordia\" + 0.014*\"new\" + 0.014*\"quebec\" + 0.014*\"novotná\"\n", + "2019-01-31 01:37:37,786 : INFO : topic #49 (0.020): 0.044*\"india\" + 0.030*\"incumb\" + 0.013*\"islam\" + 0.012*\"pakistan\" + 0.012*\"anglo\" + 0.011*\"affection\" + 0.011*\"khalsa\" + 0.011*\"televis\" + 0.011*\"tajikistan\" + 0.010*\"muskoge\"\n", + "2019-01-31 01:37:37,787 : INFO : topic #32 (0.020): 0.050*\"district\" + 0.046*\"popolo\" + 0.042*\"vigour\" + 0.034*\"tortur\" + 0.031*\"cotton\" + 0.023*\"adulthood\" + 0.022*\"multitud\" + 0.021*\"area\" + 0.020*\"cede\" + 0.019*\"commun\"\n", + "2019-01-31 01:37:37,788 : INFO : topic #12 (0.020): 0.009*\"number\" + 0.007*\"frontal\" + 0.007*\"gener\" + 0.006*\"exampl\" + 0.006*\"théori\" + 0.006*\"poet\" + 0.006*\"servitud\" + 0.006*\"mode\" + 0.006*\"measur\" + 0.006*\"southern\"\n", + "2019-01-31 01:37:37,789 : INFO : topic #17 (0.020): 0.080*\"church\" + 0.023*\"christian\" + 0.023*\"cathol\" + 0.020*\"bishop\" + 0.016*\"sail\" + 0.015*\"retroflex\" + 0.010*\"relationship\" + 0.010*\"parish\" + 0.009*\"historiographi\" + 0.009*\"cathedr\"\n", + "2019-01-31 01:37:37,795 : INFO : topic diff=0.003071, rho=0.020563\n", + "2019-01-31 01:37:37,952 : INFO : PROGRESS: pass 0, at document #4732000/4922894\n", + "2019-01-31 01:37:39,314 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:37:39,580 : INFO : topic #45 (0.020): 0.048*\"arsen\" + 0.030*\"jpg\" + 0.030*\"museo\" + 0.027*\"fifteenth\" + 0.022*\"pain\" + 0.021*\"illicit\" + 0.017*\"artist\" + 0.016*\"exhaust\" + 0.016*\"colder\" + 0.016*\"gai\"\n", + "2019-01-31 01:37:39,582 : INFO : topic #15 (0.020): 0.012*\"small\" + 0.010*\"organ\" + 0.010*\"develop\" + 0.009*\"commun\" + 0.009*\"group\" + 0.008*\"peopl\" + 0.008*\"word\" + 0.007*\"woman\" + 0.007*\"human\" + 0.006*\"workplac\"\n", + "2019-01-31 01:37:39,583 : INFO : topic #25 (0.020): 0.033*\"ring\" + 0.019*\"area\" + 0.018*\"lagrang\" + 0.017*\"warmth\" + 0.015*\"mount\" + 0.010*\"north\" + 0.009*\"land\" + 0.009*\"foam\" + 0.009*\"sourc\" + 0.009*\"palmer\"\n", + "2019-01-31 01:37:39,584 : INFO : topic #33 (0.020): 0.061*\"french\" + 0.044*\"franc\" + 0.030*\"pari\" + 0.022*\"jean\" + 0.021*\"sail\" + 0.020*\"wreath\" + 0.017*\"daphn\" + 0.013*\"lazi\" + 0.012*\"loui\" + 0.012*\"piec\"\n", + "2019-01-31 01:37:39,585 : INFO : topic #19 (0.020): 0.017*\"languag\" + 0.015*\"centuri\" + 0.010*\"woodcut\" + 0.009*\"form\" + 0.009*\"origin\" + 0.009*\"mean\" + 0.008*\"trade\" + 0.007*\"english\" + 0.007*\"known\" + 0.007*\"uruguayan\"\n", + "2019-01-31 01:37:39,591 : INFO : topic diff=0.002807, rho=0.020559\n", + "2019-01-31 01:37:39,801 : INFO : PROGRESS: pass 0, at document #4734000/4922894\n", + "2019-01-31 01:37:41,147 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:37:41,413 : INFO : topic #28 (0.020): 0.036*\"build\" + 0.030*\"hous\" + 0.019*\"buford\" + 0.015*\"histor\" + 0.012*\"linear\" + 0.012*\"depress\" + 0.011*\"centuri\" + 0.011*\"constitut\" + 0.011*\"silicon\" + 0.010*\"pistol\"\n", + "2019-01-31 01:37:41,415 : INFO : topic #15 (0.020): 0.012*\"small\" + 0.010*\"organ\" + 0.010*\"develop\" + 0.009*\"commun\" + 0.009*\"group\" + 0.008*\"peopl\" + 0.008*\"word\" + 0.007*\"woman\" + 0.007*\"human\" + 0.006*\"summerhil\"\n", + "2019-01-31 01:37:41,416 : INFO : topic #6 (0.020): 0.068*\"fewer\" + 0.023*\"epiru\" + 0.020*\"septemb\" + 0.018*\"teacher\" + 0.014*\"stake\" + 0.012*\"rodríguez\" + 0.012*\"proclaim\" + 0.011*\"movi\" + 0.010*\"direct\" + 0.010*\"acrimoni\"\n", + "2019-01-31 01:37:41,417 : INFO : topic #24 (0.020): 0.040*\"book\" + 0.036*\"publicis\" + 0.025*\"word\" + 0.020*\"new\" + 0.014*\"presid\" + 0.014*\"edit\" + 0.012*\"magazin\" + 0.011*\"worldwid\" + 0.011*\"nicola\" + 0.011*\"author\"\n", + "2019-01-31 01:37:41,418 : INFO : topic #40 (0.020): 0.086*\"unit\" + 0.023*\"schuster\" + 0.022*\"institut\" + 0.022*\"requir\" + 0.020*\"collector\" + 0.019*\"student\" + 0.014*\"professor\" + 0.012*\"word\" + 0.011*\"governor\" + 0.011*\"http\"\n", + "2019-01-31 01:37:41,424 : INFO : topic diff=0.003296, rho=0.020554\n", + "2019-01-31 01:37:41,574 : INFO : PROGRESS: pass 0, at document #4736000/4922894\n", + "2019-01-31 01:37:42,921 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:37:43,188 : INFO : topic #32 (0.020): 0.050*\"district\" + 0.046*\"popolo\" + 0.042*\"vigour\" + 0.034*\"tortur\" + 0.031*\"cotton\" + 0.023*\"adulthood\" + 0.022*\"multitud\" + 0.021*\"area\" + 0.020*\"cede\" + 0.019*\"commun\"\n", + "2019-01-31 01:37:43,189 : INFO : topic #11 (0.020): 0.022*\"john\" + 0.011*\"will\" + 0.011*\"jame\" + 0.011*\"david\" + 0.010*\"rival\" + 0.009*\"mexican–american\" + 0.008*\"slur\" + 0.008*\"paul\" + 0.008*\"rhyme\" + 0.007*\"georg\"\n", + "2019-01-31 01:37:43,190 : INFO : topic #49 (0.020): 0.044*\"india\" + 0.029*\"incumb\" + 0.013*\"islam\" + 0.012*\"pakistan\" + 0.012*\"anglo\" + 0.011*\"affection\" + 0.011*\"khalsa\" + 0.010*\"televis\" + 0.010*\"muskoge\" + 0.010*\"tajikistan\"\n", + "2019-01-31 01:37:43,191 : INFO : topic #38 (0.020): 0.022*\"walter\" + 0.009*\"aza\" + 0.009*\"forc\" + 0.008*\"battalion\" + 0.007*\"empath\" + 0.007*\"armi\" + 0.007*\"teufel\" + 0.007*\"govern\" + 0.006*\"militari\" + 0.006*\"pour\"\n", + "2019-01-31 01:37:43,192 : INFO : topic #21 (0.020): 0.035*\"samford\" + 0.023*\"spain\" + 0.018*\"del\" + 0.017*\"mexico\" + 0.017*\"italian\" + 0.014*\"soviet\" + 0.012*\"santa\" + 0.011*\"francisco\" + 0.011*\"juan\" + 0.010*\"itali\"\n", + "2019-01-31 01:37:43,198 : INFO : topic diff=0.002982, rho=0.020550\n", + "2019-01-31 01:37:43,351 : INFO : PROGRESS: pass 0, at document #4738000/4922894\n", + "2019-01-31 01:37:44,688 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:37:44,954 : INFO : topic #47 (0.020): 0.065*\"muscl\" + 0.032*\"perceptu\" + 0.021*\"theater\" + 0.018*\"compos\" + 0.018*\"place\" + 0.016*\"damn\" + 0.013*\"orchestr\" + 0.013*\"physician\" + 0.013*\"olympo\" + 0.011*\"word\"\n", + "2019-01-31 01:37:44,955 : INFO : topic #46 (0.020): 0.017*\"sweden\" + 0.016*\"swedish\" + 0.016*\"stop\" + 0.016*\"norwai\" + 0.014*\"wind\" + 0.014*\"norwegian\" + 0.013*\"damag\" + 0.011*\"treeless\" + 0.011*\"huntsvil\" + 0.010*\"denmark\"\n", + "2019-01-31 01:37:44,956 : INFO : topic #1 (0.020): 0.056*\"china\" + 0.046*\"chilton\" + 0.028*\"kong\" + 0.027*\"hong\" + 0.021*\"korea\" + 0.018*\"korean\" + 0.015*\"sourc\" + 0.014*\"leah\" + 0.014*\"shirin\" + 0.014*\"kim\"\n", + "2019-01-31 01:37:44,957 : INFO : topic #42 (0.020): 0.047*\"german\" + 0.032*\"germani\" + 0.015*\"vol\" + 0.015*\"israel\" + 0.014*\"jewish\" + 0.014*\"der\" + 0.014*\"berlin\" + 0.010*\"european\" + 0.010*\"europ\" + 0.009*\"austria\"\n", + "2019-01-31 01:37:44,958 : INFO : topic #43 (0.020): 0.066*\"elect\" + 0.054*\"parti\" + 0.025*\"voluntari\" + 0.024*\"democrat\" + 0.020*\"member\" + 0.016*\"polici\" + 0.015*\"republ\" + 0.014*\"bypass\" + 0.013*\"report\" + 0.013*\"liber\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 01:37:44,964 : INFO : topic diff=0.003137, rho=0.020546\n", + "2019-01-31 01:37:47,630 : INFO : -11.389 per-word bound, 2682.5 perplexity estimate based on a held-out corpus of 2000 documents with 548437 words\n", + "2019-01-31 01:37:47,630 : INFO : PROGRESS: pass 0, at document #4740000/4922894\n", + "2019-01-31 01:37:48,996 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:37:49,263 : INFO : topic #10 (0.020): 0.011*\"cdd\" + 0.008*\"media\" + 0.008*\"have\" + 0.008*\"disco\" + 0.007*\"hormon\" + 0.007*\"caus\" + 0.007*\"pathwai\" + 0.006*\"proper\" + 0.006*\"effect\" + 0.005*\"treat\"\n", + "2019-01-31 01:37:49,264 : INFO : topic #26 (0.020): 0.029*\"workplac\" + 0.029*\"champion\" + 0.026*\"woman\" + 0.024*\"olymp\" + 0.023*\"men\" + 0.021*\"medal\" + 0.020*\"alic\" + 0.019*\"event\" + 0.018*\"taxpay\" + 0.017*\"rainfal\"\n", + "2019-01-31 01:37:49,265 : INFO : topic #21 (0.020): 0.035*\"samford\" + 0.023*\"spain\" + 0.018*\"del\" + 0.017*\"mexico\" + 0.017*\"italian\" + 0.014*\"soviet\" + 0.012*\"santa\" + 0.011*\"francisco\" + 0.011*\"juan\" + 0.010*\"itali\"\n", + "2019-01-31 01:37:49,266 : INFO : topic #37 (0.020): 0.012*\"charact\" + 0.012*\"septemb\" + 0.011*\"man\" + 0.010*\"anim\" + 0.008*\"comic\" + 0.007*\"fusiform\" + 0.007*\"appear\" + 0.007*\"workplac\" + 0.007*\"storag\" + 0.006*\"black\"\n", + "2019-01-31 01:37:49,267 : INFO : topic #47 (0.020): 0.065*\"muscl\" + 0.032*\"perceptu\" + 0.021*\"theater\" + 0.018*\"compos\" + 0.018*\"place\" + 0.016*\"damn\" + 0.014*\"orchestr\" + 0.013*\"physician\" + 0.013*\"olympo\" + 0.011*\"word\"\n", + "2019-01-31 01:37:49,273 : INFO : topic diff=0.002845, rho=0.020541\n", + "2019-01-31 01:37:49,437 : INFO : PROGRESS: pass 0, at document #4742000/4922894\n", + "2019-01-31 01:37:50,804 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:37:51,073 : INFO : topic #15 (0.020): 0.012*\"small\" + 0.010*\"organ\" + 0.010*\"develop\" + 0.009*\"commun\" + 0.009*\"group\" + 0.008*\"peopl\" + 0.008*\"word\" + 0.007*\"woman\" + 0.007*\"human\" + 0.006*\"workplac\"\n", + "2019-01-31 01:37:51,075 : INFO : topic #30 (0.020): 0.035*\"leagu\" + 0.034*\"cleveland\" + 0.030*\"place\" + 0.027*\"taxpay\" + 0.024*\"scientist\" + 0.023*\"crete\" + 0.022*\"folei\" + 0.017*\"goal\" + 0.015*\"martin\" + 0.013*\"schmitz\"\n", + "2019-01-31 01:37:51,076 : INFO : topic #39 (0.020): 0.060*\"canada\" + 0.047*\"canadian\" + 0.026*\"toronto\" + 0.024*\"hoar\" + 0.021*\"ontario\" + 0.015*\"hydrogen\" + 0.015*\"misericordia\" + 0.014*\"new\" + 0.014*\"quebec\" + 0.014*\"novotná\"\n", + "2019-01-31 01:37:51,077 : INFO : topic #49 (0.020): 0.044*\"india\" + 0.030*\"incumb\" + 0.013*\"islam\" + 0.013*\"pakistan\" + 0.012*\"anglo\" + 0.011*\"affection\" + 0.011*\"khalsa\" + 0.011*\"muskoge\" + 0.010*\"televis\" + 0.010*\"tajikistan\"\n", + "2019-01-31 01:37:51,078 : INFO : topic #21 (0.020): 0.035*\"samford\" + 0.023*\"spain\" + 0.018*\"del\" + 0.017*\"mexico\" + 0.017*\"italian\" + 0.014*\"soviet\" + 0.012*\"santa\" + 0.011*\"juan\" + 0.010*\"francisco\" + 0.010*\"itali\"\n", + "2019-01-31 01:37:51,083 : INFO : topic diff=0.003030, rho=0.020537\n", + "2019-01-31 01:37:51,236 : INFO : PROGRESS: pass 0, at document #4744000/4922894\n", + "2019-01-31 01:37:52,602 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:37:52,868 : INFO : topic #26 (0.020): 0.030*\"workplac\" + 0.029*\"champion\" + 0.026*\"woman\" + 0.024*\"olymp\" + 0.023*\"men\" + 0.021*\"medal\" + 0.020*\"alic\" + 0.019*\"event\" + 0.018*\"taxpay\" + 0.017*\"atheist\"\n", + "2019-01-31 01:37:52,869 : INFO : topic #17 (0.020): 0.080*\"church\" + 0.023*\"christian\" + 0.023*\"cathol\" + 0.020*\"bishop\" + 0.016*\"sail\" + 0.015*\"retroflex\" + 0.010*\"relationship\" + 0.010*\"parish\" + 0.009*\"historiographi\" + 0.009*\"cathedr\"\n", + "2019-01-31 01:37:52,870 : INFO : topic #48 (0.020): 0.081*\"march\" + 0.077*\"octob\" + 0.077*\"sens\" + 0.072*\"januari\" + 0.071*\"juli\" + 0.069*\"notion\" + 0.069*\"august\" + 0.068*\"april\" + 0.068*\"judici\" + 0.067*\"decatur\"\n", + "2019-01-31 01:37:52,871 : INFO : topic #35 (0.020): 0.057*\"russia\" + 0.038*\"sovereignti\" + 0.035*\"rural\" + 0.029*\"poison\" + 0.027*\"reprint\" + 0.024*\"personifi\" + 0.020*\"moscow\" + 0.019*\"poland\" + 0.015*\"tyrant\" + 0.015*\"unfortun\"\n", + "2019-01-31 01:37:52,872 : INFO : topic #37 (0.020): 0.012*\"charact\" + 0.012*\"septemb\" + 0.011*\"man\" + 0.010*\"anim\" + 0.008*\"comic\" + 0.007*\"appear\" + 0.007*\"fusiform\" + 0.007*\"workplac\" + 0.007*\"storag\" + 0.006*\"black\"\n", + "2019-01-31 01:37:52,878 : INFO : topic diff=0.003567, rho=0.020533\n", + "2019-01-31 01:37:53,033 : INFO : PROGRESS: pass 0, at document #4746000/4922894\n", + "2019-01-31 01:37:54,399 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:37:54,666 : INFO : topic #17 (0.020): 0.080*\"church\" + 0.023*\"cathol\" + 0.023*\"christian\" + 0.020*\"bishop\" + 0.016*\"sail\" + 0.015*\"retroflex\" + 0.010*\"relationship\" + 0.010*\"parish\" + 0.010*\"historiographi\" + 0.009*\"poll\"\n", + "2019-01-31 01:37:54,667 : INFO : topic #32 (0.020): 0.051*\"district\" + 0.045*\"popolo\" + 0.042*\"vigour\" + 0.034*\"tortur\" + 0.031*\"cotton\" + 0.023*\"adulthood\" + 0.022*\"multitud\" + 0.021*\"area\" + 0.020*\"cede\" + 0.019*\"commun\"\n", + "2019-01-31 01:37:54,668 : INFO : topic #37 (0.020): 0.012*\"charact\" + 0.012*\"septemb\" + 0.011*\"man\" + 0.010*\"anim\" + 0.008*\"comic\" + 0.007*\"appear\" + 0.007*\"fusiform\" + 0.007*\"workplac\" + 0.007*\"storag\" + 0.006*\"black\"\n", + "2019-01-31 01:37:54,669 : INFO : topic #9 (0.020): 0.073*\"bone\" + 0.044*\"american\" + 0.032*\"valour\" + 0.019*\"folei\" + 0.018*\"player\" + 0.018*\"dutch\" + 0.016*\"polit\" + 0.016*\"english\" + 0.012*\"simpler\" + 0.012*\"acrimoni\"\n", + "2019-01-31 01:37:54,670 : INFO : topic #26 (0.020): 0.030*\"workplac\" + 0.029*\"champion\" + 0.025*\"woman\" + 0.025*\"olymp\" + 0.023*\"men\" + 0.021*\"medal\" + 0.020*\"alic\" + 0.019*\"event\" + 0.018*\"taxpay\" + 0.017*\"atheist\"\n", + "2019-01-31 01:37:54,676 : INFO : topic diff=0.002670, rho=0.020528\n", + "2019-01-31 01:37:54,836 : INFO : PROGRESS: pass 0, at document #4748000/4922894\n", + "2019-01-31 01:37:56,243 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:37:56,510 : INFO : topic #48 (0.020): 0.081*\"march\" + 0.078*\"octob\" + 0.077*\"sens\" + 0.072*\"januari\" + 0.071*\"juli\" + 0.070*\"notion\" + 0.069*\"august\" + 0.069*\"april\" + 0.068*\"judici\" + 0.067*\"decatur\"\n", + "2019-01-31 01:37:56,511 : INFO : topic #29 (0.020): 0.031*\"companhia\" + 0.013*\"busi\" + 0.012*\"million\" + 0.012*\"produc\" + 0.012*\"market\" + 0.010*\"bank\" + 0.010*\"industri\" + 0.009*\"yawn\" + 0.009*\"manag\" + 0.007*\"oper\"\n", + "2019-01-31 01:37:56,513 : INFO : topic #31 (0.020): 0.050*\"fusiform\" + 0.027*\"scientist\" + 0.025*\"taxpay\" + 0.022*\"player\" + 0.019*\"place\" + 0.014*\"clot\" + 0.013*\"leagu\" + 0.010*\"yawn\" + 0.010*\"folei\" + 0.009*\"reconstruct\"\n", + "2019-01-31 01:37:56,514 : INFO : topic #34 (0.020): 0.066*\"start\" + 0.032*\"new\" + 0.031*\"american\" + 0.029*\"unionist\" + 0.028*\"cotton\" + 0.020*\"year\" + 0.015*\"california\" + 0.013*\"terri\" + 0.013*\"warrior\" + 0.012*\"north\"\n", + "2019-01-31 01:37:56,515 : INFO : topic #30 (0.020): 0.035*\"cleveland\" + 0.034*\"leagu\" + 0.030*\"place\" + 0.027*\"taxpay\" + 0.024*\"scientist\" + 0.023*\"crete\" + 0.021*\"folei\" + 0.017*\"goal\" + 0.015*\"martin\" + 0.013*\"schmitz\"\n", + "2019-01-31 01:37:56,521 : INFO : topic diff=0.003243, rho=0.020524\n", + "2019-01-31 01:37:56,680 : INFO : PROGRESS: pass 0, at document #4750000/4922894\n", + "2019-01-31 01:37:58,125 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:37:58,393 : INFO : topic #41 (0.020): 0.042*\"citi\" + 0.026*\"palmer\" + 0.019*\"new\" + 0.018*\"strategist\" + 0.013*\"open\" + 0.013*\"center\" + 0.012*\"lobe\" + 0.011*\"includ\" + 0.010*\"dai\" + 0.009*\"highli\"\n", + "2019-01-31 01:37:58,395 : INFO : topic #20 (0.020): 0.142*\"scholar\" + 0.039*\"struggl\" + 0.032*\"high\" + 0.029*\"educ\" + 0.024*\"collector\" + 0.017*\"yawn\" + 0.012*\"prognosi\" + 0.011*\"district\" + 0.010*\"gothic\" + 0.010*\"task\"\n", + "2019-01-31 01:37:58,396 : INFO : topic #38 (0.020): 0.022*\"walter\" + 0.009*\"aza\" + 0.009*\"forc\" + 0.009*\"battalion\" + 0.007*\"empath\" + 0.007*\"armi\" + 0.007*\"teufel\" + 0.007*\"govern\" + 0.006*\"militari\" + 0.006*\"pour\"\n", + "2019-01-31 01:37:58,397 : INFO : topic #40 (0.020): 0.086*\"unit\" + 0.023*\"schuster\" + 0.022*\"institut\" + 0.022*\"requir\" + 0.020*\"collector\" + 0.019*\"student\" + 0.014*\"professor\" + 0.012*\"word\" + 0.011*\"governor\" + 0.011*\"http\"\n", + "2019-01-31 01:37:58,399 : INFO : topic #10 (0.020): 0.011*\"cdd\" + 0.009*\"media\" + 0.008*\"have\" + 0.008*\"disco\" + 0.007*\"hormon\" + 0.007*\"caus\" + 0.007*\"pathwai\" + 0.006*\"proper\" + 0.006*\"effect\" + 0.006*\"treat\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 01:37:58,405 : INFO : topic diff=0.002864, rho=0.020520\n", + "2019-01-31 01:37:58,563 : INFO : PROGRESS: pass 0, at document #4752000/4922894\n", + "2019-01-31 01:37:59,945 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:38:00,212 : INFO : topic #7 (0.020): 0.021*\"snatch\" + 0.019*\"di\" + 0.019*\"factor\" + 0.016*\"yawn\" + 0.016*\"margin\" + 0.014*\"bone\" + 0.013*\"life\" + 0.012*\"faster\" + 0.012*\"will\" + 0.012*\"daughter\"\n", + "2019-01-31 01:38:00,213 : INFO : topic #33 (0.020): 0.060*\"french\" + 0.045*\"franc\" + 0.030*\"pari\" + 0.023*\"jean\" + 0.021*\"sail\" + 0.018*\"wreath\" + 0.017*\"daphn\" + 0.014*\"lazi\" + 0.013*\"loui\" + 0.012*\"piec\"\n", + "2019-01-31 01:38:00,214 : INFO : topic #27 (0.020): 0.075*\"questionnair\" + 0.021*\"candid\" + 0.017*\"taxpay\" + 0.014*\"ret\" + 0.014*\"tornado\" + 0.013*\"driver\" + 0.012*\"squatter\" + 0.012*\"fool\" + 0.011*\"find\" + 0.010*\"horac\"\n", + "2019-01-31 01:38:00,215 : INFO : topic #23 (0.020): 0.139*\"audit\" + 0.069*\"best\" + 0.036*\"yawn\" + 0.028*\"jacksonvil\" + 0.023*\"japanes\" + 0.021*\"noll\" + 0.019*\"women\" + 0.018*\"intern\" + 0.018*\"festiv\" + 0.014*\"prison\"\n", + "2019-01-31 01:38:00,216 : INFO : topic #2 (0.020): 0.048*\"isl\" + 0.038*\"shield\" + 0.018*\"narrat\" + 0.014*\"scot\" + 0.013*\"pope\" + 0.012*\"blur\" + 0.011*\"nativist\" + 0.010*\"coalit\" + 0.010*\"class\" + 0.009*\"bahá\"\n", + "2019-01-31 01:38:00,222 : INFO : topic diff=0.002654, rho=0.020515\n", + "2019-01-31 01:38:00,375 : INFO : PROGRESS: pass 0, at document #4754000/4922894\n", + "2019-01-31 01:38:01,723 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:38:01,989 : INFO : topic #42 (0.020): 0.047*\"german\" + 0.032*\"germani\" + 0.016*\"vol\" + 0.015*\"israel\" + 0.014*\"der\" + 0.014*\"berlin\" + 0.014*\"jewish\" + 0.010*\"european\" + 0.010*\"europ\" + 0.010*\"austria\"\n", + "2019-01-31 01:38:01,990 : INFO : topic #46 (0.020): 0.017*\"sweden\" + 0.017*\"swedish\" + 0.016*\"norwai\" + 0.016*\"stop\" + 0.014*\"wind\" + 0.013*\"norwegian\" + 0.012*\"damag\" + 0.012*\"treeless\" + 0.011*\"huntsvil\" + 0.010*\"denmark\"\n", + "2019-01-31 01:38:01,991 : INFO : topic #47 (0.020): 0.064*\"muscl\" + 0.032*\"perceptu\" + 0.021*\"theater\" + 0.018*\"compos\" + 0.018*\"place\" + 0.016*\"damn\" + 0.014*\"orchestr\" + 0.013*\"olympo\" + 0.013*\"physician\" + 0.011*\"word\"\n", + "2019-01-31 01:38:01,993 : INFO : topic #27 (0.020): 0.075*\"questionnair\" + 0.021*\"candid\" + 0.017*\"taxpay\" + 0.014*\"ret\" + 0.014*\"tornado\" + 0.013*\"driver\" + 0.012*\"squatter\" + 0.011*\"fool\" + 0.011*\"find\" + 0.010*\"horac\"\n", + "2019-01-31 01:38:01,994 : INFO : topic #6 (0.020): 0.069*\"fewer\" + 0.024*\"epiru\" + 0.020*\"septemb\" + 0.018*\"teacher\" + 0.014*\"stake\" + 0.012*\"rodríguez\" + 0.012*\"proclaim\" + 0.011*\"movi\" + 0.010*\"direct\" + 0.010*\"acrimoni\"\n", + "2019-01-31 01:38:02,000 : INFO : topic diff=0.002949, rho=0.020511\n", + "2019-01-31 01:38:02,149 : INFO : PROGRESS: pass 0, at document #4756000/4922894\n", + "2019-01-31 01:38:03,500 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:38:03,767 : INFO : topic #25 (0.020): 0.033*\"ring\" + 0.019*\"area\" + 0.018*\"lagrang\" + 0.017*\"warmth\" + 0.015*\"mount\" + 0.010*\"foam\" + 0.010*\"north\" + 0.009*\"sourc\" + 0.009*\"land\" + 0.008*\"palmer\"\n", + "2019-01-31 01:38:03,768 : INFO : topic #21 (0.020): 0.035*\"samford\" + 0.023*\"spain\" + 0.018*\"del\" + 0.017*\"italian\" + 0.017*\"mexico\" + 0.014*\"soviet\" + 0.012*\"santa\" + 0.011*\"juan\" + 0.010*\"itali\" + 0.010*\"francisco\"\n", + "2019-01-31 01:38:03,769 : INFO : topic #2 (0.020): 0.048*\"isl\" + 0.038*\"shield\" + 0.018*\"narrat\" + 0.014*\"scot\" + 0.013*\"pope\" + 0.012*\"blur\" + 0.011*\"nativist\" + 0.010*\"coalit\" + 0.010*\"class\" + 0.009*\"fleet\"\n", + "2019-01-31 01:38:03,770 : INFO : topic #35 (0.020): 0.057*\"russia\" + 0.038*\"sovereignti\" + 0.035*\"rural\" + 0.029*\"poison\" + 0.027*\"reprint\" + 0.024*\"personifi\" + 0.019*\"moscow\" + 0.019*\"poland\" + 0.015*\"tyrant\" + 0.015*\"unfortun\"\n", + "2019-01-31 01:38:03,771 : INFO : topic #43 (0.020): 0.066*\"elect\" + 0.054*\"parti\" + 0.025*\"voluntari\" + 0.023*\"democrat\" + 0.019*\"member\" + 0.016*\"polici\" + 0.015*\"republ\" + 0.014*\"bypass\" + 0.014*\"liber\" + 0.013*\"report\"\n", + "2019-01-31 01:38:03,777 : INFO : topic diff=0.003260, rho=0.020507\n", + "2019-01-31 01:38:03,931 : INFO : PROGRESS: pass 0, at document #4758000/4922894\n", + "2019-01-31 01:38:05,291 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:38:05,558 : INFO : topic #0 (0.020): 0.061*\"statewid\" + 0.039*\"line\" + 0.032*\"rivièr\" + 0.029*\"raid\" + 0.026*\"rosenwald\" + 0.021*\"airmen\" + 0.018*\"serv\" + 0.017*\"traceabl\" + 0.013*\"oper\" + 0.011*\"briarwood\"\n", + "2019-01-31 01:38:05,560 : INFO : topic #47 (0.020): 0.064*\"muscl\" + 0.032*\"perceptu\" + 0.020*\"theater\" + 0.018*\"compos\" + 0.018*\"place\" + 0.016*\"damn\" + 0.014*\"orchestr\" + 0.013*\"olympo\" + 0.013*\"physician\" + 0.011*\"word\"\n", + "2019-01-31 01:38:05,561 : INFO : topic #43 (0.020): 0.066*\"elect\" + 0.054*\"parti\" + 0.025*\"voluntari\" + 0.023*\"democrat\" + 0.019*\"member\" + 0.017*\"polici\" + 0.015*\"republ\" + 0.014*\"bypass\" + 0.014*\"liber\" + 0.013*\"report\"\n", + "2019-01-31 01:38:05,562 : INFO : topic #45 (0.020): 0.049*\"arsen\" + 0.030*\"jpg\" + 0.030*\"museo\" + 0.027*\"fifteenth\" + 0.022*\"pain\" + 0.020*\"illicit\" + 0.017*\"artist\" + 0.017*\"exhaust\" + 0.016*\"gai\" + 0.015*\"colder\"\n", + "2019-01-31 01:38:05,563 : INFO : topic #29 (0.020): 0.031*\"companhia\" + 0.013*\"busi\" + 0.012*\"million\" + 0.012*\"market\" + 0.012*\"produc\" + 0.010*\"bank\" + 0.010*\"industri\" + 0.009*\"manag\" + 0.009*\"yawn\" + 0.007*\"oper\"\n", + "2019-01-31 01:38:05,569 : INFO : topic diff=0.003050, rho=0.020502\n", + "2019-01-31 01:38:08,229 : INFO : -11.870 per-word bound, 3742.6 perplexity estimate based on a held-out corpus of 2000 documents with 532156 words\n", + "2019-01-31 01:38:08,229 : INFO : PROGRESS: pass 0, at document #4760000/4922894\n", + "2019-01-31 01:38:09,593 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:38:09,859 : INFO : topic #26 (0.020): 0.030*\"workplac\" + 0.029*\"champion\" + 0.026*\"woman\" + 0.025*\"olymp\" + 0.024*\"men\" + 0.022*\"medal\" + 0.019*\"event\" + 0.019*\"alic\" + 0.018*\"taxpay\" + 0.017*\"atheist\"\n", + "2019-01-31 01:38:09,860 : INFO : topic #3 (0.020): 0.033*\"present\" + 0.025*\"nation\" + 0.025*\"offic\" + 0.024*\"minist\" + 0.024*\"govern\" + 0.022*\"member\" + 0.018*\"start\" + 0.017*\"serv\" + 0.016*\"gener\" + 0.013*\"council\"\n", + "2019-01-31 01:38:09,861 : INFO : topic #37 (0.020): 0.012*\"charact\" + 0.012*\"septemb\" + 0.011*\"anim\" + 0.010*\"man\" + 0.008*\"comic\" + 0.007*\"appear\" + 0.007*\"fusiform\" + 0.007*\"workplac\" + 0.007*\"storag\" + 0.006*\"black\"\n", + "2019-01-31 01:38:09,862 : INFO : topic #41 (0.020): 0.042*\"citi\" + 0.026*\"palmer\" + 0.019*\"new\" + 0.018*\"strategist\" + 0.013*\"open\" + 0.013*\"center\" + 0.012*\"lobe\" + 0.011*\"includ\" + 0.010*\"dai\" + 0.009*\"highli\"\n", + "2019-01-31 01:38:09,864 : INFO : topic #5 (0.020): 0.039*\"abroad\" + 0.028*\"son\" + 0.027*\"rel\" + 0.025*\"reconstruct\" + 0.021*\"band\" + 0.017*\"muscl\" + 0.016*\"simultan\" + 0.015*\"charcoal\" + 0.013*\"toyota\" + 0.009*\"myspac\"\n", + "2019-01-31 01:38:09,869 : INFO : topic diff=0.002848, rho=0.020498\n", + "2019-01-31 01:38:10,028 : INFO : PROGRESS: pass 0, at document #4762000/4922894\n", + "2019-01-31 01:38:11,415 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:38:11,684 : INFO : topic #4 (0.020): 0.018*\"enfranchis\" + 0.015*\"depress\" + 0.013*\"pour\" + 0.008*\"mode\" + 0.008*\"veget\" + 0.008*\"uruguayan\" + 0.008*\"elabor\" + 0.006*\"turn\" + 0.006*\"produc\" + 0.006*\"develop\"\n", + "2019-01-31 01:38:11,685 : INFO : topic #1 (0.020): 0.056*\"china\" + 0.047*\"chilton\" + 0.027*\"kong\" + 0.026*\"hong\" + 0.022*\"korea\" + 0.020*\"korean\" + 0.017*\"sourc\" + 0.014*\"leah\" + 0.014*\"shirin\" + 0.014*\"kim\"\n", + "2019-01-31 01:38:11,686 : INFO : topic #26 (0.020): 0.029*\"workplac\" + 0.029*\"champion\" + 0.026*\"woman\" + 0.025*\"olymp\" + 0.024*\"men\" + 0.022*\"medal\" + 0.019*\"event\" + 0.019*\"alic\" + 0.018*\"taxpay\" + 0.017*\"atheist\"\n", + "2019-01-31 01:38:11,687 : INFO : topic #43 (0.020): 0.066*\"elect\" + 0.054*\"parti\" + 0.025*\"voluntari\" + 0.023*\"democrat\" + 0.019*\"member\" + 0.016*\"polici\" + 0.015*\"republ\" + 0.014*\"bypass\" + 0.014*\"liber\" + 0.013*\"report\"\n", + "2019-01-31 01:38:11,688 : INFO : topic #17 (0.020): 0.080*\"church\" + 0.023*\"christian\" + 0.023*\"cathol\" + 0.021*\"bishop\" + 0.016*\"sail\" + 0.015*\"retroflex\" + 0.010*\"historiographi\" + 0.010*\"relationship\" + 0.009*\"parish\" + 0.009*\"poll\"\n", + "2019-01-31 01:38:11,694 : INFO : topic diff=0.003839, rho=0.020494\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 01:38:11,845 : INFO : PROGRESS: pass 0, at document #4764000/4922894\n", + "2019-01-31 01:38:13,173 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:38:13,439 : INFO : topic #10 (0.020): 0.011*\"cdd\" + 0.008*\"media\" + 0.008*\"disco\" + 0.008*\"have\" + 0.007*\"hormon\" + 0.007*\"caus\" + 0.007*\"pathwai\" + 0.006*\"proper\" + 0.006*\"effect\" + 0.006*\"treat\"\n", + "2019-01-31 01:38:13,441 : INFO : topic #41 (0.020): 0.043*\"citi\" + 0.026*\"palmer\" + 0.019*\"new\" + 0.018*\"strategist\" + 0.013*\"open\" + 0.013*\"center\" + 0.012*\"lobe\" + 0.011*\"includ\" + 0.010*\"dai\" + 0.009*\"highli\"\n", + "2019-01-31 01:38:13,442 : INFO : topic #44 (0.020): 0.030*\"rooftop\" + 0.025*\"final\" + 0.023*\"wife\" + 0.021*\"tourist\" + 0.018*\"champion\" + 0.015*\"chamber\" + 0.014*\"martin\" + 0.014*\"taxpay\" + 0.014*\"tiepolo\" + 0.012*\"open\"\n", + "2019-01-31 01:38:13,442 : INFO : topic #29 (0.020): 0.031*\"companhia\" + 0.013*\"busi\" + 0.012*\"million\" + 0.012*\"market\" + 0.012*\"produc\" + 0.010*\"bank\" + 0.010*\"industri\" + 0.009*\"manag\" + 0.009*\"yawn\" + 0.007*\"oper\"\n", + "2019-01-31 01:38:13,443 : INFO : topic #49 (0.020): 0.045*\"india\" + 0.030*\"incumb\" + 0.013*\"islam\" + 0.013*\"pakistan\" + 0.012*\"anglo\" + 0.011*\"khalsa\" + 0.011*\"televis\" + 0.011*\"affection\" + 0.011*\"muskoge\" + 0.010*\"tajikistan\"\n", + "2019-01-31 01:38:13,449 : INFO : topic diff=0.003146, rho=0.020489\n", + "2019-01-31 01:38:13,663 : INFO : PROGRESS: pass 0, at document #4766000/4922894\n", + "2019-01-31 01:38:15,075 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:38:15,342 : INFO : topic #36 (0.020): 0.011*\"network\" + 0.010*\"prognosi\" + 0.010*\"pop\" + 0.009*\"cytokin\" + 0.008*\"develop\" + 0.008*\"diggin\" + 0.008*\"softwar\" + 0.007*\"uruguayan\" + 0.007*\"includ\" + 0.007*\"user\"\n", + "2019-01-31 01:38:15,344 : INFO : topic #37 (0.020): 0.012*\"charact\" + 0.012*\"septemb\" + 0.011*\"anim\" + 0.010*\"man\" + 0.008*\"comic\" + 0.007*\"appear\" + 0.007*\"fusiform\" + 0.007*\"workplac\" + 0.007*\"storag\" + 0.006*\"black\"\n", + "2019-01-31 01:38:15,344 : INFO : topic #33 (0.020): 0.060*\"french\" + 0.045*\"franc\" + 0.031*\"pari\" + 0.023*\"jean\" + 0.022*\"sail\" + 0.017*\"daphn\" + 0.016*\"wreath\" + 0.014*\"lazi\" + 0.013*\"loui\" + 0.012*\"piec\"\n", + "2019-01-31 01:38:15,345 : INFO : topic #12 (0.020): 0.009*\"number\" + 0.007*\"frontal\" + 0.006*\"gener\" + 0.006*\"poet\" + 0.006*\"exampl\" + 0.006*\"servitud\" + 0.006*\"théori\" + 0.006*\"mode\" + 0.006*\"measur\" + 0.006*\"southern\"\n", + "2019-01-31 01:38:15,346 : INFO : topic #29 (0.020): 0.031*\"companhia\" + 0.013*\"busi\" + 0.012*\"million\" + 0.012*\"market\" + 0.012*\"produc\" + 0.010*\"bank\" + 0.010*\"industri\" + 0.009*\"manag\" + 0.009*\"yawn\" + 0.007*\"oper\"\n", + "2019-01-31 01:38:15,353 : INFO : topic diff=0.002722, rho=0.020485\n", + "2019-01-31 01:38:15,509 : INFO : PROGRESS: pass 0, at document #4768000/4922894\n", + "2019-01-31 01:38:16,885 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:38:17,151 : INFO : topic #46 (0.020): 0.017*\"sweden\" + 0.017*\"swedish\" + 0.016*\"stop\" + 0.015*\"norwai\" + 0.014*\"wind\" + 0.014*\"damag\" + 0.014*\"norwegian\" + 0.011*\"treeless\" + 0.011*\"huntsvil\" + 0.010*\"turkish\"\n", + "2019-01-31 01:38:17,152 : INFO : topic #39 (0.020): 0.060*\"canada\" + 0.046*\"canadian\" + 0.025*\"toronto\" + 0.024*\"hoar\" + 0.021*\"ontario\" + 0.016*\"hydrogen\" + 0.015*\"misericordia\" + 0.014*\"new\" + 0.014*\"quebec\" + 0.014*\"novotná\"\n", + "2019-01-31 01:38:17,153 : INFO : topic #0 (0.020): 0.061*\"statewid\" + 0.039*\"line\" + 0.033*\"rivièr\" + 0.029*\"raid\" + 0.027*\"rosenwald\" + 0.020*\"airmen\" + 0.017*\"traceabl\" + 0.017*\"serv\" + 0.013*\"oper\" + 0.012*\"briarwood\"\n", + "2019-01-31 01:38:17,154 : INFO : topic #13 (0.020): 0.027*\"london\" + 0.027*\"australia\" + 0.025*\"sourc\" + 0.025*\"new\" + 0.024*\"england\" + 0.021*\"australian\" + 0.019*\"british\" + 0.017*\"ireland\" + 0.014*\"youth\" + 0.013*\"wale\"\n", + "2019-01-31 01:38:17,155 : INFO : topic #42 (0.020): 0.047*\"german\" + 0.032*\"germani\" + 0.015*\"vol\" + 0.014*\"israel\" + 0.014*\"der\" + 0.014*\"berlin\" + 0.013*\"jewish\" + 0.010*\"austria\" + 0.010*\"european\" + 0.010*\"europ\"\n", + "2019-01-31 01:38:17,161 : INFO : topic diff=0.002690, rho=0.020481\n", + "2019-01-31 01:38:17,313 : INFO : PROGRESS: pass 0, at document #4770000/4922894\n", + "2019-01-31 01:38:18,671 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:38:18,937 : INFO : topic #12 (0.020): 0.009*\"number\" + 0.007*\"frontal\" + 0.006*\"gener\" + 0.006*\"poet\" + 0.006*\"exampl\" + 0.006*\"servitud\" + 0.006*\"théori\" + 0.006*\"mode\" + 0.006*\"measur\" + 0.006*\"southern\"\n", + "2019-01-31 01:38:18,938 : INFO : topic #13 (0.020): 0.027*\"london\" + 0.027*\"australia\" + 0.025*\"sourc\" + 0.025*\"new\" + 0.024*\"england\" + 0.021*\"australian\" + 0.019*\"british\" + 0.017*\"ireland\" + 0.014*\"youth\" + 0.013*\"wale\"\n", + "2019-01-31 01:38:18,939 : INFO : topic #24 (0.020): 0.041*\"book\" + 0.036*\"publicis\" + 0.025*\"word\" + 0.020*\"new\" + 0.014*\"edit\" + 0.014*\"presid\" + 0.012*\"magazin\" + 0.011*\"worldwid\" + 0.011*\"nicola\" + 0.011*\"author\"\n", + "2019-01-31 01:38:18,940 : INFO : topic #43 (0.020): 0.065*\"elect\" + 0.054*\"parti\" + 0.024*\"voluntari\" + 0.023*\"democrat\" + 0.019*\"member\" + 0.016*\"polici\" + 0.014*\"republ\" + 0.014*\"bypass\" + 0.014*\"liber\" + 0.013*\"report\"\n", + "2019-01-31 01:38:18,941 : INFO : topic #27 (0.020): 0.074*\"questionnair\" + 0.020*\"candid\" + 0.017*\"taxpay\" + 0.014*\"ret\" + 0.013*\"tornado\" + 0.012*\"driver\" + 0.012*\"fool\" + 0.012*\"squatter\" + 0.012*\"find\" + 0.010*\"landslid\"\n", + "2019-01-31 01:38:18,947 : INFO : topic diff=0.003038, rho=0.020477\n", + "2019-01-31 01:38:19,103 : INFO : PROGRESS: pass 0, at document #4772000/4922894\n", + "2019-01-31 01:38:20,476 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:38:20,746 : INFO : topic #5 (0.020): 0.039*\"abroad\" + 0.028*\"son\" + 0.027*\"rel\" + 0.025*\"reconstruct\" + 0.021*\"band\" + 0.016*\"muscl\" + 0.016*\"simultan\" + 0.014*\"charcoal\" + 0.013*\"toyota\" + 0.010*\"myspac\"\n", + "2019-01-31 01:38:20,747 : INFO : topic #10 (0.020): 0.011*\"cdd\" + 0.009*\"media\" + 0.008*\"disco\" + 0.008*\"have\" + 0.007*\"hormon\" + 0.007*\"pathwai\" + 0.007*\"caus\" + 0.006*\"proper\" + 0.006*\"effect\" + 0.006*\"treat\"\n", + "2019-01-31 01:38:20,748 : INFO : topic #21 (0.020): 0.035*\"samford\" + 0.022*\"spain\" + 0.018*\"del\" + 0.018*\"mexico\" + 0.017*\"italian\" + 0.014*\"soviet\" + 0.012*\"santa\" + 0.011*\"juan\" + 0.010*\"itali\" + 0.010*\"carlo\"\n", + "2019-01-31 01:38:20,749 : INFO : topic #12 (0.020): 0.009*\"number\" + 0.007*\"frontal\" + 0.007*\"gener\" + 0.006*\"poet\" + 0.006*\"exampl\" + 0.006*\"servitud\" + 0.006*\"théori\" + 0.006*\"mode\" + 0.006*\"southern\" + 0.006*\"measur\"\n", + "2019-01-31 01:38:20,750 : INFO : topic #3 (0.020): 0.033*\"present\" + 0.025*\"nation\" + 0.025*\"offic\" + 0.024*\"minist\" + 0.023*\"govern\" + 0.022*\"member\" + 0.018*\"start\" + 0.017*\"serv\" + 0.016*\"gener\" + 0.014*\"chickasaw\"\n", + "2019-01-31 01:38:20,756 : INFO : topic diff=0.003262, rho=0.020472\n", + "2019-01-31 01:38:20,914 : INFO : PROGRESS: pass 0, at document #4774000/4922894\n", + "2019-01-31 01:38:22,300 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:38:22,567 : INFO : topic #20 (0.020): 0.142*\"scholar\" + 0.039*\"struggl\" + 0.032*\"high\" + 0.030*\"educ\" + 0.023*\"collector\" + 0.017*\"yawn\" + 0.012*\"prognosi\" + 0.011*\"district\" + 0.010*\"task\" + 0.010*\"gothic\"\n", + "2019-01-31 01:38:22,568 : INFO : topic #10 (0.020): 0.011*\"cdd\" + 0.009*\"media\" + 0.008*\"disco\" + 0.008*\"have\" + 0.007*\"hormon\" + 0.007*\"pathwai\" + 0.007*\"caus\" + 0.006*\"proper\" + 0.006*\"effect\" + 0.006*\"treat\"\n", + "2019-01-31 01:38:22,569 : INFO : topic #34 (0.020): 0.066*\"start\" + 0.033*\"new\" + 0.031*\"american\" + 0.029*\"unionist\" + 0.027*\"cotton\" + 0.020*\"year\" + 0.015*\"california\" + 0.013*\"warrior\" + 0.012*\"terri\" + 0.012*\"north\"\n", + "2019-01-31 01:38:22,570 : INFO : topic #2 (0.020): 0.048*\"isl\" + 0.038*\"shield\" + 0.018*\"narrat\" + 0.015*\"scot\" + 0.012*\"pope\" + 0.012*\"blur\" + 0.011*\"nativist\" + 0.010*\"coalit\" + 0.010*\"class\" + 0.009*\"fleet\"\n", + "2019-01-31 01:38:22,572 : INFO : topic #31 (0.020): 0.051*\"fusiform\" + 0.027*\"scientist\" + 0.025*\"taxpay\" + 0.023*\"player\" + 0.020*\"place\" + 0.014*\"clot\" + 0.013*\"leagu\" + 0.011*\"folei\" + 0.010*\"yawn\" + 0.009*\"ruler\"\n", + "2019-01-31 01:38:22,578 : INFO : topic diff=0.003123, rho=0.020468\n", + "2019-01-31 01:38:22,737 : INFO : PROGRESS: pass 0, at document #4776000/4922894\n", + "2019-01-31 01:38:24,088 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 01:38:24,354 : INFO : topic #30 (0.020): 0.035*\"leagu\" + 0.034*\"cleveland\" + 0.030*\"place\" + 0.027*\"taxpay\" + 0.025*\"scientist\" + 0.023*\"crete\" + 0.021*\"folei\" + 0.017*\"goal\" + 0.015*\"martin\" + 0.013*\"schmitz\"\n", + "2019-01-31 01:38:24,356 : INFO : topic #17 (0.020): 0.080*\"church\" + 0.023*\"christian\" + 0.022*\"cathol\" + 0.021*\"bishop\" + 0.016*\"sail\" + 0.014*\"retroflex\" + 0.010*\"poll\" + 0.010*\"historiographi\" + 0.010*\"relationship\" + 0.009*\"parish\"\n", + "2019-01-31 01:38:24,357 : INFO : topic #9 (0.020): 0.074*\"bone\" + 0.044*\"american\" + 0.031*\"valour\" + 0.018*\"dutch\" + 0.018*\"folei\" + 0.018*\"player\" + 0.016*\"english\" + 0.016*\"polit\" + 0.012*\"acrimoni\" + 0.012*\"simpler\"\n", + "2019-01-31 01:38:24,358 : INFO : topic #4 (0.020): 0.018*\"enfranchis\" + 0.015*\"depress\" + 0.013*\"pour\" + 0.008*\"mode\" + 0.008*\"veget\" + 0.008*\"uruguayan\" + 0.007*\"elabor\" + 0.006*\"develop\" + 0.006*\"turn\" + 0.006*\"produc\"\n", + "2019-01-31 01:38:24,359 : INFO : topic #31 (0.020): 0.051*\"fusiform\" + 0.027*\"scientist\" + 0.025*\"taxpay\" + 0.023*\"player\" + 0.020*\"place\" + 0.014*\"clot\" + 0.013*\"leagu\" + 0.010*\"folei\" + 0.010*\"yawn\" + 0.009*\"ruler\"\n", + "2019-01-31 01:38:24,365 : INFO : topic diff=0.002873, rho=0.020464\n", + "2019-01-31 01:38:24,523 : INFO : PROGRESS: pass 0, at document #4778000/4922894\n", + "2019-01-31 01:38:25,893 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:38:26,159 : INFO : topic #48 (0.020): 0.080*\"march\" + 0.078*\"octob\" + 0.077*\"sens\" + 0.072*\"januari\" + 0.071*\"juli\" + 0.070*\"august\" + 0.070*\"notion\" + 0.068*\"april\" + 0.067*\"judici\" + 0.067*\"decatur\"\n", + "2019-01-31 01:38:26,160 : INFO : topic #19 (0.020): 0.017*\"languag\" + 0.015*\"centuri\" + 0.010*\"woodcut\" + 0.009*\"form\" + 0.009*\"origin\" + 0.009*\"mean\" + 0.008*\"trade\" + 0.008*\"english\" + 0.007*\"known\" + 0.007*\"uruguayan\"\n", + "2019-01-31 01:38:26,161 : INFO : topic #15 (0.020): 0.012*\"small\" + 0.010*\"organ\" + 0.009*\"develop\" + 0.009*\"commun\" + 0.008*\"group\" + 0.008*\"peopl\" + 0.008*\"word\" + 0.007*\"woman\" + 0.007*\"human\" + 0.006*\"workplac\"\n", + "2019-01-31 01:38:26,162 : INFO : topic #9 (0.020): 0.073*\"bone\" + 0.044*\"american\" + 0.031*\"valour\" + 0.018*\"folei\" + 0.018*\"dutch\" + 0.018*\"player\" + 0.016*\"polit\" + 0.016*\"english\" + 0.012*\"acrimoni\" + 0.012*\"simpler\"\n", + "2019-01-31 01:38:26,163 : INFO : topic #38 (0.020): 0.022*\"walter\" + 0.010*\"aza\" + 0.009*\"forc\" + 0.009*\"battalion\" + 0.007*\"empath\" + 0.007*\"teufel\" + 0.007*\"armi\" + 0.006*\"govern\" + 0.006*\"militari\" + 0.006*\"till\"\n", + "2019-01-31 01:38:26,169 : INFO : topic diff=0.003058, rho=0.020459\n", + "2019-01-31 01:38:28,797 : INFO : -12.003 per-word bound, 4105.5 perplexity estimate based on a held-out corpus of 2000 documents with 542807 words\n", + "2019-01-31 01:38:28,797 : INFO : PROGRESS: pass 0, at document #4780000/4922894\n", + "2019-01-31 01:38:30,144 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:38:30,412 : INFO : topic #1 (0.020): 0.055*\"china\" + 0.047*\"chilton\" + 0.027*\"kong\" + 0.026*\"hong\" + 0.021*\"korea\" + 0.020*\"korean\" + 0.017*\"sourc\" + 0.015*\"shirin\" + 0.015*\"leah\" + 0.014*\"kim\"\n", + "2019-01-31 01:38:30,413 : INFO : topic #9 (0.020): 0.073*\"bone\" + 0.044*\"american\" + 0.031*\"valour\" + 0.018*\"folei\" + 0.018*\"dutch\" + 0.018*\"player\" + 0.016*\"english\" + 0.016*\"polit\" + 0.012*\"acrimoni\" + 0.012*\"simpler\"\n", + "2019-01-31 01:38:30,414 : INFO : topic #16 (0.020): 0.054*\"king\" + 0.029*\"priest\" + 0.021*\"duke\" + 0.018*\"idiosyncrat\" + 0.018*\"rotterdam\" + 0.017*\"grammat\" + 0.017*\"quarterli\" + 0.016*\"portugues\" + 0.013*\"kingdom\" + 0.012*\"brazil\"\n", + "2019-01-31 01:38:30,415 : INFO : topic #43 (0.020): 0.065*\"elect\" + 0.055*\"parti\" + 0.024*\"voluntari\" + 0.023*\"democrat\" + 0.019*\"member\" + 0.016*\"polici\" + 0.014*\"liber\" + 0.014*\"republ\" + 0.014*\"bypass\" + 0.013*\"report\"\n", + "2019-01-31 01:38:30,416 : INFO : topic #35 (0.020): 0.058*\"russia\" + 0.036*\"sovereignti\" + 0.034*\"rural\" + 0.028*\"poison\" + 0.027*\"reprint\" + 0.024*\"personifi\" + 0.019*\"moscow\" + 0.018*\"poland\" + 0.017*\"turin\" + 0.015*\"unfortun\"\n", + "2019-01-31 01:38:30,422 : INFO : topic diff=0.003218, rho=0.020455\n", + "2019-01-31 01:38:30,578 : INFO : PROGRESS: pass 0, at document #4782000/4922894\n", + "2019-01-31 01:38:31,940 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:38:32,207 : INFO : topic #45 (0.020): 0.048*\"arsen\" + 0.030*\"jpg\" + 0.030*\"museo\" + 0.027*\"fifteenth\" + 0.022*\"pain\" + 0.020*\"illicit\" + 0.017*\"artist\" + 0.017*\"exhaust\" + 0.016*\"gai\" + 0.015*\"colder\"\n", + "2019-01-31 01:38:32,208 : INFO : topic #29 (0.020): 0.031*\"companhia\" + 0.013*\"busi\" + 0.012*\"million\" + 0.012*\"market\" + 0.012*\"produc\" + 0.010*\"bank\" + 0.010*\"industri\" + 0.009*\"manag\" + 0.009*\"yawn\" + 0.007*\"trace\"\n", + "2019-01-31 01:38:32,209 : INFO : topic #24 (0.020): 0.041*\"book\" + 0.036*\"publicis\" + 0.025*\"word\" + 0.020*\"new\" + 0.015*\"edit\" + 0.014*\"presid\" + 0.011*\"worldwid\" + 0.011*\"magazin\" + 0.011*\"nicola\" + 0.011*\"author\"\n", + "2019-01-31 01:38:32,210 : INFO : topic #4 (0.020): 0.019*\"enfranchis\" + 0.015*\"depress\" + 0.013*\"pour\" + 0.008*\"mode\" + 0.008*\"uruguayan\" + 0.008*\"veget\" + 0.007*\"elabor\" + 0.006*\"develop\" + 0.006*\"turn\" + 0.006*\"produc\"\n", + "2019-01-31 01:38:32,211 : INFO : topic #34 (0.020): 0.066*\"start\" + 0.032*\"new\" + 0.031*\"american\" + 0.029*\"unionist\" + 0.027*\"cotton\" + 0.020*\"year\" + 0.015*\"california\" + 0.013*\"warrior\" + 0.012*\"terri\" + 0.012*\"north\"\n", + "2019-01-31 01:38:32,217 : INFO : topic diff=0.003453, rho=0.020451\n", + "2019-01-31 01:38:32,374 : INFO : PROGRESS: pass 0, at document #4784000/4922894\n", + "2019-01-31 01:38:33,762 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:38:34,028 : INFO : topic #20 (0.020): 0.140*\"scholar\" + 0.039*\"struggl\" + 0.032*\"high\" + 0.029*\"educ\" + 0.023*\"collector\" + 0.017*\"yawn\" + 0.012*\"prognosi\" + 0.011*\"district\" + 0.010*\"task\" + 0.010*\"gothic\"\n", + "2019-01-31 01:38:34,029 : INFO : topic #45 (0.020): 0.049*\"arsen\" + 0.030*\"jpg\" + 0.030*\"museo\" + 0.027*\"fifteenth\" + 0.022*\"pain\" + 0.021*\"illicit\" + 0.017*\"artist\" + 0.017*\"exhaust\" + 0.016*\"gai\" + 0.015*\"colder\"\n", + "2019-01-31 01:38:34,030 : INFO : topic #46 (0.020): 0.017*\"swedish\" + 0.017*\"sweden\" + 0.016*\"stop\" + 0.015*\"norwai\" + 0.014*\"norwegian\" + 0.014*\"wind\" + 0.013*\"damag\" + 0.011*\"treeless\" + 0.011*\"huntsvil\" + 0.010*\"turkish\"\n", + "2019-01-31 01:38:34,031 : INFO : topic #27 (0.020): 0.074*\"questionnair\" + 0.020*\"candid\" + 0.017*\"taxpay\" + 0.015*\"ret\" + 0.013*\"tornado\" + 0.012*\"driver\" + 0.012*\"fool\" + 0.012*\"find\" + 0.012*\"squatter\" + 0.010*\"landslid\"\n", + "2019-01-31 01:38:34,032 : INFO : topic #44 (0.020): 0.030*\"rooftop\" + 0.026*\"final\" + 0.024*\"wife\" + 0.021*\"tourist\" + 0.019*\"champion\" + 0.015*\"chamber\" + 0.015*\"martin\" + 0.014*\"taxpay\" + 0.014*\"tiepolo\" + 0.012*\"open\"\n", + "2019-01-31 01:38:34,038 : INFO : topic diff=0.002858, rho=0.020447\n", + "2019-01-31 01:38:34,196 : INFO : PROGRESS: pass 0, at document #4786000/4922894\n", + "2019-01-31 01:38:35,576 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:38:35,845 : INFO : topic #23 (0.020): 0.138*\"audit\" + 0.069*\"best\" + 0.035*\"yawn\" + 0.027*\"jacksonvil\" + 0.022*\"japanes\" + 0.021*\"noll\" + 0.018*\"women\" + 0.018*\"intern\" + 0.018*\"festiv\" + 0.013*\"prison\"\n", + "2019-01-31 01:38:35,846 : INFO : topic #33 (0.020): 0.060*\"french\" + 0.044*\"franc\" + 0.031*\"pari\" + 0.023*\"jean\" + 0.022*\"sail\" + 0.017*\"daphn\" + 0.015*\"wreath\" + 0.014*\"lazi\" + 0.013*\"loui\" + 0.012*\"piec\"\n", + "2019-01-31 01:38:35,847 : INFO : topic #48 (0.020): 0.080*\"march\" + 0.078*\"octob\" + 0.077*\"sens\" + 0.072*\"januari\" + 0.070*\"juli\" + 0.070*\"august\" + 0.070*\"notion\" + 0.068*\"april\" + 0.067*\"judici\" + 0.067*\"decatur\"\n", + "2019-01-31 01:38:35,848 : INFO : topic #16 (0.020): 0.054*\"king\" + 0.029*\"priest\" + 0.021*\"duke\" + 0.018*\"idiosyncrat\" + 0.018*\"rotterdam\" + 0.017*\"grammat\" + 0.017*\"quarterli\" + 0.016*\"portugues\" + 0.013*\"kingdom\" + 0.012*\"brazil\"\n", + "2019-01-31 01:38:35,849 : INFO : topic #19 (0.020): 0.017*\"languag\" + 0.015*\"centuri\" + 0.010*\"woodcut\" + 0.009*\"form\" + 0.009*\"origin\" + 0.009*\"mean\" + 0.008*\"english\" + 0.008*\"trade\" + 0.007*\"known\" + 0.007*\"uruguayan\"\n", + "2019-01-31 01:38:35,855 : INFO : topic diff=0.002986, rho=0.020442\n", + "2019-01-31 01:38:36,007 : INFO : PROGRESS: pass 0, at document #4788000/4922894\n", + "2019-01-31 01:38:37,350 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 01:38:37,617 : INFO : topic #28 (0.020): 0.036*\"build\" + 0.030*\"hous\" + 0.019*\"buford\" + 0.015*\"histor\" + 0.012*\"linear\" + 0.011*\"centuri\" + 0.011*\"depress\" + 0.011*\"silicon\" + 0.011*\"constitut\" + 0.010*\"pistol\"\n", + "2019-01-31 01:38:37,618 : INFO : topic #39 (0.020): 0.060*\"canada\" + 0.046*\"canadian\" + 0.024*\"toronto\" + 0.023*\"hoar\" + 0.022*\"ontario\" + 0.016*\"quebec\" + 0.015*\"hydrogen\" + 0.015*\"misericordia\" + 0.015*\"new\" + 0.013*\"novotná\"\n", + "2019-01-31 01:38:37,619 : INFO : topic #22 (0.020): 0.034*\"spars\" + 0.017*\"factor\" + 0.012*\"plaisir\" + 0.011*\"genu\" + 0.010*\"western\" + 0.009*\"biom\" + 0.008*\"median\" + 0.007*\"trap\" + 0.007*\"incom\" + 0.006*\"florida\"\n", + "2019-01-31 01:38:37,620 : INFO : topic #40 (0.020): 0.087*\"unit\" + 0.023*\"schuster\" + 0.022*\"institut\" + 0.022*\"requir\" + 0.020*\"collector\" + 0.019*\"student\" + 0.014*\"professor\" + 0.012*\"word\" + 0.012*\"http\" + 0.011*\"governor\"\n", + "2019-01-31 01:38:37,621 : INFO : topic #19 (0.020): 0.017*\"languag\" + 0.015*\"centuri\" + 0.010*\"woodcut\" + 0.009*\"form\" + 0.009*\"origin\" + 0.009*\"mean\" + 0.008*\"english\" + 0.008*\"trade\" + 0.007*\"known\" + 0.007*\"uruguayan\"\n", + "2019-01-31 01:38:37,626 : INFO : topic diff=0.003179, rho=0.020438\n", + "2019-01-31 01:38:37,785 : INFO : PROGRESS: pass 0, at document #4790000/4922894\n", + "2019-01-31 01:38:39,163 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:38:39,430 : INFO : topic #49 (0.020): 0.044*\"india\" + 0.030*\"incumb\" + 0.013*\"islam\" + 0.012*\"anglo\" + 0.012*\"pakistan\" + 0.012*\"televis\" + 0.011*\"khalsa\" + 0.011*\"muskoge\" + 0.010*\"affection\" + 0.010*\"alam\"\n", + "2019-01-31 01:38:39,431 : INFO : topic #45 (0.020): 0.048*\"arsen\" + 0.030*\"jpg\" + 0.030*\"museo\" + 0.027*\"fifteenth\" + 0.022*\"pain\" + 0.021*\"illicit\" + 0.017*\"artist\" + 0.017*\"exhaust\" + 0.016*\"gai\" + 0.015*\"colder\"\n", + "2019-01-31 01:38:39,432 : INFO : topic #17 (0.020): 0.080*\"church\" + 0.024*\"cathol\" + 0.022*\"christian\" + 0.022*\"bishop\" + 0.016*\"sail\" + 0.014*\"retroflex\" + 0.010*\"relationship\" + 0.010*\"historiographi\" + 0.010*\"poll\" + 0.009*\"parish\"\n", + "2019-01-31 01:38:39,433 : INFO : topic #38 (0.020): 0.022*\"walter\" + 0.010*\"aza\" + 0.009*\"forc\" + 0.009*\"battalion\" + 0.007*\"empath\" + 0.007*\"teufel\" + 0.007*\"armi\" + 0.006*\"govern\" + 0.006*\"militari\" + 0.006*\"pour\"\n", + "2019-01-31 01:38:39,434 : INFO : topic #13 (0.020): 0.027*\"london\" + 0.026*\"australia\" + 0.025*\"sourc\" + 0.025*\"new\" + 0.023*\"england\" + 0.021*\"australian\" + 0.019*\"british\" + 0.018*\"ireland\" + 0.014*\"youth\" + 0.014*\"wale\"\n", + "2019-01-31 01:38:39,439 : INFO : topic diff=0.002943, rho=0.020434\n", + "2019-01-31 01:38:39,595 : INFO : PROGRESS: pass 0, at document #4792000/4922894\n", + "2019-01-31 01:38:40,967 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:38:41,234 : INFO : topic #45 (0.020): 0.048*\"arsen\" + 0.030*\"jpg\" + 0.030*\"museo\" + 0.027*\"fifteenth\" + 0.022*\"pain\" + 0.021*\"illicit\" + 0.017*\"artist\" + 0.017*\"exhaust\" + 0.016*\"gai\" + 0.015*\"colder\"\n", + "2019-01-31 01:38:41,235 : INFO : topic #29 (0.020): 0.031*\"companhia\" + 0.013*\"busi\" + 0.012*\"million\" + 0.012*\"produc\" + 0.012*\"market\" + 0.011*\"bank\" + 0.010*\"industri\" + 0.009*\"yawn\" + 0.009*\"manag\" + 0.007*\"trace\"\n", + "2019-01-31 01:38:41,236 : INFO : topic #14 (0.020): 0.023*\"forc\" + 0.021*\"aggress\" + 0.020*\"armi\" + 0.020*\"walter\" + 0.018*\"com\" + 0.013*\"oper\" + 0.013*\"militari\" + 0.013*\"unionist\" + 0.013*\"airbu\" + 0.011*\"diversifi\"\n", + "2019-01-31 01:38:41,237 : INFO : topic #6 (0.020): 0.069*\"fewer\" + 0.023*\"epiru\" + 0.020*\"septemb\" + 0.018*\"teacher\" + 0.014*\"stake\" + 0.012*\"proclaim\" + 0.012*\"rodríguez\" + 0.011*\"direct\" + 0.010*\"movi\" + 0.010*\"acrimoni\"\n", + "2019-01-31 01:38:41,238 : INFO : topic #3 (0.020): 0.033*\"present\" + 0.025*\"nation\" + 0.025*\"offic\" + 0.024*\"minist\" + 0.023*\"govern\" + 0.022*\"member\" + 0.018*\"start\" + 0.017*\"serv\" + 0.016*\"gener\" + 0.014*\"council\"\n", + "2019-01-31 01:38:41,244 : INFO : topic diff=0.003370, rho=0.020429\n", + "2019-01-31 01:38:41,399 : INFO : PROGRESS: pass 0, at document #4794000/4922894\n", + "2019-01-31 01:38:42,752 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:38:43,018 : INFO : topic #8 (0.020): 0.026*\"law\" + 0.023*\"cortic\" + 0.018*\"start\" + 0.017*\"act\" + 0.012*\"ricardo\" + 0.012*\"case\" + 0.010*\"replac\" + 0.009*\"polaris\" + 0.008*\"legal\" + 0.007*\"order\"\n", + "2019-01-31 01:38:43,020 : INFO : topic #6 (0.020): 0.069*\"fewer\" + 0.023*\"epiru\" + 0.020*\"septemb\" + 0.018*\"teacher\" + 0.014*\"stake\" + 0.012*\"proclaim\" + 0.012*\"rodríguez\" + 0.010*\"direct\" + 0.010*\"movi\" + 0.010*\"acrimoni\"\n", + "2019-01-31 01:38:43,021 : INFO : topic #43 (0.020): 0.066*\"elect\" + 0.055*\"parti\" + 0.024*\"voluntari\" + 0.022*\"democrat\" + 0.019*\"member\" + 0.016*\"polici\" + 0.015*\"liber\" + 0.014*\"republ\" + 0.014*\"bypass\" + 0.013*\"report\"\n", + "2019-01-31 01:38:43,022 : INFO : topic #15 (0.020): 0.012*\"small\" + 0.010*\"organ\" + 0.009*\"develop\" + 0.009*\"commun\" + 0.008*\"group\" + 0.008*\"peopl\" + 0.008*\"word\" + 0.007*\"woman\" + 0.007*\"human\" + 0.006*\"workplac\"\n", + "2019-01-31 01:38:43,023 : INFO : topic #32 (0.020): 0.050*\"district\" + 0.046*\"popolo\" + 0.043*\"vigour\" + 0.034*\"tortur\" + 0.031*\"cotton\" + 0.023*\"multitud\" + 0.023*\"adulthood\" + 0.021*\"area\" + 0.020*\"cede\" + 0.019*\"commun\"\n", + "2019-01-31 01:38:43,029 : INFO : topic diff=0.002873, rho=0.020425\n", + "2019-01-31 01:38:43,184 : INFO : PROGRESS: pass 0, at document #4796000/4922894\n", + "2019-01-31 01:38:44,542 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:38:44,808 : INFO : topic #13 (0.020): 0.027*\"london\" + 0.026*\"australia\" + 0.025*\"new\" + 0.025*\"sourc\" + 0.023*\"england\" + 0.021*\"australian\" + 0.019*\"british\" + 0.018*\"ireland\" + 0.014*\"youth\" + 0.014*\"wale\"\n", + "2019-01-31 01:38:44,809 : INFO : topic #47 (0.020): 0.065*\"muscl\" + 0.032*\"perceptu\" + 0.021*\"theater\" + 0.018*\"compos\" + 0.017*\"place\" + 0.016*\"damn\" + 0.014*\"orchestr\" + 0.014*\"olympo\" + 0.013*\"physician\" + 0.011*\"word\"\n", + "2019-01-31 01:38:44,810 : INFO : topic #32 (0.020): 0.050*\"district\" + 0.046*\"popolo\" + 0.043*\"vigour\" + 0.034*\"tortur\" + 0.031*\"cotton\" + 0.023*\"multitud\" + 0.023*\"adulthood\" + 0.021*\"area\" + 0.020*\"cede\" + 0.019*\"commun\"\n", + "2019-01-31 01:38:44,811 : INFO : topic #40 (0.020): 0.087*\"unit\" + 0.023*\"schuster\" + 0.022*\"institut\" + 0.021*\"requir\" + 0.020*\"collector\" + 0.019*\"student\" + 0.014*\"professor\" + 0.012*\"word\" + 0.012*\"http\" + 0.011*\"governor\"\n", + "2019-01-31 01:38:44,812 : INFO : topic #43 (0.020): 0.066*\"elect\" + 0.055*\"parti\" + 0.024*\"voluntari\" + 0.022*\"democrat\" + 0.019*\"member\" + 0.016*\"polici\" + 0.015*\"liber\" + 0.014*\"republ\" + 0.014*\"bypass\" + 0.013*\"report\"\n", + "2019-01-31 01:38:44,818 : INFO : topic diff=0.003370, rho=0.020421\n", + "2019-01-31 01:38:44,982 : INFO : PROGRESS: pass 0, at document #4798000/4922894\n", + "2019-01-31 01:38:46,350 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:38:46,619 : INFO : topic #10 (0.020): 0.010*\"cdd\" + 0.008*\"media\" + 0.008*\"disco\" + 0.008*\"have\" + 0.007*\"hormon\" + 0.007*\"caus\" + 0.007*\"pathwai\" + 0.006*\"effect\" + 0.006*\"proper\" + 0.006*\"treat\"\n", + "2019-01-31 01:38:46,621 : INFO : topic #34 (0.020): 0.067*\"start\" + 0.033*\"new\" + 0.031*\"american\" + 0.029*\"unionist\" + 0.026*\"cotton\" + 0.021*\"year\" + 0.015*\"california\" + 0.013*\"warrior\" + 0.012*\"terri\" + 0.012*\"north\"\n", + "2019-01-31 01:38:46,621 : INFO : topic #39 (0.020): 0.060*\"canada\" + 0.045*\"canadian\" + 0.024*\"toronto\" + 0.024*\"hoar\" + 0.022*\"ontario\" + 0.016*\"quebec\" + 0.015*\"hydrogen\" + 0.015*\"misericordia\" + 0.015*\"new\" + 0.012*\"novotná\"\n", + "2019-01-31 01:38:46,622 : INFO : topic #15 (0.020): 0.012*\"small\" + 0.010*\"organ\" + 0.009*\"develop\" + 0.009*\"commun\" + 0.008*\"group\" + 0.008*\"peopl\" + 0.008*\"word\" + 0.007*\"woman\" + 0.007*\"human\" + 0.006*\"workplac\"\n", + "2019-01-31 01:38:46,624 : INFO : topic #46 (0.020): 0.018*\"swedish\" + 0.018*\"sweden\" + 0.016*\"stop\" + 0.016*\"norwai\" + 0.014*\"damag\" + 0.014*\"norwegian\" + 0.014*\"wind\" + 0.011*\"treeless\" + 0.010*\"huntsvil\" + 0.010*\"turkish\"\n", + "2019-01-31 01:38:46,629 : INFO : topic diff=0.003374, rho=0.020417\n", + "2019-01-31 01:38:49,362 : INFO : -11.734 per-word bound, 3406.2 perplexity estimate based on a held-out corpus of 2000 documents with 558364 words\n", + "2019-01-31 01:38:49,363 : INFO : PROGRESS: pass 0, at document #4800000/4922894\n", + "2019-01-31 01:38:50,748 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 01:38:51,017 : INFO : topic #5 (0.020): 0.039*\"abroad\" + 0.028*\"son\" + 0.027*\"rel\" + 0.026*\"reconstruct\" + 0.021*\"band\" + 0.016*\"muscl\" + 0.016*\"simultan\" + 0.014*\"charcoal\" + 0.013*\"toyota\" + 0.010*\"myspac\"\n", + "2019-01-31 01:38:51,018 : INFO : topic #26 (0.020): 0.029*\"champion\" + 0.029*\"workplac\" + 0.026*\"woman\" + 0.025*\"olymp\" + 0.023*\"men\" + 0.021*\"medal\" + 0.020*\"event\" + 0.019*\"alic\" + 0.018*\"taxpay\" + 0.018*\"atheist\"\n", + "2019-01-31 01:38:51,019 : INFO : topic #21 (0.020): 0.036*\"samford\" + 0.022*\"spain\" + 0.018*\"del\" + 0.017*\"italian\" + 0.017*\"mexico\" + 0.013*\"soviet\" + 0.012*\"santa\" + 0.011*\"juan\" + 0.011*\"francisco\" + 0.010*\"carlo\"\n", + "2019-01-31 01:38:51,020 : INFO : topic #31 (0.020): 0.051*\"fusiform\" + 0.027*\"scientist\" + 0.025*\"taxpay\" + 0.023*\"player\" + 0.020*\"place\" + 0.013*\"clot\" + 0.013*\"leagu\" + 0.010*\"folei\" + 0.010*\"yawn\" + 0.009*\"ruler\"\n", + "2019-01-31 01:38:51,021 : INFO : topic #36 (0.020): 0.011*\"network\" + 0.010*\"prognosi\" + 0.010*\"pop\" + 0.009*\"cytokin\" + 0.008*\"develop\" + 0.008*\"diggin\" + 0.008*\"softwar\" + 0.008*\"uruguayan\" + 0.007*\"user\" + 0.007*\"includ\"\n", + "2019-01-31 01:38:51,027 : INFO : topic diff=0.003211, rho=0.020412\n", + "2019-01-31 01:38:51,182 : INFO : PROGRESS: pass 0, at document #4802000/4922894\n", + "2019-01-31 01:38:52,538 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:38:52,804 : INFO : topic #7 (0.020): 0.021*\"snatch\" + 0.020*\"di\" + 0.019*\"factor\" + 0.016*\"yawn\" + 0.016*\"margin\" + 0.014*\"bone\" + 0.013*\"life\" + 0.012*\"faster\" + 0.012*\"will\" + 0.012*\"john\"\n", + "2019-01-31 01:38:52,805 : INFO : topic #35 (0.020): 0.058*\"russia\" + 0.036*\"sovereignti\" + 0.034*\"rural\" + 0.028*\"poison\" + 0.027*\"reprint\" + 0.024*\"personifi\" + 0.019*\"moscow\" + 0.018*\"poland\" + 0.015*\"turin\" + 0.014*\"unfortun\"\n", + "2019-01-31 01:38:52,806 : INFO : topic #23 (0.020): 0.135*\"audit\" + 0.073*\"best\" + 0.035*\"yawn\" + 0.028*\"jacksonvil\" + 0.022*\"japanes\" + 0.021*\"noll\" + 0.018*\"women\" + 0.018*\"intern\" + 0.017*\"festiv\" + 0.013*\"winner\"\n", + "2019-01-31 01:38:52,807 : INFO : topic #34 (0.020): 0.067*\"start\" + 0.032*\"new\" + 0.031*\"american\" + 0.030*\"unionist\" + 0.026*\"cotton\" + 0.020*\"year\" + 0.015*\"california\" + 0.013*\"warrior\" + 0.012*\"terri\" + 0.011*\"north\"\n", + "2019-01-31 01:38:52,808 : INFO : topic #36 (0.020): 0.011*\"network\" + 0.010*\"prognosi\" + 0.010*\"pop\" + 0.009*\"cytokin\" + 0.008*\"develop\" + 0.008*\"diggin\" + 0.008*\"softwar\" + 0.008*\"uruguayan\" + 0.007*\"user\" + 0.007*\"includ\"\n", + "2019-01-31 01:38:52,814 : INFO : topic diff=0.002899, rho=0.020408\n", + "2019-01-31 01:38:52,972 : INFO : PROGRESS: pass 0, at document #4804000/4922894\n", + "2019-01-31 01:38:54,359 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:38:54,626 : INFO : topic #0 (0.020): 0.060*\"statewid\" + 0.039*\"line\" + 0.032*\"rivièr\" + 0.029*\"raid\" + 0.026*\"rosenwald\" + 0.021*\"airmen\" + 0.018*\"serv\" + 0.017*\"traceabl\" + 0.013*\"oper\" + 0.012*\"briarwood\"\n", + "2019-01-31 01:38:54,627 : INFO : topic #5 (0.020): 0.039*\"abroad\" + 0.028*\"son\" + 0.027*\"rel\" + 0.026*\"reconstruct\" + 0.020*\"band\" + 0.016*\"muscl\" + 0.016*\"simultan\" + 0.014*\"charcoal\" + 0.014*\"toyota\" + 0.010*\"myspac\"\n", + "2019-01-31 01:38:54,628 : INFO : topic #13 (0.020): 0.027*\"london\" + 0.027*\"australia\" + 0.025*\"new\" + 0.025*\"sourc\" + 0.023*\"england\" + 0.021*\"australian\" + 0.019*\"british\" + 0.018*\"ireland\" + 0.014*\"youth\" + 0.014*\"wale\"\n", + "2019-01-31 01:38:54,629 : INFO : topic #40 (0.020): 0.086*\"unit\" + 0.023*\"schuster\" + 0.022*\"institut\" + 0.021*\"requir\" + 0.020*\"collector\" + 0.019*\"student\" + 0.014*\"professor\" + 0.012*\"word\" + 0.012*\"http\" + 0.011*\"governor\"\n", + "2019-01-31 01:38:54,630 : INFO : topic #29 (0.020): 0.031*\"companhia\" + 0.013*\"busi\" + 0.012*\"million\" + 0.012*\"market\" + 0.012*\"produc\" + 0.010*\"bank\" + 0.010*\"industri\" + 0.009*\"yawn\" + 0.009*\"manag\" + 0.007*\"oper\"\n", + "2019-01-31 01:38:54,636 : INFO : topic diff=0.003219, rho=0.020404\n", + "2019-01-31 01:38:54,791 : INFO : PROGRESS: pass 0, at document #4806000/4922894\n", + "2019-01-31 01:38:56,153 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:38:56,419 : INFO : topic #45 (0.020): 0.049*\"arsen\" + 0.032*\"museo\" + 0.030*\"jpg\" + 0.027*\"fifteenth\" + 0.022*\"pain\" + 0.021*\"illicit\" + 0.017*\"artist\" + 0.017*\"exhaust\" + 0.016*\"gai\" + 0.014*\"colder\"\n", + "2019-01-31 01:38:56,420 : INFO : topic #44 (0.020): 0.030*\"rooftop\" + 0.025*\"final\" + 0.023*\"wife\" + 0.021*\"tourist\" + 0.019*\"champion\" + 0.016*\"chamber\" + 0.015*\"martin\" + 0.014*\"taxpay\" + 0.014*\"tiepolo\" + 0.012*\"open\"\n", + "2019-01-31 01:38:56,421 : INFO : topic #20 (0.020): 0.142*\"scholar\" + 0.038*\"struggl\" + 0.032*\"high\" + 0.029*\"educ\" + 0.023*\"collector\" + 0.017*\"yawn\" + 0.012*\"prognosi\" + 0.011*\"district\" + 0.010*\"task\" + 0.010*\"start\"\n", + "2019-01-31 01:38:56,422 : INFO : topic #7 (0.020): 0.021*\"snatch\" + 0.019*\"di\" + 0.019*\"factor\" + 0.016*\"yawn\" + 0.016*\"margin\" + 0.014*\"bone\" + 0.013*\"life\" + 0.012*\"faster\" + 0.012*\"will\" + 0.012*\"john\"\n", + "2019-01-31 01:38:56,423 : INFO : topic #41 (0.020): 0.044*\"citi\" + 0.026*\"palmer\" + 0.019*\"new\" + 0.017*\"strategist\" + 0.013*\"open\" + 0.012*\"center\" + 0.012*\"includ\" + 0.012*\"lobe\" + 0.010*\"dai\" + 0.009*\"highli\"\n", + "2019-01-31 01:38:56,429 : INFO : topic diff=0.002681, rho=0.020400\n", + "2019-01-31 01:38:56,586 : INFO : PROGRESS: pass 0, at document #4808000/4922894\n", + "2019-01-31 01:38:57,972 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:38:58,238 : INFO : topic #19 (0.020): 0.017*\"languag\" + 0.015*\"centuri\" + 0.010*\"woodcut\" + 0.009*\"form\" + 0.009*\"origin\" + 0.009*\"mean\" + 0.008*\"trade\" + 0.008*\"english\" + 0.007*\"known\" + 0.007*\"uruguayan\"\n", + "2019-01-31 01:38:58,240 : INFO : topic #24 (0.020): 0.041*\"book\" + 0.036*\"publicis\" + 0.024*\"word\" + 0.020*\"new\" + 0.014*\"presid\" + 0.014*\"edit\" + 0.011*\"magazin\" + 0.011*\"worldwid\" + 0.011*\"nicola\" + 0.011*\"author\"\n", + "2019-01-31 01:38:58,241 : INFO : topic #33 (0.020): 0.059*\"french\" + 0.045*\"franc\" + 0.031*\"pari\" + 0.023*\"jean\" + 0.022*\"sail\" + 0.017*\"daphn\" + 0.014*\"lazi\" + 0.013*\"wreath\" + 0.012*\"loui\" + 0.012*\"piec\"\n", + "2019-01-31 01:38:58,242 : INFO : topic #22 (0.020): 0.034*\"spars\" + 0.017*\"factor\" + 0.012*\"plaisir\" + 0.010*\"genu\" + 0.010*\"western\" + 0.009*\"biom\" + 0.008*\"median\" + 0.007*\"trap\" + 0.007*\"incom\" + 0.006*\"florida\"\n", + "2019-01-31 01:38:58,243 : INFO : topic #15 (0.020): 0.012*\"small\" + 0.010*\"organ\" + 0.009*\"develop\" + 0.009*\"commun\" + 0.008*\"group\" + 0.008*\"peopl\" + 0.008*\"word\" + 0.007*\"woman\" + 0.007*\"human\" + 0.006*\"workplac\"\n", + "2019-01-31 01:38:58,249 : INFO : topic diff=0.003120, rho=0.020395\n", + "2019-01-31 01:38:58,410 : INFO : PROGRESS: pass 0, at document #4810000/4922894\n", + "2019-01-31 01:39:00,009 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:39:00,277 : INFO : topic #9 (0.020): 0.075*\"bone\" + 0.043*\"american\" + 0.030*\"valour\" + 0.019*\"dutch\" + 0.019*\"folei\" + 0.017*\"player\" + 0.016*\"polit\" + 0.016*\"english\" + 0.012*\"acrimoni\" + 0.012*\"simpler\"\n", + "2019-01-31 01:39:00,278 : INFO : topic #34 (0.020): 0.068*\"start\" + 0.032*\"new\" + 0.031*\"american\" + 0.030*\"unionist\" + 0.026*\"cotton\" + 0.020*\"year\" + 0.015*\"california\" + 0.013*\"warrior\" + 0.012*\"terri\" + 0.012*\"north\"\n", + "2019-01-31 01:39:00,279 : INFO : topic #42 (0.020): 0.047*\"german\" + 0.032*\"germani\" + 0.016*\"vol\" + 0.015*\"israel\" + 0.014*\"der\" + 0.014*\"jewish\" + 0.013*\"berlin\" + 0.009*\"european\" + 0.009*\"austria\" + 0.009*\"europ\"\n", + "2019-01-31 01:39:00,280 : INFO : topic #3 (0.020): 0.033*\"present\" + 0.025*\"nation\" + 0.025*\"offic\" + 0.024*\"minist\" + 0.023*\"govern\" + 0.022*\"member\" + 0.018*\"start\" + 0.016*\"serv\" + 0.016*\"gener\" + 0.014*\"council\"\n", + "2019-01-31 01:39:00,281 : INFO : topic #39 (0.020): 0.060*\"canada\" + 0.045*\"canadian\" + 0.024*\"toronto\" + 0.024*\"hoar\" + 0.021*\"ontario\" + 0.016*\"quebec\" + 0.016*\"hydrogen\" + 0.015*\"misericordia\" + 0.015*\"new\" + 0.013*\"novotná\"\n", + "2019-01-31 01:39:00,287 : INFO : topic diff=0.002673, rho=0.020391\n", + "2019-01-31 01:39:00,440 : INFO : PROGRESS: pass 0, at document #4812000/4922894\n", + "2019-01-31 01:39:01,787 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:39:02,053 : INFO : topic #6 (0.020): 0.069*\"fewer\" + 0.023*\"epiru\" + 0.020*\"septemb\" + 0.018*\"teacher\" + 0.014*\"stake\" + 0.012*\"proclaim\" + 0.012*\"rodríguez\" + 0.011*\"direct\" + 0.010*\"acrimoni\" + 0.010*\"movi\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 01:39:02,054 : INFO : topic #11 (0.020): 0.022*\"john\" + 0.011*\"will\" + 0.011*\"david\" + 0.011*\"jame\" + 0.010*\"rival\" + 0.009*\"mexican–american\" + 0.008*\"paul\" + 0.008*\"slur\" + 0.007*\"georg\" + 0.007*\"rhyme\"\n", + "2019-01-31 01:39:02,055 : INFO : topic #14 (0.020): 0.024*\"forc\" + 0.022*\"aggress\" + 0.020*\"walter\" + 0.020*\"armi\" + 0.018*\"com\" + 0.013*\"oper\" + 0.013*\"militari\" + 0.013*\"unionist\" + 0.012*\"airbu\" + 0.011*\"diversifi\"\n", + "2019-01-31 01:39:02,057 : INFO : topic #47 (0.020): 0.066*\"muscl\" + 0.032*\"perceptu\" + 0.021*\"theater\" + 0.018*\"compos\" + 0.017*\"place\" + 0.015*\"damn\" + 0.014*\"orchestr\" + 0.014*\"olympo\" + 0.013*\"physician\" + 0.011*\"word\"\n", + "2019-01-31 01:39:02,058 : INFO : topic #40 (0.020): 0.086*\"unit\" + 0.023*\"schuster\" + 0.022*\"institut\" + 0.021*\"requir\" + 0.020*\"collector\" + 0.019*\"student\" + 0.014*\"professor\" + 0.012*\"word\" + 0.012*\"http\" + 0.011*\"governor\"\n", + "2019-01-31 01:39:02,063 : INFO : topic diff=0.003553, rho=0.020387\n", + "2019-01-31 01:39:02,222 : INFO : PROGRESS: pass 0, at document #4814000/4922894\n", + "2019-01-31 01:39:03,605 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:39:03,871 : INFO : topic #19 (0.020): 0.017*\"languag\" + 0.015*\"centuri\" + 0.010*\"woodcut\" + 0.009*\"form\" + 0.009*\"origin\" + 0.009*\"mean\" + 0.008*\"trade\" + 0.008*\"english\" + 0.007*\"known\" + 0.007*\"ancestor\"\n", + "2019-01-31 01:39:03,872 : INFO : topic #35 (0.020): 0.057*\"russia\" + 0.035*\"sovereignti\" + 0.033*\"rural\" + 0.028*\"poison\" + 0.027*\"reprint\" + 0.025*\"personifi\" + 0.020*\"moscow\" + 0.019*\"poland\" + 0.015*\"turin\" + 0.014*\"unfortun\"\n", + "2019-01-31 01:39:03,873 : INFO : topic #28 (0.020): 0.037*\"build\" + 0.030*\"hous\" + 0.019*\"buford\" + 0.016*\"histor\" + 0.012*\"linear\" + 0.012*\"centuri\" + 0.011*\"silicon\" + 0.011*\"depress\" + 0.011*\"constitut\" + 0.010*\"pistol\"\n", + "2019-01-31 01:39:03,874 : INFO : topic #29 (0.020): 0.032*\"companhia\" + 0.013*\"busi\" + 0.012*\"million\" + 0.012*\"produc\" + 0.011*\"market\" + 0.011*\"bank\" + 0.010*\"industri\" + 0.009*\"yawn\" + 0.008*\"manag\" + 0.007*\"oper\"\n", + "2019-01-31 01:39:03,875 : INFO : topic #34 (0.020): 0.068*\"start\" + 0.032*\"new\" + 0.031*\"american\" + 0.030*\"unionist\" + 0.026*\"cotton\" + 0.020*\"year\" + 0.015*\"california\" + 0.013*\"warrior\" + 0.012*\"terri\" + 0.011*\"north\"\n", + "2019-01-31 01:39:03,881 : INFO : topic diff=0.003579, rho=0.020383\n", + "2019-01-31 01:39:04,038 : INFO : PROGRESS: pass 0, at document #4816000/4922894\n", + "2019-01-31 01:39:05,404 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:39:05,671 : INFO : topic #3 (0.020): 0.033*\"present\" + 0.025*\"nation\" + 0.025*\"offic\" + 0.024*\"minist\" + 0.023*\"govern\" + 0.022*\"member\" + 0.018*\"start\" + 0.016*\"serv\" + 0.016*\"gener\" + 0.014*\"council\"\n", + "2019-01-31 01:39:05,672 : INFO : topic #48 (0.020): 0.079*\"march\" + 0.078*\"sens\" + 0.076*\"octob\" + 0.069*\"januari\" + 0.069*\"august\" + 0.068*\"juli\" + 0.068*\"notion\" + 0.067*\"april\" + 0.066*\"judici\" + 0.066*\"decatur\"\n", + "2019-01-31 01:39:05,673 : INFO : topic #1 (0.020): 0.051*\"china\" + 0.045*\"chilton\" + 0.026*\"kong\" + 0.026*\"hong\" + 0.020*\"korea\" + 0.020*\"korean\" + 0.019*\"shirin\" + 0.016*\"sourc\" + 0.015*\"leah\" + 0.013*\"kim\"\n", + "2019-01-31 01:39:05,674 : INFO : topic #18 (0.020): 0.011*\"théori\" + 0.007*\"later\" + 0.007*\"sack\" + 0.006*\"dai\" + 0.005*\"kill\" + 0.005*\"like\" + 0.005*\"end\" + 0.005*\"retrospect\" + 0.004*\"call\" + 0.004*\"help\"\n", + "2019-01-31 01:39:05,675 : INFO : topic #21 (0.020): 0.035*\"samford\" + 0.022*\"spain\" + 0.018*\"del\" + 0.018*\"italian\" + 0.017*\"mexico\" + 0.014*\"soviet\" + 0.012*\"santa\" + 0.011*\"juan\" + 0.011*\"francisco\" + 0.010*\"carlo\"\n", + "2019-01-31 01:39:05,681 : INFO : topic diff=0.002653, rho=0.020378\n", + "2019-01-31 01:39:05,839 : INFO : PROGRESS: pass 0, at document #4818000/4922894\n", + "2019-01-31 01:39:07,219 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:39:07,486 : INFO : topic #37 (0.020): 0.012*\"charact\" + 0.012*\"septemb\" + 0.011*\"anim\" + 0.010*\"man\" + 0.008*\"comic\" + 0.007*\"fusiform\" + 0.007*\"appear\" + 0.007*\"storag\" + 0.007*\"workplac\" + 0.006*\"black\"\n", + "2019-01-31 01:39:07,487 : INFO : topic #10 (0.020): 0.011*\"cdd\" + 0.008*\"media\" + 0.008*\"disco\" + 0.007*\"have\" + 0.007*\"pathwai\" + 0.007*\"hormon\" + 0.007*\"caus\" + 0.006*\"effect\" + 0.006*\"treat\" + 0.006*\"proper\"\n", + "2019-01-31 01:39:07,488 : INFO : topic #26 (0.020): 0.029*\"champion\" + 0.029*\"workplac\" + 0.025*\"alic\" + 0.025*\"woman\" + 0.025*\"olymp\" + 0.023*\"men\" + 0.021*\"medal\" + 0.020*\"left\" + 0.019*\"event\" + 0.018*\"taxpay\"\n", + "2019-01-31 01:39:07,489 : INFO : topic #16 (0.020): 0.053*\"king\" + 0.030*\"priest\" + 0.020*\"duke\" + 0.019*\"idiosyncrat\" + 0.018*\"grammat\" + 0.017*\"rotterdam\" + 0.017*\"portugues\" + 0.017*\"quarterli\" + 0.014*\"kingdom\" + 0.012*\"brazil\"\n", + "2019-01-31 01:39:07,490 : INFO : topic #38 (0.020): 0.022*\"walter\" + 0.010*\"aza\" + 0.009*\"forc\" + 0.008*\"battalion\" + 0.007*\"teufel\" + 0.007*\"empath\" + 0.007*\"armi\" + 0.006*\"militari\" + 0.006*\"govern\" + 0.006*\"pour\"\n", + "2019-01-31 01:39:07,496 : INFO : topic diff=0.003189, rho=0.020374\n", + "2019-01-31 01:39:10,159 : INFO : -11.683 per-word bound, 3287.4 perplexity estimate based on a held-out corpus of 2000 documents with 567625 words\n", + "2019-01-31 01:39:10,160 : INFO : PROGRESS: pass 0, at document #4820000/4922894\n", + "2019-01-31 01:39:11,525 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:39:11,792 : INFO : topic #37 (0.020): 0.012*\"charact\" + 0.012*\"septemb\" + 0.011*\"anim\" + 0.010*\"man\" + 0.008*\"comic\" + 0.007*\"fusiform\" + 0.007*\"appear\" + 0.007*\"storag\" + 0.007*\"workplac\" + 0.006*\"black\"\n", + "2019-01-31 01:39:11,793 : INFO : topic #33 (0.020): 0.060*\"french\" + 0.045*\"franc\" + 0.030*\"pari\" + 0.023*\"jean\" + 0.022*\"sail\" + 0.017*\"daphn\" + 0.014*\"lazi\" + 0.013*\"wreath\" + 0.012*\"loui\" + 0.012*\"piec\"\n", + "2019-01-31 01:39:11,794 : INFO : topic #48 (0.020): 0.079*\"march\" + 0.077*\"sens\" + 0.076*\"octob\" + 0.069*\"januari\" + 0.068*\"august\" + 0.068*\"notion\" + 0.068*\"juli\" + 0.067*\"april\" + 0.065*\"judici\" + 0.065*\"decatur\"\n", + "2019-01-31 01:39:11,795 : INFO : topic #14 (0.020): 0.024*\"forc\" + 0.022*\"aggress\" + 0.020*\"armi\" + 0.020*\"walter\" + 0.018*\"com\" + 0.013*\"oper\" + 0.013*\"militari\" + 0.013*\"unionist\" + 0.012*\"airbu\" + 0.011*\"refut\"\n", + "2019-01-31 01:39:11,796 : INFO : topic #7 (0.020): 0.021*\"snatch\" + 0.019*\"di\" + 0.019*\"factor\" + 0.016*\"yawn\" + 0.016*\"margin\" + 0.014*\"bone\" + 0.013*\"life\" + 0.012*\"faster\" + 0.012*\"will\" + 0.012*\"daughter\"\n", + "2019-01-31 01:39:11,802 : INFO : topic diff=0.002941, rho=0.020370\n", + "2019-01-31 01:39:11,957 : INFO : PROGRESS: pass 0, at document #4822000/4922894\n", + "2019-01-31 01:39:13,293 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:39:13,560 : INFO : topic #29 (0.020): 0.032*\"companhia\" + 0.013*\"busi\" + 0.012*\"million\" + 0.012*\"produc\" + 0.011*\"market\" + 0.011*\"bank\" + 0.010*\"industri\" + 0.009*\"manag\" + 0.009*\"yawn\" + 0.007*\"oper\"\n", + "2019-01-31 01:39:13,561 : INFO : topic #37 (0.020): 0.012*\"charact\" + 0.012*\"septemb\" + 0.011*\"anim\" + 0.010*\"man\" + 0.008*\"comic\" + 0.007*\"fusiform\" + 0.007*\"appear\" + 0.007*\"storag\" + 0.007*\"workplac\" + 0.006*\"black\"\n", + "2019-01-31 01:39:13,562 : INFO : topic #10 (0.020): 0.011*\"cdd\" + 0.008*\"media\" + 0.008*\"disco\" + 0.007*\"have\" + 0.007*\"caus\" + 0.007*\"pathwai\" + 0.007*\"hormon\" + 0.006*\"effect\" + 0.006*\"proper\" + 0.006*\"treat\"\n", + "2019-01-31 01:39:13,563 : INFO : topic #33 (0.020): 0.059*\"french\" + 0.044*\"franc\" + 0.030*\"pari\" + 0.023*\"sail\" + 0.022*\"jean\" + 0.017*\"daphn\" + 0.014*\"lazi\" + 0.014*\"wreath\" + 0.012*\"loui\" + 0.012*\"piec\"\n", + "2019-01-31 01:39:13,564 : INFO : topic #34 (0.020): 0.067*\"start\" + 0.032*\"new\" + 0.031*\"american\" + 0.030*\"unionist\" + 0.026*\"cotton\" + 0.021*\"year\" + 0.015*\"california\" + 0.013*\"warrior\" + 0.012*\"terri\" + 0.011*\"north\"\n", + "2019-01-31 01:39:13,570 : INFO : topic diff=0.003419, rho=0.020366\n", + "2019-01-31 01:39:13,729 : INFO : PROGRESS: pass 0, at document #4824000/4922894\n", + "2019-01-31 01:39:15,111 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:39:15,377 : INFO : topic #22 (0.020): 0.034*\"spars\" + 0.017*\"factor\" + 0.013*\"plaisir\" + 0.010*\"genu\" + 0.010*\"western\" + 0.009*\"biom\" + 0.008*\"median\" + 0.007*\"trap\" + 0.007*\"incom\" + 0.006*\"florida\"\n", + "2019-01-31 01:39:15,378 : INFO : topic #39 (0.020): 0.060*\"canada\" + 0.046*\"canadian\" + 0.024*\"toronto\" + 0.024*\"hoar\" + 0.022*\"ontario\" + 0.016*\"hydrogen\" + 0.015*\"misericordia\" + 0.015*\"quebec\" + 0.015*\"new\" + 0.014*\"novotná\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 01:39:15,379 : INFO : topic #41 (0.020): 0.043*\"citi\" + 0.025*\"palmer\" + 0.019*\"new\" + 0.017*\"strategist\" + 0.013*\"open\" + 0.012*\"center\" + 0.012*\"includ\" + 0.012*\"lobe\" + 0.010*\"dai\" + 0.009*\"highli\"\n", + "2019-01-31 01:39:15,380 : INFO : topic #49 (0.020): 0.044*\"india\" + 0.029*\"incumb\" + 0.013*\"islam\" + 0.013*\"pakistan\" + 0.012*\"anglo\" + 0.012*\"televis\" + 0.011*\"khalsa\" + 0.011*\"affection\" + 0.010*\"muskoge\" + 0.010*\"alam\"\n", + "2019-01-31 01:39:15,381 : INFO : topic #37 (0.020): 0.012*\"charact\" + 0.012*\"septemb\" + 0.011*\"anim\" + 0.010*\"man\" + 0.008*\"comic\" + 0.007*\"fusiform\" + 0.007*\"appear\" + 0.007*\"storag\" + 0.007*\"workplac\" + 0.006*\"black\"\n", + "2019-01-31 01:39:15,387 : INFO : topic diff=0.003112, rho=0.020362\n", + "2019-01-31 01:39:15,549 : INFO : PROGRESS: pass 0, at document #4826000/4922894\n", + "2019-01-31 01:39:16,936 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:39:17,202 : INFO : topic #15 (0.020): 0.011*\"small\" + 0.010*\"organ\" + 0.009*\"develop\" + 0.009*\"commun\" + 0.008*\"group\" + 0.008*\"word\" + 0.008*\"peopl\" + 0.007*\"woman\" + 0.007*\"human\" + 0.006*\"workplac\"\n", + "2019-01-31 01:39:17,203 : INFO : topic #35 (0.020): 0.057*\"russia\" + 0.035*\"sovereignti\" + 0.032*\"rural\" + 0.028*\"poison\" + 0.026*\"reprint\" + 0.024*\"personifi\" + 0.020*\"moscow\" + 0.019*\"poland\" + 0.017*\"turin\" + 0.014*\"tyrant\"\n", + "2019-01-31 01:39:17,204 : INFO : topic #47 (0.020): 0.066*\"muscl\" + 0.032*\"perceptu\" + 0.021*\"theater\" + 0.017*\"compos\" + 0.017*\"place\" + 0.016*\"damn\" + 0.014*\"orchestr\" + 0.013*\"olympo\" + 0.012*\"physician\" + 0.011*\"word\"\n", + "2019-01-31 01:39:17,205 : INFO : topic #27 (0.020): 0.075*\"questionnair\" + 0.020*\"candid\" + 0.017*\"taxpay\" + 0.014*\"ret\" + 0.014*\"tornado\" + 0.013*\"fool\" + 0.012*\"driver\" + 0.012*\"squatter\" + 0.012*\"find\" + 0.009*\"théori\"\n", + "2019-01-31 01:39:17,207 : INFO : topic #14 (0.020): 0.024*\"forc\" + 0.022*\"aggress\" + 0.020*\"walter\" + 0.020*\"armi\" + 0.018*\"com\" + 0.013*\"oper\" + 0.013*\"militari\" + 0.013*\"unionist\" + 0.012*\"airbu\" + 0.011*\"refut\"\n", + "2019-01-31 01:39:17,212 : INFO : topic diff=0.003252, rho=0.020357\n", + "2019-01-31 01:39:17,373 : INFO : PROGRESS: pass 0, at document #4828000/4922894\n", + "2019-01-31 01:39:18,779 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:39:19,046 : INFO : topic #2 (0.020): 0.048*\"isl\" + 0.039*\"shield\" + 0.018*\"narrat\" + 0.015*\"scot\" + 0.012*\"pope\" + 0.012*\"blur\" + 0.011*\"nativist\" + 0.010*\"coalit\" + 0.010*\"fleet\" + 0.010*\"class\"\n", + "2019-01-31 01:39:19,047 : INFO : topic #6 (0.020): 0.068*\"fewer\" + 0.024*\"epiru\" + 0.021*\"septemb\" + 0.018*\"teacher\" + 0.014*\"stake\" + 0.012*\"rodríguez\" + 0.012*\"proclaim\" + 0.010*\"direct\" + 0.010*\"acrimoni\" + 0.010*\"movi\"\n", + "2019-01-31 01:39:19,048 : INFO : topic #1 (0.020): 0.051*\"china\" + 0.044*\"chilton\" + 0.026*\"kong\" + 0.026*\"hong\" + 0.020*\"korea\" + 0.020*\"korean\" + 0.018*\"shirin\" + 0.016*\"leah\" + 0.016*\"sourc\" + 0.013*\"kim\"\n", + "2019-01-31 01:39:19,049 : INFO : topic #43 (0.020): 0.066*\"elect\" + 0.055*\"parti\" + 0.024*\"voluntari\" + 0.023*\"democrat\" + 0.019*\"member\" + 0.017*\"polici\" + 0.015*\"republ\" + 0.014*\"liber\" + 0.014*\"bypass\" + 0.013*\"selma\"\n", + "2019-01-31 01:39:19,050 : INFO : topic #38 (0.020): 0.022*\"walter\" + 0.010*\"aza\" + 0.009*\"forc\" + 0.008*\"battalion\" + 0.007*\"teufel\" + 0.007*\"empath\" + 0.007*\"armi\" + 0.006*\"militari\" + 0.006*\"govern\" + 0.006*\"citi\"\n", + "2019-01-31 01:39:19,056 : INFO : topic diff=0.002922, rho=0.020353\n", + "2019-01-31 01:39:19,268 : INFO : PROGRESS: pass 0, at document #4830000/4922894\n", + "2019-01-31 01:39:20,622 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:39:20,889 : INFO : topic #41 (0.020): 0.043*\"citi\" + 0.026*\"palmer\" + 0.019*\"new\" + 0.018*\"strategist\" + 0.013*\"open\" + 0.012*\"center\" + 0.012*\"lobe\" + 0.012*\"includ\" + 0.010*\"dai\" + 0.009*\"highli\"\n", + "2019-01-31 01:39:20,890 : INFO : topic #36 (0.020): 0.011*\"network\" + 0.010*\"prognosi\" + 0.010*\"pop\" + 0.009*\"cytokin\" + 0.008*\"diggin\" + 0.008*\"develop\" + 0.008*\"softwar\" + 0.008*\"uruguayan\" + 0.008*\"user\" + 0.007*\"includ\"\n", + "2019-01-31 01:39:20,891 : INFO : topic #38 (0.020): 0.022*\"walter\" + 0.010*\"aza\" + 0.009*\"forc\" + 0.008*\"battalion\" + 0.007*\"teufel\" + 0.007*\"empath\" + 0.007*\"armi\" + 0.006*\"militari\" + 0.006*\"govern\" + 0.006*\"till\"\n", + "2019-01-31 01:39:20,892 : INFO : topic #45 (0.020): 0.048*\"arsen\" + 0.031*\"museo\" + 0.030*\"jpg\" + 0.028*\"fifteenth\" + 0.021*\"pain\" + 0.021*\"illicit\" + 0.017*\"artist\" + 0.016*\"exhaust\" + 0.016*\"gai\" + 0.014*\"word\"\n", + "2019-01-31 01:39:20,893 : INFO : topic #5 (0.020): 0.039*\"abroad\" + 0.028*\"son\" + 0.027*\"rel\" + 0.025*\"reconstruct\" + 0.021*\"band\" + 0.016*\"muscl\" + 0.016*\"simultan\" + 0.014*\"charcoal\" + 0.013*\"toyota\" + 0.010*\"myspac\"\n", + "2019-01-31 01:39:20,899 : INFO : topic diff=0.003340, rho=0.020349\n", + "2019-01-31 01:39:21,055 : INFO : PROGRESS: pass 0, at document #4832000/4922894\n", + "2019-01-31 01:39:22,419 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:39:22,685 : INFO : topic #33 (0.020): 0.059*\"french\" + 0.044*\"franc\" + 0.030*\"pari\" + 0.023*\"sail\" + 0.022*\"jean\" + 0.017*\"daphn\" + 0.014*\"wreath\" + 0.014*\"lazi\" + 0.012*\"loui\" + 0.012*\"piec\"\n", + "2019-01-31 01:39:22,686 : INFO : topic #9 (0.020): 0.076*\"bone\" + 0.042*\"american\" + 0.030*\"valour\" + 0.019*\"dutch\" + 0.018*\"folei\" + 0.018*\"player\" + 0.016*\"polit\" + 0.016*\"english\" + 0.012*\"acrimoni\" + 0.012*\"simpler\"\n", + "2019-01-31 01:39:22,687 : INFO : topic #12 (0.020): 0.009*\"number\" + 0.007*\"frontal\" + 0.007*\"poet\" + 0.006*\"gener\" + 0.006*\"measur\" + 0.006*\"exampl\" + 0.006*\"théori\" + 0.006*\"southern\" + 0.006*\"servitud\" + 0.006*\"utopian\"\n", + "2019-01-31 01:39:22,688 : INFO : topic #47 (0.020): 0.065*\"muscl\" + 0.032*\"perceptu\" + 0.020*\"theater\" + 0.019*\"compos\" + 0.017*\"place\" + 0.015*\"damn\" + 0.014*\"orchestr\" + 0.013*\"olympo\" + 0.012*\"physician\" + 0.011*\"word\"\n", + "2019-01-31 01:39:22,689 : INFO : topic #10 (0.020): 0.011*\"cdd\" + 0.008*\"media\" + 0.008*\"disco\" + 0.007*\"have\" + 0.007*\"hormon\" + 0.007*\"pathwai\" + 0.007*\"caus\" + 0.006*\"proper\" + 0.006*\"effect\" + 0.006*\"treat\"\n", + "2019-01-31 01:39:22,695 : INFO : topic diff=0.003461, rho=0.020345\n", + "2019-01-31 01:39:22,851 : INFO : PROGRESS: pass 0, at document #4834000/4922894\n", + "2019-01-31 01:39:24,211 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:39:24,478 : INFO : topic #49 (0.020): 0.044*\"india\" + 0.029*\"incumb\" + 0.013*\"islam\" + 0.013*\"pakistan\" + 0.012*\"anglo\" + 0.012*\"televis\" + 0.011*\"khalsa\" + 0.011*\"affection\" + 0.011*\"muskoge\" + 0.010*\"alam\"\n", + "2019-01-31 01:39:24,479 : INFO : topic #41 (0.020): 0.043*\"citi\" + 0.026*\"palmer\" + 0.019*\"new\" + 0.018*\"strategist\" + 0.013*\"open\" + 0.012*\"center\" + 0.012*\"lobe\" + 0.012*\"includ\" + 0.010*\"dai\" + 0.009*\"highli\"\n", + "2019-01-31 01:39:24,480 : INFO : topic #43 (0.020): 0.066*\"elect\" + 0.055*\"parti\" + 0.024*\"voluntari\" + 0.023*\"democrat\" + 0.019*\"member\" + 0.017*\"polici\" + 0.015*\"republ\" + 0.014*\"liber\" + 0.014*\"bypass\" + 0.013*\"report\"\n", + "2019-01-31 01:39:24,482 : INFO : topic #28 (0.020): 0.036*\"build\" + 0.030*\"hous\" + 0.019*\"buford\" + 0.015*\"histor\" + 0.012*\"linear\" + 0.012*\"centuri\" + 0.011*\"silicon\" + 0.011*\"constitut\" + 0.011*\"depress\" + 0.010*\"pistol\"\n", + "2019-01-31 01:39:24,483 : INFO : topic #12 (0.020): 0.009*\"number\" + 0.007*\"frontal\" + 0.007*\"poet\" + 0.006*\"gener\" + 0.006*\"measur\" + 0.006*\"exampl\" + 0.006*\"théori\" + 0.006*\"southern\" + 0.006*\"servitud\" + 0.006*\"utopian\"\n", + "2019-01-31 01:39:24,489 : INFO : topic diff=0.002786, rho=0.020341\n", + "2019-01-31 01:39:24,640 : INFO : PROGRESS: pass 0, at document #4836000/4922894\n", + "2019-01-31 01:39:25,977 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:39:26,243 : INFO : topic #13 (0.020): 0.027*\"london\" + 0.026*\"australia\" + 0.025*\"new\" + 0.025*\"sourc\" + 0.023*\"england\" + 0.021*\"australian\" + 0.020*\"british\" + 0.018*\"ireland\" + 0.014*\"youth\" + 0.014*\"wale\"\n", + "2019-01-31 01:39:26,244 : INFO : topic #5 (0.020): 0.038*\"abroad\" + 0.028*\"son\" + 0.027*\"rel\" + 0.025*\"reconstruct\" + 0.021*\"band\" + 0.016*\"muscl\" + 0.016*\"simultan\" + 0.014*\"charcoal\" + 0.013*\"toyota\" + 0.010*\"myspac\"\n", + "2019-01-31 01:39:26,245 : INFO : topic #26 (0.020): 0.029*\"champion\" + 0.028*\"workplac\" + 0.025*\"woman\" + 0.025*\"alic\" + 0.025*\"olymp\" + 0.023*\"men\" + 0.021*\"medal\" + 0.020*\"left\" + 0.019*\"event\" + 0.018*\"atheist\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 01:39:26,246 : INFO : topic #48 (0.020): 0.078*\"march\" + 0.076*\"sens\" + 0.076*\"octob\" + 0.069*\"januari\" + 0.068*\"notion\" + 0.067*\"august\" + 0.067*\"juli\" + 0.066*\"april\" + 0.065*\"decatur\" + 0.064*\"judici\"\n", + "2019-01-31 01:39:26,247 : INFO : topic #39 (0.020): 0.060*\"canada\" + 0.046*\"canadian\" + 0.024*\"toronto\" + 0.024*\"hoar\" + 0.022*\"ontario\" + 0.016*\"hydrogen\" + 0.015*\"misericordia\" + 0.015*\"quebec\" + 0.014*\"new\" + 0.013*\"novotná\"\n", + "2019-01-31 01:39:26,253 : INFO : topic diff=0.003121, rho=0.020336\n", + "2019-01-31 01:39:26,410 : INFO : PROGRESS: pass 0, at document #4838000/4922894\n", + "2019-01-31 01:39:27,790 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:39:28,056 : INFO : topic #19 (0.020): 0.016*\"languag\" + 0.015*\"centuri\" + 0.010*\"woodcut\" + 0.009*\"form\" + 0.009*\"origin\" + 0.009*\"mean\" + 0.008*\"trade\" + 0.008*\"english\" + 0.007*\"known\" + 0.007*\"ancestor\"\n", + "2019-01-31 01:39:28,057 : INFO : topic #0 (0.020): 0.060*\"statewid\" + 0.039*\"line\" + 0.031*\"rivièr\" + 0.029*\"raid\" + 0.026*\"rosenwald\" + 0.020*\"airmen\" + 0.018*\"traceabl\" + 0.018*\"serv\" + 0.013*\"oper\" + 0.012*\"briarwood\"\n", + "2019-01-31 01:39:28,058 : INFO : topic #22 (0.020): 0.034*\"spars\" + 0.016*\"factor\" + 0.012*\"plaisir\" + 0.010*\"genu\" + 0.010*\"western\" + 0.009*\"biom\" + 0.008*\"median\" + 0.007*\"trap\" + 0.006*\"incom\" + 0.006*\"florida\"\n", + "2019-01-31 01:39:28,059 : INFO : topic #44 (0.020): 0.029*\"rooftop\" + 0.025*\"final\" + 0.023*\"wife\" + 0.021*\"tourist\" + 0.020*\"champion\" + 0.016*\"chamber\" + 0.015*\"martin\" + 0.014*\"taxpay\" + 0.014*\"tiepolo\" + 0.013*\"open\"\n", + "2019-01-31 01:39:28,060 : INFO : topic #36 (0.020): 0.011*\"network\" + 0.010*\"prognosi\" + 0.010*\"pop\" + 0.009*\"cytokin\" + 0.008*\"develop\" + 0.008*\"diggin\" + 0.008*\"softwar\" + 0.008*\"uruguayan\" + 0.007*\"user\" + 0.007*\"includ\"\n", + "2019-01-31 01:39:28,066 : INFO : topic diff=0.002750, rho=0.020332\n", + "2019-01-31 01:39:30,746 : INFO : -11.475 per-word bound, 2846.8 perplexity estimate based on a held-out corpus of 2000 documents with 566887 words\n", + "2019-01-31 01:39:30,747 : INFO : PROGRESS: pass 0, at document #4840000/4922894\n", + "2019-01-31 01:39:32,112 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:39:32,379 : INFO : topic #32 (0.020): 0.050*\"district\" + 0.047*\"popolo\" + 0.043*\"vigour\" + 0.034*\"tortur\" + 0.033*\"cotton\" + 0.023*\"multitud\" + 0.022*\"adulthood\" + 0.022*\"area\" + 0.019*\"cede\" + 0.018*\"commun\"\n", + "2019-01-31 01:39:32,380 : INFO : topic #22 (0.020): 0.034*\"spars\" + 0.017*\"factor\" + 0.012*\"plaisir\" + 0.010*\"genu\" + 0.010*\"western\" + 0.009*\"biom\" + 0.008*\"median\" + 0.007*\"trap\" + 0.006*\"incom\" + 0.006*\"florida\"\n", + "2019-01-31 01:39:32,381 : INFO : topic #6 (0.020): 0.068*\"fewer\" + 0.024*\"epiru\" + 0.021*\"septemb\" + 0.018*\"teacher\" + 0.014*\"stake\" + 0.012*\"rodríguez\" + 0.012*\"proclaim\" + 0.010*\"acrimoni\" + 0.010*\"direct\" + 0.010*\"movi\"\n", + "2019-01-31 01:39:32,382 : INFO : topic #41 (0.020): 0.043*\"citi\" + 0.025*\"palmer\" + 0.019*\"new\" + 0.018*\"strategist\" + 0.013*\"open\" + 0.012*\"center\" + 0.012*\"lobe\" + 0.012*\"includ\" + 0.010*\"dai\" + 0.009*\"highli\"\n", + "2019-01-31 01:39:32,383 : INFO : topic #27 (0.020): 0.074*\"questionnair\" + 0.020*\"candid\" + 0.017*\"taxpay\" + 0.014*\"ret\" + 0.013*\"tornado\" + 0.013*\"fool\" + 0.012*\"driver\" + 0.012*\"find\" + 0.012*\"squatter\" + 0.009*\"théori\"\n", + "2019-01-31 01:39:32,390 : INFO : topic diff=0.002968, rho=0.020328\n", + "2019-01-31 01:39:32,543 : INFO : PROGRESS: pass 0, at document #4842000/4922894\n", + "2019-01-31 01:39:33,883 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:39:34,149 : INFO : topic #47 (0.020): 0.065*\"muscl\" + 0.031*\"perceptu\" + 0.021*\"theater\" + 0.019*\"compos\" + 0.017*\"place\" + 0.015*\"damn\" + 0.014*\"orchestr\" + 0.013*\"olympo\" + 0.013*\"physician\" + 0.011*\"word\"\n", + "2019-01-31 01:39:34,150 : INFO : topic #27 (0.020): 0.074*\"questionnair\" + 0.020*\"candid\" + 0.017*\"taxpay\" + 0.014*\"ret\" + 0.013*\"tornado\" + 0.013*\"fool\" + 0.012*\"find\" + 0.012*\"driver\" + 0.012*\"squatter\" + 0.009*\"théori\"\n", + "2019-01-31 01:39:34,152 : INFO : topic #7 (0.020): 0.021*\"snatch\" + 0.019*\"di\" + 0.019*\"factor\" + 0.016*\"yawn\" + 0.016*\"margin\" + 0.014*\"bone\" + 0.013*\"life\" + 0.012*\"faster\" + 0.012*\"will\" + 0.012*\"john\"\n", + "2019-01-31 01:39:34,153 : INFO : topic #10 (0.020): 0.011*\"cdd\" + 0.008*\"media\" + 0.008*\"disco\" + 0.007*\"have\" + 0.007*\"hormon\" + 0.007*\"pathwai\" + 0.007*\"caus\" + 0.006*\"proper\" + 0.006*\"effect\" + 0.006*\"treat\"\n", + "2019-01-31 01:39:34,154 : INFO : topic #23 (0.020): 0.134*\"audit\" + 0.072*\"best\" + 0.035*\"yawn\" + 0.028*\"jacksonvil\" + 0.023*\"japanes\" + 0.020*\"noll\" + 0.018*\"women\" + 0.017*\"intern\" + 0.017*\"festiv\" + 0.014*\"prison\"\n", + "2019-01-31 01:39:34,160 : INFO : topic diff=0.002803, rho=0.020324\n", + "2019-01-31 01:39:34,314 : INFO : PROGRESS: pass 0, at document #4844000/4922894\n", + "2019-01-31 01:39:35,691 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:39:35,958 : INFO : topic #40 (0.020): 0.086*\"unit\" + 0.023*\"schuster\" + 0.022*\"institut\" + 0.021*\"requir\" + 0.020*\"collector\" + 0.019*\"student\" + 0.014*\"professor\" + 0.012*\"word\" + 0.012*\"http\" + 0.011*\"governor\"\n", + "2019-01-31 01:39:35,959 : INFO : topic #7 (0.020): 0.021*\"snatch\" + 0.019*\"di\" + 0.019*\"factor\" + 0.016*\"yawn\" + 0.016*\"margin\" + 0.014*\"bone\" + 0.013*\"life\" + 0.012*\"faster\" + 0.012*\"will\" + 0.012*\"john\"\n", + "2019-01-31 01:39:35,960 : INFO : topic #43 (0.020): 0.066*\"elect\" + 0.054*\"parti\" + 0.024*\"voluntari\" + 0.022*\"democrat\" + 0.019*\"member\" + 0.017*\"polici\" + 0.015*\"republ\" + 0.014*\"liber\" + 0.014*\"bypass\" + 0.013*\"seaport\"\n", + "2019-01-31 01:39:35,961 : INFO : topic #34 (0.020): 0.068*\"start\" + 0.032*\"new\" + 0.031*\"american\" + 0.030*\"unionist\" + 0.026*\"cotton\" + 0.020*\"year\" + 0.015*\"california\" + 0.013*\"warrior\" + 0.012*\"terri\" + 0.012*\"north\"\n", + "2019-01-31 01:39:35,962 : INFO : topic #38 (0.020): 0.022*\"walter\" + 0.010*\"aza\" + 0.009*\"forc\" + 0.008*\"battalion\" + 0.008*\"teufel\" + 0.007*\"empath\" + 0.007*\"armi\" + 0.006*\"till\" + 0.006*\"militari\" + 0.006*\"govern\"\n", + "2019-01-31 01:39:35,968 : INFO : topic diff=0.002403, rho=0.020319\n", + "2019-01-31 01:39:36,128 : INFO : PROGRESS: pass 0, at document #4846000/4922894\n", + "2019-01-31 01:39:37,509 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:39:37,776 : INFO : topic #5 (0.020): 0.039*\"abroad\" + 0.028*\"son\" + 0.027*\"rel\" + 0.025*\"reconstruct\" + 0.021*\"band\" + 0.016*\"muscl\" + 0.016*\"simultan\" + 0.014*\"charcoal\" + 0.013*\"toyota\" + 0.010*\"myspac\"\n", + "2019-01-31 01:39:37,777 : INFO : topic #16 (0.020): 0.053*\"king\" + 0.030*\"priest\" + 0.021*\"duke\" + 0.018*\"rotterdam\" + 0.018*\"idiosyncrat\" + 0.017*\"grammat\" + 0.017*\"quarterli\" + 0.016*\"portugues\" + 0.014*\"kingdom\" + 0.013*\"paisiello\"\n", + "2019-01-31 01:39:37,778 : INFO : topic #14 (0.020): 0.024*\"forc\" + 0.022*\"aggress\" + 0.021*\"walter\" + 0.020*\"armi\" + 0.018*\"com\" + 0.013*\"militari\" + 0.013*\"oper\" + 0.013*\"unionist\" + 0.012*\"airbu\" + 0.011*\"refut\"\n", + "2019-01-31 01:39:37,779 : INFO : topic #30 (0.020): 0.035*\"cleveland\" + 0.035*\"leagu\" + 0.030*\"place\" + 0.027*\"taxpay\" + 0.024*\"scientist\" + 0.023*\"crete\" + 0.021*\"folei\" + 0.017*\"goal\" + 0.016*\"martin\" + 0.012*\"schmitz\"\n", + "2019-01-31 01:39:37,780 : INFO : topic #4 (0.020): 0.019*\"enfranchis\" + 0.015*\"depress\" + 0.013*\"pour\" + 0.008*\"mode\" + 0.008*\"elabor\" + 0.008*\"uruguayan\" + 0.008*\"veget\" + 0.006*\"turn\" + 0.006*\"produc\" + 0.006*\"develop\"\n", + "2019-01-31 01:39:37,786 : INFO : topic diff=0.002993, rho=0.020315\n", + "2019-01-31 01:39:37,944 : INFO : PROGRESS: pass 0, at document #4848000/4922894\n", + "2019-01-31 01:39:39,323 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:39:39,590 : INFO : topic #39 (0.020): 0.060*\"canada\" + 0.047*\"canadian\" + 0.024*\"hoar\" + 0.024*\"toronto\" + 0.022*\"ontario\" + 0.016*\"hydrogen\" + 0.015*\"misericordia\" + 0.015*\"quebec\" + 0.014*\"new\" + 0.013*\"novotná\"\n", + "2019-01-31 01:39:39,591 : INFO : topic #34 (0.020): 0.067*\"start\" + 0.032*\"new\" + 0.031*\"american\" + 0.030*\"unionist\" + 0.026*\"cotton\" + 0.020*\"year\" + 0.015*\"california\" + 0.013*\"warrior\" + 0.012*\"terri\" + 0.012*\"north\"\n", + "2019-01-31 01:39:39,592 : INFO : topic #2 (0.020): 0.049*\"isl\" + 0.038*\"shield\" + 0.018*\"narrat\" + 0.015*\"scot\" + 0.012*\"pope\" + 0.012*\"blur\" + 0.011*\"nativist\" + 0.011*\"class\" + 0.010*\"coalit\" + 0.010*\"fleet\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 01:39:39,593 : INFO : topic #25 (0.020): 0.032*\"ring\" + 0.019*\"area\" + 0.017*\"lagrang\" + 0.016*\"warmth\" + 0.015*\"mount\" + 0.010*\"north\" + 0.009*\"land\" + 0.009*\"foam\" + 0.009*\"sourc\" + 0.009*\"palmer\"\n", + "2019-01-31 01:39:39,594 : INFO : topic #48 (0.020): 0.078*\"march\" + 0.077*\"octob\" + 0.076*\"sens\" + 0.069*\"januari\" + 0.068*\"notion\" + 0.066*\"august\" + 0.066*\"april\" + 0.066*\"juli\" + 0.065*\"decatur\" + 0.064*\"judici\"\n", + "2019-01-31 01:39:39,600 : INFO : topic diff=0.002819, rho=0.020311\n", + "2019-01-31 01:39:39,758 : INFO : PROGRESS: pass 0, at document #4850000/4922894\n", + "2019-01-31 01:39:41,133 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:39:41,399 : INFO : topic #41 (0.020): 0.043*\"citi\" + 0.025*\"palmer\" + 0.019*\"new\" + 0.018*\"strategist\" + 0.013*\"open\" + 0.012*\"center\" + 0.012*\"lobe\" + 0.012*\"includ\" + 0.011*\"dai\" + 0.009*\"highli\"\n", + "2019-01-31 01:39:41,400 : INFO : topic #14 (0.020): 0.024*\"forc\" + 0.022*\"aggress\" + 0.021*\"walter\" + 0.020*\"armi\" + 0.018*\"com\" + 0.013*\"militari\" + 0.013*\"oper\" + 0.013*\"unionist\" + 0.012*\"airbu\" + 0.011*\"diversifi\"\n", + "2019-01-31 01:39:41,401 : INFO : topic #10 (0.020): 0.011*\"cdd\" + 0.009*\"media\" + 0.008*\"disco\" + 0.008*\"have\" + 0.007*\"hormon\" + 0.007*\"pathwai\" + 0.007*\"caus\" + 0.006*\"proper\" + 0.006*\"effect\" + 0.006*\"treat\"\n", + "2019-01-31 01:39:41,402 : INFO : topic #48 (0.020): 0.078*\"march\" + 0.077*\"octob\" + 0.076*\"sens\" + 0.068*\"januari\" + 0.067*\"notion\" + 0.066*\"april\" + 0.066*\"august\" + 0.066*\"juli\" + 0.064*\"decatur\" + 0.063*\"judici\"\n", + "2019-01-31 01:39:41,403 : INFO : topic #16 (0.020): 0.054*\"king\" + 0.029*\"priest\" + 0.020*\"duke\" + 0.019*\"idiosyncrat\" + 0.018*\"rotterdam\" + 0.018*\"quarterli\" + 0.017*\"grammat\" + 0.016*\"portugues\" + 0.015*\"kingdom\" + 0.013*\"paisiello\"\n", + "2019-01-31 01:39:41,409 : INFO : topic diff=0.003103, rho=0.020307\n", + "2019-01-31 01:39:41,561 : INFO : PROGRESS: pass 0, at document #4852000/4922894\n", + "2019-01-31 01:39:42,894 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:39:43,160 : INFO : topic #44 (0.020): 0.030*\"rooftop\" + 0.026*\"final\" + 0.022*\"wife\" + 0.021*\"tourist\" + 0.019*\"champion\" + 0.015*\"chamber\" + 0.015*\"martin\" + 0.014*\"taxpay\" + 0.014*\"tiepolo\" + 0.013*\"open\"\n", + "2019-01-31 01:39:43,161 : INFO : topic #12 (0.020): 0.008*\"number\" + 0.007*\"frontal\" + 0.007*\"poet\" + 0.006*\"gener\" + 0.006*\"exampl\" + 0.006*\"measur\" + 0.006*\"théori\" + 0.006*\"servitud\" + 0.006*\"utopian\" + 0.006*\"southern\"\n", + "2019-01-31 01:39:43,162 : INFO : topic #1 (0.020): 0.052*\"china\" + 0.043*\"chilton\" + 0.026*\"hong\" + 0.025*\"kong\" + 0.021*\"korea\" + 0.019*\"korean\" + 0.017*\"shirin\" + 0.016*\"leah\" + 0.016*\"sourc\" + 0.013*\"kim\"\n", + "2019-01-31 01:39:43,163 : INFO : topic #33 (0.020): 0.059*\"french\" + 0.044*\"franc\" + 0.031*\"pari\" + 0.023*\"jean\" + 0.022*\"sail\" + 0.017*\"daphn\" + 0.014*\"lazi\" + 0.012*\"wreath\" + 0.012*\"loui\" + 0.011*\"piec\"\n", + "2019-01-31 01:39:43,164 : INFO : topic #21 (0.020): 0.035*\"samford\" + 0.021*\"spain\" + 0.018*\"italian\" + 0.018*\"del\" + 0.017*\"mexico\" + 0.013*\"soviet\" + 0.012*\"santa\" + 0.011*\"juan\" + 0.011*\"carlo\" + 0.010*\"francisco\"\n", + "2019-01-31 01:39:43,170 : INFO : topic diff=0.003322, rho=0.020303\n", + "2019-01-31 01:39:43,326 : INFO : PROGRESS: pass 0, at document #4854000/4922894\n", + "2019-01-31 01:39:44,686 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:39:44,952 : INFO : topic #14 (0.020): 0.024*\"forc\" + 0.022*\"aggress\" + 0.020*\"walter\" + 0.020*\"armi\" + 0.018*\"com\" + 0.013*\"militari\" + 0.013*\"oper\" + 0.013*\"unionist\" + 0.013*\"airbu\" + 0.011*\"diversifi\"\n", + "2019-01-31 01:39:44,953 : INFO : topic #36 (0.020): 0.011*\"network\" + 0.011*\"prognosi\" + 0.010*\"pop\" + 0.009*\"cytokin\" + 0.008*\"diggin\" + 0.008*\"develop\" + 0.008*\"softwar\" + 0.008*\"uruguayan\" + 0.007*\"user\" + 0.007*\"includ\"\n", + "2019-01-31 01:39:44,954 : INFO : topic #25 (0.020): 0.032*\"ring\" + 0.019*\"area\" + 0.017*\"lagrang\" + 0.016*\"warmth\" + 0.015*\"mount\" + 0.010*\"north\" + 0.009*\"land\" + 0.009*\"sourc\" + 0.009*\"foam\" + 0.009*\"palmer\"\n", + "2019-01-31 01:39:44,955 : INFO : topic #3 (0.020): 0.032*\"present\" + 0.025*\"nation\" + 0.025*\"offic\" + 0.023*\"govern\" + 0.023*\"minist\" + 0.022*\"member\" + 0.018*\"start\" + 0.017*\"serv\" + 0.016*\"gener\" + 0.014*\"chickasaw\"\n", + "2019-01-31 01:39:44,956 : INFO : topic #30 (0.020): 0.035*\"leagu\" + 0.035*\"cleveland\" + 0.030*\"place\" + 0.027*\"taxpay\" + 0.024*\"scientist\" + 0.023*\"crete\" + 0.021*\"folei\" + 0.017*\"goal\" + 0.016*\"martin\" + 0.012*\"schmitz\"\n", + "2019-01-31 01:39:44,962 : INFO : topic diff=0.002763, rho=0.020299\n", + "2019-01-31 01:39:45,118 : INFO : PROGRESS: pass 0, at document #4856000/4922894\n", + "2019-01-31 01:39:46,477 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:39:46,743 : INFO : topic #26 (0.020): 0.029*\"champion\" + 0.029*\"workplac\" + 0.025*\"woman\" + 0.024*\"olymp\" + 0.023*\"alic\" + 0.023*\"men\" + 0.021*\"medal\" + 0.020*\"event\" + 0.018*\"atheist\" + 0.018*\"taxpay\"\n", + "2019-01-31 01:39:46,744 : INFO : topic #23 (0.020): 0.135*\"audit\" + 0.071*\"best\" + 0.035*\"yawn\" + 0.028*\"jacksonvil\" + 0.023*\"japanes\" + 0.020*\"noll\" + 0.018*\"women\" + 0.017*\"intern\" + 0.017*\"festiv\" + 0.014*\"prison\"\n", + "2019-01-31 01:39:46,746 : INFO : topic #42 (0.020): 0.048*\"german\" + 0.033*\"germani\" + 0.016*\"vol\" + 0.014*\"berlin\" + 0.014*\"der\" + 0.014*\"israel\" + 0.013*\"jewish\" + 0.009*\"austria\" + 0.009*\"european\" + 0.009*\"europ\"\n", + "2019-01-31 01:39:46,747 : INFO : topic #45 (0.020): 0.048*\"arsen\" + 0.031*\"museo\" + 0.030*\"jpg\" + 0.028*\"fifteenth\" + 0.022*\"illicit\" + 0.021*\"pain\" + 0.017*\"artist\" + 0.016*\"exhaust\" + 0.016*\"gai\" + 0.015*\"colder\"\n", + "2019-01-31 01:39:46,748 : INFO : topic #36 (0.020): 0.011*\"network\" + 0.010*\"prognosi\" + 0.010*\"pop\" + 0.009*\"cytokin\" + 0.008*\"diggin\" + 0.008*\"develop\" + 0.008*\"softwar\" + 0.008*\"uruguayan\" + 0.007*\"user\" + 0.007*\"includ\"\n", + "2019-01-31 01:39:46,754 : INFO : topic diff=0.003339, rho=0.020294\n", + "2019-01-31 01:39:46,910 : INFO : PROGRESS: pass 0, at document #4858000/4922894\n", + "2019-01-31 01:39:48,361 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:39:48,629 : INFO : topic #36 (0.020): 0.011*\"network\" + 0.010*\"prognosi\" + 0.010*\"pop\" + 0.009*\"cytokin\" + 0.008*\"diggin\" + 0.008*\"develop\" + 0.008*\"softwar\" + 0.008*\"uruguayan\" + 0.007*\"user\" + 0.007*\"includ\"\n", + "2019-01-31 01:39:48,631 : INFO : topic #37 (0.020): 0.012*\"charact\" + 0.012*\"septemb\" + 0.011*\"anim\" + 0.010*\"man\" + 0.008*\"comic\" + 0.007*\"fusiform\" + 0.007*\"appear\" + 0.007*\"storag\" + 0.007*\"workplac\" + 0.006*\"black\"\n", + "2019-01-31 01:39:48,632 : INFO : topic #20 (0.020): 0.140*\"scholar\" + 0.039*\"struggl\" + 0.032*\"high\" + 0.029*\"educ\" + 0.023*\"collector\" + 0.017*\"yawn\" + 0.012*\"prognosi\" + 0.011*\"district\" + 0.010*\"gothic\" + 0.010*\"task\"\n", + "2019-01-31 01:39:48,633 : INFO : topic #9 (0.020): 0.077*\"bone\" + 0.042*\"american\" + 0.030*\"valour\" + 0.020*\"dutch\" + 0.018*\"folei\" + 0.018*\"player\" + 0.017*\"polit\" + 0.016*\"english\" + 0.012*\"simpler\" + 0.012*\"acrimoni\"\n", + "2019-01-31 01:39:48,634 : INFO : topic #12 (0.020): 0.009*\"number\" + 0.007*\"frontal\" + 0.006*\"poet\" + 0.006*\"gener\" + 0.006*\"servitud\" + 0.006*\"exampl\" + 0.006*\"théori\" + 0.006*\"measur\" + 0.006*\"southern\" + 0.006*\"utopian\"\n", + "2019-01-31 01:39:48,640 : INFO : topic diff=0.002960, rho=0.020290\n", + "2019-01-31 01:39:51,335 : INFO : -11.403 per-word bound, 2708.1 perplexity estimate based on a held-out corpus of 2000 documents with 577801 words\n", + "2019-01-31 01:39:51,335 : INFO : PROGRESS: pass 0, at document #4860000/4922894\n", + "2019-01-31 01:39:52,705 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:39:52,972 : INFO : topic #33 (0.020): 0.059*\"french\" + 0.044*\"franc\" + 0.031*\"pari\" + 0.023*\"jean\" + 0.022*\"sail\" + 0.017*\"daphn\" + 0.014*\"lazi\" + 0.013*\"wreath\" + 0.012*\"loui\" + 0.011*\"piec\"\n", + "2019-01-31 01:39:52,973 : INFO : topic #12 (0.020): 0.008*\"number\" + 0.007*\"frontal\" + 0.007*\"poet\" + 0.006*\"gener\" + 0.006*\"servitud\" + 0.006*\"exampl\" + 0.006*\"théori\" + 0.006*\"measur\" + 0.006*\"southern\" + 0.006*\"utopian\"\n", + "2019-01-31 01:39:52,974 : INFO : topic #16 (0.020): 0.054*\"king\" + 0.029*\"priest\" + 0.020*\"duke\" + 0.018*\"idiosyncrat\" + 0.018*\"rotterdam\" + 0.017*\"grammat\" + 0.017*\"quarterli\" + 0.016*\"portugues\" + 0.014*\"kingdom\" + 0.013*\"paisiello\"\n", + "2019-01-31 01:39:52,975 : INFO : topic #22 (0.020): 0.034*\"spars\" + 0.018*\"factor\" + 0.012*\"plaisir\" + 0.011*\"genu\" + 0.010*\"western\" + 0.009*\"biom\" + 0.008*\"median\" + 0.006*\"trap\" + 0.006*\"incom\" + 0.006*\"florida\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 01:39:52,976 : INFO : topic #41 (0.020): 0.043*\"citi\" + 0.025*\"palmer\" + 0.019*\"new\" + 0.019*\"strategist\" + 0.013*\"open\" + 0.012*\"center\" + 0.012*\"lobe\" + 0.012*\"includ\" + 0.011*\"dai\" + 0.009*\"highli\"\n", + "2019-01-31 01:39:52,982 : INFO : topic diff=0.003327, rho=0.020286\n", + "2019-01-31 01:39:53,136 : INFO : PROGRESS: pass 0, at document #4862000/4922894\n", + "2019-01-31 01:39:54,484 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:39:54,751 : INFO : topic #33 (0.020): 0.059*\"french\" + 0.044*\"franc\" + 0.031*\"pari\" + 0.023*\"jean\" + 0.022*\"sail\" + 0.018*\"daphn\" + 0.014*\"lazi\" + 0.013*\"wreath\" + 0.012*\"loui\" + 0.011*\"piec\"\n", + "2019-01-31 01:39:54,752 : INFO : topic #49 (0.020): 0.043*\"india\" + 0.029*\"incumb\" + 0.014*\"islam\" + 0.013*\"pakistan\" + 0.013*\"anglo\" + 0.011*\"televis\" + 0.011*\"khalsa\" + 0.011*\"affection\" + 0.011*\"muskoge\" + 0.010*\"alam\"\n", + "2019-01-31 01:39:54,753 : INFO : topic #36 (0.020): 0.011*\"network\" + 0.010*\"prognosi\" + 0.010*\"pop\" + 0.009*\"cytokin\" + 0.008*\"diggin\" + 0.008*\"develop\" + 0.008*\"softwar\" + 0.008*\"uruguayan\" + 0.007*\"user\" + 0.007*\"includ\"\n", + "2019-01-31 01:39:54,754 : INFO : topic #44 (0.020): 0.030*\"rooftop\" + 0.026*\"final\" + 0.023*\"wife\" + 0.021*\"tourist\" + 0.019*\"champion\" + 0.015*\"chamber\" + 0.015*\"martin\" + 0.014*\"taxpay\" + 0.014*\"tiepolo\" + 0.013*\"open\"\n", + "2019-01-31 01:39:54,755 : INFO : topic #39 (0.020): 0.059*\"canada\" + 0.046*\"canadian\" + 0.025*\"toronto\" + 0.024*\"hoar\" + 0.021*\"ontario\" + 0.016*\"hydrogen\" + 0.015*\"misericordia\" + 0.015*\"new\" + 0.014*\"quebec\" + 0.013*\"novotná\"\n", + "2019-01-31 01:39:54,761 : INFO : topic diff=0.002938, rho=0.020282\n", + "2019-01-31 01:39:54,968 : INFO : PROGRESS: pass 0, at document #4864000/4922894\n", + "2019-01-31 01:39:56,299 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:39:56,567 : INFO : topic #12 (0.020): 0.008*\"number\" + 0.007*\"frontal\" + 0.006*\"gener\" + 0.006*\"poet\" + 0.006*\"servitud\" + 0.006*\"exampl\" + 0.006*\"théori\" + 0.006*\"measur\" + 0.006*\"southern\" + 0.006*\"utopian\"\n", + "2019-01-31 01:39:56,568 : INFO : topic #9 (0.020): 0.076*\"bone\" + 0.042*\"american\" + 0.031*\"valour\" + 0.019*\"dutch\" + 0.018*\"folei\" + 0.017*\"player\" + 0.017*\"polit\" + 0.016*\"english\" + 0.012*\"simpler\" + 0.011*\"acrimoni\"\n", + "2019-01-31 01:39:56,569 : INFO : topic #13 (0.020): 0.026*\"london\" + 0.026*\"australia\" + 0.025*\"new\" + 0.025*\"sourc\" + 0.024*\"england\" + 0.022*\"australian\" + 0.020*\"british\" + 0.018*\"ireland\" + 0.014*\"wale\" + 0.014*\"weekli\"\n", + "2019-01-31 01:39:56,570 : INFO : topic #43 (0.020): 0.067*\"elect\" + 0.054*\"parti\" + 0.025*\"voluntari\" + 0.022*\"democrat\" + 0.019*\"member\" + 0.017*\"polici\" + 0.015*\"republ\" + 0.014*\"bypass\" + 0.014*\"liber\" + 0.013*\"report\"\n", + "2019-01-31 01:39:56,571 : INFO : topic #17 (0.020): 0.079*\"church\" + 0.025*\"cathol\" + 0.024*\"christian\" + 0.022*\"bishop\" + 0.016*\"sail\" + 0.014*\"retroflex\" + 0.010*\"relationship\" + 0.009*\"cathedr\" + 0.009*\"historiographi\" + 0.009*\"parish\"\n", + "2019-01-31 01:39:56,577 : INFO : topic diff=0.003424, rho=0.020278\n", + "2019-01-31 01:39:56,735 : INFO : PROGRESS: pass 0, at document #4866000/4922894\n", + "2019-01-31 01:39:58,277 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:39:58,544 : INFO : topic #18 (0.020): 0.011*\"théori\" + 0.007*\"later\" + 0.006*\"sack\" + 0.006*\"dai\" + 0.005*\"kill\" + 0.005*\"retrospect\" + 0.005*\"like\" + 0.005*\"end\" + 0.004*\"call\" + 0.004*\"help\"\n", + "2019-01-31 01:39:58,545 : INFO : topic #36 (0.020): 0.011*\"network\" + 0.010*\"prognosi\" + 0.010*\"pop\" + 0.009*\"cytokin\" + 0.008*\"diggin\" + 0.008*\"develop\" + 0.008*\"softwar\" + 0.008*\"uruguayan\" + 0.007*\"user\" + 0.007*\"includ\"\n", + "2019-01-31 01:39:58,546 : INFO : topic #46 (0.020): 0.017*\"sweden\" + 0.017*\"swedish\" + 0.017*\"stop\" + 0.015*\"norwai\" + 0.014*\"treeless\" + 0.014*\"wind\" + 0.013*\"damag\" + 0.013*\"norwegian\" + 0.010*\"farid\" + 0.010*\"huntsvil\"\n", + "2019-01-31 01:39:58,547 : INFO : topic #35 (0.020): 0.056*\"russia\" + 0.037*\"sovereignti\" + 0.032*\"rural\" + 0.029*\"poison\" + 0.026*\"reprint\" + 0.024*\"personifi\" + 0.022*\"poland\" + 0.018*\"moscow\" + 0.015*\"turin\" + 0.015*\"unfortun\"\n", + "2019-01-31 01:39:58,548 : INFO : topic #41 (0.020): 0.043*\"citi\" + 0.025*\"palmer\" + 0.019*\"new\" + 0.018*\"strategist\" + 0.013*\"open\" + 0.012*\"center\" + 0.012*\"includ\" + 0.012*\"lobe\" + 0.011*\"dai\" + 0.009*\"highli\"\n", + "2019-01-31 01:39:58,554 : INFO : topic diff=0.003362, rho=0.020274\n", + "2019-01-31 01:39:58,716 : INFO : PROGRESS: pass 0, at document #4868000/4922894\n", + "2019-01-31 01:40:00,120 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:40:00,386 : INFO : topic #39 (0.020): 0.058*\"canada\" + 0.046*\"canadian\" + 0.024*\"toronto\" + 0.024*\"hoar\" + 0.021*\"ontario\" + 0.016*\"hydrogen\" + 0.015*\"misericordia\" + 0.015*\"new\" + 0.015*\"quebec\" + 0.013*\"novotná\"\n", + "2019-01-31 01:40:00,387 : INFO : topic #34 (0.020): 0.068*\"start\" + 0.032*\"new\" + 0.031*\"american\" + 0.030*\"unionist\" + 0.025*\"cotton\" + 0.020*\"year\" + 0.015*\"california\" + 0.013*\"warrior\" + 0.012*\"terri\" + 0.012*\"north\"\n", + "2019-01-31 01:40:00,388 : INFO : topic #18 (0.020): 0.011*\"théori\" + 0.007*\"later\" + 0.006*\"sack\" + 0.006*\"dai\" + 0.005*\"kill\" + 0.005*\"like\" + 0.005*\"retrospect\" + 0.005*\"end\" + 0.004*\"call\" + 0.004*\"help\"\n", + "2019-01-31 01:40:00,389 : INFO : topic #29 (0.020): 0.031*\"companhia\" + 0.013*\"busi\" + 0.012*\"million\" + 0.012*\"produc\" + 0.012*\"market\" + 0.011*\"industri\" + 0.010*\"bank\" + 0.009*\"yawn\" + 0.008*\"manag\" + 0.007*\"oper\"\n", + "2019-01-31 01:40:00,390 : INFO : topic #23 (0.020): 0.135*\"audit\" + 0.070*\"best\" + 0.035*\"yawn\" + 0.028*\"jacksonvil\" + 0.023*\"japanes\" + 0.020*\"noll\" + 0.018*\"women\" + 0.017*\"intern\" + 0.017*\"festiv\" + 0.014*\"prison\"\n", + "2019-01-31 01:40:00,396 : INFO : topic diff=0.003458, rho=0.020269\n", + "2019-01-31 01:40:00,550 : INFO : PROGRESS: pass 0, at document #4870000/4922894\n", + "2019-01-31 01:40:01,891 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:40:02,157 : INFO : topic #28 (0.020): 0.037*\"build\" + 0.030*\"hous\" + 0.019*\"buford\" + 0.015*\"histor\" + 0.012*\"linear\" + 0.012*\"centuri\" + 0.012*\"silicon\" + 0.011*\"depress\" + 0.011*\"constitut\" + 0.010*\"pistol\"\n", + "2019-01-31 01:40:02,158 : INFO : topic #26 (0.020): 0.029*\"champion\" + 0.028*\"workplac\" + 0.025*\"woman\" + 0.025*\"olymp\" + 0.024*\"alic\" + 0.023*\"men\" + 0.021*\"medal\" + 0.020*\"event\" + 0.018*\"atheist\" + 0.018*\"taxpay\"\n", + "2019-01-31 01:40:02,160 : INFO : topic #18 (0.020): 0.011*\"théori\" + 0.007*\"later\" + 0.006*\"sack\" + 0.006*\"dai\" + 0.005*\"kill\" + 0.005*\"like\" + 0.005*\"retrospect\" + 0.005*\"end\" + 0.004*\"call\" + 0.004*\"help\"\n", + "2019-01-31 01:40:02,161 : INFO : topic #17 (0.020): 0.079*\"church\" + 0.025*\"cathol\" + 0.024*\"christian\" + 0.022*\"bishop\" + 0.017*\"sail\" + 0.014*\"retroflex\" + 0.010*\"relationship\" + 0.009*\"cathedr\" + 0.009*\"historiographi\" + 0.009*\"parish\"\n", + "2019-01-31 01:40:02,162 : INFO : topic #40 (0.020): 0.086*\"unit\" + 0.023*\"schuster\" + 0.022*\"institut\" + 0.021*\"requir\" + 0.020*\"collector\" + 0.019*\"student\" + 0.014*\"professor\" + 0.012*\"word\" + 0.011*\"governor\" + 0.011*\"degre\"\n", + "2019-01-31 01:40:02,168 : INFO : topic diff=0.003171, rho=0.020265\n", + "2019-01-31 01:40:02,323 : INFO : PROGRESS: pass 0, at document #4872000/4922894\n", + "2019-01-31 01:40:03,693 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:40:03,959 : INFO : topic #41 (0.020): 0.043*\"citi\" + 0.025*\"palmer\" + 0.019*\"new\" + 0.018*\"strategist\" + 0.013*\"center\" + 0.013*\"open\" + 0.012*\"includ\" + 0.011*\"lobe\" + 0.011*\"dai\" + 0.009*\"highli\"\n", + "2019-01-31 01:40:03,960 : INFO : topic #28 (0.020): 0.037*\"build\" + 0.030*\"hous\" + 0.019*\"buford\" + 0.015*\"histor\" + 0.012*\"linear\" + 0.012*\"centuri\" + 0.012*\"silicon\" + 0.011*\"depress\" + 0.011*\"constitut\" + 0.010*\"pistol\"\n", + "2019-01-31 01:40:03,961 : INFO : topic #49 (0.020): 0.043*\"india\" + 0.029*\"incumb\" + 0.013*\"islam\" + 0.013*\"pakistan\" + 0.013*\"anglo\" + 0.011*\"televis\" + 0.011*\"affection\" + 0.011*\"khalsa\" + 0.010*\"muskoge\" + 0.010*\"alam\"\n", + "2019-01-31 01:40:03,962 : INFO : topic #29 (0.020): 0.031*\"companhia\" + 0.013*\"busi\" + 0.012*\"million\" + 0.012*\"produc\" + 0.012*\"market\" + 0.011*\"industri\" + 0.010*\"bank\" + 0.009*\"yawn\" + 0.008*\"manag\" + 0.007*\"oper\"\n", + "2019-01-31 01:40:03,963 : INFO : topic #2 (0.020): 0.049*\"isl\" + 0.039*\"shield\" + 0.018*\"narrat\" + 0.014*\"scot\" + 0.012*\"pope\" + 0.012*\"blur\" + 0.011*\"nativist\" + 0.011*\"class\" + 0.010*\"coalit\" + 0.010*\"fleet\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 01:40:03,969 : INFO : topic diff=0.002540, rho=0.020261\n", + "2019-01-31 01:40:04,123 : INFO : PROGRESS: pass 0, at document #4874000/4922894\n", + "2019-01-31 01:40:05,481 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:40:05,747 : INFO : topic #22 (0.020): 0.034*\"spars\" + 0.017*\"factor\" + 0.012*\"plaisir\" + 0.010*\"genu\" + 0.010*\"western\" + 0.008*\"biom\" + 0.008*\"median\" + 0.007*\"trap\" + 0.006*\"incom\" + 0.006*\"florida\"\n", + "2019-01-31 01:40:05,749 : INFO : topic #30 (0.020): 0.035*\"leagu\" + 0.035*\"cleveland\" + 0.032*\"place\" + 0.027*\"taxpay\" + 0.024*\"scientist\" + 0.023*\"crete\" + 0.021*\"folei\" + 0.017*\"goal\" + 0.015*\"martin\" + 0.012*\"schmitz\"\n", + "2019-01-31 01:40:05,750 : INFO : topic #5 (0.020): 0.038*\"abroad\" + 0.028*\"son\" + 0.027*\"rel\" + 0.025*\"reconstruct\" + 0.021*\"band\" + 0.016*\"muscl\" + 0.016*\"simultan\" + 0.014*\"charcoal\" + 0.013*\"toyota\" + 0.010*\"myspac\"\n", + "2019-01-31 01:40:05,751 : INFO : topic #3 (0.020): 0.032*\"present\" + 0.025*\"nation\" + 0.024*\"offic\" + 0.024*\"govern\" + 0.023*\"minist\" + 0.023*\"member\" + 0.018*\"start\" + 0.017*\"serv\" + 0.015*\"gener\" + 0.014*\"chickasaw\"\n", + "2019-01-31 01:40:05,752 : INFO : topic #6 (0.020): 0.069*\"fewer\" + 0.023*\"epiru\" + 0.021*\"septemb\" + 0.018*\"teacher\" + 0.014*\"stake\" + 0.012*\"proclaim\" + 0.012*\"rodríguez\" + 0.011*\"direct\" + 0.010*\"movi\" + 0.010*\"acrimoni\"\n", + "2019-01-31 01:40:05,758 : INFO : topic diff=0.002992, rho=0.020257\n", + "2019-01-31 01:40:05,914 : INFO : PROGRESS: pass 0, at document #4876000/4922894\n", + "2019-01-31 01:40:07,290 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:40:07,557 : INFO : topic #0 (0.020): 0.061*\"statewid\" + 0.039*\"line\" + 0.031*\"rivièr\" + 0.029*\"raid\" + 0.025*\"rosenwald\" + 0.020*\"airmen\" + 0.017*\"serv\" + 0.017*\"traceabl\" + 0.013*\"oper\" + 0.012*\"briarwood\"\n", + "2019-01-31 01:40:07,558 : INFO : topic #22 (0.020): 0.034*\"spars\" + 0.017*\"factor\" + 0.012*\"plaisir\" + 0.010*\"genu\" + 0.010*\"western\" + 0.008*\"biom\" + 0.008*\"median\" + 0.007*\"trap\" + 0.006*\"incom\" + 0.006*\"florida\"\n", + "2019-01-31 01:40:07,559 : INFO : topic #39 (0.020): 0.058*\"canada\" + 0.046*\"canadian\" + 0.025*\"toronto\" + 0.024*\"hoar\" + 0.021*\"ontario\" + 0.015*\"hydrogen\" + 0.015*\"misericordia\" + 0.015*\"new\" + 0.014*\"quebec\" + 0.014*\"novotná\"\n", + "2019-01-31 01:40:07,560 : INFO : topic #5 (0.020): 0.038*\"abroad\" + 0.028*\"son\" + 0.027*\"rel\" + 0.025*\"reconstruct\" + 0.021*\"band\" + 0.016*\"muscl\" + 0.016*\"simultan\" + 0.014*\"charcoal\" + 0.013*\"toyota\" + 0.010*\"myspac\"\n", + "2019-01-31 01:40:07,561 : INFO : topic #41 (0.020): 0.043*\"citi\" + 0.025*\"palmer\" + 0.019*\"new\" + 0.019*\"strategist\" + 0.013*\"center\" + 0.013*\"open\" + 0.012*\"includ\" + 0.011*\"lobe\" + 0.011*\"dai\" + 0.009*\"highli\"\n", + "2019-01-31 01:40:07,567 : INFO : topic diff=0.003077, rho=0.020253\n", + "2019-01-31 01:40:07,727 : INFO : PROGRESS: pass 0, at document #4878000/4922894\n", + "2019-01-31 01:40:09,052 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:40:09,318 : INFO : topic #47 (0.020): 0.065*\"muscl\" + 0.031*\"perceptu\" + 0.020*\"theater\" + 0.018*\"compos\" + 0.018*\"place\" + 0.015*\"damn\" + 0.014*\"orchestr\" + 0.013*\"olympo\" + 0.013*\"physician\" + 0.012*\"word\"\n", + "2019-01-31 01:40:09,319 : INFO : topic #7 (0.020): 0.021*\"snatch\" + 0.020*\"di\" + 0.019*\"factor\" + 0.016*\"yawn\" + 0.016*\"margin\" + 0.014*\"bone\" + 0.013*\"life\" + 0.012*\"faster\" + 0.012*\"will\" + 0.012*\"john\"\n", + "2019-01-31 01:40:09,320 : INFO : topic #13 (0.020): 0.027*\"australia\" + 0.026*\"london\" + 0.025*\"sourc\" + 0.025*\"new\" + 0.024*\"england\" + 0.022*\"australian\" + 0.020*\"british\" + 0.018*\"ireland\" + 0.014*\"wale\" + 0.014*\"weekli\"\n", + "2019-01-31 01:40:09,321 : INFO : topic #26 (0.020): 0.028*\"champion\" + 0.028*\"workplac\" + 0.025*\"woman\" + 0.024*\"olymp\" + 0.023*\"men\" + 0.023*\"alic\" + 0.021*\"medal\" + 0.020*\"event\" + 0.018*\"atheist\" + 0.018*\"taxpay\"\n", + "2019-01-31 01:40:09,322 : INFO : topic #20 (0.020): 0.141*\"scholar\" + 0.039*\"struggl\" + 0.032*\"high\" + 0.029*\"educ\" + 0.023*\"collector\" + 0.017*\"yawn\" + 0.012*\"prognosi\" + 0.011*\"district\" + 0.010*\"gothic\" + 0.010*\"task\"\n", + "2019-01-31 01:40:09,328 : INFO : topic diff=0.003009, rho=0.020249\n", + "2019-01-31 01:40:12,015 : INFO : -11.801 per-word bound, 3568.7 perplexity estimate based on a held-out corpus of 2000 documents with 551274 words\n", + "2019-01-31 01:40:12,016 : INFO : PROGRESS: pass 0, at document #4880000/4922894\n", + "2019-01-31 01:40:13,393 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:40:13,660 : INFO : topic #18 (0.020): 0.011*\"théori\" + 0.007*\"later\" + 0.006*\"sack\" + 0.006*\"dai\" + 0.005*\"kill\" + 0.005*\"like\" + 0.005*\"retrospect\" + 0.005*\"end\" + 0.004*\"call\" + 0.004*\"help\"\n", + "2019-01-31 01:40:13,661 : INFO : topic #48 (0.020): 0.077*\"octob\" + 0.077*\"march\" + 0.075*\"sens\" + 0.067*\"juli\" + 0.067*\"januari\" + 0.067*\"notion\" + 0.066*\"august\" + 0.066*\"april\" + 0.065*\"decatur\" + 0.064*\"judici\"\n", + "2019-01-31 01:40:13,662 : INFO : topic #5 (0.020): 0.038*\"abroad\" + 0.028*\"son\" + 0.027*\"rel\" + 0.025*\"reconstruct\" + 0.021*\"band\" + 0.016*\"muscl\" + 0.015*\"simultan\" + 0.014*\"charcoal\" + 0.013*\"toyota\" + 0.010*\"myspac\"\n", + "2019-01-31 01:40:13,663 : INFO : topic #13 (0.020): 0.027*\"australia\" + 0.026*\"london\" + 0.025*\"sourc\" + 0.025*\"new\" + 0.024*\"england\" + 0.022*\"australian\" + 0.020*\"british\" + 0.018*\"ireland\" + 0.014*\"wale\" + 0.014*\"weekli\"\n", + "2019-01-31 01:40:13,664 : INFO : topic #14 (0.020): 0.024*\"forc\" + 0.022*\"aggress\" + 0.021*\"walter\" + 0.020*\"armi\" + 0.017*\"com\" + 0.013*\"militari\" + 0.013*\"unionist\" + 0.013*\"oper\" + 0.013*\"airbu\" + 0.011*\"refut\"\n", + "2019-01-31 01:40:13,670 : INFO : topic diff=0.003230, rho=0.020244\n", + "2019-01-31 01:40:13,827 : INFO : PROGRESS: pass 0, at document #4882000/4922894\n", + "2019-01-31 01:40:15,209 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:40:15,476 : INFO : topic #6 (0.020): 0.069*\"fewer\" + 0.023*\"epiru\" + 0.021*\"septemb\" + 0.018*\"teacher\" + 0.014*\"stake\" + 0.012*\"proclaim\" + 0.012*\"rodríguez\" + 0.011*\"direct\" + 0.010*\"movi\" + 0.010*\"acrimoni\"\n", + "2019-01-31 01:40:15,477 : INFO : topic #10 (0.020): 0.011*\"cdd\" + 0.009*\"media\" + 0.008*\"have\" + 0.008*\"disco\" + 0.007*\"hormon\" + 0.007*\"pathwai\" + 0.007*\"caus\" + 0.006*\"proper\" + 0.006*\"effect\" + 0.006*\"treat\"\n", + "2019-01-31 01:40:15,478 : INFO : topic #4 (0.020): 0.019*\"enfranchis\" + 0.015*\"depress\" + 0.013*\"pour\" + 0.008*\"mode\" + 0.008*\"uruguayan\" + 0.008*\"elabor\" + 0.008*\"veget\" + 0.006*\"develop\" + 0.006*\"produc\" + 0.006*\"turn\"\n", + "2019-01-31 01:40:15,479 : INFO : topic #32 (0.020): 0.051*\"district\" + 0.047*\"popolo\" + 0.043*\"vigour\" + 0.035*\"tortur\" + 0.033*\"cotton\" + 0.023*\"multitud\" + 0.022*\"adulthood\" + 0.021*\"area\" + 0.019*\"cede\" + 0.018*\"commun\"\n", + "2019-01-31 01:40:15,480 : INFO : topic #26 (0.020): 0.028*\"workplac\" + 0.028*\"champion\" + 0.025*\"woman\" + 0.024*\"olymp\" + 0.023*\"men\" + 0.022*\"alic\" + 0.021*\"medal\" + 0.020*\"event\" + 0.018*\"atheist\" + 0.017*\"taxpay\"\n", + "2019-01-31 01:40:15,486 : INFO : topic diff=0.003092, rho=0.020240\n", + "2019-01-31 01:40:15,639 : INFO : PROGRESS: pass 0, at document #4884000/4922894\n", + "2019-01-31 01:40:16,989 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:40:17,255 : INFO : topic #31 (0.020): 0.050*\"fusiform\" + 0.027*\"scientist\" + 0.025*\"taxpay\" + 0.023*\"player\" + 0.019*\"place\" + 0.014*\"clot\" + 0.013*\"leagu\" + 0.010*\"folei\" + 0.010*\"yawn\" + 0.009*\"reconstruct\"\n", + "2019-01-31 01:40:17,256 : INFO : topic #32 (0.020): 0.051*\"district\" + 0.047*\"popolo\" + 0.043*\"vigour\" + 0.035*\"tortur\" + 0.032*\"cotton\" + 0.023*\"multitud\" + 0.022*\"adulthood\" + 0.021*\"area\" + 0.019*\"cede\" + 0.018*\"commun\"\n", + "2019-01-31 01:40:17,257 : INFO : topic #25 (0.020): 0.031*\"ring\" + 0.019*\"area\" + 0.017*\"lagrang\" + 0.016*\"warmth\" + 0.015*\"mount\" + 0.010*\"north\" + 0.009*\"sourc\" + 0.009*\"land\" + 0.009*\"foam\" + 0.008*\"palmer\"\n", + "2019-01-31 01:40:17,258 : INFO : topic #9 (0.020): 0.074*\"bone\" + 0.042*\"american\" + 0.030*\"valour\" + 0.019*\"dutch\" + 0.017*\"folei\" + 0.017*\"player\" + 0.017*\"english\" + 0.017*\"polit\" + 0.011*\"simpler\" + 0.011*\"acrimoni\"\n", + "2019-01-31 01:40:17,259 : INFO : topic #30 (0.020): 0.035*\"leagu\" + 0.035*\"cleveland\" + 0.032*\"place\" + 0.028*\"taxpay\" + 0.024*\"scientist\" + 0.023*\"crete\" + 0.021*\"folei\" + 0.017*\"goal\" + 0.015*\"martin\" + 0.013*\"schmitz\"\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 01:40:17,265 : INFO : topic diff=0.002712, rho=0.020236\n", + "2019-01-31 01:40:17,421 : INFO : PROGRESS: pass 0, at document #4886000/4922894\n", + "2019-01-31 01:40:18,792 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:40:19,059 : INFO : topic #23 (0.020): 0.135*\"audit\" + 0.071*\"best\" + 0.035*\"yawn\" + 0.028*\"jacksonvil\" + 0.023*\"japanes\" + 0.020*\"noll\" + 0.018*\"festiv\" + 0.018*\"intern\" + 0.018*\"women\" + 0.013*\"prison\"\n", + "2019-01-31 01:40:19,060 : INFO : topic #8 (0.020): 0.026*\"law\" + 0.023*\"cortic\" + 0.018*\"start\" + 0.016*\"act\" + 0.012*\"ricardo\" + 0.012*\"case\" + 0.010*\"replac\" + 0.010*\"polaris\" + 0.008*\"legal\" + 0.008*\"order\"\n", + "2019-01-31 01:40:19,061 : INFO : topic #1 (0.020): 0.053*\"china\" + 0.043*\"chilton\" + 0.025*\"hong\" + 0.025*\"kong\" + 0.021*\"korea\" + 0.018*\"korean\" + 0.017*\"leah\" + 0.016*\"shirin\" + 0.016*\"sourc\" + 0.014*\"kim\"\n", + "2019-01-31 01:40:19,062 : INFO : topic #32 (0.020): 0.051*\"district\" + 0.046*\"popolo\" + 0.043*\"vigour\" + 0.035*\"tortur\" + 0.033*\"cotton\" + 0.023*\"multitud\" + 0.022*\"adulthood\" + 0.022*\"area\" + 0.019*\"cede\" + 0.018*\"commun\"\n", + "2019-01-31 01:40:19,063 : INFO : topic #5 (0.020): 0.038*\"abroad\" + 0.028*\"son\" + 0.027*\"rel\" + 0.025*\"reconstruct\" + 0.021*\"band\" + 0.016*\"muscl\" + 0.016*\"simultan\" + 0.014*\"charcoal\" + 0.013*\"toyota\" + 0.010*\"vocabulari\"\n", + "2019-01-31 01:40:19,069 : INFO : topic diff=0.002997, rho=0.020232\n", + "2019-01-31 01:40:19,241 : INFO : PROGRESS: pass 0, at document #4888000/4922894\n", + "2019-01-31 01:40:20,654 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:40:20,921 : INFO : topic #12 (0.020): 0.009*\"number\" + 0.007*\"frontal\" + 0.007*\"gener\" + 0.006*\"poet\" + 0.006*\"théori\" + 0.006*\"servitud\" + 0.006*\"southern\" + 0.006*\"exampl\" + 0.006*\"measur\" + 0.006*\"utopian\"\n", + "2019-01-31 01:40:20,922 : INFO : topic #2 (0.020): 0.050*\"isl\" + 0.039*\"shield\" + 0.018*\"narrat\" + 0.014*\"scot\" + 0.012*\"pope\" + 0.012*\"blur\" + 0.011*\"nativist\" + 0.011*\"class\" + 0.010*\"coalit\" + 0.010*\"fleet\"\n", + "2019-01-31 01:40:20,923 : INFO : topic #42 (0.020): 0.049*\"german\" + 0.034*\"germani\" + 0.016*\"vol\" + 0.014*\"berlin\" + 0.014*\"jewish\" + 0.013*\"der\" + 0.013*\"israel\" + 0.010*\"austria\" + 0.010*\"europ\" + 0.009*\"european\"\n", + "2019-01-31 01:40:20,924 : INFO : topic #23 (0.020): 0.135*\"audit\" + 0.070*\"best\" + 0.035*\"yawn\" + 0.029*\"jacksonvil\" + 0.023*\"japanes\" + 0.020*\"noll\" + 0.018*\"festiv\" + 0.018*\"intern\" + 0.018*\"women\" + 0.013*\"prison\"\n", + "2019-01-31 01:40:20,925 : INFO : topic #11 (0.020): 0.022*\"john\" + 0.011*\"david\" + 0.011*\"will\" + 0.011*\"jame\" + 0.010*\"rival\" + 0.009*\"mexican–american\" + 0.008*\"paul\" + 0.008*\"slur\" + 0.008*\"rhyme\" + 0.008*\"georg\"\n", + "2019-01-31 01:40:20,931 : INFO : topic diff=0.003682, rho=0.020228\n", + "2019-01-31 01:40:21,092 : INFO : PROGRESS: pass 0, at document #4890000/4922894\n", + "2019-01-31 01:40:22,478 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:40:22,745 : INFO : topic #45 (0.020): 0.047*\"arsen\" + 0.031*\"museo\" + 0.031*\"jpg\" + 0.029*\"fifteenth\" + 0.021*\"pain\" + 0.021*\"illicit\" + 0.017*\"artist\" + 0.016*\"exhaust\" + 0.016*\"gai\" + 0.015*\"colder\"\n", + "2019-01-31 01:40:22,746 : INFO : topic #47 (0.020): 0.065*\"muscl\" + 0.031*\"perceptu\" + 0.021*\"theater\" + 0.018*\"compos\" + 0.018*\"place\" + 0.015*\"damn\" + 0.014*\"orchestr\" + 0.013*\"olympo\" + 0.012*\"physician\" + 0.012*\"word\"\n", + "2019-01-31 01:40:22,747 : INFO : topic #14 (0.020): 0.024*\"forc\" + 0.022*\"aggress\" + 0.020*\"walter\" + 0.020*\"armi\" + 0.017*\"com\" + 0.013*\"militari\" + 0.013*\"unionist\" + 0.013*\"oper\" + 0.012*\"airbu\" + 0.010*\"refut\"\n", + "2019-01-31 01:40:22,748 : INFO : topic #34 (0.020): 0.068*\"start\" + 0.032*\"new\" + 0.031*\"american\" + 0.030*\"unionist\" + 0.026*\"cotton\" + 0.020*\"year\" + 0.015*\"california\" + 0.013*\"warrior\" + 0.012*\"terri\" + 0.012*\"north\"\n", + "2019-01-31 01:40:22,749 : INFO : topic #32 (0.020): 0.051*\"district\" + 0.046*\"popolo\" + 0.043*\"vigour\" + 0.035*\"tortur\" + 0.033*\"cotton\" + 0.023*\"multitud\" + 0.022*\"adulthood\" + 0.022*\"area\" + 0.019*\"cede\" + 0.018*\"commun\"\n", + "2019-01-31 01:40:22,755 : INFO : topic diff=0.003061, rho=0.020224\n", + "2019-01-31 01:40:22,911 : INFO : PROGRESS: pass 0, at document #4892000/4922894\n", + "2019-01-31 01:40:24,273 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:40:24,539 : INFO : topic #10 (0.020): 0.011*\"cdd\" + 0.008*\"media\" + 0.008*\"have\" + 0.008*\"disco\" + 0.007*\"hormon\" + 0.007*\"pathwai\" + 0.007*\"caus\" + 0.006*\"proper\" + 0.006*\"treat\" + 0.006*\"effect\"\n", + "2019-01-31 01:40:24,540 : INFO : topic #4 (0.020): 0.019*\"enfranchis\" + 0.015*\"depress\" + 0.013*\"pour\" + 0.008*\"mode\" + 0.008*\"veget\" + 0.008*\"elabor\" + 0.008*\"uruguayan\" + 0.006*\"turn\" + 0.006*\"develop\" + 0.006*\"produc\"\n", + "2019-01-31 01:40:24,541 : INFO : topic #38 (0.020): 0.022*\"walter\" + 0.011*\"aza\" + 0.009*\"forc\" + 0.008*\"battalion\" + 0.008*\"teufel\" + 0.007*\"armi\" + 0.007*\"empath\" + 0.007*\"till\" + 0.006*\"militari\" + 0.006*\"govern\"\n", + "2019-01-31 01:40:24,542 : INFO : topic #27 (0.020): 0.075*\"questionnair\" + 0.020*\"candid\" + 0.017*\"taxpay\" + 0.013*\"fool\" + 0.013*\"tornado\" + 0.013*\"ret\" + 0.012*\"find\" + 0.012*\"driver\" + 0.010*\"squatter\" + 0.009*\"théori\"\n", + "2019-01-31 01:40:24,543 : INFO : topic #23 (0.020): 0.135*\"audit\" + 0.070*\"best\" + 0.035*\"yawn\" + 0.030*\"jacksonvil\" + 0.024*\"japanes\" + 0.020*\"noll\" + 0.018*\"festiv\" + 0.018*\"women\" + 0.018*\"intern\" + 0.013*\"prison\"\n", + "2019-01-31 01:40:24,549 : INFO : topic diff=0.003183, rho=0.020220\n", + "2019-01-31 01:40:24,763 : INFO : PROGRESS: pass 0, at document #4894000/4922894\n", + "2019-01-31 01:40:26,160 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:40:26,428 : INFO : topic #35 (0.020): 0.055*\"russia\" + 0.039*\"sovereignti\" + 0.032*\"rural\" + 0.028*\"poison\" + 0.026*\"reprint\" + 0.024*\"personifi\" + 0.021*\"poland\" + 0.019*\"moscow\" + 0.018*\"turin\" + 0.015*\"unfortun\"\n", + "2019-01-31 01:40:26,429 : INFO : topic #26 (0.020): 0.028*\"champion\" + 0.028*\"workplac\" + 0.025*\"woman\" + 0.024*\"olymp\" + 0.023*\"men\" + 0.022*\"alic\" + 0.021*\"medal\" + 0.020*\"event\" + 0.018*\"atheist\" + 0.018*\"taxpay\"\n", + "2019-01-31 01:40:26,430 : INFO : topic #40 (0.020): 0.087*\"unit\" + 0.023*\"schuster\" + 0.021*\"institut\" + 0.021*\"collector\" + 0.021*\"requir\" + 0.019*\"student\" + 0.014*\"professor\" + 0.012*\"word\" + 0.011*\"governor\" + 0.011*\"degre\"\n", + "2019-01-31 01:40:26,431 : INFO : topic #48 (0.020): 0.078*\"octob\" + 0.077*\"march\" + 0.075*\"sens\" + 0.068*\"notion\" + 0.067*\"januari\" + 0.067*\"juli\" + 0.066*\"august\" + 0.066*\"april\" + 0.065*\"decatur\" + 0.064*\"judici\"\n", + "2019-01-31 01:40:26,432 : INFO : topic #31 (0.020): 0.051*\"fusiform\" + 0.027*\"scientist\" + 0.025*\"taxpay\" + 0.023*\"player\" + 0.019*\"place\" + 0.014*\"clot\" + 0.013*\"leagu\" + 0.011*\"folei\" + 0.010*\"yawn\" + 0.009*\"reconstruct\"\n", + "2019-01-31 01:40:26,438 : INFO : topic diff=0.003392, rho=0.020215\n", + "2019-01-31 01:40:26,594 : INFO : PROGRESS: pass 0, at document #4896000/4922894\n", + "2019-01-31 01:40:27,951 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:40:28,217 : INFO : topic #25 (0.020): 0.031*\"ring\" + 0.019*\"area\" + 0.017*\"lagrang\" + 0.016*\"warmth\" + 0.015*\"mount\" + 0.010*\"north\" + 0.009*\"sourc\" + 0.009*\"land\" + 0.009*\"palmer\" + 0.009*\"foam\"\n", + "2019-01-31 01:40:28,218 : INFO : topic #16 (0.020): 0.055*\"king\" + 0.030*\"priest\" + 0.020*\"duke\" + 0.019*\"rotterdam\" + 0.018*\"idiosyncrat\" + 0.018*\"quarterli\" + 0.018*\"grammat\" + 0.016*\"kingdom\" + 0.014*\"portugues\" + 0.012*\"crittenden\"\n", + "2019-01-31 01:40:28,219 : INFO : topic #8 (0.020): 0.027*\"law\" + 0.023*\"cortic\" + 0.018*\"start\" + 0.016*\"act\" + 0.012*\"ricardo\" + 0.012*\"case\" + 0.010*\"replac\" + 0.010*\"polaris\" + 0.008*\"legal\" + 0.008*\"judaism\"\n", + "2019-01-31 01:40:28,220 : INFO : topic #36 (0.020): 0.011*\"network\" + 0.011*\"prognosi\" + 0.010*\"pop\" + 0.009*\"cytokin\" + 0.008*\"develop\" + 0.008*\"diggin\" + 0.008*\"softwar\" + 0.007*\"uruguayan\" + 0.007*\"user\" + 0.007*\"includ\"\n", + "2019-01-31 01:40:28,221 : INFO : topic #7 (0.020): 0.021*\"snatch\" + 0.020*\"di\" + 0.018*\"factor\" + 0.016*\"yawn\" + 0.016*\"margin\" + 0.014*\"bone\" + 0.013*\"life\" + 0.012*\"faster\" + 0.012*\"will\" + 0.012*\"john\"\n", + "2019-01-31 01:40:28,227 : INFO : topic diff=0.002795, rho=0.020211\n", + "2019-01-31 01:40:28,385 : INFO : PROGRESS: pass 0, at document #4898000/4922894\n", + "2019-01-31 01:40:29,768 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 01:40:30,034 : INFO : topic #4 (0.020): 0.019*\"enfranchis\" + 0.015*\"depress\" + 0.013*\"pour\" + 0.008*\"veget\" + 0.008*\"elabor\" + 0.008*\"mode\" + 0.008*\"uruguayan\" + 0.006*\"develop\" + 0.006*\"turn\" + 0.006*\"produc\"\n", + "2019-01-31 01:40:30,035 : INFO : topic #26 (0.020): 0.028*\"champion\" + 0.028*\"workplac\" + 0.025*\"woman\" + 0.025*\"olymp\" + 0.023*\"men\" + 0.021*\"alic\" + 0.021*\"medal\" + 0.020*\"event\" + 0.018*\"atheist\" + 0.018*\"taxpay\"\n", + "2019-01-31 01:40:30,036 : INFO : topic #6 (0.020): 0.068*\"fewer\" + 0.024*\"epiru\" + 0.021*\"septemb\" + 0.018*\"teacher\" + 0.014*\"stake\" + 0.012*\"rodríguez\" + 0.012*\"proclaim\" + 0.010*\"direct\" + 0.010*\"acrimoni\" + 0.010*\"movi\"\n", + "2019-01-31 01:40:30,037 : INFO : topic #28 (0.020): 0.037*\"build\" + 0.031*\"hous\" + 0.019*\"buford\" + 0.015*\"histor\" + 0.012*\"linear\" + 0.011*\"silicon\" + 0.011*\"centuri\" + 0.011*\"depress\" + 0.011*\"constitut\" + 0.010*\"pistol\"\n", + "2019-01-31 01:40:30,038 : INFO : topic #16 (0.020): 0.055*\"king\" + 0.030*\"priest\" + 0.020*\"duke\" + 0.019*\"rotterdam\" + 0.018*\"idiosyncrat\" + 0.018*\"quarterli\" + 0.017*\"grammat\" + 0.016*\"kingdom\" + 0.014*\"portugues\" + 0.012*\"crittenden\"\n", + "2019-01-31 01:40:30,044 : INFO : topic diff=0.003133, rho=0.020207\n", + "2019-01-31 01:40:32,681 : INFO : -11.399 per-word bound, 2701.2 perplexity estimate based on a held-out corpus of 2000 documents with 546394 words\n", + "2019-01-31 01:40:32,681 : INFO : PROGRESS: pass 0, at document #4900000/4922894\n", + "2019-01-31 01:40:34,032 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:40:34,299 : INFO : topic #3 (0.020): 0.031*\"present\" + 0.025*\"nation\" + 0.025*\"offic\" + 0.023*\"govern\" + 0.023*\"minist\" + 0.022*\"member\" + 0.019*\"serv\" + 0.018*\"start\" + 0.015*\"gener\" + 0.014*\"chickasaw\"\n", + "2019-01-31 01:40:34,300 : INFO : topic #26 (0.020): 0.028*\"workplac\" + 0.028*\"champion\" + 0.025*\"woman\" + 0.025*\"olymp\" + 0.023*\"men\" + 0.021*\"alic\" + 0.021*\"medal\" + 0.020*\"event\" + 0.018*\"atheist\" + 0.018*\"taxpay\"\n", + "2019-01-31 01:40:34,301 : INFO : topic #12 (0.020): 0.009*\"number\" + 0.007*\"frontal\" + 0.007*\"gener\" + 0.006*\"poet\" + 0.006*\"théori\" + 0.006*\"southern\" + 0.006*\"exampl\" + 0.006*\"servitud\" + 0.006*\"measur\" + 0.006*\"mode\"\n", + "2019-01-31 01:40:34,302 : INFO : topic #2 (0.020): 0.048*\"isl\" + 0.039*\"shield\" + 0.018*\"narrat\" + 0.014*\"scot\" + 0.012*\"pope\" + 0.011*\"blur\" + 0.011*\"nativist\" + 0.010*\"class\" + 0.010*\"coalit\" + 0.010*\"fleet\"\n", + "2019-01-31 01:40:34,303 : INFO : topic #14 (0.020): 0.024*\"forc\" + 0.022*\"aggress\" + 0.021*\"walter\" + 0.020*\"armi\" + 0.017*\"com\" + 0.013*\"militari\" + 0.013*\"unionist\" + 0.013*\"oper\" + 0.012*\"airbu\" + 0.010*\"diversifi\"\n", + "2019-01-31 01:40:34,309 : INFO : topic diff=0.003008, rho=0.020203\n", + "2019-01-31 01:40:34,464 : INFO : PROGRESS: pass 0, at document #4902000/4922894\n", + "2019-01-31 01:40:35,845 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:40:36,111 : INFO : topic #19 (0.020): 0.016*\"languag\" + 0.015*\"centuri\" + 0.010*\"woodcut\" + 0.009*\"form\" + 0.009*\"origin\" + 0.009*\"mean\" + 0.008*\"trade\" + 0.008*\"english\" + 0.007*\"known\" + 0.007*\"ancestor\"\n", + "2019-01-31 01:40:36,112 : INFO : topic #37 (0.020): 0.012*\"charact\" + 0.012*\"septemb\" + 0.010*\"man\" + 0.010*\"anim\" + 0.008*\"comic\" + 0.007*\"fusiform\" + 0.007*\"appear\" + 0.007*\"storag\" + 0.007*\"workplac\" + 0.006*\"black\"\n", + "2019-01-31 01:40:36,113 : INFO : topic #15 (0.020): 0.011*\"small\" + 0.010*\"organ\" + 0.009*\"develop\" + 0.009*\"commun\" + 0.008*\"peopl\" + 0.008*\"word\" + 0.008*\"group\" + 0.007*\"woman\" + 0.007*\"human\" + 0.006*\"workplac\"\n", + "2019-01-31 01:40:36,114 : INFO : topic #24 (0.020): 0.041*\"book\" + 0.036*\"publicis\" + 0.024*\"word\" + 0.020*\"new\" + 0.014*\"edit\" + 0.014*\"presid\" + 0.011*\"magazin\" + 0.011*\"author\" + 0.011*\"nicola\" + 0.011*\"storag\"\n", + "2019-01-31 01:40:36,115 : INFO : topic #6 (0.020): 0.068*\"fewer\" + 0.024*\"epiru\" + 0.021*\"septemb\" + 0.018*\"teacher\" + 0.014*\"stake\" + 0.012*\"rodríguez\" + 0.012*\"proclaim\" + 0.010*\"direct\" + 0.010*\"acrimoni\" + 0.010*\"movi\"\n", + "2019-01-31 01:40:36,121 : INFO : topic diff=0.002406, rho=0.020199\n", + "2019-01-31 01:40:36,277 : INFO : PROGRESS: pass 0, at document #4904000/4922894\n", + "2019-01-31 01:40:37,630 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:40:37,896 : INFO : topic #28 (0.020): 0.037*\"build\" + 0.031*\"hous\" + 0.019*\"buford\" + 0.015*\"histor\" + 0.012*\"linear\" + 0.011*\"centuri\" + 0.011*\"silicon\" + 0.011*\"depress\" + 0.011*\"constitut\" + 0.010*\"pistol\"\n", + "2019-01-31 01:40:37,898 : INFO : topic #14 (0.020): 0.024*\"forc\" + 0.022*\"aggress\" + 0.021*\"walter\" + 0.020*\"armi\" + 0.017*\"com\" + 0.013*\"militari\" + 0.013*\"unionist\" + 0.013*\"oper\" + 0.012*\"airbu\" + 0.010*\"diversifi\"\n", + "2019-01-31 01:40:37,899 : INFO : topic #18 (0.020): 0.011*\"théori\" + 0.007*\"later\" + 0.006*\"sack\" + 0.006*\"dai\" + 0.005*\"kill\" + 0.005*\"like\" + 0.005*\"retrospect\" + 0.005*\"end\" + 0.004*\"call\" + 0.004*\"help\"\n", + "2019-01-31 01:40:37,900 : INFO : topic #19 (0.020): 0.016*\"languag\" + 0.015*\"centuri\" + 0.010*\"woodcut\" + 0.009*\"form\" + 0.009*\"origin\" + 0.009*\"mean\" + 0.008*\"trade\" + 0.008*\"english\" + 0.007*\"known\" + 0.007*\"ancestor\"\n", + "2019-01-31 01:40:37,901 : INFO : topic #9 (0.020): 0.074*\"bone\" + 0.043*\"american\" + 0.030*\"valour\" + 0.020*\"dutch\" + 0.018*\"folei\" + 0.017*\"player\" + 0.017*\"polit\" + 0.016*\"english\" + 0.011*\"acrimoni\" + 0.011*\"simpler\"\n", + "2019-01-31 01:40:37,907 : INFO : topic diff=0.002723, rho=0.020195\n", + "2019-01-31 01:40:38,065 : INFO : PROGRESS: pass 0, at document #4906000/4922894\n", + "2019-01-31 01:40:39,438 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:40:39,704 : INFO : topic #18 (0.020): 0.011*\"théori\" + 0.007*\"later\" + 0.006*\"sack\" + 0.006*\"dai\" + 0.005*\"kill\" + 0.005*\"like\" + 0.005*\"retrospect\" + 0.005*\"end\" + 0.004*\"call\" + 0.004*\"help\"\n", + "2019-01-31 01:40:39,705 : INFO : topic #7 (0.020): 0.021*\"snatch\" + 0.020*\"di\" + 0.018*\"factor\" + 0.016*\"yawn\" + 0.016*\"margin\" + 0.014*\"bone\" + 0.013*\"life\" + 0.012*\"faster\" + 0.012*\"will\" + 0.012*\"deal\"\n", + "2019-01-31 01:40:39,706 : INFO : topic #49 (0.020): 0.043*\"india\" + 0.031*\"incumb\" + 0.013*\"pakistan\" + 0.013*\"islam\" + 0.012*\"anglo\" + 0.011*\"televis\" + 0.011*\"affection\" + 0.011*\"khalsa\" + 0.011*\"muskoge\" + 0.010*\"tajikistan\"\n", + "2019-01-31 01:40:39,707 : INFO : topic #42 (0.020): 0.049*\"german\" + 0.034*\"germani\" + 0.016*\"vol\" + 0.014*\"berlin\" + 0.013*\"israel\" + 0.013*\"der\" + 0.013*\"jewish\" + 0.010*\"austria\" + 0.009*\"europ\" + 0.009*\"european\"\n", + "2019-01-31 01:40:39,708 : INFO : topic #16 (0.020): 0.056*\"king\" + 0.030*\"priest\" + 0.020*\"duke\" + 0.019*\"rotterdam\" + 0.018*\"idiosyncrat\" + 0.018*\"quarterli\" + 0.017*\"grammat\" + 0.016*\"kingdom\" + 0.014*\"portugues\" + 0.011*\"paisiello\"\n", + "2019-01-31 01:40:39,714 : INFO : topic diff=0.002928, rho=0.020191\n", + "2019-01-31 01:40:39,870 : INFO : PROGRESS: pass 0, at document #4908000/4922894\n", + "2019-01-31 01:40:41,231 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:40:41,497 : INFO : topic #43 (0.020): 0.067*\"elect\" + 0.053*\"parti\" + 0.025*\"voluntari\" + 0.022*\"democrat\" + 0.019*\"member\" + 0.017*\"polici\" + 0.015*\"republ\" + 0.014*\"bypass\" + 0.013*\"liber\" + 0.013*\"report\"\n", + "2019-01-31 01:40:41,498 : INFO : topic #32 (0.020): 0.051*\"district\" + 0.046*\"popolo\" + 0.042*\"vigour\" + 0.036*\"tortur\" + 0.033*\"cotton\" + 0.022*\"adulthood\" + 0.022*\"multitud\" + 0.021*\"area\" + 0.019*\"cede\" + 0.018*\"citi\"\n", + "2019-01-31 01:40:41,499 : INFO : topic #34 (0.020): 0.067*\"start\" + 0.033*\"new\" + 0.031*\"american\" + 0.030*\"unionist\" + 0.026*\"cotton\" + 0.020*\"year\" + 0.015*\"california\" + 0.013*\"warrior\" + 0.012*\"terri\" + 0.012*\"north\"\n", + "2019-01-31 01:40:41,500 : INFO : topic #38 (0.020): 0.022*\"walter\" + 0.011*\"aza\" + 0.009*\"forc\" + 0.008*\"battalion\" + 0.008*\"teufel\" + 0.007*\"till\" + 0.007*\"empath\" + 0.007*\"armi\" + 0.006*\"militari\" + 0.006*\"govern\"\n", + "2019-01-31 01:40:41,501 : INFO : topic #16 (0.020): 0.056*\"king\" + 0.031*\"priest\" + 0.020*\"duke\" + 0.019*\"rotterdam\" + 0.018*\"idiosyncrat\" + 0.018*\"quarterli\" + 0.017*\"grammat\" + 0.016*\"kingdom\" + 0.014*\"portugues\" + 0.011*\"crittenden\"\n", + "2019-01-31 01:40:41,507 : INFO : topic diff=0.003263, rho=0.020187\n", + "2019-01-31 01:40:41,660 : INFO : PROGRESS: pass 0, at document #4910000/4922894\n", + "2019-01-31 01:40:42,995 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 01:40:43,261 : INFO : topic #4 (0.020): 0.019*\"enfranchis\" + 0.015*\"depress\" + 0.013*\"pour\" + 0.008*\"mode\" + 0.008*\"veget\" + 0.008*\"elabor\" + 0.008*\"uruguayan\" + 0.006*\"develop\" + 0.006*\"turn\" + 0.006*\"produc\"\n", + "2019-01-31 01:40:43,262 : INFO : topic #15 (0.020): 0.011*\"small\" + 0.010*\"organ\" + 0.009*\"develop\" + 0.009*\"commun\" + 0.008*\"word\" + 0.008*\"peopl\" + 0.008*\"group\" + 0.007*\"woman\" + 0.007*\"human\" + 0.006*\"summerhil\"\n", + "2019-01-31 01:40:43,263 : INFO : topic #42 (0.020): 0.049*\"german\" + 0.034*\"germani\" + 0.015*\"vol\" + 0.014*\"berlin\" + 0.013*\"israel\" + 0.013*\"der\" + 0.013*\"jewish\" + 0.010*\"austria\" + 0.009*\"europ\" + 0.009*\"european\"\n", + "2019-01-31 01:40:43,264 : INFO : topic #6 (0.020): 0.068*\"fewer\" + 0.024*\"epiru\" + 0.021*\"septemb\" + 0.018*\"teacher\" + 0.014*\"stake\" + 0.012*\"rodríguez\" + 0.012*\"proclaim\" + 0.010*\"direct\" + 0.010*\"movi\" + 0.010*\"acrimoni\"\n", + "2019-01-31 01:40:43,265 : INFO : topic #12 (0.020): 0.009*\"number\" + 0.007*\"frontal\" + 0.007*\"gener\" + 0.006*\"poet\" + 0.006*\"théori\" + 0.006*\"southern\" + 0.006*\"exampl\" + 0.006*\"servitud\" + 0.006*\"measur\" + 0.006*\"utopian\"\n", + "2019-01-31 01:40:43,271 : INFO : topic diff=0.003394, rho=0.020182\n", + "2019-01-31 01:40:43,421 : INFO : PROGRESS: pass 0, at document #4912000/4922894\n", + "2019-01-31 01:40:44,767 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:40:45,033 : INFO : topic #49 (0.020): 0.043*\"india\" + 0.031*\"incumb\" + 0.013*\"pakistan\" + 0.013*\"islam\" + 0.012*\"anglo\" + 0.011*\"televis\" + 0.011*\"khalsa\" + 0.011*\"affection\" + 0.010*\"muskoge\" + 0.010*\"tajikistan\"\n", + "2019-01-31 01:40:45,034 : INFO : topic #6 (0.020): 0.068*\"fewer\" + 0.024*\"epiru\" + 0.021*\"septemb\" + 0.018*\"teacher\" + 0.014*\"stake\" + 0.012*\"rodríguez\" + 0.012*\"proclaim\" + 0.010*\"direct\" + 0.010*\"movi\" + 0.010*\"acrimoni\"\n", + "2019-01-31 01:40:45,035 : INFO : topic #41 (0.020): 0.044*\"citi\" + 0.025*\"palmer\" + 0.019*\"new\" + 0.018*\"strategist\" + 0.013*\"center\" + 0.013*\"open\" + 0.012*\"includ\" + 0.011*\"lobe\" + 0.011*\"dai\" + 0.009*\"highli\"\n", + "2019-01-31 01:40:45,036 : INFO : topic #16 (0.020): 0.055*\"king\" + 0.031*\"priest\" + 0.020*\"duke\" + 0.019*\"rotterdam\" + 0.018*\"idiosyncrat\" + 0.017*\"quarterli\" + 0.017*\"grammat\" + 0.016*\"kingdom\" + 0.014*\"portugues\" + 0.012*\"princ\"\n", + "2019-01-31 01:40:45,037 : INFO : topic #32 (0.020): 0.051*\"district\" + 0.046*\"popolo\" + 0.042*\"vigour\" + 0.036*\"tortur\" + 0.033*\"cotton\" + 0.022*\"multitud\" + 0.022*\"adulthood\" + 0.021*\"area\" + 0.019*\"cede\" + 0.018*\"citi\"\n", + "2019-01-31 01:40:45,043 : INFO : topic diff=0.003446, rho=0.020178\n", + "2019-01-31 01:40:45,202 : INFO : PROGRESS: pass 0, at document #4914000/4922894\n", + "2019-01-31 01:40:46,585 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:40:46,851 : INFO : topic #30 (0.020): 0.036*\"leagu\" + 0.034*\"cleveland\" + 0.032*\"place\" + 0.028*\"taxpay\" + 0.024*\"scientist\" + 0.023*\"crete\" + 0.021*\"folei\" + 0.017*\"goal\" + 0.015*\"martin\" + 0.013*\"schmitz\"\n", + "2019-01-31 01:40:46,852 : INFO : topic #43 (0.020): 0.066*\"elect\" + 0.054*\"parti\" + 0.025*\"voluntari\" + 0.023*\"democrat\" + 0.019*\"member\" + 0.016*\"polici\" + 0.015*\"republ\" + 0.014*\"bypass\" + 0.013*\"report\" + 0.013*\"liber\"\n", + "2019-01-31 01:40:46,853 : INFO : topic #44 (0.020): 0.031*\"rooftop\" + 0.027*\"final\" + 0.023*\"wife\" + 0.020*\"tourist\" + 0.018*\"champion\" + 0.015*\"martin\" + 0.014*\"chamber\" + 0.014*\"taxpay\" + 0.013*\"tiepolo\" + 0.013*\"open\"\n", + "2019-01-31 01:40:46,854 : INFO : topic #45 (0.020): 0.048*\"arsen\" + 0.031*\"museo\" + 0.030*\"jpg\" + 0.028*\"fifteenth\" + 0.022*\"pain\" + 0.020*\"illicit\" + 0.017*\"artist\" + 0.016*\"exhaust\" + 0.016*\"gai\" + 0.016*\"colder\"\n", + "2019-01-31 01:40:46,855 : INFO : topic #47 (0.020): 0.065*\"muscl\" + 0.032*\"perceptu\" + 0.021*\"theater\" + 0.018*\"place\" + 0.018*\"compos\" + 0.015*\"damn\" + 0.015*\"orchestr\" + 0.013*\"olympo\" + 0.013*\"physician\" + 0.012*\"word\"\n", + "2019-01-31 01:40:46,861 : INFO : topic diff=0.002499, rho=0.020174\n", + "2019-01-31 01:40:47,015 : INFO : PROGRESS: pass 0, at document #4916000/4922894\n", + "2019-01-31 01:40:48,378 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:40:48,644 : INFO : topic #17 (0.020): 0.079*\"church\" + 0.024*\"cathol\" + 0.022*\"christian\" + 0.021*\"bishop\" + 0.017*\"sail\" + 0.014*\"retroflex\" + 0.010*\"relationship\" + 0.010*\"cathedr\" + 0.009*\"historiographi\" + 0.009*\"poll\"\n", + "2019-01-31 01:40:48,645 : INFO : topic #18 (0.020): 0.011*\"théori\" + 0.007*\"later\" + 0.006*\"sack\" + 0.006*\"dai\" + 0.005*\"kill\" + 0.005*\"like\" + 0.005*\"retrospect\" + 0.005*\"end\" + 0.004*\"call\" + 0.004*\"help\"\n", + "2019-01-31 01:40:48,646 : INFO : topic #49 (0.020): 0.043*\"india\" + 0.031*\"incumb\" + 0.014*\"pakistan\" + 0.013*\"islam\" + 0.012*\"televis\" + 0.012*\"anglo\" + 0.011*\"sri\" + 0.011*\"tajikistan\" + 0.011*\"khalsa\" + 0.010*\"muskoge\"\n", + "2019-01-31 01:40:48,647 : INFO : topic #32 (0.020): 0.051*\"district\" + 0.046*\"popolo\" + 0.043*\"vigour\" + 0.036*\"tortur\" + 0.033*\"cotton\" + 0.022*\"adulthood\" + 0.022*\"multitud\" + 0.021*\"area\" + 0.019*\"cede\" + 0.018*\"citi\"\n", + "2019-01-31 01:40:48,648 : INFO : topic #3 (0.020): 0.032*\"present\" + 0.025*\"nation\" + 0.025*\"offic\" + 0.024*\"govern\" + 0.023*\"minist\" + 0.022*\"member\" + 0.018*\"serv\" + 0.018*\"start\" + 0.015*\"gener\" + 0.014*\"chickasaw\"\n", + "2019-01-31 01:40:48,654 : INFO : topic diff=0.003276, rho=0.020170\n", + "2019-01-31 01:40:48,817 : INFO : PROGRESS: pass 0, at document #4918000/4922894\n", + "2019-01-31 01:40:50,225 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:40:50,491 : INFO : topic #37 (0.020): 0.012*\"charact\" + 0.012*\"septemb\" + 0.010*\"man\" + 0.010*\"anim\" + 0.008*\"comic\" + 0.007*\"appear\" + 0.007*\"fusiform\" + 0.007*\"storag\" + 0.007*\"workplac\" + 0.006*\"black\"\n", + "2019-01-31 01:40:50,492 : INFO : topic #13 (0.020): 0.026*\"australia\" + 0.026*\"london\" + 0.025*\"sourc\" + 0.024*\"new\" + 0.023*\"england\" + 0.022*\"australian\" + 0.020*\"british\" + 0.018*\"ireland\" + 0.014*\"youth\" + 0.014*\"weekli\"\n", + "2019-01-31 01:40:50,494 : INFO : topic #5 (0.020): 0.038*\"abroad\" + 0.028*\"son\" + 0.027*\"rel\" + 0.026*\"reconstruct\" + 0.021*\"band\" + 0.016*\"muscl\" + 0.016*\"simultan\" + 0.014*\"charcoal\" + 0.013*\"toyota\" + 0.010*\"vocabulari\"\n", + "2019-01-31 01:40:50,495 : INFO : topic #15 (0.020): 0.011*\"small\" + 0.010*\"organ\" + 0.009*\"develop\" + 0.009*\"commun\" + 0.008*\"peopl\" + 0.008*\"word\" + 0.008*\"group\" + 0.007*\"woman\" + 0.007*\"human\" + 0.006*\"summerhil\"\n", + "2019-01-31 01:40:50,496 : INFO : topic #29 (0.020): 0.032*\"companhia\" + 0.013*\"busi\" + 0.012*\"million\" + 0.012*\"market\" + 0.012*\"produc\" + 0.010*\"industri\" + 0.010*\"bank\" + 0.009*\"manag\" + 0.009*\"yawn\" + 0.007*\"oper\"\n", + "2019-01-31 01:40:50,502 : INFO : topic diff=0.003675, rho=0.020166\n", + "2019-01-31 01:40:53,222 : INFO : -11.803 per-word bound, 3573.1 perplexity estimate based on a held-out corpus of 2000 documents with 581976 words\n", + "2019-01-31 01:40:53,222 : INFO : PROGRESS: pass 0, at document #4920000/4922894\n", + "2019-01-31 01:40:54,616 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n", + "2019-01-31 01:40:54,883 : INFO : topic #27 (0.020): 0.075*\"questionnair\" + 0.020*\"candid\" + 0.017*\"taxpay\" + 0.013*\"fool\" + 0.013*\"tornado\" + 0.012*\"driver\" + 0.012*\"find\" + 0.012*\"ret\" + 0.011*\"squatter\" + 0.010*\"théori\"\n", + "2019-01-31 01:40:54,883 : INFO : topic #48 (0.020): 0.077*\"octob\" + 0.076*\"march\" + 0.076*\"sens\" + 0.068*\"januari\" + 0.068*\"notion\" + 0.067*\"decatur\" + 0.067*\"juli\" + 0.066*\"august\" + 0.065*\"april\" + 0.063*\"judici\"\n", + "2019-01-31 01:40:54,884 : INFO : topic #1 (0.020): 0.052*\"china\" + 0.043*\"chilton\" + 0.025*\"kong\" + 0.025*\"hong\" + 0.021*\"korea\" + 0.019*\"korean\" + 0.016*\"leah\" + 0.015*\"sourc\" + 0.015*\"shirin\" + 0.014*\"kim\"\n", + "2019-01-31 01:40:54,885 : INFO : topic #3 (0.020): 0.031*\"present\" + 0.026*\"offic\" + 0.025*\"nation\" + 0.023*\"govern\" + 0.023*\"minist\" + 0.022*\"member\" + 0.019*\"serv\" + 0.018*\"start\" + 0.015*\"gener\" + 0.014*\"chickasaw\"\n", + "2019-01-31 01:40:54,886 : INFO : topic #25 (0.020): 0.031*\"ring\" + 0.019*\"area\" + 0.017*\"lagrang\" + 0.017*\"warmth\" + 0.015*\"mount\" + 0.010*\"north\" + 0.009*\"sourc\" + 0.009*\"land\" + 0.008*\"palmer\" + 0.008*\"foam\"\n", + "2019-01-31 01:40:54,892 : INFO : topic diff=0.003423, rho=0.020162\n", + "2019-01-31 01:40:55,051 : INFO : PROGRESS: pass 0, at document #4922000/4922894\n", + "2019-01-31 01:40:56,425 : INFO : merging changes from 2000 documents into a model of 4922894 documents\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 01:40:56,692 : INFO : topic #5 (0.020): 0.038*\"abroad\" + 0.028*\"son\" + 0.027*\"rel\" + 0.026*\"reconstruct\" + 0.021*\"band\" + 0.016*\"muscl\" + 0.016*\"simultan\" + 0.014*\"charcoal\" + 0.013*\"toyota\" + 0.010*\"vocabulari\"\n", + "2019-01-31 01:40:56,693 : INFO : topic #0 (0.020): 0.061*\"statewid\" + 0.038*\"line\" + 0.030*\"rivièr\" + 0.030*\"raid\" + 0.025*\"rosenwald\" + 0.020*\"airmen\" + 0.017*\"traceabl\" + 0.017*\"serv\" + 0.013*\"briarwood\" + 0.013*\"oper\"\n", + "2019-01-31 01:40:56,694 : INFO : topic #24 (0.020): 0.041*\"book\" + 0.036*\"publicis\" + 0.024*\"word\" + 0.020*\"new\" + 0.014*\"edit\" + 0.014*\"presid\" + 0.011*\"magazin\" + 0.011*\"author\" + 0.011*\"nicola\" + 0.011*\"storag\"\n", + "2019-01-31 01:40:56,695 : INFO : topic #48 (0.020): 0.077*\"octob\" + 0.076*\"march\" + 0.075*\"sens\" + 0.067*\"januari\" + 0.067*\"notion\" + 0.067*\"decatur\" + 0.066*\"juli\" + 0.066*\"august\" + 0.065*\"april\" + 0.063*\"judici\"\n", + "2019-01-31 01:40:56,696 : INFO : topic #38 (0.020): 0.022*\"walter\" + 0.011*\"aza\" + 0.009*\"forc\" + 0.008*\"teufel\" + 0.008*\"battalion\" + 0.008*\"till\" + 0.007*\"empath\" + 0.007*\"armi\" + 0.006*\"militari\" + 0.006*\"govern\"\n", + "2019-01-31 01:40:56,702 : INFO : topic diff=0.003322, rho=0.020158\n", + "2019-01-31 01:40:58,121 : INFO : -11.497 per-word bound, 2890.3 perplexity estimate based on a held-out corpus of 894 documents with 240967 words\n", + "2019-01-31 01:40:58,121 : INFO : PROGRESS: pass 0, at document #4922894/4922894\n", + "2019-01-31 01:40:58,868 : INFO : merging changes from 894 documents into a model of 4922894 documents\n", + "2019-01-31 01:40:59,135 : INFO : topic #11 (0.020): 0.023*\"john\" + 0.011*\"will\" + 0.011*\"david\" + 0.011*\"jame\" + 0.010*\"rival\" + 0.009*\"mexican–american\" + 0.008*\"slur\" + 0.008*\"georg\" + 0.008*\"paul\" + 0.008*\"rhyme\"\n", + "2019-01-31 01:40:59,136 : INFO : topic #18 (0.020): 0.011*\"théori\" + 0.007*\"later\" + 0.006*\"sack\" + 0.006*\"dai\" + 0.005*\"kill\" + 0.005*\"like\" + 0.005*\"retrospect\" + 0.005*\"end\" + 0.004*\"call\" + 0.004*\"help\"\n", + "2019-01-31 01:40:59,137 : INFO : topic #40 (0.020): 0.087*\"unit\" + 0.023*\"schuster\" + 0.022*\"institut\" + 0.021*\"collector\" + 0.020*\"requir\" + 0.019*\"student\" + 0.014*\"professor\" + 0.012*\"word\" + 0.011*\"governor\" + 0.011*\"degre\"\n", + "2019-01-31 01:40:59,138 : INFO : topic #15 (0.020): 0.011*\"small\" + 0.010*\"organ\" + 0.009*\"develop\" + 0.009*\"commun\" + 0.008*\"group\" + 0.008*\"peopl\" + 0.008*\"word\" + 0.007*\"woman\" + 0.007*\"human\" + 0.006*\"summerhil\"\n", + "2019-01-31 01:40:59,139 : INFO : topic #1 (0.020): 0.053*\"china\" + 0.045*\"chilton\" + 0.026*\"kong\" + 0.026*\"hong\" + 0.021*\"korea\" + 0.019*\"korean\" + 0.016*\"leah\" + 0.015*\"sourc\" + 0.015*\"shirin\" + 0.014*\"kim\"\n", + "2019-01-31 01:40:59,145 : INFO : topic diff=0.003886, rho=0.020154\n", + "2019-01-31 01:40:59,155 : INFO : saving LdaState object under lda.model.state, separately None\n", + "2019-01-31 01:40:59,266 : INFO : saved lda.model.state\n", + "2019-01-31 01:40:59,325 : INFO : saving LdaModel object under lda.model, separately ['expElogbeta', 'sstats']\n", + "2019-01-31 01:40:59,326 : INFO : not storing attribute dispatcher\n", + "2019-01-31 01:40:59,327 : INFO : not storing attribute state\n", + "2019-01-31 01:40:59,327 : INFO : storing np array 'expElogbeta' to lda.model.expElogbeta.npy\n", + "2019-01-31 01:40:59,353 : INFO : not storing attribute id2word\n", + "2019-01-31 01:40:59,356 : INFO : saved lda.model\n" ] } ], "source": [ - "for row_idx, row in tm_metrics.iterrows():\n", - " print('='*20)\n", - " print(row['model'])\n", - " print('='*20)\n", - " print()\n", - " for topic_idx, tokens in row['topics']:\n", - " print('Topic: {}'.format(topic_idx))\n", - " print(tokens)\n", - " print()\n", - " print()" + "row = dict()\n", + "row['model'] = 'lda'\n", + "row['train_time'], row['mean_ram'], row['max_ram'], lda = get_train_time_and_ram(\n", + " lambda: LdaModel(**params),\n", + " 'lda',\n", + ")\n", + "lda.save('lda.model')" ] }, { "cell_type": "markdown", "metadata": {}, "source": [ - "As we can see, NMF can be significantly faster than LDA without sacrificing quality of topics too much (or not sacrificing at all)\n", + "### Load LDA and store metrics" + ] + }, + { + "cell_type": "code", + "execution_count": 18, + "metadata": {}, + "outputs": [ + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2019-01-31 01:40:59,377 : INFO : loading LdaModel object from lda.model\n", + "2019-01-31 01:40:59,379 : INFO : loading expElogbeta from lda.model.expElogbeta.npy with mmap=None\n", + "2019-01-31 01:40:59,383 : INFO : setting ignored attribute dispatcher to None\n", + "2019-01-31 01:40:59,384 : INFO : setting ignored attribute state to None\n", + "2019-01-31 01:40:59,384 : INFO : setting ignored attribute id2word to None\n", + "2019-01-31 01:40:59,385 : INFO : loaded lda.model\n", + "2019-01-31 01:40:59,385 : INFO : loading LdaState object from lda.model.state\n", + "2019-01-31 01:40:59,479 : INFO : loaded lda.model.state\n", + "/home/anotherbugmaster/gensim/gensim/matutils.py:503: FutureWarning: arrays to stack must be passed as a \"sequence\" type such as list or tuple. Support for non-sequence iterables such as generators is deprecated as of NumPy 1.16 and will raise an error in the future.\n", + " result = np.column_stack(sparse2full(doc, num_terms) for doc in corpus)\n", + "2019-01-31 01:41:07,761 : INFO : CorpusAccumulator accumulated stats from 1000 documents\n", + "2019-01-31 01:41:07,871 : INFO : CorpusAccumulator accumulated stats from 2000 documents\n" + ] + } + ], + "source": [ + "lda = LdaModel.load('lda.model')\n", + "row.update(get_tm_metrics(lda, test_corpus))\n", + "tm_metrics = tm_metrics.append(pd.Series(row), ignore_index=True)" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "### Train Sklearn NMF and store metrics" + ] + }, + { + "cell_type": "code", + "execution_count": 19, + "metadata": {}, + "outputs": [ + { + "data": { + "text/plain": [ + "['sklearn_nmf.joblib']" + ] + }, + "execution_count": 19, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "# Normalize the input corpus to pass to sklearn\n", + "train_csc.data /= np.repeat(np.array(train_csc.sum(axis=0)), train_csc.getnnz(axis=0))\n", "\n", - "Moreover, NMF can be very flexible on RAM usage due to sparsity option, which leaves only small amount of elements in inner matrices." + "row = dict()\n", + "row['model'] = 'sklearn_nmf'\n", + "sklearn_nmf = SklearnNmf(n_components=50, tol=1e-2, random_state=42)\n", + "row['train_time'], row['mean_ram'], row['max_ram'], sklearn_nmf = get_train_time_and_ram(\n", + " lambda: sklearn_nmf.fit(train_csc.T),\n", + " 'slearn_nmf',\n", + ")\n", + "\n", + "joblib.dump(sklearn_nmf, 'sklearn_nmf.joblib')" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "### Load Sklearn NMF and store metrics" + ] + }, + { + "cell_type": "code", + "execution_count": 20, + "metadata": {}, + "outputs": [], + "source": [ + "sklearn_nmf = joblib.load('sklearn_nmf.joblib')\n", + "row.update(get_sklearn_metrics(\n", + " sklearn_nmf, test_csc.toarray(),\n", + "))\n", + "tm_metrics = tm_metrics.append(pd.Series(row), ignore_index=True)" ] }, { "cell_type": "code", - "execution_count": null, + "execution_count": 21, "metadata": {}, "outputs": [], - "source": [] + "source": [ + "tm_metrics.replace(np.nan, '-', inplace=True)" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "## Results" + ] + }, + { + "cell_type": "code", + "execution_count": 22, + "metadata": {}, + "outputs": [ + { + "data": { + "text/html": [ + "
\n", + "\n", + "\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
coherencel2_normmax_rammean_rammodelperplexitytrain_time
0-2.90777.3380008587 MB8553.0 MBgensim_nmf3817.23900000:24:16
1-2.52867.3648008773 MB8773.0 MBlda4701.97600001:25:59
2-6.97758317238 MB11675.0 MBsklearn_nmf4437.41731500:40:41
\n", + "
" + ], + "text/plain": [ + " coherence l2_norm max_ram mean_ram model perplexity \\\n", + "0 -2.9077 7.338000 8587 MB 8553.0 MB gensim_nmf 3817.239000 \n", + "1 -2.5286 7.364800 8773 MB 8773.0 MB lda 4701.976000 \n", + "2 - 6.977583 17238 MB 11675.0 MB sklearn_nmf 4437.417315 \n", + "\n", + " train_time \n", + "0 00:24:16 \n", + "1 01:25:59 \n", + "2 00:40:41 " + ] + }, + "execution_count": 22, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "tm_metrics" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "As we can see, NMF can be significantly faster than LDA without sacrificing quality of topics too much (or not sacrificing at all)\n", + "\n", + "Moreover, NMF can be very flexible on RAM usage due to sparsity option, which leaves only small amount of elements in inner matrices." + ] } ], "metadata": { @@ -1304,7 +23530,7 @@ "name": "python", "nbconvert_exporter": "python", "pygments_lexer": "ipython3", - "version": "3.7.2" + "version": "3.5.2" } }, "nbformat": 4, diff --git a/docs/src/apiref.rst b/docs/src/apiref.rst index c4f31f7f28..ae345e22bd 100644 --- a/docs/src/apiref.rst +++ b/docs/src/apiref.rst @@ -47,6 +47,7 @@ Modules: models/keyedvectors models/doc2vec models/fasttext + models/_fasttext_bin models/phrases models/poincare models/coherencemodel diff --git a/docs/src/conf.py b/docs/src/conf.py index 28da8af97e..001b357a9a 100644 --- a/docs/src/conf.py +++ b/docs/src/conf.py @@ -57,7 +57,7 @@ # The short X.Y version. version = '3.7' # The full version, including alpha/beta/rc tags. -release = '3.7.0' +release = '3.7.1' # The language for content autogenerated by Sphinx. Refer to documentation # for a list of supported languages. diff --git a/docs/src/models/_fasttext_bin.rst b/docs/src/models/_fasttext_bin.rst new file mode 100644 index 0000000000..eb9a0ad950 --- /dev/null +++ b/docs/src/models/_fasttext_bin.rst @@ -0,0 +1,10 @@ +:mod:`models._fasttext_bin` -- Facebook I/O +=========================================== + +.. automodule:: gensim.models._fasttext_bin + :synopsis: Facebook I/O + :members: + :inherited-members: + :special-members: __getitem__ + :undoc-members: + :show-inheritance: diff --git a/docs/src/tut1.rst b/docs/src/tut1.rst index 992858ffad..394cf113c1 100644 --- a/docs/src/tut1.rst +++ b/docs/src/tut1.rst @@ -5,7 +5,12 @@ Corpora and Vector Spaces This tutorial is available as a Jupyter Notebook `here `_. -Don't forget to set +Or run this notebook online (no installation required) via the Binder project: + +.. image:: https://mybinder.org/badge_logo.svg + :target: https://mybinder.org/v2/gh/RaRe-Technologies/gensim/master?filepath=%2Fdocs%2Fnotebooks%2FCorpora_and_Vector_Spaces.ipynb + +| Don't forget to set >>> import logging >>> logging.basicConfig(format='%(asctime)s : %(levelname)s : %(message)s', level=logging.INFO) diff --git a/docs/src/tutorial.rst b/docs/src/tutorial.rst index 3ec9631153..a66d7dbac3 100644 --- a/docs/src/tutorial.rst +++ b/docs/src/tutorial.rst @@ -30,6 +30,11 @@ priority levels; to activate logging (this is optional), run >>> import logging >>> logging.basicConfig(format='%(asctime)s : %(levelname)s : %(message)s', level=logging.INFO) +Many of the topics in these tutorials are also presented in Jupyter notebooks, which can be run in your browser via the Binder project (no installation required) by clicking here: + +.. image:: https://mybinder.org/badge_logo.svg + :target: https://mybinder.org/v2/gh/RaRe-Technologies/gensim/master?filepath=%2Fdocs%2Fnotebooks + .. _first-example: diff --git a/gensim/__init__.py b/gensim/__init__.py index 6499a59e97..58418001bf 100644 --- a/gensim/__init__.py +++ b/gensim/__init__.py @@ -5,7 +5,7 @@ from gensim import parsing, corpora, matutils, interfaces, models, similarities, summarization, utils # noqa:F401 import logging -__version__ = '3.7.0' +__version__ = '3.7.1' logger = logging.getLogger('gensim') diff --git a/gensim/_matutils.c b/gensim/_matutils.c index 52d56d63b9..358dfcc7ea 100644 --- a/gensim/_matutils.c +++ b/gensim/_matutils.c @@ -1,4 +1,4 @@ -/* Generated by Cython 0.29.2 */ +/* Generated by Cython 0.29.3 */ #define PY_SSIZE_T_CLEAN #include "Python.h" @@ -7,8 +7,8 @@ #elif PY_VERSION_HEX < 0x02060000 || (0x03000000 <= PY_VERSION_HEX && PY_VERSION_HEX < 0x03030000) #error Cython requires Python 2.6+ or Python 3.3+. #else -#define CYTHON_ABI "0_29_2" -#define CYTHON_HEX_VERSION 0x001D02F0 +#define CYTHON_ABI "0_29_3" +#define CYTHON_HEX_VERSION 0x001D03F0 #define CYTHON_FUTURE_DIVISION 1 #include #ifndef offsetof @@ -398,7 +398,7 @@ typedef int Py_tss_t; static CYTHON_INLINE int PyThread_tss_create(Py_tss_t *key) { *key = PyThread_create_key(); - return 0; // PyThread_create_key reports success always + return 0; } static CYTHON_INLINE Py_tss_t * PyThread_tss_alloc(void) { Py_tss_t *key = (Py_tss_t *)PyObject_Malloc(sizeof(Py_tss_t)); @@ -421,7 +421,7 @@ static CYTHON_INLINE int PyThread_tss_set(Py_tss_t *key, void *value) { static CYTHON_INLINE void * PyThread_tss_get(Py_tss_t *key) { return PyThread_get_key_value(*key); } -#endif // TSS (Thread Specific Storage) API +#endif #if CYTHON_COMPILING_IN_CPYTHON || defined(_PyDict_NewPresized) #define __Pyx_PyDict_NewPresized(n) ((n <= 8) ? PyDict_New() : _PyDict_NewPresized(n)) #else @@ -959,7 +959,7 @@ typedef struct { } __Pyx_BufFmt_Context; -/* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":776 +/* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":776 * # in Cython to enable them only on the right systems. * * ctypedef npy_int8 int8_t # <<<<<<<<<<<<<< @@ -968,7 +968,7 @@ typedef struct { */ typedef npy_int8 __pyx_t_5numpy_int8_t; -/* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":777 +/* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":777 * * ctypedef npy_int8 int8_t * ctypedef npy_int16 int16_t # <<<<<<<<<<<<<< @@ -977,7 +977,7 @@ typedef npy_int8 __pyx_t_5numpy_int8_t; */ typedef npy_int16 __pyx_t_5numpy_int16_t; -/* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":778 +/* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":778 * ctypedef npy_int8 int8_t * ctypedef npy_int16 int16_t * ctypedef npy_int32 int32_t # <<<<<<<<<<<<<< @@ -986,7 +986,7 @@ typedef npy_int16 __pyx_t_5numpy_int16_t; */ typedef npy_int32 __pyx_t_5numpy_int32_t; -/* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":779 +/* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":779 * ctypedef npy_int16 int16_t * ctypedef npy_int32 int32_t * ctypedef npy_int64 int64_t # <<<<<<<<<<<<<< @@ -995,7 +995,7 @@ typedef npy_int32 __pyx_t_5numpy_int32_t; */ typedef npy_int64 __pyx_t_5numpy_int64_t; -/* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":783 +/* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":783 * #ctypedef npy_int128 int128_t * * ctypedef npy_uint8 uint8_t # <<<<<<<<<<<<<< @@ -1004,7 +1004,7 @@ typedef npy_int64 __pyx_t_5numpy_int64_t; */ typedef npy_uint8 __pyx_t_5numpy_uint8_t; -/* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":784 +/* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":784 * * ctypedef npy_uint8 uint8_t * ctypedef npy_uint16 uint16_t # <<<<<<<<<<<<<< @@ -1013,7 +1013,7 @@ typedef npy_uint8 __pyx_t_5numpy_uint8_t; */ typedef npy_uint16 __pyx_t_5numpy_uint16_t; -/* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":785 +/* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":785 * ctypedef npy_uint8 uint8_t * ctypedef npy_uint16 uint16_t * ctypedef npy_uint32 uint32_t # <<<<<<<<<<<<<< @@ -1022,7 +1022,7 @@ typedef npy_uint16 __pyx_t_5numpy_uint16_t; */ typedef npy_uint32 __pyx_t_5numpy_uint32_t; -/* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":786 +/* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":786 * ctypedef npy_uint16 uint16_t * ctypedef npy_uint32 uint32_t * ctypedef npy_uint64 uint64_t # <<<<<<<<<<<<<< @@ -1031,7 +1031,7 @@ typedef npy_uint32 __pyx_t_5numpy_uint32_t; */ typedef npy_uint64 __pyx_t_5numpy_uint64_t; -/* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":790 +/* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":790 * #ctypedef npy_uint128 uint128_t * * ctypedef npy_float32 float32_t # <<<<<<<<<<<<<< @@ -1040,7 +1040,7 @@ typedef npy_uint64 __pyx_t_5numpy_uint64_t; */ typedef npy_float32 __pyx_t_5numpy_float32_t; -/* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":791 +/* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":791 * * ctypedef npy_float32 float32_t * ctypedef npy_float64 float64_t # <<<<<<<<<<<<<< @@ -1049,7 +1049,7 @@ typedef npy_float32 __pyx_t_5numpy_float32_t; */ typedef npy_float64 __pyx_t_5numpy_float64_t; -/* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":800 +/* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":800 * # The int types are mapped a bit surprising -- * # numpy.int corresponds to 'l' and numpy.long to 'q' * ctypedef npy_long int_t # <<<<<<<<<<<<<< @@ -1058,7 +1058,7 @@ typedef npy_float64 __pyx_t_5numpy_float64_t; */ typedef npy_long __pyx_t_5numpy_int_t; -/* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":801 +/* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":801 * # numpy.int corresponds to 'l' and numpy.long to 'q' * ctypedef npy_long int_t * ctypedef npy_longlong long_t # <<<<<<<<<<<<<< @@ -1067,7 +1067,7 @@ typedef npy_long __pyx_t_5numpy_int_t; */ typedef npy_longlong __pyx_t_5numpy_long_t; -/* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":802 +/* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":802 * ctypedef npy_long int_t * ctypedef npy_longlong long_t * ctypedef npy_longlong longlong_t # <<<<<<<<<<<<<< @@ -1076,7 +1076,7 @@ typedef npy_longlong __pyx_t_5numpy_long_t; */ typedef npy_longlong __pyx_t_5numpy_longlong_t; -/* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":804 +/* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":804 * ctypedef npy_longlong longlong_t * * ctypedef npy_ulong uint_t # <<<<<<<<<<<<<< @@ -1085,7 +1085,7 @@ typedef npy_longlong __pyx_t_5numpy_longlong_t; */ typedef npy_ulong __pyx_t_5numpy_uint_t; -/* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":805 +/* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":805 * * ctypedef npy_ulong uint_t * ctypedef npy_ulonglong ulong_t # <<<<<<<<<<<<<< @@ -1094,7 +1094,7 @@ typedef npy_ulong __pyx_t_5numpy_uint_t; */ typedef npy_ulonglong __pyx_t_5numpy_ulong_t; -/* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":806 +/* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":806 * ctypedef npy_ulong uint_t * ctypedef npy_ulonglong ulong_t * ctypedef npy_ulonglong ulonglong_t # <<<<<<<<<<<<<< @@ -1103,7 +1103,7 @@ typedef npy_ulonglong __pyx_t_5numpy_ulong_t; */ typedef npy_ulonglong __pyx_t_5numpy_ulonglong_t; -/* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":808 +/* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":808 * ctypedef npy_ulonglong ulonglong_t * * ctypedef npy_intp intp_t # <<<<<<<<<<<<<< @@ -1112,7 +1112,7 @@ typedef npy_ulonglong __pyx_t_5numpy_ulonglong_t; */ typedef npy_intp __pyx_t_5numpy_intp_t; -/* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":809 +/* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":809 * * ctypedef npy_intp intp_t * ctypedef npy_uintp uintp_t # <<<<<<<<<<<<<< @@ -1121,7 +1121,7 @@ typedef npy_intp __pyx_t_5numpy_intp_t; */ typedef npy_uintp __pyx_t_5numpy_uintp_t; -/* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":811 +/* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":811 * ctypedef npy_uintp uintp_t * * ctypedef npy_double float_t # <<<<<<<<<<<<<< @@ -1130,7 +1130,7 @@ typedef npy_uintp __pyx_t_5numpy_uintp_t; */ typedef npy_double __pyx_t_5numpy_float_t; -/* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":812 +/* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":812 * * ctypedef npy_double float_t * ctypedef npy_double double_t # <<<<<<<<<<<<<< @@ -1139,7 +1139,7 @@ typedef npy_double __pyx_t_5numpy_float_t; */ typedef npy_double __pyx_t_5numpy_double_t; -/* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":813 +/* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":813 * ctypedef npy_double float_t * ctypedef npy_double double_t * ctypedef npy_longdouble longdouble_t # <<<<<<<<<<<<<< @@ -1178,7 +1178,7 @@ struct __pyx_MemviewEnum_obj; struct __pyx_memoryview_obj; struct __pyx_memoryviewslice_obj; -/* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":815 +/* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":815 * ctypedef npy_longdouble longdouble_t * * ctypedef npy_cfloat cfloat_t # <<<<<<<<<<<<<< @@ -1187,7 +1187,7 @@ struct __pyx_memoryviewslice_obj; */ typedef npy_cfloat __pyx_t_5numpy_cfloat_t; -/* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":816 +/* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":816 * * ctypedef npy_cfloat cfloat_t * ctypedef npy_cdouble cdouble_t # <<<<<<<<<<<<<< @@ -1196,7 +1196,7 @@ typedef npy_cfloat __pyx_t_5numpy_cfloat_t; */ typedef npy_cdouble __pyx_t_5numpy_cdouble_t; -/* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":817 +/* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":817 * ctypedef npy_cfloat cfloat_t * ctypedef npy_cdouble cdouble_t * ctypedef npy_clongdouble clongdouble_t # <<<<<<<<<<<<<< @@ -1205,7 +1205,7 @@ typedef npy_cdouble __pyx_t_5numpy_cdouble_t; */ typedef npy_clongdouble __pyx_t_5numpy_clongdouble_t; -/* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":819 +/* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":819 * ctypedef npy_clongdouble clongdouble_t * * ctypedef npy_cdouble complex_t # <<<<<<<<<<<<<< @@ -6142,7 +6142,7 @@ static CYTHON_INLINE double __pyx_fuse_1__pyx_f_6gensim_9_matutils__digamma(doub return __pyx_r; } -/* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":258 +/* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":258 * # experimental exception made for __getbuffer__ and __releasebuffer__ * # -- the details of this may change. * def __getbuffer__(ndarray self, Py_buffer* info, int flags): # <<<<<<<<<<<<<< @@ -6191,7 +6191,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P __pyx_v_info->obj = Py_None; __Pyx_INCREF(Py_None); __Pyx_GIVEREF(__pyx_v_info->obj); - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":265 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":265 * * cdef int i, ndim * cdef int endian_detector = 1 # <<<<<<<<<<<<<< @@ -6200,7 +6200,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P */ __pyx_v_endian_detector = 1; - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":266 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":266 * cdef int i, ndim * cdef int endian_detector = 1 * cdef bint little_endian = ((&endian_detector)[0] != 0) # <<<<<<<<<<<<<< @@ -6209,7 +6209,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P */ __pyx_v_little_endian = ((((char *)(&__pyx_v_endian_detector))[0]) != 0); - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":268 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":268 * cdef bint little_endian = ((&endian_detector)[0] != 0) * * ndim = PyArray_NDIM(self) # <<<<<<<<<<<<<< @@ -6218,7 +6218,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P */ __pyx_v_ndim = PyArray_NDIM(__pyx_v_self); - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":270 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":270 * ndim = PyArray_NDIM(self) * * if ((flags & pybuf.PyBUF_C_CONTIGUOUS == pybuf.PyBUF_C_CONTIGUOUS) # <<<<<<<<<<<<<< @@ -6232,7 +6232,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P goto __pyx_L4_bool_binop_done; } - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":271 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":271 * * if ((flags & pybuf.PyBUF_C_CONTIGUOUS == pybuf.PyBUF_C_CONTIGUOUS) * and not PyArray_CHKFLAGS(self, NPY_ARRAY_C_CONTIGUOUS)): # <<<<<<<<<<<<<< @@ -6243,7 +6243,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P __pyx_t_1 = __pyx_t_2; __pyx_L4_bool_binop_done:; - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":270 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":270 * ndim = PyArray_NDIM(self) * * if ((flags & pybuf.PyBUF_C_CONTIGUOUS == pybuf.PyBUF_C_CONTIGUOUS) # <<<<<<<<<<<<<< @@ -6252,7 +6252,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P */ if (unlikely(__pyx_t_1)) { - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":272 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":272 * if ((flags & pybuf.PyBUF_C_CONTIGUOUS == pybuf.PyBUF_C_CONTIGUOUS) * and not PyArray_CHKFLAGS(self, NPY_ARRAY_C_CONTIGUOUS)): * raise ValueError(u"ndarray is not C contiguous") # <<<<<<<<<<<<<< @@ -6265,7 +6265,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P __Pyx_DECREF(__pyx_t_3); __pyx_t_3 = 0; __PYX_ERR(1, 272, __pyx_L1_error) - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":270 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":270 * ndim = PyArray_NDIM(self) * * if ((flags & pybuf.PyBUF_C_CONTIGUOUS == pybuf.PyBUF_C_CONTIGUOUS) # <<<<<<<<<<<<<< @@ -6274,7 +6274,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P */ } - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":274 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":274 * raise ValueError(u"ndarray is not C contiguous") * * if ((flags & pybuf.PyBUF_F_CONTIGUOUS == pybuf.PyBUF_F_CONTIGUOUS) # <<<<<<<<<<<<<< @@ -6288,7 +6288,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P goto __pyx_L7_bool_binop_done; } - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":275 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":275 * * if ((flags & pybuf.PyBUF_F_CONTIGUOUS == pybuf.PyBUF_F_CONTIGUOUS) * and not PyArray_CHKFLAGS(self, NPY_ARRAY_F_CONTIGUOUS)): # <<<<<<<<<<<<<< @@ -6299,7 +6299,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P __pyx_t_1 = __pyx_t_2; __pyx_L7_bool_binop_done:; - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":274 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":274 * raise ValueError(u"ndarray is not C contiguous") * * if ((flags & pybuf.PyBUF_F_CONTIGUOUS == pybuf.PyBUF_F_CONTIGUOUS) # <<<<<<<<<<<<<< @@ -6308,7 +6308,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P */ if (unlikely(__pyx_t_1)) { - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":276 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":276 * if ((flags & pybuf.PyBUF_F_CONTIGUOUS == pybuf.PyBUF_F_CONTIGUOUS) * and not PyArray_CHKFLAGS(self, NPY_ARRAY_F_CONTIGUOUS)): * raise ValueError(u"ndarray is not Fortran contiguous") # <<<<<<<<<<<<<< @@ -6321,7 +6321,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P __Pyx_DECREF(__pyx_t_3); __pyx_t_3 = 0; __PYX_ERR(1, 276, __pyx_L1_error) - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":274 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":274 * raise ValueError(u"ndarray is not C contiguous") * * if ((flags & pybuf.PyBUF_F_CONTIGUOUS == pybuf.PyBUF_F_CONTIGUOUS) # <<<<<<<<<<<<<< @@ -6330,7 +6330,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P */ } - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":278 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":278 * raise ValueError(u"ndarray is not Fortran contiguous") * * info.buf = PyArray_DATA(self) # <<<<<<<<<<<<<< @@ -6339,7 +6339,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P */ __pyx_v_info->buf = PyArray_DATA(__pyx_v_self); - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":279 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":279 * * info.buf = PyArray_DATA(self) * info.ndim = ndim # <<<<<<<<<<<<<< @@ -6348,7 +6348,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P */ __pyx_v_info->ndim = __pyx_v_ndim; - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":280 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":280 * info.buf = PyArray_DATA(self) * info.ndim = ndim * if sizeof(npy_intp) != sizeof(Py_ssize_t): # <<<<<<<<<<<<<< @@ -6358,7 +6358,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P __pyx_t_1 = (((sizeof(npy_intp)) != (sizeof(Py_ssize_t))) != 0); if (__pyx_t_1) { - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":283 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":283 * # Allocate new buffer for strides and shape info. * # This is allocated as one block, strides first. * info.strides = PyObject_Malloc(sizeof(Py_ssize_t) * 2 * ndim) # <<<<<<<<<<<<<< @@ -6367,7 +6367,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P */ __pyx_v_info->strides = ((Py_ssize_t *)PyObject_Malloc((((sizeof(Py_ssize_t)) * 2) * ((size_t)__pyx_v_ndim)))); - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":284 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":284 * # This is allocated as one block, strides first. * info.strides = PyObject_Malloc(sizeof(Py_ssize_t) * 2 * ndim) * info.shape = info.strides + ndim # <<<<<<<<<<<<<< @@ -6376,7 +6376,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P */ __pyx_v_info->shape = (__pyx_v_info->strides + __pyx_v_ndim); - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":285 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":285 * info.strides = PyObject_Malloc(sizeof(Py_ssize_t) * 2 * ndim) * info.shape = info.strides + ndim * for i in range(ndim): # <<<<<<<<<<<<<< @@ -6388,7 +6388,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P for (__pyx_t_6 = 0; __pyx_t_6 < __pyx_t_5; __pyx_t_6+=1) { __pyx_v_i = __pyx_t_6; - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":286 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":286 * info.shape = info.strides + ndim * for i in range(ndim): * info.strides[i] = PyArray_STRIDES(self)[i] # <<<<<<<<<<<<<< @@ -6397,7 +6397,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P */ (__pyx_v_info->strides[__pyx_v_i]) = (PyArray_STRIDES(__pyx_v_self)[__pyx_v_i]); - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":287 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":287 * for i in range(ndim): * info.strides[i] = PyArray_STRIDES(self)[i] * info.shape[i] = PyArray_DIMS(self)[i] # <<<<<<<<<<<<<< @@ -6407,7 +6407,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P (__pyx_v_info->shape[__pyx_v_i]) = (PyArray_DIMS(__pyx_v_self)[__pyx_v_i]); } - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":280 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":280 * info.buf = PyArray_DATA(self) * info.ndim = ndim * if sizeof(npy_intp) != sizeof(Py_ssize_t): # <<<<<<<<<<<<<< @@ -6417,7 +6417,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P goto __pyx_L9; } - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":289 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":289 * info.shape[i] = PyArray_DIMS(self)[i] * else: * info.strides = PyArray_STRIDES(self) # <<<<<<<<<<<<<< @@ -6427,7 +6427,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P /*else*/ { __pyx_v_info->strides = ((Py_ssize_t *)PyArray_STRIDES(__pyx_v_self)); - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":290 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":290 * else: * info.strides = PyArray_STRIDES(self) * info.shape = PyArray_DIMS(self) # <<<<<<<<<<<<<< @@ -6438,7 +6438,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P } __pyx_L9:; - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":291 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":291 * info.strides = PyArray_STRIDES(self) * info.shape = PyArray_DIMS(self) * info.suboffsets = NULL # <<<<<<<<<<<<<< @@ -6447,7 +6447,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P */ __pyx_v_info->suboffsets = NULL; - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":292 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":292 * info.shape = PyArray_DIMS(self) * info.suboffsets = NULL * info.itemsize = PyArray_ITEMSIZE(self) # <<<<<<<<<<<<<< @@ -6456,7 +6456,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P */ __pyx_v_info->itemsize = PyArray_ITEMSIZE(__pyx_v_self); - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":293 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":293 * info.suboffsets = NULL * info.itemsize = PyArray_ITEMSIZE(self) * info.readonly = not PyArray_ISWRITEABLE(self) # <<<<<<<<<<<<<< @@ -6465,7 +6465,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P */ __pyx_v_info->readonly = (!(PyArray_ISWRITEABLE(__pyx_v_self) != 0)); - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":296 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":296 * * cdef int t * cdef char* f = NULL # <<<<<<<<<<<<<< @@ -6474,7 +6474,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P */ __pyx_v_f = NULL; - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":297 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":297 * cdef int t * cdef char* f = NULL * cdef dtype descr = PyArray_DESCR(self) # <<<<<<<<<<<<<< @@ -6487,7 +6487,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P __pyx_v_descr = ((PyArray_Descr *)__pyx_t_3); __pyx_t_3 = 0; - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":300 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":300 * cdef int offset * * info.obj = self # <<<<<<<<<<<<<< @@ -6500,7 +6500,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P __Pyx_DECREF(__pyx_v_info->obj); __pyx_v_info->obj = ((PyObject *)__pyx_v_self); - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":302 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":302 * info.obj = self * * if not PyDataType_HASFIELDS(descr): # <<<<<<<<<<<<<< @@ -6510,7 +6510,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P __pyx_t_1 = ((!(PyDataType_HASFIELDS(__pyx_v_descr) != 0)) != 0); if (__pyx_t_1) { - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":303 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":303 * * if not PyDataType_HASFIELDS(descr): * t = descr.type_num # <<<<<<<<<<<<<< @@ -6520,7 +6520,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P __pyx_t_4 = __pyx_v_descr->type_num; __pyx_v_t = __pyx_t_4; - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":304 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":304 * if not PyDataType_HASFIELDS(descr): * t = descr.type_num * if ((descr.byteorder == c'>' and little_endian) or # <<<<<<<<<<<<<< @@ -6540,7 +6540,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P } __pyx_L15_next_or:; - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":305 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":305 * t = descr.type_num * if ((descr.byteorder == c'>' and little_endian) or * (descr.byteorder == c'<' and not little_endian)): # <<<<<<<<<<<<<< @@ -6557,7 +6557,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P __pyx_t_1 = __pyx_t_2; __pyx_L14_bool_binop_done:; - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":304 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":304 * if not PyDataType_HASFIELDS(descr): * t = descr.type_num * if ((descr.byteorder == c'>' and little_endian) or # <<<<<<<<<<<<<< @@ -6566,7 +6566,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P */ if (unlikely(__pyx_t_1)) { - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":306 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":306 * if ((descr.byteorder == c'>' and little_endian) or * (descr.byteorder == c'<' and not little_endian)): * raise ValueError(u"Non-native byte order not supported") # <<<<<<<<<<<<<< @@ -6579,7 +6579,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P __Pyx_DECREF(__pyx_t_3); __pyx_t_3 = 0; __PYX_ERR(1, 306, __pyx_L1_error) - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":304 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":304 * if not PyDataType_HASFIELDS(descr): * t = descr.type_num * if ((descr.byteorder == c'>' and little_endian) or # <<<<<<<<<<<<<< @@ -6588,7 +6588,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P */ } - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":307 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":307 * (descr.byteorder == c'<' and not little_endian)): * raise ValueError(u"Non-native byte order not supported") * if t == NPY_BYTE: f = "b" # <<<<<<<<<<<<<< @@ -6601,7 +6601,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P break; case NPY_UBYTE: - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":308 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":308 * raise ValueError(u"Non-native byte order not supported") * if t == NPY_BYTE: f = "b" * elif t == NPY_UBYTE: f = "B" # <<<<<<<<<<<<<< @@ -6612,7 +6612,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P break; case NPY_SHORT: - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":309 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":309 * if t == NPY_BYTE: f = "b" * elif t == NPY_UBYTE: f = "B" * elif t == NPY_SHORT: f = "h" # <<<<<<<<<<<<<< @@ -6623,7 +6623,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P break; case NPY_USHORT: - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":310 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":310 * elif t == NPY_UBYTE: f = "B" * elif t == NPY_SHORT: f = "h" * elif t == NPY_USHORT: f = "H" # <<<<<<<<<<<<<< @@ -6634,7 +6634,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P break; case NPY_INT: - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":311 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":311 * elif t == NPY_SHORT: f = "h" * elif t == NPY_USHORT: f = "H" * elif t == NPY_INT: f = "i" # <<<<<<<<<<<<<< @@ -6645,7 +6645,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P break; case NPY_UINT: - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":312 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":312 * elif t == NPY_USHORT: f = "H" * elif t == NPY_INT: f = "i" * elif t == NPY_UINT: f = "I" # <<<<<<<<<<<<<< @@ -6656,7 +6656,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P break; case NPY_LONG: - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":313 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":313 * elif t == NPY_INT: f = "i" * elif t == NPY_UINT: f = "I" * elif t == NPY_LONG: f = "l" # <<<<<<<<<<<<<< @@ -6667,7 +6667,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P break; case NPY_ULONG: - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":314 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":314 * elif t == NPY_UINT: f = "I" * elif t == NPY_LONG: f = "l" * elif t == NPY_ULONG: f = "L" # <<<<<<<<<<<<<< @@ -6678,7 +6678,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P break; case NPY_LONGLONG: - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":315 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":315 * elif t == NPY_LONG: f = "l" * elif t == NPY_ULONG: f = "L" * elif t == NPY_LONGLONG: f = "q" # <<<<<<<<<<<<<< @@ -6689,7 +6689,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P break; case NPY_ULONGLONG: - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":316 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":316 * elif t == NPY_ULONG: f = "L" * elif t == NPY_LONGLONG: f = "q" * elif t == NPY_ULONGLONG: f = "Q" # <<<<<<<<<<<<<< @@ -6700,7 +6700,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P break; case NPY_FLOAT: - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":317 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":317 * elif t == NPY_LONGLONG: f = "q" * elif t == NPY_ULONGLONG: f = "Q" * elif t == NPY_FLOAT: f = "f" # <<<<<<<<<<<<<< @@ -6711,7 +6711,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P break; case NPY_DOUBLE: - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":318 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":318 * elif t == NPY_ULONGLONG: f = "Q" * elif t == NPY_FLOAT: f = "f" * elif t == NPY_DOUBLE: f = "d" # <<<<<<<<<<<<<< @@ -6722,7 +6722,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P break; case NPY_LONGDOUBLE: - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":319 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":319 * elif t == NPY_FLOAT: f = "f" * elif t == NPY_DOUBLE: f = "d" * elif t == NPY_LONGDOUBLE: f = "g" # <<<<<<<<<<<<<< @@ -6733,7 +6733,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P break; case NPY_CFLOAT: - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":320 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":320 * elif t == NPY_DOUBLE: f = "d" * elif t == NPY_LONGDOUBLE: f = "g" * elif t == NPY_CFLOAT: f = "Zf" # <<<<<<<<<<<<<< @@ -6744,7 +6744,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P break; case NPY_CDOUBLE: - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":321 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":321 * elif t == NPY_LONGDOUBLE: f = "g" * elif t == NPY_CFLOAT: f = "Zf" * elif t == NPY_CDOUBLE: f = "Zd" # <<<<<<<<<<<<<< @@ -6755,7 +6755,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P break; case NPY_CLONGDOUBLE: - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":322 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":322 * elif t == NPY_CFLOAT: f = "Zf" * elif t == NPY_CDOUBLE: f = "Zd" * elif t == NPY_CLONGDOUBLE: f = "Zg" # <<<<<<<<<<<<<< @@ -6766,7 +6766,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P break; case NPY_OBJECT: - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":323 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":323 * elif t == NPY_CDOUBLE: f = "Zd" * elif t == NPY_CLONGDOUBLE: f = "Zg" * elif t == NPY_OBJECT: f = "O" # <<<<<<<<<<<<<< @@ -6777,7 +6777,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P break; default: - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":325 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":325 * elif t == NPY_OBJECT: f = "O" * else: * raise ValueError(u"unknown dtype code in numpy.pxd (%d)" % t) # <<<<<<<<<<<<<< @@ -6798,7 +6798,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P break; } - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":326 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":326 * else: * raise ValueError(u"unknown dtype code in numpy.pxd (%d)" % t) * info.format = f # <<<<<<<<<<<<<< @@ -6807,7 +6807,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P */ __pyx_v_info->format = __pyx_v_f; - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":327 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":327 * raise ValueError(u"unknown dtype code in numpy.pxd (%d)" % t) * info.format = f * return # <<<<<<<<<<<<<< @@ -6817,7 +6817,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P __pyx_r = 0; goto __pyx_L0; - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":302 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":302 * info.obj = self * * if not PyDataType_HASFIELDS(descr): # <<<<<<<<<<<<<< @@ -6826,7 +6826,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P */ } - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":329 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":329 * return * else: * info.format = PyObject_Malloc(_buffer_format_string_len) # <<<<<<<<<<<<<< @@ -6836,7 +6836,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P /*else*/ { __pyx_v_info->format = ((char *)PyObject_Malloc(0xFF)); - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":330 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":330 * else: * info.format = PyObject_Malloc(_buffer_format_string_len) * info.format[0] = c'^' # Native data types, manual alignment # <<<<<<<<<<<<<< @@ -6845,7 +6845,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P */ (__pyx_v_info->format[0]) = '^'; - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":331 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":331 * info.format = PyObject_Malloc(_buffer_format_string_len) * info.format[0] = c'^' # Native data types, manual alignment * offset = 0 # <<<<<<<<<<<<<< @@ -6854,7 +6854,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P */ __pyx_v_offset = 0; - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":332 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":332 * info.format[0] = c'^' # Native data types, manual alignment * offset = 0 * f = _util_dtypestring(descr, info.format + 1, # <<<<<<<<<<<<<< @@ -6864,7 +6864,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P __pyx_t_9 = __pyx_f_5numpy__util_dtypestring(__pyx_v_descr, (__pyx_v_info->format + 1), (__pyx_v_info->format + 0xFF), (&__pyx_v_offset)); if (unlikely(__pyx_t_9 == ((char *)NULL))) __PYX_ERR(1, 332, __pyx_L1_error) __pyx_v_f = __pyx_t_9; - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":335 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":335 * info.format + _buffer_format_string_len, * &offset) * f[0] = c'\0' # Terminate format string # <<<<<<<<<<<<<< @@ -6874,7 +6874,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P (__pyx_v_f[0]) = '\x00'; } - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":258 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":258 * # experimental exception made for __getbuffer__ and __releasebuffer__ * # -- the details of this may change. * def __getbuffer__(ndarray self, Py_buffer* info, int flags): # <<<<<<<<<<<<<< @@ -6906,7 +6906,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P return __pyx_r; } -/* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":337 +/* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":337 * f[0] = c'\0' # Terminate format string * * def __releasebuffer__(ndarray self, Py_buffer* info): # <<<<<<<<<<<<<< @@ -6930,7 +6930,7 @@ static void __pyx_pf_5numpy_7ndarray_2__releasebuffer__(PyArrayObject *__pyx_v_s int __pyx_t_1; __Pyx_RefNannySetupContext("__releasebuffer__", 0); - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":338 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":338 * * def __releasebuffer__(ndarray self, Py_buffer* info): * if PyArray_HASFIELDS(self): # <<<<<<<<<<<<<< @@ -6940,7 +6940,7 @@ static void __pyx_pf_5numpy_7ndarray_2__releasebuffer__(PyArrayObject *__pyx_v_s __pyx_t_1 = (PyArray_HASFIELDS(__pyx_v_self) != 0); if (__pyx_t_1) { - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":339 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":339 * def __releasebuffer__(ndarray self, Py_buffer* info): * if PyArray_HASFIELDS(self): * PyObject_Free(info.format) # <<<<<<<<<<<<<< @@ -6949,7 +6949,7 @@ static void __pyx_pf_5numpy_7ndarray_2__releasebuffer__(PyArrayObject *__pyx_v_s */ PyObject_Free(__pyx_v_info->format); - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":338 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":338 * * def __releasebuffer__(ndarray self, Py_buffer* info): * if PyArray_HASFIELDS(self): # <<<<<<<<<<<<<< @@ -6958,7 +6958,7 @@ static void __pyx_pf_5numpy_7ndarray_2__releasebuffer__(PyArrayObject *__pyx_v_s */ } - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":340 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":340 * if PyArray_HASFIELDS(self): * PyObject_Free(info.format) * if sizeof(npy_intp) != sizeof(Py_ssize_t): # <<<<<<<<<<<<<< @@ -6968,7 +6968,7 @@ static void __pyx_pf_5numpy_7ndarray_2__releasebuffer__(PyArrayObject *__pyx_v_s __pyx_t_1 = (((sizeof(npy_intp)) != (sizeof(Py_ssize_t))) != 0); if (__pyx_t_1) { - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":341 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":341 * PyObject_Free(info.format) * if sizeof(npy_intp) != sizeof(Py_ssize_t): * PyObject_Free(info.strides) # <<<<<<<<<<<<<< @@ -6977,7 +6977,7 @@ static void __pyx_pf_5numpy_7ndarray_2__releasebuffer__(PyArrayObject *__pyx_v_s */ PyObject_Free(__pyx_v_info->strides); - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":340 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":340 * if PyArray_HASFIELDS(self): * PyObject_Free(info.format) * if sizeof(npy_intp) != sizeof(Py_ssize_t): # <<<<<<<<<<<<<< @@ -6986,7 +6986,7 @@ static void __pyx_pf_5numpy_7ndarray_2__releasebuffer__(PyArrayObject *__pyx_v_s */ } - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":337 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":337 * f[0] = c'\0' # Terminate format string * * def __releasebuffer__(ndarray self, Py_buffer* info): # <<<<<<<<<<<<<< @@ -6998,7 +6998,7 @@ static void __pyx_pf_5numpy_7ndarray_2__releasebuffer__(PyArrayObject *__pyx_v_s __Pyx_RefNannyFinishContext(); } -/* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":821 +/* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":821 * ctypedef npy_cdouble complex_t * * cdef inline object PyArray_MultiIterNew1(a): # <<<<<<<<<<<<<< @@ -7012,7 +7012,7 @@ static CYTHON_INLINE PyObject *__pyx_f_5numpy_PyArray_MultiIterNew1(PyObject *__ PyObject *__pyx_t_1 = NULL; __Pyx_RefNannySetupContext("PyArray_MultiIterNew1", 0); - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":822 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":822 * * cdef inline object PyArray_MultiIterNew1(a): * return PyArray_MultiIterNew(1, a) # <<<<<<<<<<<<<< @@ -7026,7 +7026,7 @@ static CYTHON_INLINE PyObject *__pyx_f_5numpy_PyArray_MultiIterNew1(PyObject *__ __pyx_t_1 = 0; goto __pyx_L0; - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":821 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":821 * ctypedef npy_cdouble complex_t * * cdef inline object PyArray_MultiIterNew1(a): # <<<<<<<<<<<<<< @@ -7045,7 +7045,7 @@ static CYTHON_INLINE PyObject *__pyx_f_5numpy_PyArray_MultiIterNew1(PyObject *__ return __pyx_r; } -/* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":824 +/* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":824 * return PyArray_MultiIterNew(1, a) * * cdef inline object PyArray_MultiIterNew2(a, b): # <<<<<<<<<<<<<< @@ -7059,7 +7059,7 @@ static CYTHON_INLINE PyObject *__pyx_f_5numpy_PyArray_MultiIterNew2(PyObject *__ PyObject *__pyx_t_1 = NULL; __Pyx_RefNannySetupContext("PyArray_MultiIterNew2", 0); - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":825 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":825 * * cdef inline object PyArray_MultiIterNew2(a, b): * return PyArray_MultiIterNew(2, a, b) # <<<<<<<<<<<<<< @@ -7073,7 +7073,7 @@ static CYTHON_INLINE PyObject *__pyx_f_5numpy_PyArray_MultiIterNew2(PyObject *__ __pyx_t_1 = 0; goto __pyx_L0; - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":824 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":824 * return PyArray_MultiIterNew(1, a) * * cdef inline object PyArray_MultiIterNew2(a, b): # <<<<<<<<<<<<<< @@ -7092,7 +7092,7 @@ static CYTHON_INLINE PyObject *__pyx_f_5numpy_PyArray_MultiIterNew2(PyObject *__ return __pyx_r; } -/* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":827 +/* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":827 * return PyArray_MultiIterNew(2, a, b) * * cdef inline object PyArray_MultiIterNew3(a, b, c): # <<<<<<<<<<<<<< @@ -7106,7 +7106,7 @@ static CYTHON_INLINE PyObject *__pyx_f_5numpy_PyArray_MultiIterNew3(PyObject *__ PyObject *__pyx_t_1 = NULL; __Pyx_RefNannySetupContext("PyArray_MultiIterNew3", 0); - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":828 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":828 * * cdef inline object PyArray_MultiIterNew3(a, b, c): * return PyArray_MultiIterNew(3, a, b, c) # <<<<<<<<<<<<<< @@ -7120,7 +7120,7 @@ static CYTHON_INLINE PyObject *__pyx_f_5numpy_PyArray_MultiIterNew3(PyObject *__ __pyx_t_1 = 0; goto __pyx_L0; - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":827 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":827 * return PyArray_MultiIterNew(2, a, b) * * cdef inline object PyArray_MultiIterNew3(a, b, c): # <<<<<<<<<<<<<< @@ -7139,7 +7139,7 @@ static CYTHON_INLINE PyObject *__pyx_f_5numpy_PyArray_MultiIterNew3(PyObject *__ return __pyx_r; } -/* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":830 +/* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":830 * return PyArray_MultiIterNew(3, a, b, c) * * cdef inline object PyArray_MultiIterNew4(a, b, c, d): # <<<<<<<<<<<<<< @@ -7153,7 +7153,7 @@ static CYTHON_INLINE PyObject *__pyx_f_5numpy_PyArray_MultiIterNew4(PyObject *__ PyObject *__pyx_t_1 = NULL; __Pyx_RefNannySetupContext("PyArray_MultiIterNew4", 0); - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":831 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":831 * * cdef inline object PyArray_MultiIterNew4(a, b, c, d): * return PyArray_MultiIterNew(4, a, b, c, d) # <<<<<<<<<<<<<< @@ -7167,7 +7167,7 @@ static CYTHON_INLINE PyObject *__pyx_f_5numpy_PyArray_MultiIterNew4(PyObject *__ __pyx_t_1 = 0; goto __pyx_L0; - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":830 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":830 * return PyArray_MultiIterNew(3, a, b, c) * * cdef inline object PyArray_MultiIterNew4(a, b, c, d): # <<<<<<<<<<<<<< @@ -7186,7 +7186,7 @@ static CYTHON_INLINE PyObject *__pyx_f_5numpy_PyArray_MultiIterNew4(PyObject *__ return __pyx_r; } -/* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":833 +/* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":833 * return PyArray_MultiIterNew(4, a, b, c, d) * * cdef inline object PyArray_MultiIterNew5(a, b, c, d, e): # <<<<<<<<<<<<<< @@ -7200,7 +7200,7 @@ static CYTHON_INLINE PyObject *__pyx_f_5numpy_PyArray_MultiIterNew5(PyObject *__ PyObject *__pyx_t_1 = NULL; __Pyx_RefNannySetupContext("PyArray_MultiIterNew5", 0); - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":834 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":834 * * cdef inline object PyArray_MultiIterNew5(a, b, c, d, e): * return PyArray_MultiIterNew(5, a, b, c, d, e) # <<<<<<<<<<<<<< @@ -7214,7 +7214,7 @@ static CYTHON_INLINE PyObject *__pyx_f_5numpy_PyArray_MultiIterNew5(PyObject *__ __pyx_t_1 = 0; goto __pyx_L0; - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":833 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":833 * return PyArray_MultiIterNew(4, a, b, c, d) * * cdef inline object PyArray_MultiIterNew5(a, b, c, d, e): # <<<<<<<<<<<<<< @@ -7233,7 +7233,7 @@ static CYTHON_INLINE PyObject *__pyx_f_5numpy_PyArray_MultiIterNew5(PyObject *__ return __pyx_r; } -/* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":836 +/* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":836 * return PyArray_MultiIterNew(5, a, b, c, d, e) * * cdef inline tuple PyDataType_SHAPE(dtype d): # <<<<<<<<<<<<<< @@ -7247,7 +7247,7 @@ static CYTHON_INLINE PyObject *__pyx_f_5numpy_PyDataType_SHAPE(PyArray_Descr *__ int __pyx_t_1; __Pyx_RefNannySetupContext("PyDataType_SHAPE", 0); - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":837 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":837 * * cdef inline tuple PyDataType_SHAPE(dtype d): * if PyDataType_HASSUBARRAY(d): # <<<<<<<<<<<<<< @@ -7257,7 +7257,7 @@ static CYTHON_INLINE PyObject *__pyx_f_5numpy_PyDataType_SHAPE(PyArray_Descr *__ __pyx_t_1 = (PyDataType_HASSUBARRAY(__pyx_v_d) != 0); if (__pyx_t_1) { - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":838 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":838 * cdef inline tuple PyDataType_SHAPE(dtype d): * if PyDataType_HASSUBARRAY(d): * return d.subarray.shape # <<<<<<<<<<<<<< @@ -7269,7 +7269,7 @@ static CYTHON_INLINE PyObject *__pyx_f_5numpy_PyDataType_SHAPE(PyArray_Descr *__ __pyx_r = ((PyObject*)__pyx_v_d->subarray->shape); goto __pyx_L0; - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":837 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":837 * * cdef inline tuple PyDataType_SHAPE(dtype d): * if PyDataType_HASSUBARRAY(d): # <<<<<<<<<<<<<< @@ -7278,7 +7278,7 @@ static CYTHON_INLINE PyObject *__pyx_f_5numpy_PyDataType_SHAPE(PyArray_Descr *__ */ } - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":840 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":840 * return d.subarray.shape * else: * return () # <<<<<<<<<<<<<< @@ -7292,7 +7292,7 @@ static CYTHON_INLINE PyObject *__pyx_f_5numpy_PyDataType_SHAPE(PyArray_Descr *__ goto __pyx_L0; } - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":836 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":836 * return PyArray_MultiIterNew(5, a, b, c, d, e) * * cdef inline tuple PyDataType_SHAPE(dtype d): # <<<<<<<<<<<<<< @@ -7307,7 +7307,7 @@ static CYTHON_INLINE PyObject *__pyx_f_5numpy_PyDataType_SHAPE(PyArray_Descr *__ return __pyx_r; } -/* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":842 +/* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":842 * return () * * cdef inline char* _util_dtypestring(dtype descr, char* f, char* end, int* offset) except NULL: # <<<<<<<<<<<<<< @@ -7336,7 +7336,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx char *__pyx_t_9; __Pyx_RefNannySetupContext("_util_dtypestring", 0); - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":847 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":847 * * cdef dtype child * cdef int endian_detector = 1 # <<<<<<<<<<<<<< @@ -7345,7 +7345,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx */ __pyx_v_endian_detector = 1; - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":848 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":848 * cdef dtype child * cdef int endian_detector = 1 * cdef bint little_endian = ((&endian_detector)[0] != 0) # <<<<<<<<<<<<<< @@ -7354,7 +7354,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx */ __pyx_v_little_endian = ((((char *)(&__pyx_v_endian_detector))[0]) != 0); - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":851 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":851 * cdef tuple fields * * for childname in descr.names: # <<<<<<<<<<<<<< @@ -7377,7 +7377,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx __Pyx_XDECREF_SET(__pyx_v_childname, __pyx_t_3); __pyx_t_3 = 0; - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":852 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":852 * * for childname in descr.names: * fields = descr.fields[childname] # <<<<<<<<<<<<<< @@ -7394,7 +7394,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx __Pyx_XDECREF_SET(__pyx_v_fields, ((PyObject*)__pyx_t_3)); __pyx_t_3 = 0; - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":853 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":853 * for childname in descr.names: * fields = descr.fields[childname] * child, new_offset = fields # <<<<<<<<<<<<<< @@ -7429,7 +7429,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx __Pyx_XDECREF_SET(__pyx_v_new_offset, __pyx_t_4); __pyx_t_4 = 0; - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":855 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":855 * child, new_offset = fields * * if (end - f) - (new_offset - offset[0]) < 15: # <<<<<<<<<<<<<< @@ -7446,7 +7446,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx __pyx_t_6 = ((((__pyx_v_end - __pyx_v_f) - ((int)__pyx_t_5)) < 15) != 0); if (unlikely(__pyx_t_6)) { - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":856 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":856 * * if (end - f) - (new_offset - offset[0]) < 15: * raise RuntimeError(u"Format string allocated too short, see comment in numpy.pxd") # <<<<<<<<<<<<<< @@ -7459,7 +7459,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx __Pyx_DECREF(__pyx_t_3); __pyx_t_3 = 0; __PYX_ERR(1, 856, __pyx_L1_error) - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":855 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":855 * child, new_offset = fields * * if (end - f) - (new_offset - offset[0]) < 15: # <<<<<<<<<<<<<< @@ -7468,7 +7468,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx */ } - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":858 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":858 * raise RuntimeError(u"Format string allocated too short, see comment in numpy.pxd") * * if ((child.byteorder == c'>' and little_endian) or # <<<<<<<<<<<<<< @@ -7488,7 +7488,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx } __pyx_L8_next_or:; - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":859 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":859 * * if ((child.byteorder == c'>' and little_endian) or * (child.byteorder == c'<' and not little_endian)): # <<<<<<<<<<<<<< @@ -7505,7 +7505,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx __pyx_t_6 = __pyx_t_7; __pyx_L7_bool_binop_done:; - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":858 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":858 * raise RuntimeError(u"Format string allocated too short, see comment in numpy.pxd") * * if ((child.byteorder == c'>' and little_endian) or # <<<<<<<<<<<<<< @@ -7514,7 +7514,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx */ if (unlikely(__pyx_t_6)) { - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":860 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":860 * if ((child.byteorder == c'>' and little_endian) or * (child.byteorder == c'<' and not little_endian)): * raise ValueError(u"Non-native byte order not supported") # <<<<<<<<<<<<<< @@ -7527,7 +7527,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx __Pyx_DECREF(__pyx_t_3); __pyx_t_3 = 0; __PYX_ERR(1, 860, __pyx_L1_error) - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":858 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":858 * raise RuntimeError(u"Format string allocated too short, see comment in numpy.pxd") * * if ((child.byteorder == c'>' and little_endian) or # <<<<<<<<<<<<<< @@ -7536,7 +7536,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx */ } - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":870 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":870 * * # Output padding bytes * while offset[0] < new_offset: # <<<<<<<<<<<<<< @@ -7552,7 +7552,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx __Pyx_DECREF(__pyx_t_4); __pyx_t_4 = 0; if (!__pyx_t_6) break; - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":871 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":871 * # Output padding bytes * while offset[0] < new_offset: * f[0] = 120 # "x"; pad byte # <<<<<<<<<<<<<< @@ -7561,7 +7561,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx */ (__pyx_v_f[0]) = 0x78; - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":872 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":872 * while offset[0] < new_offset: * f[0] = 120 # "x"; pad byte * f += 1 # <<<<<<<<<<<<<< @@ -7570,7 +7570,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx */ __pyx_v_f = (__pyx_v_f + 1); - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":873 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":873 * f[0] = 120 # "x"; pad byte * f += 1 * offset[0] += 1 # <<<<<<<<<<<<<< @@ -7581,7 +7581,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx (__pyx_v_offset[__pyx_t_8]) = ((__pyx_v_offset[__pyx_t_8]) + 1); } - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":875 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":875 * offset[0] += 1 * * offset[0] += child.itemsize # <<<<<<<<<<<<<< @@ -7591,7 +7591,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx __pyx_t_8 = 0; (__pyx_v_offset[__pyx_t_8]) = ((__pyx_v_offset[__pyx_t_8]) + __pyx_v_child->elsize); - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":877 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":877 * offset[0] += child.itemsize * * if not PyDataType_HASFIELDS(child): # <<<<<<<<<<<<<< @@ -7601,7 +7601,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx __pyx_t_6 = ((!(PyDataType_HASFIELDS(__pyx_v_child) != 0)) != 0); if (__pyx_t_6) { - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":878 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":878 * * if not PyDataType_HASFIELDS(child): * t = child.type_num # <<<<<<<<<<<<<< @@ -7613,7 +7613,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx __Pyx_XDECREF_SET(__pyx_v_t, __pyx_t_4); __pyx_t_4 = 0; - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":879 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":879 * if not PyDataType_HASFIELDS(child): * t = child.type_num * if end - f < 5: # <<<<<<<<<<<<<< @@ -7623,7 +7623,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx __pyx_t_6 = (((__pyx_v_end - __pyx_v_f) < 5) != 0); if (unlikely(__pyx_t_6)) { - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":880 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":880 * t = child.type_num * if end - f < 5: * raise RuntimeError(u"Format string allocated too short.") # <<<<<<<<<<<<<< @@ -7636,7 +7636,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx __Pyx_DECREF(__pyx_t_4); __pyx_t_4 = 0; __PYX_ERR(1, 880, __pyx_L1_error) - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":879 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":879 * if not PyDataType_HASFIELDS(child): * t = child.type_num * if end - f < 5: # <<<<<<<<<<<<<< @@ -7645,7 +7645,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx */ } - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":883 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":883 * * # Until ticket #99 is fixed, use integers to avoid warnings * if t == NPY_BYTE: f[0] = 98 #"b" # <<<<<<<<<<<<<< @@ -7663,7 +7663,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx goto __pyx_L15; } - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":884 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":884 * # Until ticket #99 is fixed, use integers to avoid warnings * if t == NPY_BYTE: f[0] = 98 #"b" * elif t == NPY_UBYTE: f[0] = 66 #"B" # <<<<<<<<<<<<<< @@ -7681,7 +7681,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx goto __pyx_L15; } - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":885 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":885 * if t == NPY_BYTE: f[0] = 98 #"b" * elif t == NPY_UBYTE: f[0] = 66 #"B" * elif t == NPY_SHORT: f[0] = 104 #"h" # <<<<<<<<<<<<<< @@ -7699,7 +7699,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx goto __pyx_L15; } - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":886 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":886 * elif t == NPY_UBYTE: f[0] = 66 #"B" * elif t == NPY_SHORT: f[0] = 104 #"h" * elif t == NPY_USHORT: f[0] = 72 #"H" # <<<<<<<<<<<<<< @@ -7717,7 +7717,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx goto __pyx_L15; } - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":887 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":887 * elif t == NPY_SHORT: f[0] = 104 #"h" * elif t == NPY_USHORT: f[0] = 72 #"H" * elif t == NPY_INT: f[0] = 105 #"i" # <<<<<<<<<<<<<< @@ -7735,7 +7735,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx goto __pyx_L15; } - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":888 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":888 * elif t == NPY_USHORT: f[0] = 72 #"H" * elif t == NPY_INT: f[0] = 105 #"i" * elif t == NPY_UINT: f[0] = 73 #"I" # <<<<<<<<<<<<<< @@ -7753,7 +7753,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx goto __pyx_L15; } - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":889 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":889 * elif t == NPY_INT: f[0] = 105 #"i" * elif t == NPY_UINT: f[0] = 73 #"I" * elif t == NPY_LONG: f[0] = 108 #"l" # <<<<<<<<<<<<<< @@ -7771,7 +7771,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx goto __pyx_L15; } - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":890 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":890 * elif t == NPY_UINT: f[0] = 73 #"I" * elif t == NPY_LONG: f[0] = 108 #"l" * elif t == NPY_ULONG: f[0] = 76 #"L" # <<<<<<<<<<<<<< @@ -7789,7 +7789,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx goto __pyx_L15; } - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":891 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":891 * elif t == NPY_LONG: f[0] = 108 #"l" * elif t == NPY_ULONG: f[0] = 76 #"L" * elif t == NPY_LONGLONG: f[0] = 113 #"q" # <<<<<<<<<<<<<< @@ -7807,7 +7807,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx goto __pyx_L15; } - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":892 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":892 * elif t == NPY_ULONG: f[0] = 76 #"L" * elif t == NPY_LONGLONG: f[0] = 113 #"q" * elif t == NPY_ULONGLONG: f[0] = 81 #"Q" # <<<<<<<<<<<<<< @@ -7825,7 +7825,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx goto __pyx_L15; } - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":893 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":893 * elif t == NPY_LONGLONG: f[0] = 113 #"q" * elif t == NPY_ULONGLONG: f[0] = 81 #"Q" * elif t == NPY_FLOAT: f[0] = 102 #"f" # <<<<<<<<<<<<<< @@ -7843,7 +7843,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx goto __pyx_L15; } - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":894 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":894 * elif t == NPY_ULONGLONG: f[0] = 81 #"Q" * elif t == NPY_FLOAT: f[0] = 102 #"f" * elif t == NPY_DOUBLE: f[0] = 100 #"d" # <<<<<<<<<<<<<< @@ -7861,7 +7861,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx goto __pyx_L15; } - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":895 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":895 * elif t == NPY_FLOAT: f[0] = 102 #"f" * elif t == NPY_DOUBLE: f[0] = 100 #"d" * elif t == NPY_LONGDOUBLE: f[0] = 103 #"g" # <<<<<<<<<<<<<< @@ -7879,7 +7879,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx goto __pyx_L15; } - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":896 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":896 * elif t == NPY_DOUBLE: f[0] = 100 #"d" * elif t == NPY_LONGDOUBLE: f[0] = 103 #"g" * elif t == NPY_CFLOAT: f[0] = 90; f[1] = 102; f += 1 # Zf # <<<<<<<<<<<<<< @@ -7899,7 +7899,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx goto __pyx_L15; } - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":897 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":897 * elif t == NPY_LONGDOUBLE: f[0] = 103 #"g" * elif t == NPY_CFLOAT: f[0] = 90; f[1] = 102; f += 1 # Zf * elif t == NPY_CDOUBLE: f[0] = 90; f[1] = 100; f += 1 # Zd # <<<<<<<<<<<<<< @@ -7919,7 +7919,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx goto __pyx_L15; } - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":898 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":898 * elif t == NPY_CFLOAT: f[0] = 90; f[1] = 102; f += 1 # Zf * elif t == NPY_CDOUBLE: f[0] = 90; f[1] = 100; f += 1 # Zd * elif t == NPY_CLONGDOUBLE: f[0] = 90; f[1] = 103; f += 1 # Zg # <<<<<<<<<<<<<< @@ -7939,7 +7939,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx goto __pyx_L15; } - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":899 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":899 * elif t == NPY_CDOUBLE: f[0] = 90; f[1] = 100; f += 1 # Zd * elif t == NPY_CLONGDOUBLE: f[0] = 90; f[1] = 103; f += 1 # Zg * elif t == NPY_OBJECT: f[0] = 79 #"O" # <<<<<<<<<<<<<< @@ -7957,7 +7957,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx goto __pyx_L15; } - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":901 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":901 * elif t == NPY_OBJECT: f[0] = 79 #"O" * else: * raise ValueError(u"unknown dtype code in numpy.pxd (%d)" % t) # <<<<<<<<<<<<<< @@ -7976,7 +7976,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx } __pyx_L15:; - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":902 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":902 * else: * raise ValueError(u"unknown dtype code in numpy.pxd (%d)" % t) * f += 1 # <<<<<<<<<<<<<< @@ -7985,7 +7985,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx */ __pyx_v_f = (__pyx_v_f + 1); - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":877 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":877 * offset[0] += child.itemsize * * if not PyDataType_HASFIELDS(child): # <<<<<<<<<<<<<< @@ -7995,7 +7995,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx goto __pyx_L13; } - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":906 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":906 * # Cython ignores struct boundary information ("T{...}"), * # so don't output it * f = _util_dtypestring(child, f, end, offset) # <<<<<<<<<<<<<< @@ -8008,7 +8008,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx } __pyx_L13:; - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":851 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":851 * cdef tuple fields * * for childname in descr.names: # <<<<<<<<<<<<<< @@ -8018,7 +8018,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx } __Pyx_DECREF(__pyx_t_1); __pyx_t_1 = 0; - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":907 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":907 * # so don't output it * f = _util_dtypestring(child, f, end, offset) * return f # <<<<<<<<<<<<<< @@ -8028,7 +8028,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx __pyx_r = __pyx_v_f; goto __pyx_L0; - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":842 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":842 * return () * * cdef inline char* _util_dtypestring(dtype descr, char* f, char* end, int* offset) except NULL: # <<<<<<<<<<<<<< @@ -8053,7 +8053,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx return __pyx_r; } -/* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1022 +/* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1022 * int _import_umath() except -1 * * cdef inline void set_array_base(ndarray arr, object base): # <<<<<<<<<<<<<< @@ -8065,7 +8065,7 @@ static CYTHON_INLINE void __pyx_f_5numpy_set_array_base(PyArrayObject *__pyx_v_a __Pyx_RefNannyDeclarations __Pyx_RefNannySetupContext("set_array_base", 0); - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1023 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1023 * * cdef inline void set_array_base(ndarray arr, object base): * Py_INCREF(base) # important to do this before stealing the reference below! # <<<<<<<<<<<<<< @@ -8074,7 +8074,7 @@ static CYTHON_INLINE void __pyx_f_5numpy_set_array_base(PyArrayObject *__pyx_v_a */ Py_INCREF(__pyx_v_base); - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1024 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1024 * cdef inline void set_array_base(ndarray arr, object base): * Py_INCREF(base) # important to do this before stealing the reference below! * PyArray_SetBaseObject(arr, base) # <<<<<<<<<<<<<< @@ -8083,7 +8083,7 @@ static CYTHON_INLINE void __pyx_f_5numpy_set_array_base(PyArrayObject *__pyx_v_a */ (void)(PyArray_SetBaseObject(__pyx_v_arr, __pyx_v_base)); - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1022 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1022 * int _import_umath() except -1 * * cdef inline void set_array_base(ndarray arr, object base): # <<<<<<<<<<<<<< @@ -8095,7 +8095,7 @@ static CYTHON_INLINE void __pyx_f_5numpy_set_array_base(PyArrayObject *__pyx_v_a __Pyx_RefNannyFinishContext(); } -/* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1026 +/* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1026 * PyArray_SetBaseObject(arr, base) * * cdef inline object get_array_base(ndarray arr): # <<<<<<<<<<<<<< @@ -8110,7 +8110,7 @@ static CYTHON_INLINE PyObject *__pyx_f_5numpy_get_array_base(PyArrayObject *__py int __pyx_t_1; __Pyx_RefNannySetupContext("get_array_base", 0); - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1027 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1027 * * cdef inline object get_array_base(ndarray arr): * base = PyArray_BASE(arr) # <<<<<<<<<<<<<< @@ -8119,7 +8119,7 @@ static CYTHON_INLINE PyObject *__pyx_f_5numpy_get_array_base(PyArrayObject *__py */ __pyx_v_base = PyArray_BASE(__pyx_v_arr); - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1028 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1028 * cdef inline object get_array_base(ndarray arr): * base = PyArray_BASE(arr) * if base is NULL: # <<<<<<<<<<<<<< @@ -8129,7 +8129,7 @@ static CYTHON_INLINE PyObject *__pyx_f_5numpy_get_array_base(PyArrayObject *__py __pyx_t_1 = ((__pyx_v_base == NULL) != 0); if (__pyx_t_1) { - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1029 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1029 * base = PyArray_BASE(arr) * if base is NULL: * return None # <<<<<<<<<<<<<< @@ -8140,7 +8140,7 @@ static CYTHON_INLINE PyObject *__pyx_f_5numpy_get_array_base(PyArrayObject *__py __pyx_r = Py_None; __Pyx_INCREF(Py_None); goto __pyx_L0; - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1028 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1028 * cdef inline object get_array_base(ndarray arr): * base = PyArray_BASE(arr) * if base is NULL: # <<<<<<<<<<<<<< @@ -8149,7 +8149,7 @@ static CYTHON_INLINE PyObject *__pyx_f_5numpy_get_array_base(PyArrayObject *__py */ } - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1030 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1030 * if base is NULL: * return None * return base # <<<<<<<<<<<<<< @@ -8161,7 +8161,7 @@ static CYTHON_INLINE PyObject *__pyx_f_5numpy_get_array_base(PyArrayObject *__py __pyx_r = ((PyObject *)__pyx_v_base); goto __pyx_L0; - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1026 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1026 * PyArray_SetBaseObject(arr, base) * * cdef inline object get_array_base(ndarray arr): # <<<<<<<<<<<<<< @@ -8176,7 +8176,7 @@ static CYTHON_INLINE PyObject *__pyx_f_5numpy_get_array_base(PyArrayObject *__py return __pyx_r; } -/* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1034 +/* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1034 * # Versions of the import_* functions which are more suitable for * # Cython code. * cdef inline int import_array() except -1: # <<<<<<<<<<<<<< @@ -8197,7 +8197,7 @@ static CYTHON_INLINE int __pyx_f_5numpy_import_array(void) { PyObject *__pyx_t_8 = NULL; __Pyx_RefNannySetupContext("import_array", 0); - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1035 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1035 * # Cython code. * cdef inline int import_array() except -1: * try: # <<<<<<<<<<<<<< @@ -8213,7 +8213,7 @@ static CYTHON_INLINE int __pyx_f_5numpy_import_array(void) { __Pyx_XGOTREF(__pyx_t_3); /*try:*/ { - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1036 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1036 * cdef inline int import_array() except -1: * try: * _import_array() # <<<<<<<<<<<<<< @@ -8222,7 +8222,7 @@ static CYTHON_INLINE int __pyx_f_5numpy_import_array(void) { */ __pyx_t_4 = _import_array(); if (unlikely(__pyx_t_4 == ((int)-1))) __PYX_ERR(1, 1036, __pyx_L3_error) - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1035 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1035 * # Cython code. * cdef inline int import_array() except -1: * try: # <<<<<<<<<<<<<< @@ -8236,7 +8236,7 @@ static CYTHON_INLINE int __pyx_f_5numpy_import_array(void) { goto __pyx_L8_try_end; __pyx_L3_error:; - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1037 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1037 * try: * _import_array() * except Exception: # <<<<<<<<<<<<<< @@ -8251,7 +8251,7 @@ static CYTHON_INLINE int __pyx_f_5numpy_import_array(void) { __Pyx_GOTREF(__pyx_t_6); __Pyx_GOTREF(__pyx_t_7); - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1038 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1038 * _import_array() * except Exception: * raise ImportError("numpy.core.multiarray failed to import") # <<<<<<<<<<<<<< @@ -8267,7 +8267,7 @@ static CYTHON_INLINE int __pyx_f_5numpy_import_array(void) { goto __pyx_L5_except_error; __pyx_L5_except_error:; - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1035 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1035 * # Cython code. * cdef inline int import_array() except -1: * try: # <<<<<<<<<<<<<< @@ -8282,7 +8282,7 @@ static CYTHON_INLINE int __pyx_f_5numpy_import_array(void) { __pyx_L8_try_end:; } - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1034 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1034 * # Versions of the import_* functions which are more suitable for * # Cython code. * cdef inline int import_array() except -1: # <<<<<<<<<<<<<< @@ -8305,7 +8305,7 @@ static CYTHON_INLINE int __pyx_f_5numpy_import_array(void) { return __pyx_r; } -/* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1040 +/* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1040 * raise ImportError("numpy.core.multiarray failed to import") * * cdef inline int import_umath() except -1: # <<<<<<<<<<<<<< @@ -8326,7 +8326,7 @@ static CYTHON_INLINE int __pyx_f_5numpy_import_umath(void) { PyObject *__pyx_t_8 = NULL; __Pyx_RefNannySetupContext("import_umath", 0); - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1041 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1041 * * cdef inline int import_umath() except -1: * try: # <<<<<<<<<<<<<< @@ -8342,7 +8342,7 @@ static CYTHON_INLINE int __pyx_f_5numpy_import_umath(void) { __Pyx_XGOTREF(__pyx_t_3); /*try:*/ { - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1042 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1042 * cdef inline int import_umath() except -1: * try: * _import_umath() # <<<<<<<<<<<<<< @@ -8351,7 +8351,7 @@ static CYTHON_INLINE int __pyx_f_5numpy_import_umath(void) { */ __pyx_t_4 = _import_umath(); if (unlikely(__pyx_t_4 == ((int)-1))) __PYX_ERR(1, 1042, __pyx_L3_error) - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1041 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1041 * * cdef inline int import_umath() except -1: * try: # <<<<<<<<<<<<<< @@ -8365,7 +8365,7 @@ static CYTHON_INLINE int __pyx_f_5numpy_import_umath(void) { goto __pyx_L8_try_end; __pyx_L3_error:; - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1043 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1043 * try: * _import_umath() * except Exception: # <<<<<<<<<<<<<< @@ -8380,7 +8380,7 @@ static CYTHON_INLINE int __pyx_f_5numpy_import_umath(void) { __Pyx_GOTREF(__pyx_t_6); __Pyx_GOTREF(__pyx_t_7); - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1044 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1044 * _import_umath() * except Exception: * raise ImportError("numpy.core.umath failed to import") # <<<<<<<<<<<<<< @@ -8396,7 +8396,7 @@ static CYTHON_INLINE int __pyx_f_5numpy_import_umath(void) { goto __pyx_L5_except_error; __pyx_L5_except_error:; - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1041 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1041 * * cdef inline int import_umath() except -1: * try: # <<<<<<<<<<<<<< @@ -8411,7 +8411,7 @@ static CYTHON_INLINE int __pyx_f_5numpy_import_umath(void) { __pyx_L8_try_end:; } - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1040 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1040 * raise ImportError("numpy.core.multiarray failed to import") * * cdef inline int import_umath() except -1: # <<<<<<<<<<<<<< @@ -8434,7 +8434,7 @@ static CYTHON_INLINE int __pyx_f_5numpy_import_umath(void) { return __pyx_r; } -/* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1046 +/* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1046 * raise ImportError("numpy.core.umath failed to import") * * cdef inline int import_ufunc() except -1: # <<<<<<<<<<<<<< @@ -8455,7 +8455,7 @@ static CYTHON_INLINE int __pyx_f_5numpy_import_ufunc(void) { PyObject *__pyx_t_8 = NULL; __Pyx_RefNannySetupContext("import_ufunc", 0); - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1047 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1047 * * cdef inline int import_ufunc() except -1: * try: # <<<<<<<<<<<<<< @@ -8471,7 +8471,7 @@ static CYTHON_INLINE int __pyx_f_5numpy_import_ufunc(void) { __Pyx_XGOTREF(__pyx_t_3); /*try:*/ { - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1048 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1048 * cdef inline int import_ufunc() except -1: * try: * _import_umath() # <<<<<<<<<<<<<< @@ -8480,7 +8480,7 @@ static CYTHON_INLINE int __pyx_f_5numpy_import_ufunc(void) { */ __pyx_t_4 = _import_umath(); if (unlikely(__pyx_t_4 == ((int)-1))) __PYX_ERR(1, 1048, __pyx_L3_error) - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1047 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1047 * * cdef inline int import_ufunc() except -1: * try: # <<<<<<<<<<<<<< @@ -8494,7 +8494,7 @@ static CYTHON_INLINE int __pyx_f_5numpy_import_ufunc(void) { goto __pyx_L8_try_end; __pyx_L3_error:; - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1049 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1049 * try: * _import_umath() * except Exception: # <<<<<<<<<<<<<< @@ -8508,7 +8508,7 @@ static CYTHON_INLINE int __pyx_f_5numpy_import_ufunc(void) { __Pyx_GOTREF(__pyx_t_6); __Pyx_GOTREF(__pyx_t_7); - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1050 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1050 * _import_umath() * except Exception: * raise ImportError("numpy.core.umath failed to import") # <<<<<<<<<<<<<< @@ -8522,7 +8522,7 @@ static CYTHON_INLINE int __pyx_f_5numpy_import_ufunc(void) { goto __pyx_L5_except_error; __pyx_L5_except_error:; - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1047 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1047 * * cdef inline int import_ufunc() except -1: * try: # <<<<<<<<<<<<<< @@ -8537,7 +8537,7 @@ static CYTHON_INLINE int __pyx_f_5numpy_import_ufunc(void) { __pyx_L8_try_end:; } - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1046 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1046 * raise ImportError("numpy.core.umath failed to import") * * cdef inline int import_ufunc() except -1: # <<<<<<<<<<<<<< @@ -12127,8 +12127,8 @@ static PyObject *__pyx_memoryview_is_slice(struct __pyx_memoryview_obj *__pyx_v_ goto __pyx_L9_try_end; __pyx_L4_error:; __Pyx_XDECREF(__pyx_t_6); __pyx_t_6 = 0; - __Pyx_XDECREF(__pyx_t_8); __pyx_t_8 = 0; __Pyx_XDECREF(__pyx_t_7); __pyx_t_7 = 0; + __Pyx_XDECREF(__pyx_t_8); __pyx_t_8 = 0; /* "View.MemoryView":432 * obj = memoryview(obj, self.flags & ~PyBUF_WRITABLE | PyBUF_ANY_CONTIGUOUS, @@ -12837,11 +12837,11 @@ static PyObject *__pyx_memoryview_convert_item_to_object(struct __pyx_memoryview goto __pyx_L6_except_return; } __pyx_L3_error:; - __Pyx_XDECREF(__pyx_t_7); __pyx_t_7 = 0; + __Pyx_XDECREF(__pyx_t_1); __pyx_t_1 = 0; + __Pyx_XDECREF(__pyx_t_5); __pyx_t_5 = 0; __Pyx_XDECREF(__pyx_t_6); __pyx_t_6 = 0; + __Pyx_XDECREF(__pyx_t_7); __pyx_t_7 = 0; __Pyx_XDECREF(__pyx_t_9); __pyx_t_9 = 0; - __Pyx_XDECREF(__pyx_t_5); __pyx_t_5 = 0; - __Pyx_XDECREF(__pyx_t_1); __pyx_t_1 = 0; /* "View.MemoryView":490 * try: @@ -22230,7 +22230,7 @@ static CYTHON_SMALL_CODE int __Pyx_InitCachedConstants(void) { __Pyx_GOTREF(__pyx_tuple__6); __Pyx_GIVEREF(__pyx_tuple__6); - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":272 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":272 * if ((flags & pybuf.PyBUF_C_CONTIGUOUS == pybuf.PyBUF_C_CONTIGUOUS) * and not PyArray_CHKFLAGS(self, NPY_ARRAY_C_CONTIGUOUS)): * raise ValueError(u"ndarray is not C contiguous") # <<<<<<<<<<<<<< @@ -22241,7 +22241,7 @@ static CYTHON_SMALL_CODE int __Pyx_InitCachedConstants(void) { __Pyx_GOTREF(__pyx_tuple__7); __Pyx_GIVEREF(__pyx_tuple__7); - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":276 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":276 * if ((flags & pybuf.PyBUF_F_CONTIGUOUS == pybuf.PyBUF_F_CONTIGUOUS) * and not PyArray_CHKFLAGS(self, NPY_ARRAY_F_CONTIGUOUS)): * raise ValueError(u"ndarray is not Fortran contiguous") # <<<<<<<<<<<<<< @@ -22252,7 +22252,7 @@ static CYTHON_SMALL_CODE int __Pyx_InitCachedConstants(void) { __Pyx_GOTREF(__pyx_tuple__8); __Pyx_GIVEREF(__pyx_tuple__8); - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":306 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":306 * if ((descr.byteorder == c'>' and little_endian) or * (descr.byteorder == c'<' and not little_endian)): * raise ValueError(u"Non-native byte order not supported") # <<<<<<<<<<<<<< @@ -22263,7 +22263,7 @@ static CYTHON_SMALL_CODE int __Pyx_InitCachedConstants(void) { __Pyx_GOTREF(__pyx_tuple__9); __Pyx_GIVEREF(__pyx_tuple__9); - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":856 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":856 * * if (end - f) - (new_offset - offset[0]) < 15: * raise RuntimeError(u"Format string allocated too short, see comment in numpy.pxd") # <<<<<<<<<<<<<< @@ -22274,7 +22274,7 @@ static CYTHON_SMALL_CODE int __Pyx_InitCachedConstants(void) { __Pyx_GOTREF(__pyx_tuple__10); __Pyx_GIVEREF(__pyx_tuple__10); - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":880 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":880 * t = child.type_num * if end - f < 5: * raise RuntimeError(u"Format string allocated too short.") # <<<<<<<<<<<<<< @@ -22285,7 +22285,7 @@ static CYTHON_SMALL_CODE int __Pyx_InitCachedConstants(void) { __Pyx_GOTREF(__pyx_tuple__11); __Pyx_GIVEREF(__pyx_tuple__11); - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1038 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1038 * _import_array() * except Exception: * raise ImportError("numpy.core.multiarray failed to import") # <<<<<<<<<<<<<< @@ -22296,7 +22296,7 @@ static CYTHON_SMALL_CODE int __Pyx_InitCachedConstants(void) { __Pyx_GOTREF(__pyx_tuple__12); __Pyx_GIVEREF(__pyx_tuple__12); - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1044 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1044 * _import_umath() * except Exception: * raise ImportError("numpy.core.umath failed to import") # <<<<<<<<<<<<<< @@ -27200,7 +27200,7 @@ static CYTHON_INLINE PyObject* __Pyx_PyInt_From_long(long value) { theta = 0; } else { r = -a.real; - theta = atan2f(0, -1); + theta = atan2f(0.0, -1.0); } } else { r = __Pyx_c_abs_float(a); @@ -27355,7 +27355,7 @@ static CYTHON_INLINE PyObject* __Pyx_PyInt_From_long(long value) { theta = 0; } else { r = -a.real; - theta = atan2(0, -1); + theta = atan2(0.0, -1.0); } } else { r = __Pyx_c_abs_double(a); diff --git a/gensim/corpora/_mmreader.c b/gensim/corpora/_mmreader.c index 03734e0f32..e8c98eccc3 100644 --- a/gensim/corpora/_mmreader.c +++ b/gensim/corpora/_mmreader.c @@ -1,4 +1,4 @@ -/* Generated by Cython 0.29.2 */ +/* Generated by Cython 0.29.3 */ #define PY_SSIZE_T_CLEAN #include "Python.h" @@ -7,8 +7,8 @@ #elif PY_VERSION_HEX < 0x02060000 || (0x03000000 <= PY_VERSION_HEX && PY_VERSION_HEX < 0x03030000) #error Cython requires Python 2.6+ or Python 3.3+. #else -#define CYTHON_ABI "0_29_2" -#define CYTHON_HEX_VERSION 0x001D02F0 +#define CYTHON_ABI "0_29_3" +#define CYTHON_HEX_VERSION 0x001D03F0 #define CYTHON_FUTURE_DIVISION 0 #include #ifndef offsetof @@ -398,7 +398,7 @@ typedef int Py_tss_t; static CYTHON_INLINE int PyThread_tss_create(Py_tss_t *key) { *key = PyThread_create_key(); - return 0; // PyThread_create_key reports success always + return 0; } static CYTHON_INLINE Py_tss_t * PyThread_tss_alloc(void) { Py_tss_t *key = (Py_tss_t *)PyObject_Malloc(sizeof(Py_tss_t)); @@ -421,7 +421,7 @@ static CYTHON_INLINE int PyThread_tss_set(Py_tss_t *key, void *value) { static CYTHON_INLINE void * PyThread_tss_get(Py_tss_t *key) { return PyThread_get_key_value(*key); } -#endif // TSS (Thread Specific Storage) API +#endif #if CYTHON_COMPILING_IN_CPYTHON || defined(_PyDict_NewPresized) #define __Pyx_PyDict_NewPresized(n) ((n <= 8) ? PyDict_New() : _PyDict_NewPresized(n)) #else @@ -2227,11 +2227,11 @@ static int __pyx_pf_6gensim_7corpora_9_mmreader_8MmReader___init__(struct __pyx_ __Pyx_XDECREF(__pyx_t_13); __pyx_t_13 = 0; goto __pyx_L18_try_end; __pyx_L13_error:; + __Pyx_XDECREF(__pyx_t_1); __pyx_t_1 = 0; __Pyx_XDECREF(__pyx_t_14); __pyx_t_14 = 0; - __Pyx_XDECREF(__pyx_t_5); __pyx_t_5 = 0; __Pyx_XDECREF(__pyx_t_2); __pyx_t_2 = 0; - __Pyx_XDECREF(__pyx_t_1); __pyx_t_1 = 0; __Pyx_XDECREF(__pyx_t_3); __pyx_t_3 = 0; + __Pyx_XDECREF(__pyx_t_5); __pyx_t_5 = 0; /* "gensim/corpora/_mmreader.pyx":70 * (self.input, header) @@ -2546,13 +2546,13 @@ static int __pyx_pf_6gensim_7corpora_9_mmreader_8MmReader___init__(struct __pyx_ __Pyx_XDECREF(__pyx_t_10); __pyx_t_10 = 0; goto __pyx_L12_try_end; __pyx_L7_error:; - __Pyx_XDECREF(__pyx_t_19); __pyx_t_19 = 0; + __Pyx_XDECREF(__pyx_t_1); __pyx_t_1 = 0; __Pyx_XDECREF(__pyx_t_14); __pyx_t_14 = 0; - __Pyx_XDECREF(__pyx_t_5); __pyx_t_5 = 0; __Pyx_XDECREF(__pyx_t_18); __pyx_t_18 = 0; + __Pyx_XDECREF(__pyx_t_19); __pyx_t_19 = 0; __Pyx_XDECREF(__pyx_t_2); __pyx_t_2 = 0; - __Pyx_XDECREF(__pyx_t_1); __pyx_t_1 = 0; __Pyx_XDECREF(__pyx_t_3); __pyx_t_3 = 0; + __Pyx_XDECREF(__pyx_t_5); __pyx_t_5 = 0; /*except:*/ { __Pyx_AddTraceback("gensim.corpora._mmreader.MmReader.__init__", __pyx_clineno, __pyx_lineno, __pyx_filename); if (__Pyx_GetException(&__pyx_t_3, &__pyx_t_1, &__pyx_t_2) < 0) __PYX_ERR(0, 62, __pyx_L9_except_error) @@ -3784,13 +3784,13 @@ static PyObject *__pyx_gb_6gensim_7corpora_9_mmreader_8MmReader_10generator(__py __Pyx_XDECREF(__pyx_t_8); __pyx_t_8 = 0; goto __pyx_L13_try_end; __pyx_L8_error:; - __Pyx_XDECREF(__pyx_t_16); __pyx_t_16 = 0; - __Pyx_XDECREF(__pyx_t_5); __pyx_t_5 = 0; __Pyx_XDECREF(__pyx_t_1); __pyx_t_1 = 0; - __Pyx_XDECREF(__pyx_t_3); __pyx_t_3 = 0; __Pyx_XDECREF(__pyx_t_15); __pyx_t_15 = 0; + __Pyx_XDECREF(__pyx_t_16); __pyx_t_16 = 0; __Pyx_XDECREF(__pyx_t_18); __pyx_t_18 = 0; __Pyx_XDECREF(__pyx_t_2); __pyx_t_2 = 0; + __Pyx_XDECREF(__pyx_t_3); __pyx_t_3 = 0; + __Pyx_XDECREF(__pyx_t_5); __pyx_t_5 = 0; /*except:*/ { __Pyx_AddTraceback("gensim.corpora._mmreader.MmReader.__iter__", __pyx_clineno, __pyx_lineno, __pyx_filename); if (__Pyx_GetException(&__pyx_t_2, &__pyx_t_18, &__pyx_t_15) < 0) __PYX_ERR(0, 127, __pyx_L10_except_error) diff --git a/gensim/models/_fasttext_bin.py b/gensim/models/_fasttext_bin.py index 31d85c5074..d8d84131a3 100644 --- a/gensim/models/_fasttext_bin.py +++ b/gensim/models/_fasttext_bin.py @@ -1,10 +1,14 @@ # -*- coding: utf-8 -*- """Load models from the native binary format released by Facebook. +The main entry point is the :func:`~gensim.models._fasttext_bin.load` function. +It returns a :class:`~gensim.models._fasttext_bin.Model` namedtuple containing everything loaded from the binary. + Examples -------- Load a model from a binary file: + .. sourcecode:: pycon >>> from gensim.test.utils import datapath @@ -26,11 +30,14 @@ """ import collections +import io import logging import struct import numpy as np +_END_OF_WORD_MARKER = b'\x00' + logger = logging.getLogger(__name__) _FASTTEXT_FILEFORMAT_MAGIC = 793712314 @@ -79,6 +86,49 @@ def _yield_field_names(): _FIELD_NAMES = sorted(set(_yield_field_names())) Model = collections.namedtuple('Model', _FIELD_NAMES) +"""Holds data loaded from the Facebook binary. + +Parameters +---------- +dim : int + The dimensionality of the vectors. +ws : int + The window size. +epoch : int + The number of training epochs. +neg : int + If non-zero, indicates that the model uses negative sampling. +loss : int + If equal to 1, indicates that the model uses hierarchical sampling. +model : int + If equal to 2, indicates that the model uses skip-grams. +bucket : int + The number of buckets. +min_count : int + The threshold below which the model ignores terms. +t : float + The sample threshold. +minn : int + The minimum ngram length. +maxn : int + The maximum ngram length. +raw_vocab : collections.OrderedDict + A map from words (str) to their frequency (int). The order in the dict + corresponds to the order of the words in the Facebook binary. +nwords : int + The number of words. +vocab_size : int + The size of the vocabulary. +vectors_ngrams : numpy.array + This is a matrix that contains vectors learned by the model. + Each row corresponds to a vector. + The number of vectors is equal to the number of words plus the number of buckets. + The number of columns is equal to the vector dimensionality. +hidden_output : numpy.array + This is a matrix that contains the shallow neural network output. + This array has the same dimensions as vectors_ngrams. + May be None - in that case, it is impossible to continue training the model. +""" def _struct_unpack(fin, fmt): @@ -121,13 +171,22 @@ def _load_vocab(fin, new_format, encoding='utf-8'): raw_vocab = collections.OrderedDict() for i in range(vocab_size): - word_bytes = b'' + word_bytes = io.BytesIO() char_byte = fin.read(1) - # Read vocab word - while char_byte != b'\x00': - word_bytes += char_byte + + while char_byte != _END_OF_WORD_MARKER: + word_bytes.write(char_byte) char_byte = fin.read(1) - word = word_bytes.decode(encoding) + + word_bytes = word_bytes.getvalue() + try: + word = word_bytes.decode(encoding) + except UnicodeDecodeError: + word = word_bytes.decode(encoding, errors='ignore') + logger.error( + 'failed to decode invalid unicode bytes %r; ignoring invalid characters, using %r', + word_bytes, word + ) count, _ = _struct_unpack(fin, '@qb') raw_vocab[word] = count @@ -177,7 +236,7 @@ def _load_matrix(fin, new_format=True): return matrix -def load(fin, encoding='utf-8'): +def load(fin, encoding='utf-8', full_model=True): """Load a model from a binary stream. Parameters @@ -186,10 +245,13 @@ def load(fin, encoding='utf-8'): The readable binary stream. encoding : str, optional The encoding to use for decoding text + full_model : boolean, optional + If False, skips loading the hidden output matrix. This saves a fair bit + of CPU time and RAM, but prevents training continuation. Returns ------- - Model + :class:`~gensim.models._fasttext_bin.Model` The loaded model. """ @@ -209,10 +271,12 @@ def load(fin, encoding='utf-8'): vectors_ngrams = _load_matrix(fin, new_format=new_format) - hidden_output = _load_matrix(fin, new_format=new_format) - model.update(vectors_ngrams=vectors_ngrams, hidden_output=hidden_output) - - assert fin.read() == b'', 'expected to reach EOF' + if not full_model: + hidden_output = None + else: + hidden_output = _load_matrix(fin, new_format=new_format) + assert fin.read() == b'', 'expected to reach EOF' + model.update(vectors_ngrams=vectors_ngrams, hidden_output=hidden_output) model = {k: v for k, v in model.items() if k in _FIELD_NAMES} return Model(**model) diff --git a/gensim/models/_utils_any2vec.c b/gensim/models/_utils_any2vec.c index c42dd6ef33..c9709ad9be 100644 --- a/gensim/models/_utils_any2vec.c +++ b/gensim/models/_utils_any2vec.c @@ -1,4 +1,4 @@ -/* Generated by Cython 0.29.2 */ +/* Generated by Cython 0.29.3 */ #define PY_SSIZE_T_CLEAN #include "Python.h" @@ -7,8 +7,8 @@ #elif PY_VERSION_HEX < 0x02060000 || (0x03000000 <= PY_VERSION_HEX && PY_VERSION_HEX < 0x03030000) #error Cython requires Python 2.6+ or Python 3.3+. #else -#define CYTHON_ABI "0_29_2" -#define CYTHON_HEX_VERSION 0x001D02F0 +#define CYTHON_ABI "0_29_3" +#define CYTHON_HEX_VERSION 0x001D03F0 #define CYTHON_FUTURE_DIVISION 0 #include #ifndef offsetof @@ -398,7 +398,7 @@ typedef int Py_tss_t; static CYTHON_INLINE int PyThread_tss_create(Py_tss_t *key) { *key = PyThread_create_key(); - return 0; // PyThread_create_key reports success always + return 0; } static CYTHON_INLINE Py_tss_t * PyThread_tss_alloc(void) { Py_tss_t *key = (Py_tss_t *)PyObject_Malloc(sizeof(Py_tss_t)); @@ -421,7 +421,7 @@ static CYTHON_INLINE int PyThread_tss_set(Py_tss_t *key, void *value) { static CYTHON_INLINE void * PyThread_tss_get(Py_tss_t *key) { return PyThread_get_key_value(*key); } -#endif // TSS (Thread Specific Storage) API +#endif #if CYTHON_COMPILING_IN_CPYTHON || defined(_PyDict_NewPresized) #define __Pyx_PyDict_NewPresized(n) ((n <= 8) ? PyDict_New() : _PyDict_NewPresized(n)) #else @@ -608,6 +608,7 @@ static CYTHON_INLINE float __PYX_NAN() { #define __PYX_HAVE__gensim__models___utils_any2vec #define __PYX_HAVE_API__gensim__models___utils_any2vec /* Early includes */ +#include "stdint_wrapper.h" #include #include #include "numpy/arrayobject.h" @@ -843,11 +844,10 @@ static const char *__pyx_filename; static const char *__pyx_f[] = { "gensim/models/_utils_any2vec.pyx", "__init__.pxd", - "stringsource", "type.pxd", }; -/* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":776 +/* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":776 * # in Cython to enable them only on the right systems. * * ctypedef npy_int8 int8_t # <<<<<<<<<<<<<< @@ -856,7 +856,7 @@ static const char *__pyx_f[] = { */ typedef npy_int8 __pyx_t_5numpy_int8_t; -/* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":777 +/* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":777 * * ctypedef npy_int8 int8_t * ctypedef npy_int16 int16_t # <<<<<<<<<<<<<< @@ -865,7 +865,7 @@ typedef npy_int8 __pyx_t_5numpy_int8_t; */ typedef npy_int16 __pyx_t_5numpy_int16_t; -/* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":778 +/* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":778 * ctypedef npy_int8 int8_t * ctypedef npy_int16 int16_t * ctypedef npy_int32 int32_t # <<<<<<<<<<<<<< @@ -874,7 +874,7 @@ typedef npy_int16 __pyx_t_5numpy_int16_t; */ typedef npy_int32 __pyx_t_5numpy_int32_t; -/* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":779 +/* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":779 * ctypedef npy_int16 int16_t * ctypedef npy_int32 int32_t * ctypedef npy_int64 int64_t # <<<<<<<<<<<<<< @@ -883,7 +883,7 @@ typedef npy_int32 __pyx_t_5numpy_int32_t; */ typedef npy_int64 __pyx_t_5numpy_int64_t; -/* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":783 +/* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":783 * #ctypedef npy_int128 int128_t * * ctypedef npy_uint8 uint8_t # <<<<<<<<<<<<<< @@ -892,7 +892,7 @@ typedef npy_int64 __pyx_t_5numpy_int64_t; */ typedef npy_uint8 __pyx_t_5numpy_uint8_t; -/* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":784 +/* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":784 * * ctypedef npy_uint8 uint8_t * ctypedef npy_uint16 uint16_t # <<<<<<<<<<<<<< @@ -901,7 +901,7 @@ typedef npy_uint8 __pyx_t_5numpy_uint8_t; */ typedef npy_uint16 __pyx_t_5numpy_uint16_t; -/* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":785 +/* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":785 * ctypedef npy_uint8 uint8_t * ctypedef npy_uint16 uint16_t * ctypedef npy_uint32 uint32_t # <<<<<<<<<<<<<< @@ -910,7 +910,7 @@ typedef npy_uint16 __pyx_t_5numpy_uint16_t; */ typedef npy_uint32 __pyx_t_5numpy_uint32_t; -/* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":786 +/* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":786 * ctypedef npy_uint16 uint16_t * ctypedef npy_uint32 uint32_t * ctypedef npy_uint64 uint64_t # <<<<<<<<<<<<<< @@ -919,7 +919,7 @@ typedef npy_uint32 __pyx_t_5numpy_uint32_t; */ typedef npy_uint64 __pyx_t_5numpy_uint64_t; -/* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":790 +/* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":790 * #ctypedef npy_uint128 uint128_t * * ctypedef npy_float32 float32_t # <<<<<<<<<<<<<< @@ -928,7 +928,7 @@ typedef npy_uint64 __pyx_t_5numpy_uint64_t; */ typedef npy_float32 __pyx_t_5numpy_float32_t; -/* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":791 +/* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":791 * * ctypedef npy_float32 float32_t * ctypedef npy_float64 float64_t # <<<<<<<<<<<<<< @@ -937,7 +937,7 @@ typedef npy_float32 __pyx_t_5numpy_float32_t; */ typedef npy_float64 __pyx_t_5numpy_float64_t; -/* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":800 +/* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":800 * # The int types are mapped a bit surprising -- * # numpy.int corresponds to 'l' and numpy.long to 'q' * ctypedef npy_long int_t # <<<<<<<<<<<<<< @@ -946,7 +946,7 @@ typedef npy_float64 __pyx_t_5numpy_float64_t; */ typedef npy_long __pyx_t_5numpy_int_t; -/* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":801 +/* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":801 * # numpy.int corresponds to 'l' and numpy.long to 'q' * ctypedef npy_long int_t * ctypedef npy_longlong long_t # <<<<<<<<<<<<<< @@ -955,7 +955,7 @@ typedef npy_long __pyx_t_5numpy_int_t; */ typedef npy_longlong __pyx_t_5numpy_long_t; -/* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":802 +/* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":802 * ctypedef npy_long int_t * ctypedef npy_longlong long_t * ctypedef npy_longlong longlong_t # <<<<<<<<<<<<<< @@ -964,7 +964,7 @@ typedef npy_longlong __pyx_t_5numpy_long_t; */ typedef npy_longlong __pyx_t_5numpy_longlong_t; -/* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":804 +/* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":804 * ctypedef npy_longlong longlong_t * * ctypedef npy_ulong uint_t # <<<<<<<<<<<<<< @@ -973,7 +973,7 @@ typedef npy_longlong __pyx_t_5numpy_longlong_t; */ typedef npy_ulong __pyx_t_5numpy_uint_t; -/* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":805 +/* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":805 * * ctypedef npy_ulong uint_t * ctypedef npy_ulonglong ulong_t # <<<<<<<<<<<<<< @@ -982,7 +982,7 @@ typedef npy_ulong __pyx_t_5numpy_uint_t; */ typedef npy_ulonglong __pyx_t_5numpy_ulong_t; -/* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":806 +/* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":806 * ctypedef npy_ulong uint_t * ctypedef npy_ulonglong ulong_t * ctypedef npy_ulonglong ulonglong_t # <<<<<<<<<<<<<< @@ -991,7 +991,7 @@ typedef npy_ulonglong __pyx_t_5numpy_ulong_t; */ typedef npy_ulonglong __pyx_t_5numpy_ulonglong_t; -/* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":808 +/* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":808 * ctypedef npy_ulonglong ulonglong_t * * ctypedef npy_intp intp_t # <<<<<<<<<<<<<< @@ -1000,7 +1000,7 @@ typedef npy_ulonglong __pyx_t_5numpy_ulonglong_t; */ typedef npy_intp __pyx_t_5numpy_intp_t; -/* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":809 +/* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":809 * * ctypedef npy_intp intp_t * ctypedef npy_uintp uintp_t # <<<<<<<<<<<<<< @@ -1009,7 +1009,7 @@ typedef npy_intp __pyx_t_5numpy_intp_t; */ typedef npy_uintp __pyx_t_5numpy_uintp_t; -/* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":811 +/* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":811 * ctypedef npy_uintp uintp_t * * ctypedef npy_double float_t # <<<<<<<<<<<<<< @@ -1018,7 +1018,7 @@ typedef npy_uintp __pyx_t_5numpy_uintp_t; */ typedef npy_double __pyx_t_5numpy_float_t; -/* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":812 +/* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":812 * * ctypedef npy_double float_t * ctypedef npy_double double_t # <<<<<<<<<<<<<< @@ -1027,7 +1027,7 @@ typedef npy_double __pyx_t_5numpy_float_t; */ typedef npy_double __pyx_t_5numpy_double_t; -/* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":813 +/* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":813 * ctypedef npy_double float_t * ctypedef npy_double double_t * ctypedef npy_longdouble longdouble_t # <<<<<<<<<<<<<< @@ -1061,9 +1061,8 @@ static CYTHON_INLINE __pyx_t_double_complex __pyx_t_double_complex_from_parts(do /*--- Type declarations ---*/ -struct __pyx_obj___pyx_scope_struct____Pyx_CFunc_object____object___to_py; -/* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":815 +/* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":815 * ctypedef npy_longdouble longdouble_t * * ctypedef npy_cfloat cfloat_t # <<<<<<<<<<<<<< @@ -1072,7 +1071,7 @@ struct __pyx_obj___pyx_scope_struct____Pyx_CFunc_object____object___to_py; */ typedef npy_cfloat __pyx_t_5numpy_cfloat_t; -/* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":816 +/* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":816 * * ctypedef npy_cfloat cfloat_t * ctypedef npy_cdouble cdouble_t # <<<<<<<<<<<<<< @@ -1081,7 +1080,7 @@ typedef npy_cfloat __pyx_t_5numpy_cfloat_t; */ typedef npy_cdouble __pyx_t_5numpy_cdouble_t; -/* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":817 +/* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":817 * ctypedef npy_cfloat cfloat_t * ctypedef npy_cdouble cdouble_t * ctypedef npy_clongdouble clongdouble_t # <<<<<<<<<<<<<< @@ -1090,7 +1089,7 @@ typedef npy_cdouble __pyx_t_5numpy_cdouble_t; */ typedef npy_clongdouble __pyx_t_5numpy_clongdouble_t; -/* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":819 +/* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":819 * ctypedef npy_clongdouble clongdouble_t * * ctypedef npy_cdouble complex_t # <<<<<<<<<<<<<< @@ -1099,19 +1098,6 @@ typedef npy_clongdouble __pyx_t_5numpy_clongdouble_t; */ typedef npy_cdouble __pyx_t_5numpy_complex_t; -/* "cfunc.to_py":64 - * - * @cname("__Pyx_CFunc_object____object___to_py") - * cdef object __Pyx_CFunc_object____object___to_py(object (*f)(object) ): # <<<<<<<<<<<<<< - * def wrap(object b): - * """wrap(b)""" - */ -struct __pyx_obj___pyx_scope_struct____Pyx_CFunc_object____object___to_py { - PyObject_HEAD - PyObject *(*__pyx_v_f)(PyObject *); -}; - - /* --- Runtime support code (head) --- */ /* Refnanny.proto */ #ifndef CYTHON_REFNANNY @@ -1186,6 +1172,16 @@ static CYTHON_INLINE PyObject* __Pyx_PyObject_GetAttrStr(PyObject* obj, PyObject /* GetBuiltinName.proto */ static PyObject *__Pyx_GetBuiltinName(PyObject *name); +/* ArgTypeTest.proto */ +#define __Pyx_ArgTypeTest(obj, type, none_allowed, name, exact)\ + ((likely((Py_TYPE(obj) == type) | (none_allowed && (obj == Py_None)))) ? 1 :\ + __Pyx__ArgTypeTest(obj, type, name, exact)) +static int __Pyx__ArgTypeTest(PyObject *obj, PyTypeObject *type, const char *name, int exact); + +/* unicode_iter.proto */ +static CYTHON_INLINE int __Pyx_init_unicode_iteration( + PyObject* ustring, Py_ssize_t *length, void** data, int *kind); + /* UnicodeAsUCS4.proto */ static CYTHON_INLINE Py_UCS4 __Pyx_PyUnicode_AsPy_UCS4(PyObject*); @@ -1198,85 +1194,6 @@ static CYTHON_INLINE Py_UCS4 __Pyx_PyUnicode_AsPy_UCS4(PyObject*); #endif static long __Pyx__PyObject_Ord(PyObject* c); -/* GetModuleGlobalName.proto */ -#if CYTHON_USE_DICT_VERSIONS -#define __Pyx_GetModuleGlobalName(var, name) {\ - static PY_UINT64_T __pyx_dict_version = 0;\ - static PyObject *__pyx_dict_cached_value = NULL;\ - (var) = (likely(__pyx_dict_version == __PYX_GET_DICT_VERSION(__pyx_d))) ?\ - (likely(__pyx_dict_cached_value) ? __Pyx_NewRef(__pyx_dict_cached_value) : __Pyx_GetBuiltinName(name)) :\ - __Pyx__GetModuleGlobalName(name, &__pyx_dict_version, &__pyx_dict_cached_value);\ -} -#define __Pyx_GetModuleGlobalNameUncached(var, name) {\ - PY_UINT64_T __pyx_dict_version;\ - PyObject *__pyx_dict_cached_value;\ - (var) = __Pyx__GetModuleGlobalName(name, &__pyx_dict_version, &__pyx_dict_cached_value);\ -} -static PyObject *__Pyx__GetModuleGlobalName(PyObject *name, PY_UINT64_T *dict_version, PyObject **dict_cached_value); -#else -#define __Pyx_GetModuleGlobalName(var, name) (var) = __Pyx__GetModuleGlobalName(name) -#define __Pyx_GetModuleGlobalNameUncached(var, name) (var) = __Pyx__GetModuleGlobalName(name) -static CYTHON_INLINE PyObject *__Pyx__GetModuleGlobalName(PyObject *name); -#endif - -/* PyCFunctionFastCall.proto */ -#if CYTHON_FAST_PYCCALL -static CYTHON_INLINE PyObject *__Pyx_PyCFunction_FastCall(PyObject *func, PyObject **args, Py_ssize_t nargs); -#else -#define __Pyx_PyCFunction_FastCall(func, args, nargs) (assert(0), NULL) -#endif - -/* PyFunctionFastCall.proto */ -#if CYTHON_FAST_PYCALL -#define __Pyx_PyFunction_FastCall(func, args, nargs)\ - __Pyx_PyFunction_FastCallDict((func), (args), (nargs), NULL) -#if 1 || PY_VERSION_HEX < 0x030600B1 -static PyObject *__Pyx_PyFunction_FastCallDict(PyObject *func, PyObject **args, int nargs, PyObject *kwargs); -#else -#define __Pyx_PyFunction_FastCallDict(func, args, nargs, kwargs) _PyFunction_FastCallDict(func, args, nargs, kwargs) -#endif -#define __Pyx_BUILD_ASSERT_EXPR(cond)\ - (sizeof(char [1 - 2*!(cond)]) - 1) -#ifndef Py_MEMBER_SIZE -#define Py_MEMBER_SIZE(type, member) sizeof(((type *)0)->member) -#endif - static size_t __pyx_pyframe_localsplus_offset = 0; - #include "frameobject.h" - #define __Pxy_PyFrame_Initialize_Offsets()\ - ((void)__Pyx_BUILD_ASSERT_EXPR(sizeof(PyFrameObject) == offsetof(PyFrameObject, f_localsplus) + Py_MEMBER_SIZE(PyFrameObject, f_localsplus)),\ - (void)(__pyx_pyframe_localsplus_offset = ((size_t)PyFrame_Type.tp_basicsize) - Py_MEMBER_SIZE(PyFrameObject, f_localsplus))) - #define __Pyx_PyFrame_GetLocalsplus(frame)\ - (assert(__pyx_pyframe_localsplus_offset), (PyObject **)(((char *)(frame)) + __pyx_pyframe_localsplus_offset)) -#endif - -/* PyObjectCall.proto */ -#if CYTHON_COMPILING_IN_CPYTHON -static CYTHON_INLINE PyObject* __Pyx_PyObject_Call(PyObject *func, PyObject *arg, PyObject *kw); -#else -#define __Pyx_PyObject_Call(func, arg, kw) PyObject_Call(func, arg, kw) -#endif - -/* PyObjectCall2Args.proto */ -static CYTHON_UNUSED PyObject* __Pyx_PyObject_Call2Args(PyObject* function, PyObject* arg1, PyObject* arg2); - -/* PyObjectCallMethO.proto */ -#if CYTHON_COMPILING_IN_CPYTHON -static CYTHON_INLINE PyObject* __Pyx_PyObject_CallMethO(PyObject *func, PyObject *arg); -#endif - -/* PyObjectCallOneArg.proto */ -static CYTHON_INLINE PyObject* __Pyx_PyObject_CallOneArg(PyObject *func, PyObject *arg); - -/* ArgTypeTest.proto */ -#define __Pyx_ArgTypeTest(obj, type, none_allowed, name, exact)\ - ((likely((Py_TYPE(obj) == type) | (none_allowed && (obj == Py_None)))) ? 1 :\ - __Pyx__ArgTypeTest(obj, type, name, exact)) -static int __Pyx__ArgTypeTest(PyObject *obj, PyTypeObject *type, const char *name, int exact); - -/* unicode_iter.proto */ -static CYTHON_INLINE int __Pyx_init_unicode_iteration( - PyObject* ustring, Py_ssize_t *length, void** data, int *kind); - /* PyObjectFormatSimple.proto */ #if CYTHON_COMPILING_IN_PYPY #define __Pyx_PyObject_FormatSimple(s, f) (\ @@ -1306,6 +1223,13 @@ static CYTHON_INLINE int __Pyx_init_unicode_iteration( static PyObject* __Pyx_PyUnicode_Join(PyObject* value_tuple, Py_ssize_t value_count, Py_ssize_t result_ulength, Py_UCS4 max_char); +/* PyObjectCall.proto */ +#if CYTHON_COMPILING_IN_CPYTHON +static CYTHON_INLINE PyObject* __Pyx_PyObject_Call(PyObject *func, PyObject *arg, PyObject *kw); +#else +#define __Pyx_PyObject_Call(func, arg, kw) PyObject_Call(func, arg, kw) +#endif + /* PyIntBinop.proto */ #if !CYTHON_COMPILING_IN_PYPY static PyObject* __Pyx_PyInt_AddObjC(PyObject *op1, PyObject *op2, long intval, int inplace); @@ -1347,6 +1271,47 @@ static int __Pyx_ParseOptionalKeywords(PyObject *kwds, PyObject **argnames[],\ PyObject *kwds2, PyObject *values[], Py_ssize_t num_pos_args,\ const char* function_name); +/* PyCFunctionFastCall.proto */ +#if CYTHON_FAST_PYCCALL +static CYTHON_INLINE PyObject *__Pyx_PyCFunction_FastCall(PyObject *func, PyObject **args, Py_ssize_t nargs); +#else +#define __Pyx_PyCFunction_FastCall(func, args, nargs) (assert(0), NULL) +#endif + +/* PyFunctionFastCall.proto */ +#if CYTHON_FAST_PYCALL +#define __Pyx_PyFunction_FastCall(func, args, nargs)\ + __Pyx_PyFunction_FastCallDict((func), (args), (nargs), NULL) +#if 1 || PY_VERSION_HEX < 0x030600B1 +static PyObject *__Pyx_PyFunction_FastCallDict(PyObject *func, PyObject **args, int nargs, PyObject *kwargs); +#else +#define __Pyx_PyFunction_FastCallDict(func, args, nargs, kwargs) _PyFunction_FastCallDict(func, args, nargs, kwargs) +#endif +#define __Pyx_BUILD_ASSERT_EXPR(cond)\ + (sizeof(char [1 - 2*!(cond)]) - 1) +#ifndef Py_MEMBER_SIZE +#define Py_MEMBER_SIZE(type, member) sizeof(((type *)0)->member) +#endif + static size_t __pyx_pyframe_localsplus_offset = 0; + #include "frameobject.h" + #define __Pxy_PyFrame_Initialize_Offsets()\ + ((void)__Pyx_BUILD_ASSERT_EXPR(sizeof(PyFrameObject) == offsetof(PyFrameObject, f_localsplus) + Py_MEMBER_SIZE(PyFrameObject, f_localsplus)),\ + (void)(__pyx_pyframe_localsplus_offset = ((size_t)PyFrame_Type.tp_basicsize) - Py_MEMBER_SIZE(PyFrameObject, f_localsplus))) + #define __Pyx_PyFrame_GetLocalsplus(frame)\ + (assert(__pyx_pyframe_localsplus_offset), (PyObject **)(((char *)(frame)) + __pyx_pyframe_localsplus_offset)) +#endif + +/* PyObjectCall2Args.proto */ +static CYTHON_UNUSED PyObject* __Pyx_PyObject_Call2Args(PyObject* function, PyObject* arg1, PyObject* arg2); + +/* PyObjectCallMethO.proto */ +#if CYTHON_COMPILING_IN_CPYTHON +static CYTHON_INLINE PyObject* __Pyx_PyObject_CallMethO(PyObject *func, PyObject *arg); +#endif + +/* PyObjectCallOneArg.proto */ +static CYTHON_INLINE PyObject* __Pyx_PyObject_CallOneArg(PyObject *func, PyObject *arg); + /* PyThreadStateGet.proto */ #if CYTHON_FAST_THREAD_STATE #define __Pyx_PyThreadState_declare PyThreadState *__pyx_tstate; @@ -1441,70 +1406,6 @@ static int __Pyx__GetException(PyThreadState *tstate, PyObject **type, PyObject static int __Pyx_GetException(PyObject **type, PyObject **value, PyObject **tb); #endif -/* FetchCommonType.proto */ -static PyTypeObject* __Pyx_FetchCommonType(PyTypeObject* type); - -/* CythonFunction.proto */ -#define __Pyx_CyFunction_USED 1 -#define __Pyx_CYFUNCTION_STATICMETHOD 0x01 -#define __Pyx_CYFUNCTION_CLASSMETHOD 0x02 -#define __Pyx_CYFUNCTION_CCLASS 0x04 -#define __Pyx_CyFunction_GetClosure(f)\ - (((__pyx_CyFunctionObject *) (f))->func_closure) -#define __Pyx_CyFunction_GetClassObj(f)\ - (((__pyx_CyFunctionObject *) (f))->func_classobj) -#define __Pyx_CyFunction_Defaults(type, f)\ - ((type *)(((__pyx_CyFunctionObject *) (f))->defaults)) -#define __Pyx_CyFunction_SetDefaultsGetter(f, g)\ - ((__pyx_CyFunctionObject *) (f))->defaults_getter = (g) -typedef struct { - PyCFunctionObject func; -#if PY_VERSION_HEX < 0x030500A0 - PyObject *func_weakreflist; -#endif - PyObject *func_dict; - PyObject *func_name; - PyObject *func_qualname; - PyObject *func_doc; - PyObject *func_globals; - PyObject *func_code; - PyObject *func_closure; - PyObject *func_classobj; - void *defaults; - int defaults_pyobjects; - int flags; - PyObject *defaults_tuple; - PyObject *defaults_kwdict; - PyObject *(*defaults_getter)(PyObject *); - PyObject *func_annotations; -} __pyx_CyFunctionObject; -static PyTypeObject *__pyx_CyFunctionType = 0; -#define __Pyx_CyFunction_Check(obj) (__Pyx_TypeCheck(obj, __pyx_CyFunctionType)) -#define __Pyx_CyFunction_NewEx(ml, flags, qualname, self, module, globals, code)\ - __Pyx_CyFunction_New(__pyx_CyFunctionType, ml, flags, qualname, self, module, globals, code) -static PyObject *__Pyx_CyFunction_New(PyTypeObject *, PyMethodDef *ml, - int flags, PyObject* qualname, - PyObject *self, - PyObject *module, PyObject *globals, - PyObject* code); -static CYTHON_INLINE void *__Pyx_CyFunction_InitDefaults(PyObject *m, - size_t size, - int pyobjects); -static CYTHON_INLINE void __Pyx_CyFunction_SetDefaultsTuple(PyObject *m, - PyObject *tuple); -static CYTHON_INLINE void __Pyx_CyFunction_SetDefaultsKwDict(PyObject *m, - PyObject *dict); -static CYTHON_INLINE void __Pyx_CyFunction_SetAnnotationsDict(PyObject *m, - PyObject *dict); -static int __pyx_CyFunction_init(void); - -/* PyObject_GenericGetAttrNoDict.proto */ -#if CYTHON_USE_TYPE_SLOTS && CYTHON_USE_PYTYPE_LOOKUP && PY_VERSION_HEX < 0x03070000 -static CYTHON_INLINE PyObject* __Pyx_PyObject_GenericGetAttrNoDict(PyObject* obj, PyObject* attr_name); -#else -#define __Pyx_PyObject_GenericGetAttrNoDict PyObject_GenericGetAttr -#endif - /* TypeImport.proto */ #ifndef __PYX_HAVE_RT_ImportType_proto #define __PYX_HAVE_RT_ImportType_proto @@ -1549,7 +1450,7 @@ static void __Pyx_AddTraceback(const char *funcname, int c_line, int py_line, const char *filename); /* CIntToPy.proto */ -static CYTHON_INLINE PyObject* __Pyx_PyInt_From_long(long value); +static CYTHON_INLINE PyObject* __Pyx_PyInt_From_uint32_t(uint32_t value); /* CIntToPy.proto */ static CYTHON_INLINE PyObject* __Pyx_PyInt_From_unsigned_int(unsigned int value); @@ -1661,9 +1562,18 @@ static CYTHON_INLINE PyObject* __Pyx_PyInt_From_enum__NPY_TYPES(enum NPY_TYPES v /* CIntFromPy.proto */ static CYTHON_INLINE unsigned int __Pyx_PyInt_As_unsigned_int(PyObject *); +/* CIntFromPy.proto */ +static CYTHON_INLINE char __Pyx_PyInt_As_char(PyObject *); + +/* CIntFromPy.proto */ +static CYTHON_INLINE size_t __Pyx_PyInt_As_size_t(PyObject *); + /* CIntFromPy.proto */ static CYTHON_INLINE int __Pyx_PyInt_As_int(PyObject *); +/* CIntToPy.proto */ +static CYTHON_INLINE PyObject* __Pyx_PyInt_From_long(long value); + /* CIntFromPy.proto */ static CYTHON_INLINE long __Pyx_PyInt_As_long(PyObject *); @@ -1717,13 +1627,12 @@ static PyTypeObject *__pyx_ptype_5numpy_ufunc = 0; static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *, char *, char *, int *); /*proto*/ /* Module declarations from 'gensim.models._utils_any2vec' */ -static PyTypeObject *__pyx_ptype___pyx_scope_struct____Pyx_CFunc_object____object___to_py = 0; -static PyObject *__pyx_f_6gensim_6models_14_utils_any2vec__byte_to_int_py3(PyObject *); /*proto*/ -static PyObject *__pyx_f_6gensim_6models_14_utils_any2vec__byte_to_int_py2(PyObject *); /*proto*/ -static PyObject *__pyx_f_6gensim_6models_14_utils_any2vec_ft_hash(PyObject *, int __pyx_skip_dispatch); /*proto*/ +static unsigned char __pyx_v_6gensim_6models_14_utils_any2vec__MB_MASK; +static unsigned char __pyx_v_6gensim_6models_14_utils_any2vec__MB_START; +static PyObject *__pyx_f_6gensim_6models_14_utils_any2vec_ft_hash_bytes(PyObject *, int __pyx_skip_dispatch); /*proto*/ static PyObject *__pyx_f_6gensim_6models_14_utils_any2vec_ft_hash_broken(PyObject *, int __pyx_skip_dispatch); /*proto*/ static PyObject *__pyx_f_6gensim_6models_14_utils_any2vec_compute_ngrams(PyObject *, unsigned int, unsigned int, int __pyx_skip_dispatch); /*proto*/ -static PyObject *__Pyx_CFunc_object____object___to_py(PyObject *(*)(PyObject *)); /*proto*/ +static PyObject *__pyx_f_6gensim_6models_14_utils_any2vec_compute_ngrams_bytes(PyObject *, unsigned int, unsigned int, int __pyx_skip_dispatch); /*proto*/ #define __Pyx_MODULE_NAME "gensim.models._utils_any2vec" extern int __pyx_module_is_main_gensim__models___utils_any2vec; int __pyx_module_is_main_gensim__models___utils_any2vec = 0; @@ -1734,32 +1643,27 @@ static PyObject *__pyx_builtin_ValueError; static PyObject *__pyx_builtin_RuntimeError; static PyObject *__pyx_builtin_ImportError; static const char __pyx_k_[] = "<"; -static const char __pyx_k_b[] = "b"; +static const char __pyx_k_s[] = "<%s>"; static const char __pyx_k__2[] = ">"; static const char __pyx_k_np[] = "np"; static const char __pyx_k_PY2[] = "PY2"; static const char __pyx_k_six[] = "six"; -static const char __pyx_k_int8[] = "int8"; static const char __pyx_k_main[] = "__main__"; static const char __pyx_k_name[] = "__name__"; static const char __pyx_k_test[] = "__test__"; static const char __pyx_k_word[] = "word"; -static const char __pyx_k_wrap[] = "wrap"; static const char __pyx_k_max_n[] = "max_n"; static const char __pyx_k_min_n[] = "min_n"; static const char __pyx_k_numpy[] = "numpy"; static const char __pyx_k_range[] = "range"; +static const char __pyx_k_utf_8[] = "utf-8"; +static const char __pyx_k_encode[] = "encode"; static const char __pyx_k_import[] = "__import__"; -static const char __pyx_k_uint32[] = "uint32"; static const char __pyx_k_ValueError[] = "ValueError"; static const char __pyx_k_ImportError[] = "ImportError"; -static const char __pyx_k_byte_to_int[] = "_byte_to_int"; -static const char __pyx_k_cfunc_to_py[] = "cfunc.to_py"; static const char __pyx_k_RuntimeError[] = "RuntimeError"; -static const char __pyx_k_stringsource[] = "stringsource"; static const char __pyx_k_cline_in_traceback[] = "cline_in_traceback"; static const char __pyx_k_ndarray_is_not_C_contiguous[] = "ndarray is not C contiguous"; -static const char __pyx_k_Pyx_CFunc_object____object___t[] = "__Pyx_CFunc_object____object___to_py..wrap"; static const char __pyx_k_numpy_core_multiarray_failed_to[] = "numpy.core.multiarray failed to import"; static const char __pyx_k_unknown_dtype_code_in_numpy_pxd[] = "unknown dtype code in numpy.pxd (%d)"; static const char __pyx_k_Format_string_allocated_too_shor[] = "Format string allocated too short, see comment in numpy.pxd"; @@ -1774,16 +1678,12 @@ static PyObject *__pyx_kp_u_Format_string_allocated_too_shor_2; static PyObject *__pyx_n_s_ImportError; static PyObject *__pyx_kp_u_Non_native_byte_order_not_suppor; static PyObject *__pyx_n_s_PY2; -static PyObject *__pyx_n_s_Pyx_CFunc_object____object___t; static PyObject *__pyx_n_s_RuntimeError; static PyObject *__pyx_n_s_ValueError; static PyObject *__pyx_kp_u__2; -static PyObject *__pyx_n_s_b; -static PyObject *__pyx_n_s_byte_to_int; -static PyObject *__pyx_n_s_cfunc_to_py; static PyObject *__pyx_n_s_cline_in_traceback; +static PyObject *__pyx_n_s_encode; static PyObject *__pyx_n_s_import; -static PyObject *__pyx_n_s_int8; static PyObject *__pyx_n_s_main; static PyObject *__pyx_n_s_max_n; static PyObject *__pyx_n_s_min_n; @@ -1795,23 +1695,20 @@ static PyObject *__pyx_n_s_numpy; static PyObject *__pyx_kp_s_numpy_core_multiarray_failed_to; static PyObject *__pyx_kp_s_numpy_core_umath_failed_to_impor; static PyObject *__pyx_n_s_range; +static PyObject *__pyx_kp_s_s; static PyObject *__pyx_n_s_six; -static PyObject *__pyx_kp_s_stringsource; static PyObject *__pyx_n_s_test; -static PyObject *__pyx_n_s_uint32; static PyObject *__pyx_kp_u_unknown_dtype_code_in_numpy_pxd; +static PyObject *__pyx_kp_s_utf_8; static PyObject *__pyx_n_s_word; -static PyObject *__pyx_n_s_wrap; -static PyObject *__pyx_pf_6gensim_6models_14_utils_any2vec_ft_hash(CYTHON_UNUSED PyObject *__pyx_self, PyObject *__pyx_v_string); /* proto */ +static PyObject *__pyx_pf_6gensim_6models_14_utils_any2vec_ft_hash_bytes(CYTHON_UNUSED PyObject *__pyx_self, PyObject *__pyx_v_bytez); /* proto */ static PyObject *__pyx_pf_6gensim_6models_14_utils_any2vec_2ft_hash_broken(CYTHON_UNUSED PyObject *__pyx_self, PyObject *__pyx_v_string); /* proto */ static PyObject *__pyx_pf_6gensim_6models_14_utils_any2vec_4compute_ngrams(CYTHON_UNUSED PyObject *__pyx_self, PyObject *__pyx_v_word, unsigned int __pyx_v_min_n, unsigned int __pyx_v_max_n); /* proto */ +static PyObject *__pyx_pf_6gensim_6models_14_utils_any2vec_6compute_ngrams_bytes(CYTHON_UNUSED PyObject *__pyx_self, PyObject *__pyx_v_word, unsigned int __pyx_v_min_n, unsigned int __pyx_v_max_n); /* proto */ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, Py_buffer *__pyx_v_info, int __pyx_v_flags); /* proto */ static void __pyx_pf_5numpy_7ndarray_2__releasebuffer__(PyArrayObject *__pyx_v_self, Py_buffer *__pyx_v_info); /* proto */ -static PyObject *__pyx_pf_11cfunc_dot_to_py_36__Pyx_CFunc_object____object___to_py_wrap(PyObject *__pyx_self, PyObject *__pyx_v_b); /* proto */ -static PyObject *__pyx_tp_new___pyx_scope_struct____Pyx_CFunc_object____object___to_py(PyTypeObject *t, PyObject *a, PyObject *k); /*proto*/ static PyObject *__pyx_int_0; static PyObject *__pyx_int_1; -static PyObject *__pyx_int_16777619; static PyObject *__pyx_tuple__3; static PyObject *__pyx_tuple__4; static PyObject *__pyx_tuple__5; @@ -1819,465 +1716,198 @@ static PyObject *__pyx_tuple__6; static PyObject *__pyx_tuple__7; static PyObject *__pyx_tuple__8; static PyObject *__pyx_tuple__9; -static PyObject *__pyx_tuple__10; -static PyObject *__pyx_codeobj__11; /* Late includes */ -/* "gensim/models/_utils_any2vec.pyx":15 - * +/* "gensim/models/_utils_any2vec.pyx":22 * - * cdef _byte_to_int_py3(b): # <<<<<<<<<<<<<< - * return b * + * cpdef ft_hash_bytes(bytes bytez): # <<<<<<<<<<<<<< + * """Calculate hash based on `bytez`. + * Reproduce `hash method from Facebook fastText implementation */ -static PyObject *__pyx_f_6gensim_6models_14_utils_any2vec__byte_to_int_py3(PyObject *__pyx_v_b) { +static PyObject *__pyx_pw_6gensim_6models_14_utils_any2vec_1ft_hash_bytes(PyObject *__pyx_self, PyObject *__pyx_v_bytez); /*proto*/ +static PyObject *__pyx_f_6gensim_6models_14_utils_any2vec_ft_hash_bytes(PyObject *__pyx_v_bytez, CYTHON_UNUSED int __pyx_skip_dispatch) { + uint32_t __pyx_v_h; + char __pyx_v_b; PyObject *__pyx_r = NULL; __Pyx_RefNannyDeclarations - __Pyx_RefNannySetupContext("_byte_to_int_py3", 0); + PyObject *__pyx_t_1 = NULL; + char *__pyx_t_2; + char *__pyx_t_3; + char *__pyx_t_4; + char *__pyx_t_5; + PyObject *__pyx_t_6 = NULL; + __Pyx_RefNannySetupContext("ft_hash_bytes", 0); + + /* "gensim/models/_utils_any2vec.pyx":38 + * + * """ + * cdef uint32_t h = 2166136261 # <<<<<<<<<<<<<< + * cdef char b + * + */ + __pyx_v_h = 0x811C9DC5; + + /* "gensim/models/_utils_any2vec.pyx":41 + * cdef char b + * + * for b in bytez: # <<<<<<<<<<<<<< + * h = h ^ (b) + * h = h * 16777619 + */ + if (unlikely(__pyx_v_bytez == Py_None)) { + PyErr_SetString(PyExc_TypeError, "'NoneType' is not iterable"); + __PYX_ERR(0, 41, __pyx_L1_error) + } + __Pyx_INCREF(__pyx_v_bytez); + __pyx_t_1 = __pyx_v_bytez; + __pyx_t_3 = PyBytes_AS_STRING(__pyx_t_1); + __pyx_t_4 = (__pyx_t_3 + PyBytes_GET_SIZE(__pyx_t_1)); + for (__pyx_t_5 = __pyx_t_3; __pyx_t_5 < __pyx_t_4; __pyx_t_5++) { + __pyx_t_2 = __pyx_t_5; + __pyx_v_b = (__pyx_t_2[0]); + + /* "gensim/models/_utils_any2vec.pyx":42 + * + * for b in bytez: + * h = h ^ (b) # <<<<<<<<<<<<<< + * h = h * 16777619 + * return h + */ + __pyx_v_h = (__pyx_v_h ^ ((uint32_t)((int8_t)__pyx_v_b))); + + /* "gensim/models/_utils_any2vec.pyx":43 + * for b in bytez: + * h = h ^ (b) + * h = h * 16777619 # <<<<<<<<<<<<<< + * return h + * + */ + __pyx_v_h = (__pyx_v_h * 0x1000193); + } + __Pyx_DECREF(__pyx_t_1); __pyx_t_1 = 0; - /* "gensim/models/_utils_any2vec.pyx":16 + /* "gensim/models/_utils_any2vec.pyx":44 + * h = h ^ (b) + * h = h * 16777619 + * return h # <<<<<<<<<<<<<< * - * cdef _byte_to_int_py3(b): - * return b # <<<<<<<<<<<<<< * - * cdef _byte_to_int_py2(b): */ __Pyx_XDECREF(__pyx_r); - __Pyx_INCREF(__pyx_v_b); - __pyx_r = __pyx_v_b; + __pyx_t_6 = __Pyx_PyInt_From_uint32_t(__pyx_v_h); if (unlikely(!__pyx_t_6)) __PYX_ERR(0, 44, __pyx_L1_error) + __Pyx_GOTREF(__pyx_t_6); + __pyx_r = __pyx_t_6; + __pyx_t_6 = 0; goto __pyx_L0; - /* "gensim/models/_utils_any2vec.pyx":15 - * + /* "gensim/models/_utils_any2vec.pyx":22 * - * cdef _byte_to_int_py3(b): # <<<<<<<<<<<<<< - * return b * + * cpdef ft_hash_bytes(bytes bytez): # <<<<<<<<<<<<<< + * """Calculate hash based on `bytez`. + * Reproduce `hash method from Facebook fastText implementation */ /* function exit code */ + __pyx_L1_error:; + __Pyx_XDECREF(__pyx_t_1); + __Pyx_XDECREF(__pyx_t_6); + __Pyx_AddTraceback("gensim.models._utils_any2vec.ft_hash_bytes", __pyx_clineno, __pyx_lineno, __pyx_filename); + __pyx_r = 0; __pyx_L0:; __Pyx_XGIVEREF(__pyx_r); __Pyx_RefNannyFinishContext(); return __pyx_r; } -/* "gensim/models/_utils_any2vec.pyx":18 - * return b - * - * cdef _byte_to_int_py2(b): # <<<<<<<<<<<<<< - * return ord(b) - * - */ +/* Python wrapper */ +static PyObject *__pyx_pw_6gensim_6models_14_utils_any2vec_1ft_hash_bytes(PyObject *__pyx_self, PyObject *__pyx_v_bytez); /*proto*/ +static char __pyx_doc_6gensim_6models_14_utils_any2vec_ft_hash_bytes[] = "ft_hash_bytes(bytes bytez)\nCalculate hash based on `bytez`.\n Reproduce `hash method from Facebook fastText implementation\n `_.\n\n Parameters\n ----------\n bytez : bytes\n The string whose hash needs to be calculated, encoded as UTF-8.\n\n Returns\n -------\n unsigned int\n The hash of the string.\n\n "; +static PyObject *__pyx_pw_6gensim_6models_14_utils_any2vec_1ft_hash_bytes(PyObject *__pyx_self, PyObject *__pyx_v_bytez) { + PyObject *__pyx_r = 0; + __Pyx_RefNannyDeclarations + __Pyx_RefNannySetupContext("ft_hash_bytes (wrapper)", 0); + if (unlikely(!__Pyx_ArgTypeTest(((PyObject *)__pyx_v_bytez), (&PyBytes_Type), 1, "bytez", 1))) __PYX_ERR(0, 22, __pyx_L1_error) + __pyx_r = __pyx_pf_6gensim_6models_14_utils_any2vec_ft_hash_bytes(__pyx_self, ((PyObject*)__pyx_v_bytez)); + + /* function exit code */ + goto __pyx_L0; + __pyx_L1_error:; + __pyx_r = NULL; + __pyx_L0:; + __Pyx_RefNannyFinishContext(); + return __pyx_r; +} -static PyObject *__pyx_f_6gensim_6models_14_utils_any2vec__byte_to_int_py2(PyObject *__pyx_v_b) { +static PyObject *__pyx_pf_6gensim_6models_14_utils_any2vec_ft_hash_bytes(CYTHON_UNUSED PyObject *__pyx_self, PyObject *__pyx_v_bytez) { PyObject *__pyx_r = NULL; __Pyx_RefNannyDeclarations - long __pyx_t_1; - PyObject *__pyx_t_2 = NULL; - __Pyx_RefNannySetupContext("_byte_to_int_py2", 0); - - /* "gensim/models/_utils_any2vec.pyx":19 - * - * cdef _byte_to_int_py2(b): - * return ord(b) # <<<<<<<<<<<<<< - * - * _byte_to_int = _byte_to_int_py2 if PY2 else _byte_to_int_py3 - */ + PyObject *__pyx_t_1 = NULL; + __Pyx_RefNannySetupContext("ft_hash_bytes", 0); __Pyx_XDECREF(__pyx_r); - __pyx_t_1 = __Pyx_PyObject_Ord(__pyx_v_b); if (unlikely(__pyx_t_1 == ((long)(long)(Py_UCS4)-1))) __PYX_ERR(0, 19, __pyx_L1_error) - __pyx_t_2 = __Pyx_PyInt_From_long(__pyx_t_1); if (unlikely(!__pyx_t_2)) __PYX_ERR(0, 19, __pyx_L1_error) - __Pyx_GOTREF(__pyx_t_2); - __pyx_r = __pyx_t_2; - __pyx_t_2 = 0; + __pyx_t_1 = __pyx_f_6gensim_6models_14_utils_any2vec_ft_hash_bytes(__pyx_v_bytez, 0); if (unlikely(!__pyx_t_1)) __PYX_ERR(0, 22, __pyx_L1_error) + __Pyx_GOTREF(__pyx_t_1); + __pyx_r = __pyx_t_1; + __pyx_t_1 = 0; goto __pyx_L0; - /* "gensim/models/_utils_any2vec.pyx":18 - * return b - * - * cdef _byte_to_int_py2(b): # <<<<<<<<<<<<<< - * return ord(b) - * - */ - /* function exit code */ __pyx_L1_error:; - __Pyx_XDECREF(__pyx_t_2); - __Pyx_AddTraceback("gensim.models._utils_any2vec._byte_to_int_py2", __pyx_clineno, __pyx_lineno, __pyx_filename); - __pyx_r = 0; + __Pyx_XDECREF(__pyx_t_1); + __Pyx_AddTraceback("gensim.models._utils_any2vec.ft_hash_bytes", __pyx_clineno, __pyx_lineno, __pyx_filename); + __pyx_r = NULL; __pyx_L0:; __Pyx_XGIVEREF(__pyx_r); __Pyx_RefNannyFinishContext(); return __pyx_r; } -/* "gensim/models/_utils_any2vec.pyx":24 +/* "gensim/models/_utils_any2vec.pyx":47 * * - * cpdef ft_hash(unicode string): # <<<<<<<<<<<<<< + * cpdef ft_hash_broken(unicode string): # <<<<<<<<<<<<<< * """Calculate hash based on `string`. - * Reproduce `hash method from Facebook fastText implementation + * */ -static PyObject *__pyx_pw_6gensim_6models_14_utils_any2vec_1ft_hash(PyObject *__pyx_self, PyObject *__pyx_v_string); /*proto*/ -static PyObject *__pyx_f_6gensim_6models_14_utils_any2vec_ft_hash(PyObject *__pyx_v_string, CYTHON_UNUSED int __pyx_skip_dispatch) { +static PyObject *__pyx_pw_6gensim_6models_14_utils_any2vec_3ft_hash_broken(PyObject *__pyx_self, PyObject *__pyx_v_string); /*proto*/ +static PyObject *__pyx_f_6gensim_6models_14_utils_any2vec_ft_hash_broken(PyObject *__pyx_v_string, CYTHON_UNUSED int __pyx_skip_dispatch) { unsigned int __pyx_v_h; PyObject *__pyx_v_c = NULL; PyObject *__pyx_r = NULL; __Pyx_RefNannyDeclarations PyObject *__pyx_t_1 = NULL; - PyObject *__pyx_t_2 = NULL; - PyObject *(*__pyx_t_3)(PyObject *); - PyObject *__pyx_t_4 = NULL; - PyObject *__pyx_t_5 = NULL; - PyObject *__pyx_t_6 = NULL; - PyObject *__pyx_t_7 = NULL; + Py_ssize_t __pyx_t_2; + Py_ssize_t __pyx_t_3; + void *__pyx_t_4; + int __pyx_t_5; + int __pyx_t_6; + Py_ssize_t __pyx_t_7; PyObject *__pyx_t_8 = NULL; - PyObject *__pyx_t_9 = NULL; - PyObject *__pyx_t_10 = NULL; - PyObject *__pyx_t_11 = NULL; - PyObject *__pyx_t_12 = NULL; - unsigned int __pyx_t_13; - __Pyx_RefNannySetupContext("ft_hash", 0); + long __pyx_t_9; + __Pyx_RefNannySetupContext("ft_hash_broken", 0); - /* "gensim/models/_utils_any2vec.pyx":40 + /* "gensim/models/_utils_any2vec.pyx":64 * * """ * cdef unsigned int h = 2166136261 # <<<<<<<<<<<<<< - * for c in string.encode("utf-8"): - * h = np.uint32(h ^ np.uint32(np.int8(_byte_to_int(c)))) + * for c in string: + * h ^= ord(c) */ __pyx_v_h = 0x811C9DC5; - /* "gensim/models/_utils_any2vec.pyx":41 + /* "gensim/models/_utils_any2vec.pyx":65 * """ * cdef unsigned int h = 2166136261 - * for c in string.encode("utf-8"): # <<<<<<<<<<<<<< - * h = np.uint32(h ^ np.uint32(np.int8(_byte_to_int(c)))) - * h = np.uint32(h * np.uint32(16777619)) + * for c in string: # <<<<<<<<<<<<<< + * h ^= ord(c) + * h *= 16777619 */ if (unlikely(__pyx_v_string == Py_None)) { - PyErr_Format(PyExc_AttributeError, "'NoneType' object has no attribute '%.30s'", "encode"); - __PYX_ERR(0, 41, __pyx_L1_error) - } - __pyx_t_1 = PyUnicode_AsUTF8String(__pyx_v_string); if (unlikely(!__pyx_t_1)) __PYX_ERR(0, 41, __pyx_L1_error) - __Pyx_GOTREF(__pyx_t_1); - __pyx_t_2 = PyObject_GetIter(__pyx_t_1); if (unlikely(!__pyx_t_2)) __PYX_ERR(0, 41, __pyx_L1_error) - __Pyx_GOTREF(__pyx_t_2); - __pyx_t_3 = Py_TYPE(__pyx_t_2)->tp_iternext; if (unlikely(!__pyx_t_3)) __PYX_ERR(0, 41, __pyx_L1_error) - __Pyx_DECREF(__pyx_t_1); __pyx_t_1 = 0; - for (;;) { - { - __pyx_t_1 = __pyx_t_3(__pyx_t_2); - if (unlikely(!__pyx_t_1)) { - PyObject* exc_type = PyErr_Occurred(); - if (exc_type) { - if (likely(__Pyx_PyErr_GivenExceptionMatches(exc_type, PyExc_StopIteration))) PyErr_Clear(); - else __PYX_ERR(0, 41, __pyx_L1_error) - } - break; - } - __Pyx_GOTREF(__pyx_t_1); - } - __Pyx_XDECREF_SET(__pyx_v_c, __pyx_t_1); - __pyx_t_1 = 0; - - /* "gensim/models/_utils_any2vec.pyx":42 - * cdef unsigned int h = 2166136261 - * for c in string.encode("utf-8"): - * h = np.uint32(h ^ np.uint32(np.int8(_byte_to_int(c)))) # <<<<<<<<<<<<<< - * h = np.uint32(h * np.uint32(16777619)) - * return h - */ - __Pyx_GetModuleGlobalName(__pyx_t_4, __pyx_n_s_np); if (unlikely(!__pyx_t_4)) __PYX_ERR(0, 42, __pyx_L1_error) - __Pyx_GOTREF(__pyx_t_4); - __pyx_t_5 = __Pyx_PyObject_GetAttrStr(__pyx_t_4, __pyx_n_s_uint32); if (unlikely(!__pyx_t_5)) __PYX_ERR(0, 42, __pyx_L1_error) - __Pyx_GOTREF(__pyx_t_5); - __Pyx_DECREF(__pyx_t_4); __pyx_t_4 = 0; - __pyx_t_4 = __Pyx_PyInt_From_unsigned_int(__pyx_v_h); if (unlikely(!__pyx_t_4)) __PYX_ERR(0, 42, __pyx_L1_error) - __Pyx_GOTREF(__pyx_t_4); - __Pyx_GetModuleGlobalName(__pyx_t_7, __pyx_n_s_np); if (unlikely(!__pyx_t_7)) __PYX_ERR(0, 42, __pyx_L1_error) - __Pyx_GOTREF(__pyx_t_7); - __pyx_t_8 = __Pyx_PyObject_GetAttrStr(__pyx_t_7, __pyx_n_s_uint32); if (unlikely(!__pyx_t_8)) __PYX_ERR(0, 42, __pyx_L1_error) - __Pyx_GOTREF(__pyx_t_8); - __Pyx_DECREF(__pyx_t_7); __pyx_t_7 = 0; - __Pyx_GetModuleGlobalName(__pyx_t_9, __pyx_n_s_np); if (unlikely(!__pyx_t_9)) __PYX_ERR(0, 42, __pyx_L1_error) - __Pyx_GOTREF(__pyx_t_9); - __pyx_t_10 = __Pyx_PyObject_GetAttrStr(__pyx_t_9, __pyx_n_s_int8); if (unlikely(!__pyx_t_10)) __PYX_ERR(0, 42, __pyx_L1_error) - __Pyx_GOTREF(__pyx_t_10); - __Pyx_DECREF(__pyx_t_9); __pyx_t_9 = 0; - __Pyx_GetModuleGlobalName(__pyx_t_11, __pyx_n_s_byte_to_int); if (unlikely(!__pyx_t_11)) __PYX_ERR(0, 42, __pyx_L1_error) - __Pyx_GOTREF(__pyx_t_11); - __pyx_t_12 = NULL; - if (CYTHON_UNPACK_METHODS && unlikely(PyMethod_Check(__pyx_t_11))) { - __pyx_t_12 = PyMethod_GET_SELF(__pyx_t_11); - if (likely(__pyx_t_12)) { - PyObject* function = PyMethod_GET_FUNCTION(__pyx_t_11); - __Pyx_INCREF(__pyx_t_12); - __Pyx_INCREF(function); - __Pyx_DECREF_SET(__pyx_t_11, function); - } - } - __pyx_t_9 = (__pyx_t_12) ? __Pyx_PyObject_Call2Args(__pyx_t_11, __pyx_t_12, __pyx_v_c) : __Pyx_PyObject_CallOneArg(__pyx_t_11, __pyx_v_c); - __Pyx_XDECREF(__pyx_t_12); __pyx_t_12 = 0; - if (unlikely(!__pyx_t_9)) __PYX_ERR(0, 42, __pyx_L1_error) - __Pyx_GOTREF(__pyx_t_9); - __Pyx_DECREF(__pyx_t_11); __pyx_t_11 = 0; - __pyx_t_11 = NULL; - if (CYTHON_UNPACK_METHODS && unlikely(PyMethod_Check(__pyx_t_10))) { - __pyx_t_11 = PyMethod_GET_SELF(__pyx_t_10); - if (likely(__pyx_t_11)) { - PyObject* function = PyMethod_GET_FUNCTION(__pyx_t_10); - __Pyx_INCREF(__pyx_t_11); - __Pyx_INCREF(function); - __Pyx_DECREF_SET(__pyx_t_10, function); - } - } - __pyx_t_7 = (__pyx_t_11) ? __Pyx_PyObject_Call2Args(__pyx_t_10, __pyx_t_11, __pyx_t_9) : __Pyx_PyObject_CallOneArg(__pyx_t_10, __pyx_t_9); - __Pyx_XDECREF(__pyx_t_11); __pyx_t_11 = 0; - __Pyx_DECREF(__pyx_t_9); __pyx_t_9 = 0; - if (unlikely(!__pyx_t_7)) __PYX_ERR(0, 42, __pyx_L1_error) - __Pyx_GOTREF(__pyx_t_7); - __Pyx_DECREF(__pyx_t_10); __pyx_t_10 = 0; - __pyx_t_10 = NULL; - if (CYTHON_UNPACK_METHODS && unlikely(PyMethod_Check(__pyx_t_8))) { - __pyx_t_10 = PyMethod_GET_SELF(__pyx_t_8); - if (likely(__pyx_t_10)) { - PyObject* function = PyMethod_GET_FUNCTION(__pyx_t_8); - __Pyx_INCREF(__pyx_t_10); - __Pyx_INCREF(function); - __Pyx_DECREF_SET(__pyx_t_8, function); - } - } - __pyx_t_6 = (__pyx_t_10) ? __Pyx_PyObject_Call2Args(__pyx_t_8, __pyx_t_10, __pyx_t_7) : __Pyx_PyObject_CallOneArg(__pyx_t_8, __pyx_t_7); - __Pyx_XDECREF(__pyx_t_10); __pyx_t_10 = 0; - __Pyx_DECREF(__pyx_t_7); __pyx_t_7 = 0; - if (unlikely(!__pyx_t_6)) __PYX_ERR(0, 42, __pyx_L1_error) - __Pyx_GOTREF(__pyx_t_6); - __Pyx_DECREF(__pyx_t_8); __pyx_t_8 = 0; - __pyx_t_8 = PyNumber_Xor(__pyx_t_4, __pyx_t_6); if (unlikely(!__pyx_t_8)) __PYX_ERR(0, 42, __pyx_L1_error) - __Pyx_GOTREF(__pyx_t_8); - __Pyx_DECREF(__pyx_t_4); __pyx_t_4 = 0; - __Pyx_DECREF(__pyx_t_6); __pyx_t_6 = 0; - __pyx_t_6 = NULL; - if (CYTHON_UNPACK_METHODS && unlikely(PyMethod_Check(__pyx_t_5))) { - __pyx_t_6 = PyMethod_GET_SELF(__pyx_t_5); - if (likely(__pyx_t_6)) { - PyObject* function = PyMethod_GET_FUNCTION(__pyx_t_5); - __Pyx_INCREF(__pyx_t_6); - __Pyx_INCREF(function); - __Pyx_DECREF_SET(__pyx_t_5, function); - } - } - __pyx_t_1 = (__pyx_t_6) ? __Pyx_PyObject_Call2Args(__pyx_t_5, __pyx_t_6, __pyx_t_8) : __Pyx_PyObject_CallOneArg(__pyx_t_5, __pyx_t_8); - __Pyx_XDECREF(__pyx_t_6); __pyx_t_6 = 0; - __Pyx_DECREF(__pyx_t_8); __pyx_t_8 = 0; - if (unlikely(!__pyx_t_1)) __PYX_ERR(0, 42, __pyx_L1_error) - __Pyx_GOTREF(__pyx_t_1); - __Pyx_DECREF(__pyx_t_5); __pyx_t_5 = 0; - __pyx_t_13 = __Pyx_PyInt_As_unsigned_int(__pyx_t_1); if (unlikely((__pyx_t_13 == (unsigned int)-1) && PyErr_Occurred())) __PYX_ERR(0, 42, __pyx_L1_error) - __Pyx_DECREF(__pyx_t_1); __pyx_t_1 = 0; - __pyx_v_h = __pyx_t_13; - - /* "gensim/models/_utils_any2vec.pyx":43 - * for c in string.encode("utf-8"): - * h = np.uint32(h ^ np.uint32(np.int8(_byte_to_int(c)))) - * h = np.uint32(h * np.uint32(16777619)) # <<<<<<<<<<<<<< - * return h - * - */ - __Pyx_GetModuleGlobalName(__pyx_t_5, __pyx_n_s_np); if (unlikely(!__pyx_t_5)) __PYX_ERR(0, 43, __pyx_L1_error) - __Pyx_GOTREF(__pyx_t_5); - __pyx_t_8 = __Pyx_PyObject_GetAttrStr(__pyx_t_5, __pyx_n_s_uint32); if (unlikely(!__pyx_t_8)) __PYX_ERR(0, 43, __pyx_L1_error) - __Pyx_GOTREF(__pyx_t_8); - __Pyx_DECREF(__pyx_t_5); __pyx_t_5 = 0; - __pyx_t_5 = __Pyx_PyInt_From_unsigned_int(__pyx_v_h); if (unlikely(!__pyx_t_5)) __PYX_ERR(0, 43, __pyx_L1_error) - __Pyx_GOTREF(__pyx_t_5); - __Pyx_GetModuleGlobalName(__pyx_t_4, __pyx_n_s_np); if (unlikely(!__pyx_t_4)) __PYX_ERR(0, 43, __pyx_L1_error) - __Pyx_GOTREF(__pyx_t_4); - __pyx_t_7 = __Pyx_PyObject_GetAttrStr(__pyx_t_4, __pyx_n_s_uint32); if (unlikely(!__pyx_t_7)) __PYX_ERR(0, 43, __pyx_L1_error) - __Pyx_GOTREF(__pyx_t_7); - __Pyx_DECREF(__pyx_t_4); __pyx_t_4 = 0; - __pyx_t_4 = NULL; - if (CYTHON_UNPACK_METHODS && unlikely(PyMethod_Check(__pyx_t_7))) { - __pyx_t_4 = PyMethod_GET_SELF(__pyx_t_7); - if (likely(__pyx_t_4)) { - PyObject* function = PyMethod_GET_FUNCTION(__pyx_t_7); - __Pyx_INCREF(__pyx_t_4); - __Pyx_INCREF(function); - __Pyx_DECREF_SET(__pyx_t_7, function); - } - } - __pyx_t_6 = (__pyx_t_4) ? __Pyx_PyObject_Call2Args(__pyx_t_7, __pyx_t_4, __pyx_int_16777619) : __Pyx_PyObject_CallOneArg(__pyx_t_7, __pyx_int_16777619); - __Pyx_XDECREF(__pyx_t_4); __pyx_t_4 = 0; - if (unlikely(!__pyx_t_6)) __PYX_ERR(0, 43, __pyx_L1_error) - __Pyx_GOTREF(__pyx_t_6); - __Pyx_DECREF(__pyx_t_7); __pyx_t_7 = 0; - __pyx_t_7 = PyNumber_Multiply(__pyx_t_5, __pyx_t_6); if (unlikely(!__pyx_t_7)) __PYX_ERR(0, 43, __pyx_L1_error) - __Pyx_GOTREF(__pyx_t_7); - __Pyx_DECREF(__pyx_t_5); __pyx_t_5 = 0; - __Pyx_DECREF(__pyx_t_6); __pyx_t_6 = 0; - __pyx_t_6 = NULL; - if (CYTHON_UNPACK_METHODS && unlikely(PyMethod_Check(__pyx_t_8))) { - __pyx_t_6 = PyMethod_GET_SELF(__pyx_t_8); - if (likely(__pyx_t_6)) { - PyObject* function = PyMethod_GET_FUNCTION(__pyx_t_8); - __Pyx_INCREF(__pyx_t_6); - __Pyx_INCREF(function); - __Pyx_DECREF_SET(__pyx_t_8, function); - } - } - __pyx_t_1 = (__pyx_t_6) ? __Pyx_PyObject_Call2Args(__pyx_t_8, __pyx_t_6, __pyx_t_7) : __Pyx_PyObject_CallOneArg(__pyx_t_8, __pyx_t_7); - __Pyx_XDECREF(__pyx_t_6); __pyx_t_6 = 0; - __Pyx_DECREF(__pyx_t_7); __pyx_t_7 = 0; - if (unlikely(!__pyx_t_1)) __PYX_ERR(0, 43, __pyx_L1_error) - __Pyx_GOTREF(__pyx_t_1); - __Pyx_DECREF(__pyx_t_8); __pyx_t_8 = 0; - __pyx_t_13 = __Pyx_PyInt_As_unsigned_int(__pyx_t_1); if (unlikely((__pyx_t_13 == (unsigned int)-1) && PyErr_Occurred())) __PYX_ERR(0, 43, __pyx_L1_error) - __Pyx_DECREF(__pyx_t_1); __pyx_t_1 = 0; - __pyx_v_h = __pyx_t_13; - - /* "gensim/models/_utils_any2vec.pyx":41 - * """ - * cdef unsigned int h = 2166136261 - * for c in string.encode("utf-8"): # <<<<<<<<<<<<<< - * h = np.uint32(h ^ np.uint32(np.int8(_byte_to_int(c)))) - * h = np.uint32(h * np.uint32(16777619)) - */ - } - __Pyx_DECREF(__pyx_t_2); __pyx_t_2 = 0; - - /* "gensim/models/_utils_any2vec.pyx":44 - * h = np.uint32(h ^ np.uint32(np.int8(_byte_to_int(c)))) - * h = np.uint32(h * np.uint32(16777619)) - * return h # <<<<<<<<<<<<<< - * - * - */ - __Pyx_XDECREF(__pyx_r); - __pyx_t_2 = __Pyx_PyInt_From_unsigned_int(__pyx_v_h); if (unlikely(!__pyx_t_2)) __PYX_ERR(0, 44, __pyx_L1_error) - __Pyx_GOTREF(__pyx_t_2); - __pyx_r = __pyx_t_2; - __pyx_t_2 = 0; - goto __pyx_L0; - - /* "gensim/models/_utils_any2vec.pyx":24 - * - * - * cpdef ft_hash(unicode string): # <<<<<<<<<<<<<< - * """Calculate hash based on `string`. - * Reproduce `hash method from Facebook fastText implementation - */ - - /* function exit code */ - __pyx_L1_error:; - __Pyx_XDECREF(__pyx_t_1); - __Pyx_XDECREF(__pyx_t_2); - __Pyx_XDECREF(__pyx_t_4); - __Pyx_XDECREF(__pyx_t_5); - __Pyx_XDECREF(__pyx_t_6); - __Pyx_XDECREF(__pyx_t_7); - __Pyx_XDECREF(__pyx_t_8); - __Pyx_XDECREF(__pyx_t_9); - __Pyx_XDECREF(__pyx_t_10); - __Pyx_XDECREF(__pyx_t_11); - __Pyx_XDECREF(__pyx_t_12); - __Pyx_AddTraceback("gensim.models._utils_any2vec.ft_hash", __pyx_clineno, __pyx_lineno, __pyx_filename); - __pyx_r = 0; - __pyx_L0:; - __Pyx_XDECREF(__pyx_v_c); - __Pyx_XGIVEREF(__pyx_r); - __Pyx_RefNannyFinishContext(); - return __pyx_r; -} - -/* Python wrapper */ -static PyObject *__pyx_pw_6gensim_6models_14_utils_any2vec_1ft_hash(PyObject *__pyx_self, PyObject *__pyx_v_string); /*proto*/ -static char __pyx_doc_6gensim_6models_14_utils_any2vec_ft_hash[] = "ft_hash(unicode string)\nCalculate hash based on `string`.\n Reproduce `hash method from Facebook fastText implementation\n `_.\n\n Parameters\n ----------\n string : unicode\n The string whose hash needs to be calculated.\n\n Returns\n -------\n unsigned int\n The hash of the string.\n\n "; -static PyObject *__pyx_pw_6gensim_6models_14_utils_any2vec_1ft_hash(PyObject *__pyx_self, PyObject *__pyx_v_string) { - PyObject *__pyx_r = 0; - __Pyx_RefNannyDeclarations - __Pyx_RefNannySetupContext("ft_hash (wrapper)", 0); - if (unlikely(!__Pyx_ArgTypeTest(((PyObject *)__pyx_v_string), (&PyUnicode_Type), 1, "string", 1))) __PYX_ERR(0, 24, __pyx_L1_error) - __pyx_r = __pyx_pf_6gensim_6models_14_utils_any2vec_ft_hash(__pyx_self, ((PyObject*)__pyx_v_string)); - - /* function exit code */ - goto __pyx_L0; - __pyx_L1_error:; - __pyx_r = NULL; - __pyx_L0:; - __Pyx_RefNannyFinishContext(); - return __pyx_r; -} - -static PyObject *__pyx_pf_6gensim_6models_14_utils_any2vec_ft_hash(CYTHON_UNUSED PyObject *__pyx_self, PyObject *__pyx_v_string) { - PyObject *__pyx_r = NULL; - __Pyx_RefNannyDeclarations - PyObject *__pyx_t_1 = NULL; - __Pyx_RefNannySetupContext("ft_hash", 0); - __Pyx_XDECREF(__pyx_r); - __pyx_t_1 = __pyx_f_6gensim_6models_14_utils_any2vec_ft_hash(__pyx_v_string, 0); if (unlikely(!__pyx_t_1)) __PYX_ERR(0, 24, __pyx_L1_error) - __Pyx_GOTREF(__pyx_t_1); - __pyx_r = __pyx_t_1; - __pyx_t_1 = 0; - goto __pyx_L0; - - /* function exit code */ - __pyx_L1_error:; - __Pyx_XDECREF(__pyx_t_1); - __Pyx_AddTraceback("gensim.models._utils_any2vec.ft_hash", __pyx_clineno, __pyx_lineno, __pyx_filename); - __pyx_r = NULL; - __pyx_L0:; - __Pyx_XGIVEREF(__pyx_r); - __Pyx_RefNannyFinishContext(); - return __pyx_r; -} - -/* "gensim/models/_utils_any2vec.pyx":47 - * - * - * cpdef ft_hash_broken(unicode string): # <<<<<<<<<<<<<< - * """Calculate hash based on `string`. - * - */ - -static PyObject *__pyx_pw_6gensim_6models_14_utils_any2vec_3ft_hash_broken(PyObject *__pyx_self, PyObject *__pyx_v_string); /*proto*/ -static PyObject *__pyx_f_6gensim_6models_14_utils_any2vec_ft_hash_broken(PyObject *__pyx_v_string, CYTHON_UNUSED int __pyx_skip_dispatch) { - unsigned int __pyx_v_h; - PyObject *__pyx_v_c = NULL; - PyObject *__pyx_r = NULL; - __Pyx_RefNannyDeclarations - PyObject *__pyx_t_1 = NULL; - Py_ssize_t __pyx_t_2; - Py_ssize_t __pyx_t_3; - void *__pyx_t_4; - int __pyx_t_5; - int __pyx_t_6; - Py_ssize_t __pyx_t_7; - PyObject *__pyx_t_8 = NULL; - long __pyx_t_9; - __Pyx_RefNannySetupContext("ft_hash_broken", 0); - - /* "gensim/models/_utils_any2vec.pyx":64 - * - * """ - * cdef unsigned int h = 2166136261 # <<<<<<<<<<<<<< - * for c in string: - * h ^= ord(c) - */ - __pyx_v_h = 0x811C9DC5; - - /* "gensim/models/_utils_any2vec.pyx":65 - * """ - * cdef unsigned int h = 2166136261 - * for c in string: # <<<<<<<<<<<<<< - * h ^= ord(c) - * h *= 16777619 - */ - if (unlikely(__pyx_v_string == Py_None)) { - PyErr_SetString(PyExc_TypeError, "'NoneType' is not iterable"); - __PYX_ERR(0, 65, __pyx_L1_error) + PyErr_SetString(PyExc_TypeError, "'NoneType' is not iterable"); + __PYX_ERR(0, 65, __pyx_L1_error) } __Pyx_INCREF(__pyx_v_string); __pyx_t_1 = __pyx_v_string; @@ -2610,6 +2240,7 @@ static PyObject *__pyx_f_6gensim_6models_14_utils_any2vec_compute_ngrams(PyObjec * for i in range(0, len(extended_word) - ngram_length + 1): * ngrams.append(extended_word[i:i + ngram_length]) # <<<<<<<<<<<<<< * return ngrams + * */ __Pyx_INCREF(__pyx_v_i); __pyx_t_1 = __pyx_v_i; @@ -2660,6 +2291,8 @@ static PyObject *__pyx_f_6gensim_6models_14_utils_any2vec_compute_ngrams(PyObjec * for i in range(0, len(extended_word) - ngram_length + 1): * ngrams.append(extended_word[i:i + ngram_length]) * return ngrams # <<<<<<<<<<<<<< + * + * # */ __Pyx_XDECREF(__pyx_r); __Pyx_INCREF(__pyx_v_ngrams); @@ -2787,97 +2420,520 @@ static PyObject *__pyx_pf_6gensim_6models_14_utils_any2vec_4compute_ngrams(CYTHO return __pyx_r; } -/* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":258 - * # experimental exception made for __getbuffer__ and __releasebuffer__ - * # -- the details of this may change. - * def __getbuffer__(ndarray self, Py_buffer* info, int flags): # <<<<<<<<<<<<<< - * # This implementation of getbuffer is geared towards Cython - * # requirements, and does not yet fulfill the PEP. +/* "gensim/models/_utils_any2vec.pyx":104 + * + * + * cpdef compute_ngrams_bytes(word, unsigned int min_n, unsigned int max_n): # <<<<<<<<<<<<<< + * """Computes ngrams for a word. + * */ -/* Python wrapper */ -static CYTHON_UNUSED int __pyx_pw_5numpy_7ndarray_1__getbuffer__(PyObject *__pyx_v_self, Py_buffer *__pyx_v_info, int __pyx_v_flags); /*proto*/ -static CYTHON_UNUSED int __pyx_pw_5numpy_7ndarray_1__getbuffer__(PyObject *__pyx_v_self, Py_buffer *__pyx_v_info, int __pyx_v_flags) { - int __pyx_r; +static PyObject *__pyx_pw_6gensim_6models_14_utils_any2vec_7compute_ngrams_bytes(PyObject *__pyx_self, PyObject *__pyx_args, PyObject *__pyx_kwds); /*proto*/ +static PyObject *__pyx_f_6gensim_6models_14_utils_any2vec_compute_ngrams_bytes(PyObject *__pyx_v_word, unsigned int __pyx_v_min_n, unsigned int __pyx_v_max_n, CYTHON_UNUSED int __pyx_skip_dispatch) { + PyObject *__pyx_v_utf8_word = 0; + unsigned char const *__pyx_v_bytez; + size_t __pyx_v_num_bytes; + size_t __pyx_v_j; + size_t __pyx_v_i; + size_t __pyx_v_n; + PyObject *__pyx_v_ngrams = NULL; + PyObject *__pyx_v_ngram = NULL; + PyObject *__pyx_r = NULL; __Pyx_RefNannyDeclarations - __Pyx_RefNannySetupContext("__getbuffer__ (wrapper)", 0); - __pyx_r = __pyx_pf_5numpy_7ndarray___getbuffer__(((PyArrayObject *)__pyx_v_self), ((Py_buffer *)__pyx_v_info), ((int)__pyx_v_flags)); + PyObject *__pyx_t_1 = NULL; + PyObject *__pyx_t_2 = NULL; + PyObject *__pyx_t_3 = NULL; + unsigned char const *__pyx_t_4; + Py_ssize_t __pyx_t_5; + size_t __pyx_t_6; + size_t __pyx_t_7; + size_t __pyx_t_8; + int __pyx_t_9; + size_t __pyx_t_10; + size_t __pyx_t_11; + int __pyx_t_12; + int __pyx_t_13; + int __pyx_t_14; + __Pyx_RefNannySetupContext("compute_ngrams_bytes", 0); - /* function exit code */ - __Pyx_RefNannyFinishContext(); - return __pyx_r; -} + /* "gensim/models/_utils_any2vec.pyx":128 + * + * """ + * cdef bytes utf8_word = ('<%s>' % word).encode("utf-8") # <<<<<<<<<<<<<< + * cdef const unsigned char *bytez = utf8_word + * cdef size_t num_bytes = len(utf8_word) + */ + __pyx_t_2 = __Pyx_PyString_FormatSafe(__pyx_kp_s_s, __pyx_v_word); if (unlikely(!__pyx_t_2)) __PYX_ERR(0, 128, __pyx_L1_error) + __Pyx_GOTREF(__pyx_t_2); + __pyx_t_3 = __Pyx_PyObject_GetAttrStr(__pyx_t_2, __pyx_n_s_encode); if (unlikely(!__pyx_t_3)) __PYX_ERR(0, 128, __pyx_L1_error) + __Pyx_GOTREF(__pyx_t_3); + __Pyx_DECREF(__pyx_t_2); __pyx_t_2 = 0; + __pyx_t_2 = NULL; + if (CYTHON_UNPACK_METHODS && likely(PyMethod_Check(__pyx_t_3))) { + __pyx_t_2 = PyMethod_GET_SELF(__pyx_t_3); + if (likely(__pyx_t_2)) { + PyObject* function = PyMethod_GET_FUNCTION(__pyx_t_3); + __Pyx_INCREF(__pyx_t_2); + __Pyx_INCREF(function); + __Pyx_DECREF_SET(__pyx_t_3, function); + } + } + __pyx_t_1 = (__pyx_t_2) ? __Pyx_PyObject_Call2Args(__pyx_t_3, __pyx_t_2, __pyx_kp_s_utf_8) : __Pyx_PyObject_CallOneArg(__pyx_t_3, __pyx_kp_s_utf_8); + __Pyx_XDECREF(__pyx_t_2); __pyx_t_2 = 0; + if (unlikely(!__pyx_t_1)) __PYX_ERR(0, 128, __pyx_L1_error) + __Pyx_GOTREF(__pyx_t_1); + __Pyx_DECREF(__pyx_t_3); __pyx_t_3 = 0; + if (!(likely(PyBytes_CheckExact(__pyx_t_1))||((__pyx_t_1) == Py_None)||(PyErr_Format(PyExc_TypeError, "Expected %.16s, got %.200s", "bytes", Py_TYPE(__pyx_t_1)->tp_name), 0))) __PYX_ERR(0, 128, __pyx_L1_error) + __pyx_v_utf8_word = ((PyObject*)__pyx_t_1); + __pyx_t_1 = 0; -static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, Py_buffer *__pyx_v_info, int __pyx_v_flags) { - int __pyx_v_i; - int __pyx_v_ndim; - int __pyx_v_endian_detector; - int __pyx_v_little_endian; - int __pyx_v_t; - char *__pyx_v_f; - PyArray_Descr *__pyx_v_descr = 0; - int __pyx_v_offset; - int __pyx_r; - __Pyx_RefNannyDeclarations - int __pyx_t_1; - int __pyx_t_2; - PyObject *__pyx_t_3 = NULL; - int __pyx_t_4; - int __pyx_t_5; - int __pyx_t_6; - PyArray_Descr *__pyx_t_7; - PyObject *__pyx_t_8 = NULL; - char *__pyx_t_9; - if (__pyx_v_info == NULL) { - PyErr_SetString(PyExc_BufferError, "PyObject_GetBuffer: view==NULL argument is obsolete"); - return -1; + /* "gensim/models/_utils_any2vec.pyx":129 + * """ + * cdef bytes utf8_word = ('<%s>' % word).encode("utf-8") + * cdef const unsigned char *bytez = utf8_word # <<<<<<<<<<<<<< + * cdef size_t num_bytes = len(utf8_word) + * cdef size_t j, i, n + */ + if (unlikely(__pyx_v_utf8_word == Py_None)) { + PyErr_SetString(PyExc_TypeError, "expected bytes, NoneType found"); + __PYX_ERR(0, 129, __pyx_L1_error) } - __Pyx_RefNannySetupContext("__getbuffer__", 0); - __pyx_v_info->obj = Py_None; __Pyx_INCREF(Py_None); - __Pyx_GIVEREF(__pyx_v_info->obj); + __pyx_t_4 = __Pyx_PyBytes_AsUString(__pyx_v_utf8_word); if (unlikely((!__pyx_t_4) && PyErr_Occurred())) __PYX_ERR(0, 129, __pyx_L1_error) + __pyx_v_bytez = __pyx_t_4; - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":265 + /* "gensim/models/_utils_any2vec.pyx":130 + * cdef bytes utf8_word = ('<%s>' % word).encode("utf-8") + * cdef const unsigned char *bytez = utf8_word + * cdef size_t num_bytes = len(utf8_word) # <<<<<<<<<<<<<< + * cdef size_t j, i, n * - * cdef int i, ndim - * cdef int endian_detector = 1 # <<<<<<<<<<<<<< - * cdef bint little_endian = ((&endian_detector)[0] != 0) + */ + if (unlikely(__pyx_v_utf8_word == Py_None)) { + PyErr_SetString(PyExc_TypeError, "object of type 'NoneType' has no len()"); + __PYX_ERR(0, 130, __pyx_L1_error) + } + __pyx_t_5 = PyBytes_GET_SIZE(__pyx_v_utf8_word); if (unlikely(__pyx_t_5 == ((Py_ssize_t)-1))) __PYX_ERR(0, 130, __pyx_L1_error) + __pyx_v_num_bytes = __pyx_t_5; + + /* "gensim/models/_utils_any2vec.pyx":133 + * cdef size_t j, i, n * + * ngrams = [] # <<<<<<<<<<<<<< + * for i in range(num_bytes): + * if bytez[i] & _MB_MASK == _MB_START: */ - __pyx_v_endian_detector = 1; + __pyx_t_1 = PyList_New(0); if (unlikely(!__pyx_t_1)) __PYX_ERR(0, 133, __pyx_L1_error) + __Pyx_GOTREF(__pyx_t_1); + __pyx_v_ngrams = ((PyObject*)__pyx_t_1); + __pyx_t_1 = 0; - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":266 - * cdef int i, ndim - * cdef int endian_detector = 1 - * cdef bint little_endian = ((&endian_detector)[0] != 0) # <<<<<<<<<<<<<< + /* "gensim/models/_utils_any2vec.pyx":134 * - * ndim = PyArray_NDIM(self) + * ngrams = [] + * for i in range(num_bytes): # <<<<<<<<<<<<<< + * if bytez[i] & _MB_MASK == _MB_START: + * continue */ - __pyx_v_little_endian = ((((char *)(&__pyx_v_endian_detector))[0]) != 0); + __pyx_t_6 = __pyx_v_num_bytes; + __pyx_t_7 = __pyx_t_6; + for (__pyx_t_8 = 0; __pyx_t_8 < __pyx_t_7; __pyx_t_8+=1) { + __pyx_v_i = __pyx_t_8; - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":268 - * cdef bint little_endian = ((&endian_detector)[0] != 0) + /* "gensim/models/_utils_any2vec.pyx":135 + * ngrams = [] + * for i in range(num_bytes): + * if bytez[i] & _MB_MASK == _MB_START: # <<<<<<<<<<<<<< + * continue * - * ndim = PyArray_NDIM(self) # <<<<<<<<<<<<<< + */ + __pyx_t_9 = ((((__pyx_v_bytez[__pyx_v_i]) & __pyx_v_6gensim_6models_14_utils_any2vec__MB_MASK) == __pyx_v_6gensim_6models_14_utils_any2vec__MB_START) != 0); + if (__pyx_t_9) { + + /* "gensim/models/_utils_any2vec.pyx":136 + * for i in range(num_bytes): + * if bytez[i] & _MB_MASK == _MB_START: + * continue # <<<<<<<<<<<<<< * - * if ((flags & pybuf.PyBUF_C_CONTIGUOUS == pybuf.PyBUF_C_CONTIGUOUS) + * j, n = i, 1 */ - __pyx_v_ndim = PyArray_NDIM(__pyx_v_self); + goto __pyx_L3_continue; - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":270 - * ndim = PyArray_NDIM(self) + /* "gensim/models/_utils_any2vec.pyx":135 + * ngrams = [] + * for i in range(num_bytes): + * if bytez[i] & _MB_MASK == _MB_START: # <<<<<<<<<<<<<< + * continue * - * if ((flags & pybuf.PyBUF_C_CONTIGUOUS == pybuf.PyBUF_C_CONTIGUOUS) # <<<<<<<<<<<<<< - * and not PyArray_CHKFLAGS(self, NPY_ARRAY_C_CONTIGUOUS)): - * raise ValueError(u"ndarray is not C contiguous") */ - __pyx_t_2 = (((__pyx_v_flags & PyBUF_C_CONTIGUOUS) == PyBUF_C_CONTIGUOUS) != 0); - if (__pyx_t_2) { - } else { - __pyx_t_1 = __pyx_t_2; - goto __pyx_L4_bool_binop_done; - } + } - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":271 + /* "gensim/models/_utils_any2vec.pyx":138 + * continue + * + * j, n = i, 1 # <<<<<<<<<<<<<< + * while j < num_bytes and n <= max_n: + * j += 1 + */ + __pyx_t_10 = __pyx_v_i; + __pyx_t_11 = 1; + __pyx_v_j = __pyx_t_10; + __pyx_v_n = __pyx_t_11; + + /* "gensim/models/_utils_any2vec.pyx":139 + * + * j, n = i, 1 + * while j < num_bytes and n <= max_n: # <<<<<<<<<<<<<< + * j += 1 + * while j < num_bytes and (bytez[j] & _MB_MASK) == _MB_START: + */ + while (1) { + __pyx_t_12 = ((__pyx_v_j < __pyx_v_num_bytes) != 0); + if (__pyx_t_12) { + } else { + __pyx_t_9 = __pyx_t_12; + goto __pyx_L8_bool_binop_done; + } + __pyx_t_12 = ((__pyx_v_n <= __pyx_v_max_n) != 0); + __pyx_t_9 = __pyx_t_12; + __pyx_L8_bool_binop_done:; + if (!__pyx_t_9) break; + + /* "gensim/models/_utils_any2vec.pyx":140 + * j, n = i, 1 + * while j < num_bytes and n <= max_n: + * j += 1 # <<<<<<<<<<<<<< + * while j < num_bytes and (bytez[j] & _MB_MASK) == _MB_START: + * j += 1 + */ + __pyx_v_j = (__pyx_v_j + 1); + + /* "gensim/models/_utils_any2vec.pyx":141 + * while j < num_bytes and n <= max_n: + * j += 1 + * while j < num_bytes and (bytez[j] & _MB_MASK) == _MB_START: # <<<<<<<<<<<<<< + * j += 1 + * if n >= min_n and not (n == 1 and (i == 0 or j == num_bytes)): + */ + while (1) { + __pyx_t_12 = ((__pyx_v_j < __pyx_v_num_bytes) != 0); + if (__pyx_t_12) { + } else { + __pyx_t_9 = __pyx_t_12; + goto __pyx_L12_bool_binop_done; + } + __pyx_t_12 = ((((__pyx_v_bytez[__pyx_v_j]) & __pyx_v_6gensim_6models_14_utils_any2vec__MB_MASK) == __pyx_v_6gensim_6models_14_utils_any2vec__MB_START) != 0); + __pyx_t_9 = __pyx_t_12; + __pyx_L12_bool_binop_done:; + if (!__pyx_t_9) break; + + /* "gensim/models/_utils_any2vec.pyx":142 + * j += 1 + * while j < num_bytes and (bytez[j] & _MB_MASK) == _MB_START: + * j += 1 # <<<<<<<<<<<<<< + * if n >= min_n and not (n == 1 and (i == 0 or j == num_bytes)): + * ngram = bytes(bytez[i:j]) + */ + __pyx_v_j = (__pyx_v_j + 1); + } + + /* "gensim/models/_utils_any2vec.pyx":143 + * while j < num_bytes and (bytez[j] & _MB_MASK) == _MB_START: + * j += 1 + * if n >= min_n and not (n == 1 and (i == 0 or j == num_bytes)): # <<<<<<<<<<<<<< + * ngram = bytes(bytez[i:j]) + * ngrams.append(ngram) + */ + __pyx_t_12 = ((__pyx_v_n >= __pyx_v_min_n) != 0); + if (__pyx_t_12) { + } else { + __pyx_t_9 = __pyx_t_12; + goto __pyx_L15_bool_binop_done; + } + __pyx_t_13 = ((__pyx_v_n == 1) != 0); + if (__pyx_t_13) { + } else { + __pyx_t_12 = __pyx_t_13; + goto __pyx_L17_bool_binop_done; + } + __pyx_t_13 = ((__pyx_v_i == 0) != 0); + if (!__pyx_t_13) { + } else { + __pyx_t_12 = __pyx_t_13; + goto __pyx_L17_bool_binop_done; + } + __pyx_t_13 = ((__pyx_v_j == __pyx_v_num_bytes) != 0); + __pyx_t_12 = __pyx_t_13; + __pyx_L17_bool_binop_done:; + __pyx_t_13 = ((!__pyx_t_12) != 0); + __pyx_t_9 = __pyx_t_13; + __pyx_L15_bool_binop_done:; + if (__pyx_t_9) { + + /* "gensim/models/_utils_any2vec.pyx":144 + * j += 1 + * if n >= min_n and not (n == 1 and (i == 0 or j == num_bytes)): + * ngram = bytes(bytez[i:j]) # <<<<<<<<<<<<<< + * ngrams.append(ngram) + * n += 1 + */ + __pyx_t_1 = __Pyx_PyBytes_FromStringAndSize(((const char*)__pyx_v_bytez) + __pyx_v_i, __pyx_v_j - __pyx_v_i); if (unlikely(!__pyx_t_1)) __PYX_ERR(0, 144, __pyx_L1_error) + __Pyx_GOTREF(__pyx_t_1); + __pyx_t_3 = __Pyx_PyObject_CallOneArg(((PyObject *)(&PyBytes_Type)), __pyx_t_1); if (unlikely(!__pyx_t_3)) __PYX_ERR(0, 144, __pyx_L1_error) + __Pyx_GOTREF(__pyx_t_3); + __Pyx_DECREF(__pyx_t_1); __pyx_t_1 = 0; + __Pyx_XDECREF_SET(__pyx_v_ngram, ((PyObject*)__pyx_t_3)); + __pyx_t_3 = 0; + + /* "gensim/models/_utils_any2vec.pyx":145 + * if n >= min_n and not (n == 1 and (i == 0 or j == num_bytes)): + * ngram = bytes(bytez[i:j]) + * ngrams.append(ngram) # <<<<<<<<<<<<<< + * n += 1 + * return ngrams + */ + __pyx_t_14 = __Pyx_PyList_Append(__pyx_v_ngrams, __pyx_v_ngram); if (unlikely(__pyx_t_14 == ((int)-1))) __PYX_ERR(0, 145, __pyx_L1_error) + + /* "gensim/models/_utils_any2vec.pyx":143 + * while j < num_bytes and (bytez[j] & _MB_MASK) == _MB_START: + * j += 1 + * if n >= min_n and not (n == 1 and (i == 0 or j == num_bytes)): # <<<<<<<<<<<<<< + * ngram = bytes(bytez[i:j]) + * ngrams.append(ngram) + */ + } + + /* "gensim/models/_utils_any2vec.pyx":146 + * ngram = bytes(bytez[i:j]) + * ngrams.append(ngram) + * n += 1 # <<<<<<<<<<<<<< + * return ngrams + */ + __pyx_v_n = (__pyx_v_n + 1); + } + __pyx_L3_continue:; + } + + /* "gensim/models/_utils_any2vec.pyx":147 + * ngrams.append(ngram) + * n += 1 + * return ngrams # <<<<<<<<<<<<<< + */ + __Pyx_XDECREF(__pyx_r); + __Pyx_INCREF(__pyx_v_ngrams); + __pyx_r = __pyx_v_ngrams; + goto __pyx_L0; + + /* "gensim/models/_utils_any2vec.pyx":104 + * + * + * cpdef compute_ngrams_bytes(word, unsigned int min_n, unsigned int max_n): # <<<<<<<<<<<<<< + * """Computes ngrams for a word. + * + */ + + /* function exit code */ + __pyx_L1_error:; + __Pyx_XDECREF(__pyx_t_1); + __Pyx_XDECREF(__pyx_t_2); + __Pyx_XDECREF(__pyx_t_3); + __Pyx_AddTraceback("gensim.models._utils_any2vec.compute_ngrams_bytes", __pyx_clineno, __pyx_lineno, __pyx_filename); + __pyx_r = 0; + __pyx_L0:; + __Pyx_XDECREF(__pyx_v_utf8_word); + __Pyx_XDECREF(__pyx_v_ngrams); + __Pyx_XDECREF(__pyx_v_ngram); + __Pyx_XGIVEREF(__pyx_r); + __Pyx_RefNannyFinishContext(); + return __pyx_r; +} + +/* Python wrapper */ +static PyObject *__pyx_pw_6gensim_6models_14_utils_any2vec_7compute_ngrams_bytes(PyObject *__pyx_self, PyObject *__pyx_args, PyObject *__pyx_kwds); /*proto*/ +static char __pyx_doc_6gensim_6models_14_utils_any2vec_6compute_ngrams_bytes[] = "compute_ngrams_bytes(word, unsigned int min_n, unsigned int max_n)\nComputes ngrams for a word.\n\n Ported from the original FB implementation.\n\n Parameters\n ----------\n word : str\n A unicode string.\n min_n : unsigned int\n The minimum ngram length.\n max_n : unsigned int\n The maximum ngram length.\n\n Returns:\n --------\n list of str\n A list of ngrams, where each ngram is a list of **bytes**.\n\n See Also\n --------\n `Original implementation `__\n\n "; +static PyObject *__pyx_pw_6gensim_6models_14_utils_any2vec_7compute_ngrams_bytes(PyObject *__pyx_self, PyObject *__pyx_args, PyObject *__pyx_kwds) { + PyObject *__pyx_v_word = 0; + unsigned int __pyx_v_min_n; + unsigned int __pyx_v_max_n; + PyObject *__pyx_r = 0; + __Pyx_RefNannyDeclarations + __Pyx_RefNannySetupContext("compute_ngrams_bytes (wrapper)", 0); + { + static PyObject **__pyx_pyargnames[] = {&__pyx_n_s_word,&__pyx_n_s_min_n,&__pyx_n_s_max_n,0}; + PyObject* values[3] = {0,0,0}; + if (unlikely(__pyx_kwds)) { + Py_ssize_t kw_args; + const Py_ssize_t pos_args = PyTuple_GET_SIZE(__pyx_args); + switch (pos_args) { + case 3: values[2] = PyTuple_GET_ITEM(__pyx_args, 2); + CYTHON_FALLTHROUGH; + case 2: values[1] = PyTuple_GET_ITEM(__pyx_args, 1); + CYTHON_FALLTHROUGH; + case 1: values[0] = PyTuple_GET_ITEM(__pyx_args, 0); + CYTHON_FALLTHROUGH; + case 0: break; + default: goto __pyx_L5_argtuple_error; + } + kw_args = PyDict_Size(__pyx_kwds); + switch (pos_args) { + case 0: + if (likely((values[0] = __Pyx_PyDict_GetItemStr(__pyx_kwds, __pyx_n_s_word)) != 0)) kw_args--; + else goto __pyx_L5_argtuple_error; + CYTHON_FALLTHROUGH; + case 1: + if (likely((values[1] = __Pyx_PyDict_GetItemStr(__pyx_kwds, __pyx_n_s_min_n)) != 0)) kw_args--; + else { + __Pyx_RaiseArgtupleInvalid("compute_ngrams_bytes", 1, 3, 3, 1); __PYX_ERR(0, 104, __pyx_L3_error) + } + CYTHON_FALLTHROUGH; + case 2: + if (likely((values[2] = __Pyx_PyDict_GetItemStr(__pyx_kwds, __pyx_n_s_max_n)) != 0)) kw_args--; + else { + __Pyx_RaiseArgtupleInvalid("compute_ngrams_bytes", 1, 3, 3, 2); __PYX_ERR(0, 104, __pyx_L3_error) + } + } + if (unlikely(kw_args > 0)) { + if (unlikely(__Pyx_ParseOptionalKeywords(__pyx_kwds, __pyx_pyargnames, 0, values, pos_args, "compute_ngrams_bytes") < 0)) __PYX_ERR(0, 104, __pyx_L3_error) + } + } else if (PyTuple_GET_SIZE(__pyx_args) != 3) { + goto __pyx_L5_argtuple_error; + } else { + values[0] = PyTuple_GET_ITEM(__pyx_args, 0); + values[1] = PyTuple_GET_ITEM(__pyx_args, 1); + values[2] = PyTuple_GET_ITEM(__pyx_args, 2); + } + __pyx_v_word = values[0]; + __pyx_v_min_n = __Pyx_PyInt_As_unsigned_int(values[1]); if (unlikely((__pyx_v_min_n == (unsigned int)-1) && PyErr_Occurred())) __PYX_ERR(0, 104, __pyx_L3_error) + __pyx_v_max_n = __Pyx_PyInt_As_unsigned_int(values[2]); if (unlikely((__pyx_v_max_n == (unsigned int)-1) && PyErr_Occurred())) __PYX_ERR(0, 104, __pyx_L3_error) + } + goto __pyx_L4_argument_unpacking_done; + __pyx_L5_argtuple_error:; + __Pyx_RaiseArgtupleInvalid("compute_ngrams_bytes", 1, 3, 3, PyTuple_GET_SIZE(__pyx_args)); __PYX_ERR(0, 104, __pyx_L3_error) + __pyx_L3_error:; + __Pyx_AddTraceback("gensim.models._utils_any2vec.compute_ngrams_bytes", __pyx_clineno, __pyx_lineno, __pyx_filename); + __Pyx_RefNannyFinishContext(); + return NULL; + __pyx_L4_argument_unpacking_done:; + __pyx_r = __pyx_pf_6gensim_6models_14_utils_any2vec_6compute_ngrams_bytes(__pyx_self, __pyx_v_word, __pyx_v_min_n, __pyx_v_max_n); + + /* function exit code */ + __Pyx_RefNannyFinishContext(); + return __pyx_r; +} + +static PyObject *__pyx_pf_6gensim_6models_14_utils_any2vec_6compute_ngrams_bytes(CYTHON_UNUSED PyObject *__pyx_self, PyObject *__pyx_v_word, unsigned int __pyx_v_min_n, unsigned int __pyx_v_max_n) { + PyObject *__pyx_r = NULL; + __Pyx_RefNannyDeclarations + PyObject *__pyx_t_1 = NULL; + __Pyx_RefNannySetupContext("compute_ngrams_bytes", 0); + __Pyx_XDECREF(__pyx_r); + __pyx_t_1 = __pyx_f_6gensim_6models_14_utils_any2vec_compute_ngrams_bytes(__pyx_v_word, __pyx_v_min_n, __pyx_v_max_n, 0); if (unlikely(!__pyx_t_1)) __PYX_ERR(0, 104, __pyx_L1_error) + __Pyx_GOTREF(__pyx_t_1); + __pyx_r = __pyx_t_1; + __pyx_t_1 = 0; + goto __pyx_L0; + + /* function exit code */ + __pyx_L1_error:; + __Pyx_XDECREF(__pyx_t_1); + __Pyx_AddTraceback("gensim.models._utils_any2vec.compute_ngrams_bytes", __pyx_clineno, __pyx_lineno, __pyx_filename); + __pyx_r = NULL; + __pyx_L0:; + __Pyx_XGIVEREF(__pyx_r); + __Pyx_RefNannyFinishContext(); + return __pyx_r; +} + +/* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":258 + * # experimental exception made for __getbuffer__ and __releasebuffer__ + * # -- the details of this may change. + * def __getbuffer__(ndarray self, Py_buffer* info, int flags): # <<<<<<<<<<<<<< + * # This implementation of getbuffer is geared towards Cython + * # requirements, and does not yet fulfill the PEP. + */ + +/* Python wrapper */ +static CYTHON_UNUSED int __pyx_pw_5numpy_7ndarray_1__getbuffer__(PyObject *__pyx_v_self, Py_buffer *__pyx_v_info, int __pyx_v_flags); /*proto*/ +static CYTHON_UNUSED int __pyx_pw_5numpy_7ndarray_1__getbuffer__(PyObject *__pyx_v_self, Py_buffer *__pyx_v_info, int __pyx_v_flags) { + int __pyx_r; + __Pyx_RefNannyDeclarations + __Pyx_RefNannySetupContext("__getbuffer__ (wrapper)", 0); + __pyx_r = __pyx_pf_5numpy_7ndarray___getbuffer__(((PyArrayObject *)__pyx_v_self), ((Py_buffer *)__pyx_v_info), ((int)__pyx_v_flags)); + + /* function exit code */ + __Pyx_RefNannyFinishContext(); + return __pyx_r; +} + +static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, Py_buffer *__pyx_v_info, int __pyx_v_flags) { + int __pyx_v_i; + int __pyx_v_ndim; + int __pyx_v_endian_detector; + int __pyx_v_little_endian; + int __pyx_v_t; + char *__pyx_v_f; + PyArray_Descr *__pyx_v_descr = 0; + int __pyx_v_offset; + int __pyx_r; + __Pyx_RefNannyDeclarations + int __pyx_t_1; + int __pyx_t_2; + PyObject *__pyx_t_3 = NULL; + int __pyx_t_4; + int __pyx_t_5; + int __pyx_t_6; + PyArray_Descr *__pyx_t_7; + PyObject *__pyx_t_8 = NULL; + char *__pyx_t_9; + if (__pyx_v_info == NULL) { + PyErr_SetString(PyExc_BufferError, "PyObject_GetBuffer: view==NULL argument is obsolete"); + return -1; + } + __Pyx_RefNannySetupContext("__getbuffer__", 0); + __pyx_v_info->obj = Py_None; __Pyx_INCREF(Py_None); + __Pyx_GIVEREF(__pyx_v_info->obj); + + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":265 + * + * cdef int i, ndim + * cdef int endian_detector = 1 # <<<<<<<<<<<<<< + * cdef bint little_endian = ((&endian_detector)[0] != 0) + * + */ + __pyx_v_endian_detector = 1; + + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":266 + * cdef int i, ndim + * cdef int endian_detector = 1 + * cdef bint little_endian = ((&endian_detector)[0] != 0) # <<<<<<<<<<<<<< + * + * ndim = PyArray_NDIM(self) + */ + __pyx_v_little_endian = ((((char *)(&__pyx_v_endian_detector))[0]) != 0); + + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":268 + * cdef bint little_endian = ((&endian_detector)[0] != 0) + * + * ndim = PyArray_NDIM(self) # <<<<<<<<<<<<<< + * + * if ((flags & pybuf.PyBUF_C_CONTIGUOUS == pybuf.PyBUF_C_CONTIGUOUS) + */ + __pyx_v_ndim = PyArray_NDIM(__pyx_v_self); + + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":270 + * ndim = PyArray_NDIM(self) + * + * if ((flags & pybuf.PyBUF_C_CONTIGUOUS == pybuf.PyBUF_C_CONTIGUOUS) # <<<<<<<<<<<<<< + * and not PyArray_CHKFLAGS(self, NPY_ARRAY_C_CONTIGUOUS)): + * raise ValueError(u"ndarray is not C contiguous") + */ + __pyx_t_2 = (((__pyx_v_flags & PyBUF_C_CONTIGUOUS) == PyBUF_C_CONTIGUOUS) != 0); + if (__pyx_t_2) { + } else { + __pyx_t_1 = __pyx_t_2; + goto __pyx_L4_bool_binop_done; + } + + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":271 * * if ((flags & pybuf.PyBUF_C_CONTIGUOUS == pybuf.PyBUF_C_CONTIGUOUS) * and not PyArray_CHKFLAGS(self, NPY_ARRAY_C_CONTIGUOUS)): # <<<<<<<<<<<<<< @@ -2888,7 +2944,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P __pyx_t_1 = __pyx_t_2; __pyx_L4_bool_binop_done:; - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":270 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":270 * ndim = PyArray_NDIM(self) * * if ((flags & pybuf.PyBUF_C_CONTIGUOUS == pybuf.PyBUF_C_CONTIGUOUS) # <<<<<<<<<<<<<< @@ -2897,7 +2953,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P */ if (unlikely(__pyx_t_1)) { - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":272 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":272 * if ((flags & pybuf.PyBUF_C_CONTIGUOUS == pybuf.PyBUF_C_CONTIGUOUS) * and not PyArray_CHKFLAGS(self, NPY_ARRAY_C_CONTIGUOUS)): * raise ValueError(u"ndarray is not C contiguous") # <<<<<<<<<<<<<< @@ -2910,7 +2966,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P __Pyx_DECREF(__pyx_t_3); __pyx_t_3 = 0; __PYX_ERR(1, 272, __pyx_L1_error) - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":270 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":270 * ndim = PyArray_NDIM(self) * * if ((flags & pybuf.PyBUF_C_CONTIGUOUS == pybuf.PyBUF_C_CONTIGUOUS) # <<<<<<<<<<<<<< @@ -2919,7 +2975,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P */ } - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":274 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":274 * raise ValueError(u"ndarray is not C contiguous") * * if ((flags & pybuf.PyBUF_F_CONTIGUOUS == pybuf.PyBUF_F_CONTIGUOUS) # <<<<<<<<<<<<<< @@ -2933,7 +2989,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P goto __pyx_L7_bool_binop_done; } - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":275 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":275 * * if ((flags & pybuf.PyBUF_F_CONTIGUOUS == pybuf.PyBUF_F_CONTIGUOUS) * and not PyArray_CHKFLAGS(self, NPY_ARRAY_F_CONTIGUOUS)): # <<<<<<<<<<<<<< @@ -2944,7 +3000,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P __pyx_t_1 = __pyx_t_2; __pyx_L7_bool_binop_done:; - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":274 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":274 * raise ValueError(u"ndarray is not C contiguous") * * if ((flags & pybuf.PyBUF_F_CONTIGUOUS == pybuf.PyBUF_F_CONTIGUOUS) # <<<<<<<<<<<<<< @@ -2953,7 +3009,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P */ if (unlikely(__pyx_t_1)) { - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":276 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":276 * if ((flags & pybuf.PyBUF_F_CONTIGUOUS == pybuf.PyBUF_F_CONTIGUOUS) * and not PyArray_CHKFLAGS(self, NPY_ARRAY_F_CONTIGUOUS)): * raise ValueError(u"ndarray is not Fortran contiguous") # <<<<<<<<<<<<<< @@ -2966,7 +3022,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P __Pyx_DECREF(__pyx_t_3); __pyx_t_3 = 0; __PYX_ERR(1, 276, __pyx_L1_error) - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":274 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":274 * raise ValueError(u"ndarray is not C contiguous") * * if ((flags & pybuf.PyBUF_F_CONTIGUOUS == pybuf.PyBUF_F_CONTIGUOUS) # <<<<<<<<<<<<<< @@ -2975,7 +3031,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P */ } - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":278 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":278 * raise ValueError(u"ndarray is not Fortran contiguous") * * info.buf = PyArray_DATA(self) # <<<<<<<<<<<<<< @@ -2984,7 +3040,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P */ __pyx_v_info->buf = PyArray_DATA(__pyx_v_self); - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":279 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":279 * * info.buf = PyArray_DATA(self) * info.ndim = ndim # <<<<<<<<<<<<<< @@ -2993,7 +3049,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P */ __pyx_v_info->ndim = __pyx_v_ndim; - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":280 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":280 * info.buf = PyArray_DATA(self) * info.ndim = ndim * if sizeof(npy_intp) != sizeof(Py_ssize_t): # <<<<<<<<<<<<<< @@ -3003,7 +3059,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P __pyx_t_1 = (((sizeof(npy_intp)) != (sizeof(Py_ssize_t))) != 0); if (__pyx_t_1) { - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":283 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":283 * # Allocate new buffer for strides and shape info. * # This is allocated as one block, strides first. * info.strides = PyObject_Malloc(sizeof(Py_ssize_t) * 2 * ndim) # <<<<<<<<<<<<<< @@ -3012,7 +3068,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P */ __pyx_v_info->strides = ((Py_ssize_t *)PyObject_Malloc((((sizeof(Py_ssize_t)) * 2) * ((size_t)__pyx_v_ndim)))); - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":284 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":284 * # This is allocated as one block, strides first. * info.strides = PyObject_Malloc(sizeof(Py_ssize_t) * 2 * ndim) * info.shape = info.strides + ndim # <<<<<<<<<<<<<< @@ -3021,7 +3077,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P */ __pyx_v_info->shape = (__pyx_v_info->strides + __pyx_v_ndim); - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":285 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":285 * info.strides = PyObject_Malloc(sizeof(Py_ssize_t) * 2 * ndim) * info.shape = info.strides + ndim * for i in range(ndim): # <<<<<<<<<<<<<< @@ -3033,7 +3089,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P for (__pyx_t_6 = 0; __pyx_t_6 < __pyx_t_5; __pyx_t_6+=1) { __pyx_v_i = __pyx_t_6; - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":286 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":286 * info.shape = info.strides + ndim * for i in range(ndim): * info.strides[i] = PyArray_STRIDES(self)[i] # <<<<<<<<<<<<<< @@ -3042,7 +3098,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P */ (__pyx_v_info->strides[__pyx_v_i]) = (PyArray_STRIDES(__pyx_v_self)[__pyx_v_i]); - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":287 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":287 * for i in range(ndim): * info.strides[i] = PyArray_STRIDES(self)[i] * info.shape[i] = PyArray_DIMS(self)[i] # <<<<<<<<<<<<<< @@ -3052,7 +3108,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P (__pyx_v_info->shape[__pyx_v_i]) = (PyArray_DIMS(__pyx_v_self)[__pyx_v_i]); } - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":280 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":280 * info.buf = PyArray_DATA(self) * info.ndim = ndim * if sizeof(npy_intp) != sizeof(Py_ssize_t): # <<<<<<<<<<<<<< @@ -3062,7 +3118,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P goto __pyx_L9; } - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":289 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":289 * info.shape[i] = PyArray_DIMS(self)[i] * else: * info.strides = PyArray_STRIDES(self) # <<<<<<<<<<<<<< @@ -3072,7 +3128,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P /*else*/ { __pyx_v_info->strides = ((Py_ssize_t *)PyArray_STRIDES(__pyx_v_self)); - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":290 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":290 * else: * info.strides = PyArray_STRIDES(self) * info.shape = PyArray_DIMS(self) # <<<<<<<<<<<<<< @@ -3083,7 +3139,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P } __pyx_L9:; - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":291 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":291 * info.strides = PyArray_STRIDES(self) * info.shape = PyArray_DIMS(self) * info.suboffsets = NULL # <<<<<<<<<<<<<< @@ -3092,7 +3148,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P */ __pyx_v_info->suboffsets = NULL; - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":292 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":292 * info.shape = PyArray_DIMS(self) * info.suboffsets = NULL * info.itemsize = PyArray_ITEMSIZE(self) # <<<<<<<<<<<<<< @@ -3101,7 +3157,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P */ __pyx_v_info->itemsize = PyArray_ITEMSIZE(__pyx_v_self); - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":293 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":293 * info.suboffsets = NULL * info.itemsize = PyArray_ITEMSIZE(self) * info.readonly = not PyArray_ISWRITEABLE(self) # <<<<<<<<<<<<<< @@ -3110,7 +3166,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P */ __pyx_v_info->readonly = (!(PyArray_ISWRITEABLE(__pyx_v_self) != 0)); - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":296 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":296 * * cdef int t * cdef char* f = NULL # <<<<<<<<<<<<<< @@ -3119,7 +3175,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P */ __pyx_v_f = NULL; - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":297 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":297 * cdef int t * cdef char* f = NULL * cdef dtype descr = PyArray_DESCR(self) # <<<<<<<<<<<<<< @@ -3132,7 +3188,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P __pyx_v_descr = ((PyArray_Descr *)__pyx_t_3); __pyx_t_3 = 0; - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":300 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":300 * cdef int offset * * info.obj = self # <<<<<<<<<<<<<< @@ -3145,7 +3201,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P __Pyx_DECREF(__pyx_v_info->obj); __pyx_v_info->obj = ((PyObject *)__pyx_v_self); - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":302 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":302 * info.obj = self * * if not PyDataType_HASFIELDS(descr): # <<<<<<<<<<<<<< @@ -3155,7 +3211,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P __pyx_t_1 = ((!(PyDataType_HASFIELDS(__pyx_v_descr) != 0)) != 0); if (__pyx_t_1) { - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":303 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":303 * * if not PyDataType_HASFIELDS(descr): * t = descr.type_num # <<<<<<<<<<<<<< @@ -3165,7 +3221,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P __pyx_t_4 = __pyx_v_descr->type_num; __pyx_v_t = __pyx_t_4; - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":304 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":304 * if not PyDataType_HASFIELDS(descr): * t = descr.type_num * if ((descr.byteorder == c'>' and little_endian) or # <<<<<<<<<<<<<< @@ -3185,7 +3241,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P } __pyx_L15_next_or:; - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":305 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":305 * t = descr.type_num * if ((descr.byteorder == c'>' and little_endian) or * (descr.byteorder == c'<' and not little_endian)): # <<<<<<<<<<<<<< @@ -3202,7 +3258,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P __pyx_t_1 = __pyx_t_2; __pyx_L14_bool_binop_done:; - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":304 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":304 * if not PyDataType_HASFIELDS(descr): * t = descr.type_num * if ((descr.byteorder == c'>' and little_endian) or # <<<<<<<<<<<<<< @@ -3211,7 +3267,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P */ if (unlikely(__pyx_t_1)) { - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":306 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":306 * if ((descr.byteorder == c'>' and little_endian) or * (descr.byteorder == c'<' and not little_endian)): * raise ValueError(u"Non-native byte order not supported") # <<<<<<<<<<<<<< @@ -3224,7 +3280,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P __Pyx_DECREF(__pyx_t_3); __pyx_t_3 = 0; __PYX_ERR(1, 306, __pyx_L1_error) - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":304 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":304 * if not PyDataType_HASFIELDS(descr): * t = descr.type_num * if ((descr.byteorder == c'>' and little_endian) or # <<<<<<<<<<<<<< @@ -3233,7 +3289,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P */ } - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":307 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":307 * (descr.byteorder == c'<' and not little_endian)): * raise ValueError(u"Non-native byte order not supported") * if t == NPY_BYTE: f = "b" # <<<<<<<<<<<<<< @@ -3246,7 +3302,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P break; case NPY_UBYTE: - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":308 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":308 * raise ValueError(u"Non-native byte order not supported") * if t == NPY_BYTE: f = "b" * elif t == NPY_UBYTE: f = "B" # <<<<<<<<<<<<<< @@ -3257,7 +3313,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P break; case NPY_SHORT: - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":309 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":309 * if t == NPY_BYTE: f = "b" * elif t == NPY_UBYTE: f = "B" * elif t == NPY_SHORT: f = "h" # <<<<<<<<<<<<<< @@ -3268,7 +3324,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P break; case NPY_USHORT: - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":310 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":310 * elif t == NPY_UBYTE: f = "B" * elif t == NPY_SHORT: f = "h" * elif t == NPY_USHORT: f = "H" # <<<<<<<<<<<<<< @@ -3279,7 +3335,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P break; case NPY_INT: - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":311 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":311 * elif t == NPY_SHORT: f = "h" * elif t == NPY_USHORT: f = "H" * elif t == NPY_INT: f = "i" # <<<<<<<<<<<<<< @@ -3290,7 +3346,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P break; case NPY_UINT: - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":312 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":312 * elif t == NPY_USHORT: f = "H" * elif t == NPY_INT: f = "i" * elif t == NPY_UINT: f = "I" # <<<<<<<<<<<<<< @@ -3301,7 +3357,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P break; case NPY_LONG: - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":313 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":313 * elif t == NPY_INT: f = "i" * elif t == NPY_UINT: f = "I" * elif t == NPY_LONG: f = "l" # <<<<<<<<<<<<<< @@ -3312,7 +3368,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P break; case NPY_ULONG: - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":314 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":314 * elif t == NPY_UINT: f = "I" * elif t == NPY_LONG: f = "l" * elif t == NPY_ULONG: f = "L" # <<<<<<<<<<<<<< @@ -3323,7 +3379,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P break; case NPY_LONGLONG: - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":315 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":315 * elif t == NPY_LONG: f = "l" * elif t == NPY_ULONG: f = "L" * elif t == NPY_LONGLONG: f = "q" # <<<<<<<<<<<<<< @@ -3334,7 +3390,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P break; case NPY_ULONGLONG: - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":316 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":316 * elif t == NPY_ULONG: f = "L" * elif t == NPY_LONGLONG: f = "q" * elif t == NPY_ULONGLONG: f = "Q" # <<<<<<<<<<<<<< @@ -3345,7 +3401,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P break; case NPY_FLOAT: - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":317 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":317 * elif t == NPY_LONGLONG: f = "q" * elif t == NPY_ULONGLONG: f = "Q" * elif t == NPY_FLOAT: f = "f" # <<<<<<<<<<<<<< @@ -3356,7 +3412,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P break; case NPY_DOUBLE: - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":318 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":318 * elif t == NPY_ULONGLONG: f = "Q" * elif t == NPY_FLOAT: f = "f" * elif t == NPY_DOUBLE: f = "d" # <<<<<<<<<<<<<< @@ -3367,7 +3423,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P break; case NPY_LONGDOUBLE: - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":319 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":319 * elif t == NPY_FLOAT: f = "f" * elif t == NPY_DOUBLE: f = "d" * elif t == NPY_LONGDOUBLE: f = "g" # <<<<<<<<<<<<<< @@ -3378,7 +3434,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P break; case NPY_CFLOAT: - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":320 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":320 * elif t == NPY_DOUBLE: f = "d" * elif t == NPY_LONGDOUBLE: f = "g" * elif t == NPY_CFLOAT: f = "Zf" # <<<<<<<<<<<<<< @@ -3389,7 +3445,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P break; case NPY_CDOUBLE: - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":321 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":321 * elif t == NPY_LONGDOUBLE: f = "g" * elif t == NPY_CFLOAT: f = "Zf" * elif t == NPY_CDOUBLE: f = "Zd" # <<<<<<<<<<<<<< @@ -3400,7 +3456,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P break; case NPY_CLONGDOUBLE: - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":322 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":322 * elif t == NPY_CFLOAT: f = "Zf" * elif t == NPY_CDOUBLE: f = "Zd" * elif t == NPY_CLONGDOUBLE: f = "Zg" # <<<<<<<<<<<<<< @@ -3411,7 +3467,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P break; case NPY_OBJECT: - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":323 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":323 * elif t == NPY_CDOUBLE: f = "Zd" * elif t == NPY_CLONGDOUBLE: f = "Zg" * elif t == NPY_OBJECT: f = "O" # <<<<<<<<<<<<<< @@ -3422,7 +3478,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P break; default: - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":325 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":325 * elif t == NPY_OBJECT: f = "O" * else: * raise ValueError(u"unknown dtype code in numpy.pxd (%d)" % t) # <<<<<<<<<<<<<< @@ -3443,7 +3499,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P break; } - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":326 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":326 * else: * raise ValueError(u"unknown dtype code in numpy.pxd (%d)" % t) * info.format = f # <<<<<<<<<<<<<< @@ -3452,7 +3508,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P */ __pyx_v_info->format = __pyx_v_f; - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":327 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":327 * raise ValueError(u"unknown dtype code in numpy.pxd (%d)" % t) * info.format = f * return # <<<<<<<<<<<<<< @@ -3462,7 +3518,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P __pyx_r = 0; goto __pyx_L0; - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":302 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":302 * info.obj = self * * if not PyDataType_HASFIELDS(descr): # <<<<<<<<<<<<<< @@ -3471,7 +3527,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P */ } - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":329 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":329 * return * else: * info.format = PyObject_Malloc(_buffer_format_string_len) # <<<<<<<<<<<<<< @@ -3481,7 +3537,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P /*else*/ { __pyx_v_info->format = ((char *)PyObject_Malloc(0xFF)); - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":330 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":330 * else: * info.format = PyObject_Malloc(_buffer_format_string_len) * info.format[0] = c'^' # Native data types, manual alignment # <<<<<<<<<<<<<< @@ -3490,7 +3546,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P */ (__pyx_v_info->format[0]) = '^'; - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":331 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":331 * info.format = PyObject_Malloc(_buffer_format_string_len) * info.format[0] = c'^' # Native data types, manual alignment * offset = 0 # <<<<<<<<<<<<<< @@ -3499,7 +3555,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P */ __pyx_v_offset = 0; - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":332 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":332 * info.format[0] = c'^' # Native data types, manual alignment * offset = 0 * f = _util_dtypestring(descr, info.format + 1, # <<<<<<<<<<<<<< @@ -3509,7 +3565,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P __pyx_t_9 = __pyx_f_5numpy__util_dtypestring(__pyx_v_descr, (__pyx_v_info->format + 1), (__pyx_v_info->format + 0xFF), (&__pyx_v_offset)); if (unlikely(__pyx_t_9 == ((char *)NULL))) __PYX_ERR(1, 332, __pyx_L1_error) __pyx_v_f = __pyx_t_9; - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":335 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":335 * info.format + _buffer_format_string_len, * &offset) * f[0] = c'\0' # Terminate format string # <<<<<<<<<<<<<< @@ -3519,7 +3575,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P (__pyx_v_f[0]) = '\x00'; } - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":258 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":258 * # experimental exception made for __getbuffer__ and __releasebuffer__ * # -- the details of this may change. * def __getbuffer__(ndarray self, Py_buffer* info, int flags): # <<<<<<<<<<<<<< @@ -3551,7 +3607,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P return __pyx_r; } -/* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":337 +/* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":337 * f[0] = c'\0' # Terminate format string * * def __releasebuffer__(ndarray self, Py_buffer* info): # <<<<<<<<<<<<<< @@ -3575,7 +3631,7 @@ static void __pyx_pf_5numpy_7ndarray_2__releasebuffer__(PyArrayObject *__pyx_v_s int __pyx_t_1; __Pyx_RefNannySetupContext("__releasebuffer__", 0); - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":338 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":338 * * def __releasebuffer__(ndarray self, Py_buffer* info): * if PyArray_HASFIELDS(self): # <<<<<<<<<<<<<< @@ -3585,7 +3641,7 @@ static void __pyx_pf_5numpy_7ndarray_2__releasebuffer__(PyArrayObject *__pyx_v_s __pyx_t_1 = (PyArray_HASFIELDS(__pyx_v_self) != 0); if (__pyx_t_1) { - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":339 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":339 * def __releasebuffer__(ndarray self, Py_buffer* info): * if PyArray_HASFIELDS(self): * PyObject_Free(info.format) # <<<<<<<<<<<<<< @@ -3594,7 +3650,7 @@ static void __pyx_pf_5numpy_7ndarray_2__releasebuffer__(PyArrayObject *__pyx_v_s */ PyObject_Free(__pyx_v_info->format); - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":338 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":338 * * def __releasebuffer__(ndarray self, Py_buffer* info): * if PyArray_HASFIELDS(self): # <<<<<<<<<<<<<< @@ -3603,7 +3659,7 @@ static void __pyx_pf_5numpy_7ndarray_2__releasebuffer__(PyArrayObject *__pyx_v_s */ } - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":340 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":340 * if PyArray_HASFIELDS(self): * PyObject_Free(info.format) * if sizeof(npy_intp) != sizeof(Py_ssize_t): # <<<<<<<<<<<<<< @@ -3613,7 +3669,7 @@ static void __pyx_pf_5numpy_7ndarray_2__releasebuffer__(PyArrayObject *__pyx_v_s __pyx_t_1 = (((sizeof(npy_intp)) != (sizeof(Py_ssize_t))) != 0); if (__pyx_t_1) { - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":341 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":341 * PyObject_Free(info.format) * if sizeof(npy_intp) != sizeof(Py_ssize_t): * PyObject_Free(info.strides) # <<<<<<<<<<<<<< @@ -3622,7 +3678,7 @@ static void __pyx_pf_5numpy_7ndarray_2__releasebuffer__(PyArrayObject *__pyx_v_s */ PyObject_Free(__pyx_v_info->strides); - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":340 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":340 * if PyArray_HASFIELDS(self): * PyObject_Free(info.format) * if sizeof(npy_intp) != sizeof(Py_ssize_t): # <<<<<<<<<<<<<< @@ -3631,7 +3687,7 @@ static void __pyx_pf_5numpy_7ndarray_2__releasebuffer__(PyArrayObject *__pyx_v_s */ } - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":337 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":337 * f[0] = c'\0' # Terminate format string * * def __releasebuffer__(ndarray self, Py_buffer* info): # <<<<<<<<<<<<<< @@ -3643,7 +3699,7 @@ static void __pyx_pf_5numpy_7ndarray_2__releasebuffer__(PyArrayObject *__pyx_v_s __Pyx_RefNannyFinishContext(); } -/* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":821 +/* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":821 * ctypedef npy_cdouble complex_t * * cdef inline object PyArray_MultiIterNew1(a): # <<<<<<<<<<<<<< @@ -3657,7 +3713,7 @@ static CYTHON_INLINE PyObject *__pyx_f_5numpy_PyArray_MultiIterNew1(PyObject *__ PyObject *__pyx_t_1 = NULL; __Pyx_RefNannySetupContext("PyArray_MultiIterNew1", 0); - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":822 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":822 * * cdef inline object PyArray_MultiIterNew1(a): * return PyArray_MultiIterNew(1, a) # <<<<<<<<<<<<<< @@ -3671,7 +3727,7 @@ static CYTHON_INLINE PyObject *__pyx_f_5numpy_PyArray_MultiIterNew1(PyObject *__ __pyx_t_1 = 0; goto __pyx_L0; - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":821 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":821 * ctypedef npy_cdouble complex_t * * cdef inline object PyArray_MultiIterNew1(a): # <<<<<<<<<<<<<< @@ -3690,7 +3746,7 @@ static CYTHON_INLINE PyObject *__pyx_f_5numpy_PyArray_MultiIterNew1(PyObject *__ return __pyx_r; } -/* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":824 +/* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":824 * return PyArray_MultiIterNew(1, a) * * cdef inline object PyArray_MultiIterNew2(a, b): # <<<<<<<<<<<<<< @@ -3704,7 +3760,7 @@ static CYTHON_INLINE PyObject *__pyx_f_5numpy_PyArray_MultiIterNew2(PyObject *__ PyObject *__pyx_t_1 = NULL; __Pyx_RefNannySetupContext("PyArray_MultiIterNew2", 0); - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":825 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":825 * * cdef inline object PyArray_MultiIterNew2(a, b): * return PyArray_MultiIterNew(2, a, b) # <<<<<<<<<<<<<< @@ -3718,7 +3774,7 @@ static CYTHON_INLINE PyObject *__pyx_f_5numpy_PyArray_MultiIterNew2(PyObject *__ __pyx_t_1 = 0; goto __pyx_L0; - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":824 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":824 * return PyArray_MultiIterNew(1, a) * * cdef inline object PyArray_MultiIterNew2(a, b): # <<<<<<<<<<<<<< @@ -3737,7 +3793,7 @@ static CYTHON_INLINE PyObject *__pyx_f_5numpy_PyArray_MultiIterNew2(PyObject *__ return __pyx_r; } -/* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":827 +/* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":827 * return PyArray_MultiIterNew(2, a, b) * * cdef inline object PyArray_MultiIterNew3(a, b, c): # <<<<<<<<<<<<<< @@ -3751,7 +3807,7 @@ static CYTHON_INLINE PyObject *__pyx_f_5numpy_PyArray_MultiIterNew3(PyObject *__ PyObject *__pyx_t_1 = NULL; __Pyx_RefNannySetupContext("PyArray_MultiIterNew3", 0); - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":828 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":828 * * cdef inline object PyArray_MultiIterNew3(a, b, c): * return PyArray_MultiIterNew(3, a, b, c) # <<<<<<<<<<<<<< @@ -3765,7 +3821,7 @@ static CYTHON_INLINE PyObject *__pyx_f_5numpy_PyArray_MultiIterNew3(PyObject *__ __pyx_t_1 = 0; goto __pyx_L0; - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":827 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":827 * return PyArray_MultiIterNew(2, a, b) * * cdef inline object PyArray_MultiIterNew3(a, b, c): # <<<<<<<<<<<<<< @@ -3784,7 +3840,7 @@ static CYTHON_INLINE PyObject *__pyx_f_5numpy_PyArray_MultiIterNew3(PyObject *__ return __pyx_r; } -/* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":830 +/* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":830 * return PyArray_MultiIterNew(3, a, b, c) * * cdef inline object PyArray_MultiIterNew4(a, b, c, d): # <<<<<<<<<<<<<< @@ -3798,7 +3854,7 @@ static CYTHON_INLINE PyObject *__pyx_f_5numpy_PyArray_MultiIterNew4(PyObject *__ PyObject *__pyx_t_1 = NULL; __Pyx_RefNannySetupContext("PyArray_MultiIterNew4", 0); - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":831 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":831 * * cdef inline object PyArray_MultiIterNew4(a, b, c, d): * return PyArray_MultiIterNew(4, a, b, c, d) # <<<<<<<<<<<<<< @@ -3812,7 +3868,7 @@ static CYTHON_INLINE PyObject *__pyx_f_5numpy_PyArray_MultiIterNew4(PyObject *__ __pyx_t_1 = 0; goto __pyx_L0; - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":830 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":830 * return PyArray_MultiIterNew(3, a, b, c) * * cdef inline object PyArray_MultiIterNew4(a, b, c, d): # <<<<<<<<<<<<<< @@ -3831,7 +3887,7 @@ static CYTHON_INLINE PyObject *__pyx_f_5numpy_PyArray_MultiIterNew4(PyObject *__ return __pyx_r; } -/* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":833 +/* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":833 * return PyArray_MultiIterNew(4, a, b, c, d) * * cdef inline object PyArray_MultiIterNew5(a, b, c, d, e): # <<<<<<<<<<<<<< @@ -3845,7 +3901,7 @@ static CYTHON_INLINE PyObject *__pyx_f_5numpy_PyArray_MultiIterNew5(PyObject *__ PyObject *__pyx_t_1 = NULL; __Pyx_RefNannySetupContext("PyArray_MultiIterNew5", 0); - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":834 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":834 * * cdef inline object PyArray_MultiIterNew5(a, b, c, d, e): * return PyArray_MultiIterNew(5, a, b, c, d, e) # <<<<<<<<<<<<<< @@ -3859,7 +3915,7 @@ static CYTHON_INLINE PyObject *__pyx_f_5numpy_PyArray_MultiIterNew5(PyObject *__ __pyx_t_1 = 0; goto __pyx_L0; - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":833 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":833 * return PyArray_MultiIterNew(4, a, b, c, d) * * cdef inline object PyArray_MultiIterNew5(a, b, c, d, e): # <<<<<<<<<<<<<< @@ -3878,7 +3934,7 @@ static CYTHON_INLINE PyObject *__pyx_f_5numpy_PyArray_MultiIterNew5(PyObject *__ return __pyx_r; } -/* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":836 +/* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":836 * return PyArray_MultiIterNew(5, a, b, c, d, e) * * cdef inline tuple PyDataType_SHAPE(dtype d): # <<<<<<<<<<<<<< @@ -3892,7 +3948,7 @@ static CYTHON_INLINE PyObject *__pyx_f_5numpy_PyDataType_SHAPE(PyArray_Descr *__ int __pyx_t_1; __Pyx_RefNannySetupContext("PyDataType_SHAPE", 0); - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":837 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":837 * * cdef inline tuple PyDataType_SHAPE(dtype d): * if PyDataType_HASSUBARRAY(d): # <<<<<<<<<<<<<< @@ -3902,7 +3958,7 @@ static CYTHON_INLINE PyObject *__pyx_f_5numpy_PyDataType_SHAPE(PyArray_Descr *__ __pyx_t_1 = (PyDataType_HASSUBARRAY(__pyx_v_d) != 0); if (__pyx_t_1) { - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":838 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":838 * cdef inline tuple PyDataType_SHAPE(dtype d): * if PyDataType_HASSUBARRAY(d): * return d.subarray.shape # <<<<<<<<<<<<<< @@ -3914,7 +3970,7 @@ static CYTHON_INLINE PyObject *__pyx_f_5numpy_PyDataType_SHAPE(PyArray_Descr *__ __pyx_r = ((PyObject*)__pyx_v_d->subarray->shape); goto __pyx_L0; - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":837 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":837 * * cdef inline tuple PyDataType_SHAPE(dtype d): * if PyDataType_HASSUBARRAY(d): # <<<<<<<<<<<<<< @@ -3923,7 +3979,7 @@ static CYTHON_INLINE PyObject *__pyx_f_5numpy_PyDataType_SHAPE(PyArray_Descr *__ */ } - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":840 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":840 * return d.subarray.shape * else: * return () # <<<<<<<<<<<<<< @@ -3937,7 +3993,7 @@ static CYTHON_INLINE PyObject *__pyx_f_5numpy_PyDataType_SHAPE(PyArray_Descr *__ goto __pyx_L0; } - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":836 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":836 * return PyArray_MultiIterNew(5, a, b, c, d, e) * * cdef inline tuple PyDataType_SHAPE(dtype d): # <<<<<<<<<<<<<< @@ -3952,7 +4008,7 @@ static CYTHON_INLINE PyObject *__pyx_f_5numpy_PyDataType_SHAPE(PyArray_Descr *__ return __pyx_r; } -/* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":842 +/* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":842 * return () * * cdef inline char* _util_dtypestring(dtype descr, char* f, char* end, int* offset) except NULL: # <<<<<<<<<<<<<< @@ -3981,7 +4037,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx char *__pyx_t_9; __Pyx_RefNannySetupContext("_util_dtypestring", 0); - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":847 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":847 * * cdef dtype child * cdef int endian_detector = 1 # <<<<<<<<<<<<<< @@ -3990,7 +4046,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx */ __pyx_v_endian_detector = 1; - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":848 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":848 * cdef dtype child * cdef int endian_detector = 1 * cdef bint little_endian = ((&endian_detector)[0] != 0) # <<<<<<<<<<<<<< @@ -3999,7 +4055,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx */ __pyx_v_little_endian = ((((char *)(&__pyx_v_endian_detector))[0]) != 0); - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":851 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":851 * cdef tuple fields * * for childname in descr.names: # <<<<<<<<<<<<<< @@ -4022,7 +4078,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx __Pyx_XDECREF_SET(__pyx_v_childname, __pyx_t_3); __pyx_t_3 = 0; - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":852 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":852 * * for childname in descr.names: * fields = descr.fields[childname] # <<<<<<<<<<<<<< @@ -4039,7 +4095,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx __Pyx_XDECREF_SET(__pyx_v_fields, ((PyObject*)__pyx_t_3)); __pyx_t_3 = 0; - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":853 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":853 * for childname in descr.names: * fields = descr.fields[childname] * child, new_offset = fields # <<<<<<<<<<<<<< @@ -4074,7 +4130,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx __Pyx_XDECREF_SET(__pyx_v_new_offset, __pyx_t_4); __pyx_t_4 = 0; - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":855 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":855 * child, new_offset = fields * * if (end - f) - (new_offset - offset[0]) < 15: # <<<<<<<<<<<<<< @@ -4091,7 +4147,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx __pyx_t_6 = ((((__pyx_v_end - __pyx_v_f) - ((int)__pyx_t_5)) < 15) != 0); if (unlikely(__pyx_t_6)) { - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":856 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":856 * * if (end - f) - (new_offset - offset[0]) < 15: * raise RuntimeError(u"Format string allocated too short, see comment in numpy.pxd") # <<<<<<<<<<<<<< @@ -4104,7 +4160,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx __Pyx_DECREF(__pyx_t_3); __pyx_t_3 = 0; __PYX_ERR(1, 856, __pyx_L1_error) - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":855 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":855 * child, new_offset = fields * * if (end - f) - (new_offset - offset[0]) < 15: # <<<<<<<<<<<<<< @@ -4113,7 +4169,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx */ } - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":858 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":858 * raise RuntimeError(u"Format string allocated too short, see comment in numpy.pxd") * * if ((child.byteorder == c'>' and little_endian) or # <<<<<<<<<<<<<< @@ -4133,7 +4189,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx } __pyx_L8_next_or:; - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":859 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":859 * * if ((child.byteorder == c'>' and little_endian) or * (child.byteorder == c'<' and not little_endian)): # <<<<<<<<<<<<<< @@ -4150,7 +4206,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx __pyx_t_6 = __pyx_t_7; __pyx_L7_bool_binop_done:; - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":858 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":858 * raise RuntimeError(u"Format string allocated too short, see comment in numpy.pxd") * * if ((child.byteorder == c'>' and little_endian) or # <<<<<<<<<<<<<< @@ -4159,7 +4215,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx */ if (unlikely(__pyx_t_6)) { - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":860 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":860 * if ((child.byteorder == c'>' and little_endian) or * (child.byteorder == c'<' and not little_endian)): * raise ValueError(u"Non-native byte order not supported") # <<<<<<<<<<<<<< @@ -4172,7 +4228,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx __Pyx_DECREF(__pyx_t_3); __pyx_t_3 = 0; __PYX_ERR(1, 860, __pyx_L1_error) - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":858 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":858 * raise RuntimeError(u"Format string allocated too short, see comment in numpy.pxd") * * if ((child.byteorder == c'>' and little_endian) or # <<<<<<<<<<<<<< @@ -4181,7 +4237,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx */ } - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":870 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":870 * * # Output padding bytes * while offset[0] < new_offset: # <<<<<<<<<<<<<< @@ -4197,7 +4253,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx __Pyx_DECREF(__pyx_t_4); __pyx_t_4 = 0; if (!__pyx_t_6) break; - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":871 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":871 * # Output padding bytes * while offset[0] < new_offset: * f[0] = 120 # "x"; pad byte # <<<<<<<<<<<<<< @@ -4206,7 +4262,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx */ (__pyx_v_f[0]) = 0x78; - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":872 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":872 * while offset[0] < new_offset: * f[0] = 120 # "x"; pad byte * f += 1 # <<<<<<<<<<<<<< @@ -4215,7 +4271,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx */ __pyx_v_f = (__pyx_v_f + 1); - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":873 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":873 * f[0] = 120 # "x"; pad byte * f += 1 * offset[0] += 1 # <<<<<<<<<<<<<< @@ -4226,7 +4282,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx (__pyx_v_offset[__pyx_t_8]) = ((__pyx_v_offset[__pyx_t_8]) + 1); } - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":875 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":875 * offset[0] += 1 * * offset[0] += child.itemsize # <<<<<<<<<<<<<< @@ -4236,7 +4292,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx __pyx_t_8 = 0; (__pyx_v_offset[__pyx_t_8]) = ((__pyx_v_offset[__pyx_t_8]) + __pyx_v_child->elsize); - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":877 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":877 * offset[0] += child.itemsize * * if not PyDataType_HASFIELDS(child): # <<<<<<<<<<<<<< @@ -4246,7 +4302,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx __pyx_t_6 = ((!(PyDataType_HASFIELDS(__pyx_v_child) != 0)) != 0); if (__pyx_t_6) { - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":878 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":878 * * if not PyDataType_HASFIELDS(child): * t = child.type_num # <<<<<<<<<<<<<< @@ -4258,7 +4314,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx __Pyx_XDECREF_SET(__pyx_v_t, __pyx_t_4); __pyx_t_4 = 0; - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":879 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":879 * if not PyDataType_HASFIELDS(child): * t = child.type_num * if end - f < 5: # <<<<<<<<<<<<<< @@ -4268,7 +4324,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx __pyx_t_6 = (((__pyx_v_end - __pyx_v_f) < 5) != 0); if (unlikely(__pyx_t_6)) { - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":880 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":880 * t = child.type_num * if end - f < 5: * raise RuntimeError(u"Format string allocated too short.") # <<<<<<<<<<<<<< @@ -4281,7 +4337,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx __Pyx_DECREF(__pyx_t_4); __pyx_t_4 = 0; __PYX_ERR(1, 880, __pyx_L1_error) - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":879 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":879 * if not PyDataType_HASFIELDS(child): * t = child.type_num * if end - f < 5: # <<<<<<<<<<<<<< @@ -4290,7 +4346,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx */ } - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":883 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":883 * * # Until ticket #99 is fixed, use integers to avoid warnings * if t == NPY_BYTE: f[0] = 98 #"b" # <<<<<<<<<<<<<< @@ -4308,7 +4364,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx goto __pyx_L15; } - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":884 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":884 * # Until ticket #99 is fixed, use integers to avoid warnings * if t == NPY_BYTE: f[0] = 98 #"b" * elif t == NPY_UBYTE: f[0] = 66 #"B" # <<<<<<<<<<<<<< @@ -4326,7 +4382,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx goto __pyx_L15; } - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":885 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":885 * if t == NPY_BYTE: f[0] = 98 #"b" * elif t == NPY_UBYTE: f[0] = 66 #"B" * elif t == NPY_SHORT: f[0] = 104 #"h" # <<<<<<<<<<<<<< @@ -4344,7 +4400,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx goto __pyx_L15; } - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":886 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":886 * elif t == NPY_UBYTE: f[0] = 66 #"B" * elif t == NPY_SHORT: f[0] = 104 #"h" * elif t == NPY_USHORT: f[0] = 72 #"H" # <<<<<<<<<<<<<< @@ -4362,7 +4418,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx goto __pyx_L15; } - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":887 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":887 * elif t == NPY_SHORT: f[0] = 104 #"h" * elif t == NPY_USHORT: f[0] = 72 #"H" * elif t == NPY_INT: f[0] = 105 #"i" # <<<<<<<<<<<<<< @@ -4380,7 +4436,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx goto __pyx_L15; } - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":888 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":888 * elif t == NPY_USHORT: f[0] = 72 #"H" * elif t == NPY_INT: f[0] = 105 #"i" * elif t == NPY_UINT: f[0] = 73 #"I" # <<<<<<<<<<<<<< @@ -4398,7 +4454,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx goto __pyx_L15; } - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":889 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":889 * elif t == NPY_INT: f[0] = 105 #"i" * elif t == NPY_UINT: f[0] = 73 #"I" * elif t == NPY_LONG: f[0] = 108 #"l" # <<<<<<<<<<<<<< @@ -4416,7 +4472,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx goto __pyx_L15; } - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":890 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":890 * elif t == NPY_UINT: f[0] = 73 #"I" * elif t == NPY_LONG: f[0] = 108 #"l" * elif t == NPY_ULONG: f[0] = 76 #"L" # <<<<<<<<<<<<<< @@ -4434,7 +4490,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx goto __pyx_L15; } - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":891 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":891 * elif t == NPY_LONG: f[0] = 108 #"l" * elif t == NPY_ULONG: f[0] = 76 #"L" * elif t == NPY_LONGLONG: f[0] = 113 #"q" # <<<<<<<<<<<<<< @@ -4452,7 +4508,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx goto __pyx_L15; } - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":892 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":892 * elif t == NPY_ULONG: f[0] = 76 #"L" * elif t == NPY_LONGLONG: f[0] = 113 #"q" * elif t == NPY_ULONGLONG: f[0] = 81 #"Q" # <<<<<<<<<<<<<< @@ -4470,7 +4526,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx goto __pyx_L15; } - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":893 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":893 * elif t == NPY_LONGLONG: f[0] = 113 #"q" * elif t == NPY_ULONGLONG: f[0] = 81 #"Q" * elif t == NPY_FLOAT: f[0] = 102 #"f" # <<<<<<<<<<<<<< @@ -4488,7 +4544,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx goto __pyx_L15; } - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":894 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":894 * elif t == NPY_ULONGLONG: f[0] = 81 #"Q" * elif t == NPY_FLOAT: f[0] = 102 #"f" * elif t == NPY_DOUBLE: f[0] = 100 #"d" # <<<<<<<<<<<<<< @@ -4506,7 +4562,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx goto __pyx_L15; } - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":895 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":895 * elif t == NPY_FLOAT: f[0] = 102 #"f" * elif t == NPY_DOUBLE: f[0] = 100 #"d" * elif t == NPY_LONGDOUBLE: f[0] = 103 #"g" # <<<<<<<<<<<<<< @@ -4524,7 +4580,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx goto __pyx_L15; } - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":896 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":896 * elif t == NPY_DOUBLE: f[0] = 100 #"d" * elif t == NPY_LONGDOUBLE: f[0] = 103 #"g" * elif t == NPY_CFLOAT: f[0] = 90; f[1] = 102; f += 1 # Zf # <<<<<<<<<<<<<< @@ -4544,7 +4600,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx goto __pyx_L15; } - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":897 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":897 * elif t == NPY_LONGDOUBLE: f[0] = 103 #"g" * elif t == NPY_CFLOAT: f[0] = 90; f[1] = 102; f += 1 # Zf * elif t == NPY_CDOUBLE: f[0] = 90; f[1] = 100; f += 1 # Zd # <<<<<<<<<<<<<< @@ -4564,7 +4620,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx goto __pyx_L15; } - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":898 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":898 * elif t == NPY_CFLOAT: f[0] = 90; f[1] = 102; f += 1 # Zf * elif t == NPY_CDOUBLE: f[0] = 90; f[1] = 100; f += 1 # Zd * elif t == NPY_CLONGDOUBLE: f[0] = 90; f[1] = 103; f += 1 # Zg # <<<<<<<<<<<<<< @@ -4584,7 +4640,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx goto __pyx_L15; } - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":899 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":899 * elif t == NPY_CDOUBLE: f[0] = 90; f[1] = 100; f += 1 # Zd * elif t == NPY_CLONGDOUBLE: f[0] = 90; f[1] = 103; f += 1 # Zg * elif t == NPY_OBJECT: f[0] = 79 #"O" # <<<<<<<<<<<<<< @@ -4602,7 +4658,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx goto __pyx_L15; } - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":901 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":901 * elif t == NPY_OBJECT: f[0] = 79 #"O" * else: * raise ValueError(u"unknown dtype code in numpy.pxd (%d)" % t) # <<<<<<<<<<<<<< @@ -4621,7 +4677,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx } __pyx_L15:; - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":902 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":902 * else: * raise ValueError(u"unknown dtype code in numpy.pxd (%d)" % t) * f += 1 # <<<<<<<<<<<<<< @@ -4630,7 +4686,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx */ __pyx_v_f = (__pyx_v_f + 1); - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":877 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":877 * offset[0] += child.itemsize * * if not PyDataType_HASFIELDS(child): # <<<<<<<<<<<<<< @@ -4640,7 +4696,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx goto __pyx_L13; } - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":906 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":906 * # Cython ignores struct boundary information ("T{...}"), * # so don't output it * f = _util_dtypestring(child, f, end, offset) # <<<<<<<<<<<<<< @@ -4653,7 +4709,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx } __pyx_L13:; - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":851 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":851 * cdef tuple fields * * for childname in descr.names: # <<<<<<<<<<<<<< @@ -4663,7 +4719,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx } __Pyx_DECREF(__pyx_t_1); __pyx_t_1 = 0; - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":907 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":907 * # so don't output it * f = _util_dtypestring(child, f, end, offset) * return f # <<<<<<<<<<<<<< @@ -4673,7 +4729,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx __pyx_r = __pyx_v_f; goto __pyx_L0; - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":842 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":842 * return () * * cdef inline char* _util_dtypestring(dtype descr, char* f, char* end, int* offset) except NULL: # <<<<<<<<<<<<<< @@ -4698,7 +4754,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx return __pyx_r; } -/* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1022 +/* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1022 * int _import_umath() except -1 * * cdef inline void set_array_base(ndarray arr, object base): # <<<<<<<<<<<<<< @@ -4710,7 +4766,7 @@ static CYTHON_INLINE void __pyx_f_5numpy_set_array_base(PyArrayObject *__pyx_v_a __Pyx_RefNannyDeclarations __Pyx_RefNannySetupContext("set_array_base", 0); - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1023 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1023 * * cdef inline void set_array_base(ndarray arr, object base): * Py_INCREF(base) # important to do this before stealing the reference below! # <<<<<<<<<<<<<< @@ -4719,7 +4775,7 @@ static CYTHON_INLINE void __pyx_f_5numpy_set_array_base(PyArrayObject *__pyx_v_a */ Py_INCREF(__pyx_v_base); - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1024 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1024 * cdef inline void set_array_base(ndarray arr, object base): * Py_INCREF(base) # important to do this before stealing the reference below! * PyArray_SetBaseObject(arr, base) # <<<<<<<<<<<<<< @@ -4728,7 +4784,7 @@ static CYTHON_INLINE void __pyx_f_5numpy_set_array_base(PyArrayObject *__pyx_v_a */ (void)(PyArray_SetBaseObject(__pyx_v_arr, __pyx_v_base)); - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1022 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1022 * int _import_umath() except -1 * * cdef inline void set_array_base(ndarray arr, object base): # <<<<<<<<<<<<<< @@ -4740,7 +4796,7 @@ static CYTHON_INLINE void __pyx_f_5numpy_set_array_base(PyArrayObject *__pyx_v_a __Pyx_RefNannyFinishContext(); } -/* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1026 +/* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1026 * PyArray_SetBaseObject(arr, base) * * cdef inline object get_array_base(ndarray arr): # <<<<<<<<<<<<<< @@ -4755,7 +4811,7 @@ static CYTHON_INLINE PyObject *__pyx_f_5numpy_get_array_base(PyArrayObject *__py int __pyx_t_1; __Pyx_RefNannySetupContext("get_array_base", 0); - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1027 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1027 * * cdef inline object get_array_base(ndarray arr): * base = PyArray_BASE(arr) # <<<<<<<<<<<<<< @@ -4764,7 +4820,7 @@ static CYTHON_INLINE PyObject *__pyx_f_5numpy_get_array_base(PyArrayObject *__py */ __pyx_v_base = PyArray_BASE(__pyx_v_arr); - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1028 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1028 * cdef inline object get_array_base(ndarray arr): * base = PyArray_BASE(arr) * if base is NULL: # <<<<<<<<<<<<<< @@ -4774,7 +4830,7 @@ static CYTHON_INLINE PyObject *__pyx_f_5numpy_get_array_base(PyArrayObject *__py __pyx_t_1 = ((__pyx_v_base == NULL) != 0); if (__pyx_t_1) { - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1029 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1029 * base = PyArray_BASE(arr) * if base is NULL: * return None # <<<<<<<<<<<<<< @@ -4785,7 +4841,7 @@ static CYTHON_INLINE PyObject *__pyx_f_5numpy_get_array_base(PyArrayObject *__py __pyx_r = Py_None; __Pyx_INCREF(Py_None); goto __pyx_L0; - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1028 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1028 * cdef inline object get_array_base(ndarray arr): * base = PyArray_BASE(arr) * if base is NULL: # <<<<<<<<<<<<<< @@ -4794,7 +4850,7 @@ static CYTHON_INLINE PyObject *__pyx_f_5numpy_get_array_base(PyArrayObject *__py */ } - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1030 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1030 * if base is NULL: * return None * return base # <<<<<<<<<<<<<< @@ -4806,7 +4862,7 @@ static CYTHON_INLINE PyObject *__pyx_f_5numpy_get_array_base(PyArrayObject *__py __pyx_r = ((PyObject *)__pyx_v_base); goto __pyx_L0; - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1026 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1026 * PyArray_SetBaseObject(arr, base) * * cdef inline object get_array_base(ndarray arr): # <<<<<<<<<<<<<< @@ -4821,7 +4877,7 @@ static CYTHON_INLINE PyObject *__pyx_f_5numpy_get_array_base(PyArrayObject *__py return __pyx_r; } -/* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1034 +/* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1034 * # Versions of the import_* functions which are more suitable for * # Cython code. * cdef inline int import_array() except -1: # <<<<<<<<<<<<<< @@ -4842,7 +4898,7 @@ static CYTHON_INLINE int __pyx_f_5numpy_import_array(void) { PyObject *__pyx_t_8 = NULL; __Pyx_RefNannySetupContext("import_array", 0); - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1035 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1035 * # Cython code. * cdef inline int import_array() except -1: * try: # <<<<<<<<<<<<<< @@ -4858,7 +4914,7 @@ static CYTHON_INLINE int __pyx_f_5numpy_import_array(void) { __Pyx_XGOTREF(__pyx_t_3); /*try:*/ { - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1036 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1036 * cdef inline int import_array() except -1: * try: * _import_array() # <<<<<<<<<<<<<< @@ -4867,7 +4923,7 @@ static CYTHON_INLINE int __pyx_f_5numpy_import_array(void) { */ __pyx_t_4 = _import_array(); if (unlikely(__pyx_t_4 == ((int)-1))) __PYX_ERR(1, 1036, __pyx_L3_error) - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1035 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1035 * # Cython code. * cdef inline int import_array() except -1: * try: # <<<<<<<<<<<<<< @@ -4881,7 +4937,7 @@ static CYTHON_INLINE int __pyx_f_5numpy_import_array(void) { goto __pyx_L8_try_end; __pyx_L3_error:; - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1037 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1037 * try: * _import_array() * except Exception: # <<<<<<<<<<<<<< @@ -4896,7 +4952,7 @@ static CYTHON_INLINE int __pyx_f_5numpy_import_array(void) { __Pyx_GOTREF(__pyx_t_6); __Pyx_GOTREF(__pyx_t_7); - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1038 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1038 * _import_array() * except Exception: * raise ImportError("numpy.core.multiarray failed to import") # <<<<<<<<<<<<<< @@ -4912,7 +4968,7 @@ static CYTHON_INLINE int __pyx_f_5numpy_import_array(void) { goto __pyx_L5_except_error; __pyx_L5_except_error:; - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1035 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1035 * # Cython code. * cdef inline int import_array() except -1: * try: # <<<<<<<<<<<<<< @@ -4927,7 +4983,7 @@ static CYTHON_INLINE int __pyx_f_5numpy_import_array(void) { __pyx_L8_try_end:; } - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1034 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1034 * # Versions of the import_* functions which are more suitable for * # Cython code. * cdef inline int import_array() except -1: # <<<<<<<<<<<<<< @@ -4950,7 +5006,7 @@ static CYTHON_INLINE int __pyx_f_5numpy_import_array(void) { return __pyx_r; } -/* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1040 +/* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1040 * raise ImportError("numpy.core.multiarray failed to import") * * cdef inline int import_umath() except -1: # <<<<<<<<<<<<<< @@ -4971,7 +5027,7 @@ static CYTHON_INLINE int __pyx_f_5numpy_import_umath(void) { PyObject *__pyx_t_8 = NULL; __Pyx_RefNannySetupContext("import_umath", 0); - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1041 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1041 * * cdef inline int import_umath() except -1: * try: # <<<<<<<<<<<<<< @@ -4987,7 +5043,7 @@ static CYTHON_INLINE int __pyx_f_5numpy_import_umath(void) { __Pyx_XGOTREF(__pyx_t_3); /*try:*/ { - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1042 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1042 * cdef inline int import_umath() except -1: * try: * _import_umath() # <<<<<<<<<<<<<< @@ -4996,7 +5052,7 @@ static CYTHON_INLINE int __pyx_f_5numpy_import_umath(void) { */ __pyx_t_4 = _import_umath(); if (unlikely(__pyx_t_4 == ((int)-1))) __PYX_ERR(1, 1042, __pyx_L3_error) - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1041 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1041 * * cdef inline int import_umath() except -1: * try: # <<<<<<<<<<<<<< @@ -5010,7 +5066,7 @@ static CYTHON_INLINE int __pyx_f_5numpy_import_umath(void) { goto __pyx_L8_try_end; __pyx_L3_error:; - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1043 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1043 * try: * _import_umath() * except Exception: # <<<<<<<<<<<<<< @@ -5025,7 +5081,7 @@ static CYTHON_INLINE int __pyx_f_5numpy_import_umath(void) { __Pyx_GOTREF(__pyx_t_6); __Pyx_GOTREF(__pyx_t_7); - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1044 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1044 * _import_umath() * except Exception: * raise ImportError("numpy.core.umath failed to import") # <<<<<<<<<<<<<< @@ -5041,7 +5097,7 @@ static CYTHON_INLINE int __pyx_f_5numpy_import_umath(void) { goto __pyx_L5_except_error; __pyx_L5_except_error:; - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1041 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1041 * * cdef inline int import_umath() except -1: * try: # <<<<<<<<<<<<<< @@ -5056,7 +5112,7 @@ static CYTHON_INLINE int __pyx_f_5numpy_import_umath(void) { __pyx_L8_try_end:; } - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1040 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1040 * raise ImportError("numpy.core.multiarray failed to import") * * cdef inline int import_umath() except -1: # <<<<<<<<<<<<<< @@ -5079,7 +5135,7 @@ static CYTHON_INLINE int __pyx_f_5numpy_import_umath(void) { return __pyx_r; } -/* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1046 +/* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1046 * raise ImportError("numpy.core.umath failed to import") * * cdef inline int import_ufunc() except -1: # <<<<<<<<<<<<<< @@ -5100,7 +5156,7 @@ static CYTHON_INLINE int __pyx_f_5numpy_import_ufunc(void) { PyObject *__pyx_t_8 = NULL; __Pyx_RefNannySetupContext("import_ufunc", 0); - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1047 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1047 * * cdef inline int import_ufunc() except -1: * try: # <<<<<<<<<<<<<< @@ -5116,7 +5172,7 @@ static CYTHON_INLINE int __pyx_f_5numpy_import_ufunc(void) { __Pyx_XGOTREF(__pyx_t_3); /*try:*/ { - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1048 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1048 * cdef inline int import_ufunc() except -1: * try: * _import_umath() # <<<<<<<<<<<<<< @@ -5125,7 +5181,7 @@ static CYTHON_INLINE int __pyx_f_5numpy_import_ufunc(void) { */ __pyx_t_4 = _import_umath(); if (unlikely(__pyx_t_4 == ((int)-1))) __PYX_ERR(1, 1048, __pyx_L3_error) - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1047 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1047 * * cdef inline int import_ufunc() except -1: * try: # <<<<<<<<<<<<<< @@ -5139,7 +5195,7 @@ static CYTHON_INLINE int __pyx_f_5numpy_import_ufunc(void) { goto __pyx_L8_try_end; __pyx_L3_error:; - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1049 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1049 * try: * _import_umath() * except Exception: # <<<<<<<<<<<<<< @@ -5153,7 +5209,7 @@ static CYTHON_INLINE int __pyx_f_5numpy_import_ufunc(void) { __Pyx_GOTREF(__pyx_t_6); __Pyx_GOTREF(__pyx_t_7); - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1050 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1050 * _import_umath() * except Exception: * raise ImportError("numpy.core.umath failed to import") # <<<<<<<<<<<<<< @@ -5167,7 +5223,7 @@ static CYTHON_INLINE int __pyx_f_5numpy_import_ufunc(void) { goto __pyx_L5_except_error; __pyx_L5_except_error:; - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1047 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1047 * * cdef inline int import_ufunc() except -1: * try: # <<<<<<<<<<<<<< @@ -5182,7 +5238,7 @@ static CYTHON_INLINE int __pyx_f_5numpy_import_ufunc(void) { __pyx_L8_try_end:; } - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1046 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1046 * raise ImportError("numpy.core.umath failed to import") * * cdef inline int import_ufunc() except -1: # <<<<<<<<<<<<<< @@ -5205,241 +5261,24 @@ static CYTHON_INLINE int __pyx_f_5numpy_import_ufunc(void) { return __pyx_r; } -/* "cfunc.to_py":65 - * @cname("__Pyx_CFunc_object____object___to_py") - * cdef object __Pyx_CFunc_object____object___to_py(object (*f)(object) ): - * def wrap(object b): # <<<<<<<<<<<<<< - * """wrap(b)""" - * return f(b) - */ - -/* Python wrapper */ -static PyObject *__pyx_pw_11cfunc_dot_to_py_36__Pyx_CFunc_object____object___to_py_1wrap(PyObject *__pyx_self, PyObject *__pyx_v_b); /*proto*/ -static char __pyx_doc_11cfunc_dot_to_py_36__Pyx_CFunc_object____object___to_py_wrap[] = "wrap(b)"; -static PyMethodDef __pyx_mdef_11cfunc_dot_to_py_36__Pyx_CFunc_object____object___to_py_1wrap = {"wrap", (PyCFunction)__pyx_pw_11cfunc_dot_to_py_36__Pyx_CFunc_object____object___to_py_1wrap, METH_O, __pyx_doc_11cfunc_dot_to_py_36__Pyx_CFunc_object____object___to_py_wrap}; -static PyObject *__pyx_pw_11cfunc_dot_to_py_36__Pyx_CFunc_object____object___to_py_1wrap(PyObject *__pyx_self, PyObject *__pyx_v_b) { - PyObject *__pyx_r = 0; - __Pyx_RefNannyDeclarations - __Pyx_RefNannySetupContext("wrap (wrapper)", 0); - __pyx_r = __pyx_pf_11cfunc_dot_to_py_36__Pyx_CFunc_object____object___to_py_wrap(__pyx_self, ((PyObject *)__pyx_v_b)); - - /* function exit code */ - __Pyx_RefNannyFinishContext(); - return __pyx_r; -} +static PyMethodDef __pyx_methods[] = { + {"ft_hash_bytes", (PyCFunction)__pyx_pw_6gensim_6models_14_utils_any2vec_1ft_hash_bytes, METH_O, __pyx_doc_6gensim_6models_14_utils_any2vec_ft_hash_bytes}, + {"ft_hash_broken", (PyCFunction)__pyx_pw_6gensim_6models_14_utils_any2vec_3ft_hash_broken, METH_O, __pyx_doc_6gensim_6models_14_utils_any2vec_2ft_hash_broken}, + {"compute_ngrams", (PyCFunction)(void*)(PyCFunctionWithKeywords)__pyx_pw_6gensim_6models_14_utils_any2vec_5compute_ngrams, METH_VARARGS|METH_KEYWORDS, __pyx_doc_6gensim_6models_14_utils_any2vec_4compute_ngrams}, + {"compute_ngrams_bytes", (PyCFunction)(void*)(PyCFunctionWithKeywords)__pyx_pw_6gensim_6models_14_utils_any2vec_7compute_ngrams_bytes, METH_VARARGS|METH_KEYWORDS, __pyx_doc_6gensim_6models_14_utils_any2vec_6compute_ngrams_bytes}, + {0, 0, 0, 0} +}; -static PyObject *__pyx_pf_11cfunc_dot_to_py_36__Pyx_CFunc_object____object___to_py_wrap(PyObject *__pyx_self, PyObject *__pyx_v_b) { - struct __pyx_obj___pyx_scope_struct____Pyx_CFunc_object____object___to_py *__pyx_cur_scope; - struct __pyx_obj___pyx_scope_struct____Pyx_CFunc_object____object___to_py *__pyx_outer_scope; - PyObject *__pyx_r = NULL; - __Pyx_RefNannyDeclarations - PyObject *__pyx_t_1 = NULL; - __Pyx_RefNannySetupContext("wrap", 0); - __pyx_outer_scope = (struct __pyx_obj___pyx_scope_struct____Pyx_CFunc_object____object___to_py *) __Pyx_CyFunction_GetClosure(__pyx_self); - __pyx_cur_scope = __pyx_outer_scope; - - /* "cfunc.to_py":67 - * def wrap(object b): - * """wrap(b)""" - * return f(b) # <<<<<<<<<<<<<< - * return wrap - * - */ - __Pyx_XDECREF(__pyx_r); - __pyx_t_1 = __pyx_cur_scope->__pyx_v_f(__pyx_v_b); if (unlikely(!__pyx_t_1)) __PYX_ERR(2, 67, __pyx_L1_error) - __Pyx_GOTREF(__pyx_t_1); - __pyx_r = __pyx_t_1; - __pyx_t_1 = 0; - goto __pyx_L0; - - /* "cfunc.to_py":65 - * @cname("__Pyx_CFunc_object____object___to_py") - * cdef object __Pyx_CFunc_object____object___to_py(object (*f)(object) ): - * def wrap(object b): # <<<<<<<<<<<<<< - * """wrap(b)""" - * return f(b) - */ - - /* function exit code */ - __pyx_L1_error:; - __Pyx_XDECREF(__pyx_t_1); - __Pyx_AddTraceback("cfunc.to_py.__Pyx_CFunc_object____object___to_py.wrap", __pyx_clineno, __pyx_lineno, __pyx_filename); - __pyx_r = NULL; - __pyx_L0:; - __Pyx_XGIVEREF(__pyx_r); - __Pyx_RefNannyFinishContext(); - return __pyx_r; -} - -/* "cfunc.to_py":64 - * - * @cname("__Pyx_CFunc_object____object___to_py") - * cdef object __Pyx_CFunc_object____object___to_py(object (*f)(object) ): # <<<<<<<<<<<<<< - * def wrap(object b): - * """wrap(b)""" - */ - -static PyObject *__Pyx_CFunc_object____object___to_py(PyObject *(*__pyx_v_f)(PyObject *)) { - struct __pyx_obj___pyx_scope_struct____Pyx_CFunc_object____object___to_py *__pyx_cur_scope; - PyObject *__pyx_v_wrap = 0; - PyObject *__pyx_r = NULL; - __Pyx_RefNannyDeclarations - PyObject *__pyx_t_1 = NULL; - __Pyx_RefNannySetupContext("__Pyx_CFunc_object____object___to_py", 0); - __pyx_cur_scope = (struct __pyx_obj___pyx_scope_struct____Pyx_CFunc_object____object___to_py *)__pyx_tp_new___pyx_scope_struct____Pyx_CFunc_object____object___to_py(__pyx_ptype___pyx_scope_struct____Pyx_CFunc_object____object___to_py, __pyx_empty_tuple, NULL); - if (unlikely(!__pyx_cur_scope)) { - __pyx_cur_scope = ((struct __pyx_obj___pyx_scope_struct____Pyx_CFunc_object____object___to_py *)Py_None); - __Pyx_INCREF(Py_None); - __PYX_ERR(2, 64, __pyx_L1_error) - } else { - __Pyx_GOTREF(__pyx_cur_scope); - } - __pyx_cur_scope->__pyx_v_f = __pyx_v_f; - - /* "cfunc.to_py":65 - * @cname("__Pyx_CFunc_object____object___to_py") - * cdef object __Pyx_CFunc_object____object___to_py(object (*f)(object) ): - * def wrap(object b): # <<<<<<<<<<<<<< - * """wrap(b)""" - * return f(b) - */ - __pyx_t_1 = __Pyx_CyFunction_NewEx(&__pyx_mdef_11cfunc_dot_to_py_36__Pyx_CFunc_object____object___to_py_1wrap, 0, __pyx_n_s_Pyx_CFunc_object____object___t, ((PyObject*)__pyx_cur_scope), __pyx_n_s_cfunc_to_py, __pyx_d, ((PyObject *)__pyx_codeobj__11)); if (unlikely(!__pyx_t_1)) __PYX_ERR(2, 65, __pyx_L1_error) - __Pyx_GOTREF(__pyx_t_1); - __pyx_v_wrap = __pyx_t_1; - __pyx_t_1 = 0; - - /* "cfunc.to_py":68 - * """wrap(b)""" - * return f(b) - * return wrap # <<<<<<<<<<<<<< - * - * - */ - __Pyx_XDECREF(__pyx_r); - __Pyx_INCREF(__pyx_v_wrap); - __pyx_r = __pyx_v_wrap; - goto __pyx_L0; - - /* "cfunc.to_py":64 - * - * @cname("__Pyx_CFunc_object____object___to_py") - * cdef object __Pyx_CFunc_object____object___to_py(object (*f)(object) ): # <<<<<<<<<<<<<< - * def wrap(object b): - * """wrap(b)""" - */ - - /* function exit code */ - __pyx_L1_error:; - __Pyx_XDECREF(__pyx_t_1); - __Pyx_AddTraceback("cfunc.to_py.__Pyx_CFunc_object____object___to_py", __pyx_clineno, __pyx_lineno, __pyx_filename); - __pyx_r = 0; - __pyx_L0:; - __Pyx_XDECREF(__pyx_v_wrap); - __Pyx_DECREF(((PyObject *)__pyx_cur_scope)); - __Pyx_XGIVEREF(__pyx_r); - __Pyx_RefNannyFinishContext(); - return __pyx_r; -} - -static struct __pyx_obj___pyx_scope_struct____Pyx_CFunc_object____object___to_py *__pyx_freelist___pyx_scope_struct____Pyx_CFunc_object____object___to_py[8]; -static int __pyx_freecount___pyx_scope_struct____Pyx_CFunc_object____object___to_py = 0; - -static PyObject *__pyx_tp_new___pyx_scope_struct____Pyx_CFunc_object____object___to_py(PyTypeObject *t, CYTHON_UNUSED PyObject *a, CYTHON_UNUSED PyObject *k) { - PyObject *o; - if (CYTHON_COMPILING_IN_CPYTHON && likely((__pyx_freecount___pyx_scope_struct____Pyx_CFunc_object____object___to_py > 0) & (t->tp_basicsize == sizeof(struct __pyx_obj___pyx_scope_struct____Pyx_CFunc_object____object___to_py)))) { - o = (PyObject*)__pyx_freelist___pyx_scope_struct____Pyx_CFunc_object____object___to_py[--__pyx_freecount___pyx_scope_struct____Pyx_CFunc_object____object___to_py]; - memset(o, 0, sizeof(struct __pyx_obj___pyx_scope_struct____Pyx_CFunc_object____object___to_py)); - (void) PyObject_INIT(o, t); - } else { - o = (*t->tp_alloc)(t, 0); - if (unlikely(!o)) return 0; - } - return o; -} - -static void __pyx_tp_dealloc___pyx_scope_struct____Pyx_CFunc_object____object___to_py(PyObject *o) { - if (CYTHON_COMPILING_IN_CPYTHON && ((__pyx_freecount___pyx_scope_struct____Pyx_CFunc_object____object___to_py < 8) & (Py_TYPE(o)->tp_basicsize == sizeof(struct __pyx_obj___pyx_scope_struct____Pyx_CFunc_object____object___to_py)))) { - __pyx_freelist___pyx_scope_struct____Pyx_CFunc_object____object___to_py[__pyx_freecount___pyx_scope_struct____Pyx_CFunc_object____object___to_py++] = ((struct __pyx_obj___pyx_scope_struct____Pyx_CFunc_object____object___to_py *)o); - } else { - (*Py_TYPE(o)->tp_free)(o); - } -} - -static PyTypeObject __pyx_scope_struct____Pyx_CFunc_object____object___to_py = { - PyVarObject_HEAD_INIT(0, 0) - "gensim.models._utils_any2vec.__pyx_scope_struct____Pyx_CFunc_object____object___to_py", /*tp_name*/ - sizeof(struct __pyx_obj___pyx_scope_struct____Pyx_CFunc_object____object___to_py), /*tp_basicsize*/ - 0, /*tp_itemsize*/ - __pyx_tp_dealloc___pyx_scope_struct____Pyx_CFunc_object____object___to_py, /*tp_dealloc*/ - 0, /*tp_print*/ - 0, /*tp_getattr*/ - 0, /*tp_setattr*/ - #if PY_MAJOR_VERSION < 3 - 0, /*tp_compare*/ - #endif - #if PY_MAJOR_VERSION >= 3 - 0, /*tp_as_async*/ - #endif - 0, /*tp_repr*/ - 0, /*tp_as_number*/ - 0, /*tp_as_sequence*/ - 0, /*tp_as_mapping*/ - 0, /*tp_hash*/ - 0, /*tp_call*/ - 0, /*tp_str*/ - 0, /*tp_getattro*/ - 0, /*tp_setattro*/ - 0, /*tp_as_buffer*/ - Py_TPFLAGS_DEFAULT|Py_TPFLAGS_HAVE_VERSION_TAG|Py_TPFLAGS_CHECKTYPES|Py_TPFLAGS_HAVE_NEWBUFFER, /*tp_flags*/ - 0, /*tp_doc*/ - 0, /*tp_traverse*/ - 0, /*tp_clear*/ - 0, /*tp_richcompare*/ - 0, /*tp_weaklistoffset*/ - 0, /*tp_iter*/ - 0, /*tp_iternext*/ - 0, /*tp_methods*/ - 0, /*tp_members*/ - 0, /*tp_getset*/ - 0, /*tp_base*/ - 0, /*tp_dict*/ - 0, /*tp_descr_get*/ - 0, /*tp_descr_set*/ - 0, /*tp_dictoffset*/ - 0, /*tp_init*/ - 0, /*tp_alloc*/ - __pyx_tp_new___pyx_scope_struct____Pyx_CFunc_object____object___to_py, /*tp_new*/ - 0, /*tp_free*/ - 0, /*tp_is_gc*/ - 0, /*tp_bases*/ - 0, /*tp_mro*/ - 0, /*tp_cache*/ - 0, /*tp_subclasses*/ - 0, /*tp_weaklist*/ - 0, /*tp_del*/ - 0, /*tp_version_tag*/ - #if PY_VERSION_HEX >= 0x030400a1 - 0, /*tp_finalize*/ - #endif -}; - -static PyMethodDef __pyx_methods[] = { - {"ft_hash", (PyCFunction)__pyx_pw_6gensim_6models_14_utils_any2vec_1ft_hash, METH_O, __pyx_doc_6gensim_6models_14_utils_any2vec_ft_hash}, - {"ft_hash_broken", (PyCFunction)__pyx_pw_6gensim_6models_14_utils_any2vec_3ft_hash_broken, METH_O, __pyx_doc_6gensim_6models_14_utils_any2vec_2ft_hash_broken}, - {"compute_ngrams", (PyCFunction)(void*)(PyCFunctionWithKeywords)__pyx_pw_6gensim_6models_14_utils_any2vec_5compute_ngrams, METH_VARARGS|METH_KEYWORDS, __pyx_doc_6gensim_6models_14_utils_any2vec_4compute_ngrams}, - {0, 0, 0, 0} -}; - -#if PY_MAJOR_VERSION >= 3 -#if CYTHON_PEP489_MULTI_PHASE_INIT -static PyObject* __pyx_pymod_create(PyObject *spec, PyModuleDef *def); /*proto*/ -static int __pyx_pymod_exec__utils_any2vec(PyObject* module); /*proto*/ -static PyModuleDef_Slot __pyx_moduledef_slots[] = { - {Py_mod_create, (void*)__pyx_pymod_create}, - {Py_mod_exec, (void*)__pyx_pymod_exec__utils_any2vec}, - {0, NULL} -}; -#endif +#if PY_MAJOR_VERSION >= 3 +#if CYTHON_PEP489_MULTI_PHASE_INIT +static PyObject* __pyx_pymod_create(PyObject *spec, PyModuleDef *def); /*proto*/ +static int __pyx_pymod_exec__utils_any2vec(PyObject* module); /*proto*/ +static PyModuleDef_Slot __pyx_moduledef_slots[] = { + {Py_mod_create, (void*)__pyx_pymod_create}, + {Py_mod_exec, (void*)__pyx_pymod_exec__utils_any2vec}, + {0, NULL} +}; +#endif static struct PyModuleDef __pyx_moduledef = { PyModuleDef_HEAD_INIT, @@ -5478,16 +5317,12 @@ static __Pyx_StringTabEntry __pyx_string_tab[] = { {&__pyx_n_s_ImportError, __pyx_k_ImportError, sizeof(__pyx_k_ImportError), 0, 0, 1, 1}, {&__pyx_kp_u_Non_native_byte_order_not_suppor, __pyx_k_Non_native_byte_order_not_suppor, sizeof(__pyx_k_Non_native_byte_order_not_suppor), 0, 1, 0, 0}, {&__pyx_n_s_PY2, __pyx_k_PY2, sizeof(__pyx_k_PY2), 0, 0, 1, 1}, - {&__pyx_n_s_Pyx_CFunc_object____object___t, __pyx_k_Pyx_CFunc_object____object___t, sizeof(__pyx_k_Pyx_CFunc_object____object___t), 0, 0, 1, 1}, {&__pyx_n_s_RuntimeError, __pyx_k_RuntimeError, sizeof(__pyx_k_RuntimeError), 0, 0, 1, 1}, {&__pyx_n_s_ValueError, __pyx_k_ValueError, sizeof(__pyx_k_ValueError), 0, 0, 1, 1}, {&__pyx_kp_u__2, __pyx_k__2, sizeof(__pyx_k__2), 0, 1, 0, 0}, - {&__pyx_n_s_b, __pyx_k_b, sizeof(__pyx_k_b), 0, 0, 1, 1}, - {&__pyx_n_s_byte_to_int, __pyx_k_byte_to_int, sizeof(__pyx_k_byte_to_int), 0, 0, 1, 1}, - {&__pyx_n_s_cfunc_to_py, __pyx_k_cfunc_to_py, sizeof(__pyx_k_cfunc_to_py), 0, 0, 1, 1}, {&__pyx_n_s_cline_in_traceback, __pyx_k_cline_in_traceback, sizeof(__pyx_k_cline_in_traceback), 0, 0, 1, 1}, + {&__pyx_n_s_encode, __pyx_k_encode, sizeof(__pyx_k_encode), 0, 0, 1, 1}, {&__pyx_n_s_import, __pyx_k_import, sizeof(__pyx_k_import), 0, 0, 1, 1}, - {&__pyx_n_s_int8, __pyx_k_int8, sizeof(__pyx_k_int8), 0, 0, 1, 1}, {&__pyx_n_s_main, __pyx_k_main, sizeof(__pyx_k_main), 0, 0, 1, 1}, {&__pyx_n_s_max_n, __pyx_k_max_n, sizeof(__pyx_k_max_n), 0, 0, 1, 1}, {&__pyx_n_s_min_n, __pyx_k_min_n, sizeof(__pyx_k_min_n), 0, 0, 1, 1}, @@ -5499,13 +5334,12 @@ static __Pyx_StringTabEntry __pyx_string_tab[] = { {&__pyx_kp_s_numpy_core_multiarray_failed_to, __pyx_k_numpy_core_multiarray_failed_to, sizeof(__pyx_k_numpy_core_multiarray_failed_to), 0, 0, 1, 0}, {&__pyx_kp_s_numpy_core_umath_failed_to_impor, __pyx_k_numpy_core_umath_failed_to_impor, sizeof(__pyx_k_numpy_core_umath_failed_to_impor), 0, 0, 1, 0}, {&__pyx_n_s_range, __pyx_k_range, sizeof(__pyx_k_range), 0, 0, 1, 1}, + {&__pyx_kp_s_s, __pyx_k_s, sizeof(__pyx_k_s), 0, 0, 1, 0}, {&__pyx_n_s_six, __pyx_k_six, sizeof(__pyx_k_six), 0, 0, 1, 1}, - {&__pyx_kp_s_stringsource, __pyx_k_stringsource, sizeof(__pyx_k_stringsource), 0, 0, 1, 0}, {&__pyx_n_s_test, __pyx_k_test, sizeof(__pyx_k_test), 0, 0, 1, 1}, - {&__pyx_n_s_uint32, __pyx_k_uint32, sizeof(__pyx_k_uint32), 0, 0, 1, 1}, {&__pyx_kp_u_unknown_dtype_code_in_numpy_pxd, __pyx_k_unknown_dtype_code_in_numpy_pxd, sizeof(__pyx_k_unknown_dtype_code_in_numpy_pxd), 0, 1, 0, 0}, + {&__pyx_kp_s_utf_8, __pyx_k_utf_8, sizeof(__pyx_k_utf_8), 0, 0, 1, 0}, {&__pyx_n_s_word, __pyx_k_word, sizeof(__pyx_k_word), 0, 0, 1, 1}, - {&__pyx_n_s_wrap, __pyx_k_wrap, sizeof(__pyx_k_wrap), 0, 0, 1, 1}, {0, 0, 0, 0, 0, 0, 0} }; static CYTHON_SMALL_CODE int __Pyx_InitCachedBuiltins(void) { @@ -5522,7 +5356,7 @@ static CYTHON_SMALL_CODE int __Pyx_InitCachedConstants(void) { __Pyx_RefNannyDeclarations __Pyx_RefNannySetupContext("__Pyx_InitCachedConstants", 0); - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":272 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":272 * if ((flags & pybuf.PyBUF_C_CONTIGUOUS == pybuf.PyBUF_C_CONTIGUOUS) * and not PyArray_CHKFLAGS(self, NPY_ARRAY_C_CONTIGUOUS)): * raise ValueError(u"ndarray is not C contiguous") # <<<<<<<<<<<<<< @@ -5533,7 +5367,7 @@ static CYTHON_SMALL_CODE int __Pyx_InitCachedConstants(void) { __Pyx_GOTREF(__pyx_tuple__3); __Pyx_GIVEREF(__pyx_tuple__3); - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":276 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":276 * if ((flags & pybuf.PyBUF_F_CONTIGUOUS == pybuf.PyBUF_F_CONTIGUOUS) * and not PyArray_CHKFLAGS(self, NPY_ARRAY_F_CONTIGUOUS)): * raise ValueError(u"ndarray is not Fortran contiguous") # <<<<<<<<<<<<<< @@ -5544,7 +5378,7 @@ static CYTHON_SMALL_CODE int __Pyx_InitCachedConstants(void) { __Pyx_GOTREF(__pyx_tuple__4); __Pyx_GIVEREF(__pyx_tuple__4); - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":306 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":306 * if ((descr.byteorder == c'>' and little_endian) or * (descr.byteorder == c'<' and not little_endian)): * raise ValueError(u"Non-native byte order not supported") # <<<<<<<<<<<<<< @@ -5555,7 +5389,7 @@ static CYTHON_SMALL_CODE int __Pyx_InitCachedConstants(void) { __Pyx_GOTREF(__pyx_tuple__5); __Pyx_GIVEREF(__pyx_tuple__5); - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":856 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":856 * * if (end - f) - (new_offset - offset[0]) < 15: * raise RuntimeError(u"Format string allocated too short, see comment in numpy.pxd") # <<<<<<<<<<<<<< @@ -5566,7 +5400,7 @@ static CYTHON_SMALL_CODE int __Pyx_InitCachedConstants(void) { __Pyx_GOTREF(__pyx_tuple__6); __Pyx_GIVEREF(__pyx_tuple__6); - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":880 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":880 * t = child.type_num * if end - f < 5: * raise RuntimeError(u"Format string allocated too short.") # <<<<<<<<<<<<<< @@ -5577,7 +5411,7 @@ static CYTHON_SMALL_CODE int __Pyx_InitCachedConstants(void) { __Pyx_GOTREF(__pyx_tuple__7); __Pyx_GIVEREF(__pyx_tuple__7); - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1038 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1038 * _import_array() * except Exception: * raise ImportError("numpy.core.multiarray failed to import") # <<<<<<<<<<<<<< @@ -5588,7 +5422,7 @@ static CYTHON_SMALL_CODE int __Pyx_InitCachedConstants(void) { __Pyx_GOTREF(__pyx_tuple__8); __Pyx_GIVEREF(__pyx_tuple__8); - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1044 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1044 * _import_umath() * except Exception: * raise ImportError("numpy.core.umath failed to import") # <<<<<<<<<<<<<< @@ -5598,18 +5432,6 @@ static CYTHON_SMALL_CODE int __Pyx_InitCachedConstants(void) { __pyx_tuple__9 = PyTuple_Pack(1, __pyx_kp_s_numpy_core_umath_failed_to_impor); if (unlikely(!__pyx_tuple__9)) __PYX_ERR(1, 1044, __pyx_L1_error) __Pyx_GOTREF(__pyx_tuple__9); __Pyx_GIVEREF(__pyx_tuple__9); - - /* "cfunc.to_py":65 - * @cname("__Pyx_CFunc_object____object___to_py") - * cdef object __Pyx_CFunc_object____object___to_py(object (*f)(object) ): - * def wrap(object b): # <<<<<<<<<<<<<< - * """wrap(b)""" - * return f(b) - */ - __pyx_tuple__10 = PyTuple_Pack(1, __pyx_n_s_b); if (unlikely(!__pyx_tuple__10)) __PYX_ERR(2, 65, __pyx_L1_error) - __Pyx_GOTREF(__pyx_tuple__10); - __Pyx_GIVEREF(__pyx_tuple__10); - __pyx_codeobj__11 = (PyObject*)__Pyx_PyCode_New(1, 0, 1, 0, CO_OPTIMIZED|CO_NEWLOCALS, __pyx_empty_bytes, __pyx_empty_tuple, __pyx_empty_tuple, __pyx_tuple__10, __pyx_empty_tuple, __pyx_empty_tuple, __pyx_kp_s_stringsource, __pyx_n_s_wrap, 65, __pyx_empty_bytes); if (unlikely(!__pyx_codeobj__11)) __PYX_ERR(2, 65, __pyx_L1_error) __Pyx_RefNannyFinishContext(); return 0; __pyx_L1_error:; @@ -5621,7 +5443,6 @@ static CYTHON_SMALL_CODE int __Pyx_InitGlobals(void) { if (__Pyx_InitStrings(__pyx_string_tab) < 0) __PYX_ERR(0, 1, __pyx_L1_error); __pyx_int_0 = PyInt_FromLong(0); if (unlikely(!__pyx_int_0)) __PYX_ERR(0, 1, __pyx_L1_error) __pyx_int_1 = PyInt_FromLong(1); if (unlikely(!__pyx_int_1)) __PYX_ERR(0, 1, __pyx_L1_error) - __pyx_int_16777619 = PyInt_FromLong(16777619L); if (unlikely(!__pyx_int_16777619)) __PYX_ERR(0, 1, __pyx_L1_error) return 0; __pyx_L1_error:; return -1; @@ -5663,17 +5484,8 @@ static int __Pyx_modinit_type_init_code(void) { __Pyx_RefNannyDeclarations __Pyx_RefNannySetupContext("__Pyx_modinit_type_init_code", 0); /*--- Type init code ---*/ - if (PyType_Ready(&__pyx_scope_struct____Pyx_CFunc_object____object___to_py) < 0) __PYX_ERR(2, 64, __pyx_L1_error) - __pyx_scope_struct____Pyx_CFunc_object____object___to_py.tp_print = 0; - if ((CYTHON_USE_TYPE_SLOTS && CYTHON_USE_PYTYPE_LOOKUP) && likely(!__pyx_scope_struct____Pyx_CFunc_object____object___to_py.tp_dictoffset && __pyx_scope_struct____Pyx_CFunc_object____object___to_py.tp_getattro == PyObject_GenericGetAttr)) { - __pyx_scope_struct____Pyx_CFunc_object____object___to_py.tp_getattro = __Pyx_PyObject_GenericGetAttrNoDict; - } - __pyx_ptype___pyx_scope_struct____Pyx_CFunc_object____object___to_py = &__pyx_scope_struct____Pyx_CFunc_object____object___to_py; __Pyx_RefNannyFinishContext(); return 0; - __pyx_L1_error:; - __Pyx_RefNannyFinishContext(); - return -1; } static int __Pyx_modinit_type_import_code(void) { @@ -5681,7 +5493,7 @@ static int __Pyx_modinit_type_import_code(void) { PyObject *__pyx_t_1 = NULL; __Pyx_RefNannySetupContext("__Pyx_modinit_type_import_code", 0); /*--- Type import code ---*/ - __pyx_t_1 = PyImport_ImportModule(__Pyx_BUILTIN_MODULE_NAME); if (unlikely(!__pyx_t_1)) __PYX_ERR(3, 9, __pyx_L1_error) + __pyx_t_1 = PyImport_ImportModule(__Pyx_BUILTIN_MODULE_NAME); if (unlikely(!__pyx_t_1)) __PYX_ERR(2, 9, __pyx_L1_error) __Pyx_GOTREF(__pyx_t_1); __pyx_ptype_7cpython_4type_type = __Pyx_ImportType(__pyx_t_1, __Pyx_BUILTIN_MODULE_NAME, "type", #if defined(PYPY_VERSION_NUM) && PYPY_VERSION_NUM < 0x050B0000 @@ -5690,7 +5502,7 @@ static int __Pyx_modinit_type_import_code(void) { sizeof(PyHeapTypeObject), #endif __Pyx_ImportType_CheckSize_Warn); - if (!__pyx_ptype_7cpython_4type_type) __PYX_ERR(3, 9, __pyx_L1_error) + if (!__pyx_ptype_7cpython_4type_type) __PYX_ERR(2, 9, __pyx_L1_error) __Pyx_DECREF(__pyx_t_1); __pyx_t_1 = 0; __pyx_t_1 = PyImport_ImportModule("numpy"); if (unlikely(!__pyx_t_1)) __PYX_ERR(1, 206, __pyx_L1_error) __Pyx_GOTREF(__pyx_t_1); @@ -5823,7 +5635,6 @@ static CYTHON_SMALL_CODE int __pyx_pymod_exec__utils_any2vec(PyObject *__pyx_pyi { PyObject *__pyx_t_1 = NULL; PyObject *__pyx_t_2 = NULL; - int __pyx_t_3; __Pyx_RefNannyDeclarations #if CYTHON_PEP489_MULTI_PHASE_INIT if (__pyx_m) { @@ -5920,7 +5731,7 @@ if (!__Pyx_RefNanny) { (void)__Pyx_modinit_global_init_code(); (void)__Pyx_modinit_variable_export_code(); (void)__Pyx_modinit_function_export_code(); - if (unlikely(__Pyx_modinit_type_init_code() != 0)) goto __pyx_L1_error; + (void)__Pyx_modinit_type_init_code(); if (unlikely(__Pyx_modinit_type_import_code() != 0)) goto __pyx_L1_error; (void)__Pyx_modinit_variable_import_code(); (void)__Pyx_modinit_function_import_code(); @@ -5929,63 +5740,56 @@ if (!__Pyx_RefNanny) { if (__Pyx_patch_abc() < 0) __PYX_ERR(0, 1, __pyx_L1_error) #endif - /* "gensim/models/_utils_any2vec.pyx":10 - * """General functions used for any2vec models.""" + /* "gensim/models/_utils_any2vec.pyx":17 + * ctypedef signed char int8_t * * from six import PY2 # <<<<<<<<<<<<<< * import numpy as np * cimport numpy as np */ - __pyx_t_1 = PyList_New(1); if (unlikely(!__pyx_t_1)) __PYX_ERR(0, 10, __pyx_L1_error) + __pyx_t_1 = PyList_New(1); if (unlikely(!__pyx_t_1)) __PYX_ERR(0, 17, __pyx_L1_error) __Pyx_GOTREF(__pyx_t_1); __Pyx_INCREF(__pyx_n_s_PY2); __Pyx_GIVEREF(__pyx_n_s_PY2); PyList_SET_ITEM(__pyx_t_1, 0, __pyx_n_s_PY2); - __pyx_t_2 = __Pyx_Import(__pyx_n_s_six, __pyx_t_1, -1); if (unlikely(!__pyx_t_2)) __PYX_ERR(0, 10, __pyx_L1_error) + __pyx_t_2 = __Pyx_Import(__pyx_n_s_six, __pyx_t_1, -1); if (unlikely(!__pyx_t_2)) __PYX_ERR(0, 17, __pyx_L1_error) __Pyx_GOTREF(__pyx_t_2); __Pyx_DECREF(__pyx_t_1); __pyx_t_1 = 0; - __pyx_t_1 = __Pyx_ImportFrom(__pyx_t_2, __pyx_n_s_PY2); if (unlikely(!__pyx_t_1)) __PYX_ERR(0, 10, __pyx_L1_error) + __pyx_t_1 = __Pyx_ImportFrom(__pyx_t_2, __pyx_n_s_PY2); if (unlikely(!__pyx_t_1)) __PYX_ERR(0, 17, __pyx_L1_error) __Pyx_GOTREF(__pyx_t_1); - if (PyDict_SetItem(__pyx_d, __pyx_n_s_PY2, __pyx_t_1) < 0) __PYX_ERR(0, 10, __pyx_L1_error) + if (PyDict_SetItem(__pyx_d, __pyx_n_s_PY2, __pyx_t_1) < 0) __PYX_ERR(0, 17, __pyx_L1_error) __Pyx_DECREF(__pyx_t_1); __pyx_t_1 = 0; __Pyx_DECREF(__pyx_t_2); __pyx_t_2 = 0; - /* "gensim/models/_utils_any2vec.pyx":11 + /* "gensim/models/_utils_any2vec.pyx":18 * * from six import PY2 * import numpy as np # <<<<<<<<<<<<<< * cimport numpy as np * */ - __pyx_t_2 = __Pyx_Import(__pyx_n_s_numpy, 0, -1); if (unlikely(!__pyx_t_2)) __PYX_ERR(0, 11, __pyx_L1_error) + __pyx_t_2 = __Pyx_Import(__pyx_n_s_numpy, 0, -1); if (unlikely(!__pyx_t_2)) __PYX_ERR(0, 18, __pyx_L1_error) __Pyx_GOTREF(__pyx_t_2); - if (PyDict_SetItem(__pyx_d, __pyx_n_s_np, __pyx_t_2) < 0) __PYX_ERR(0, 11, __pyx_L1_error) + if (PyDict_SetItem(__pyx_d, __pyx_n_s_np, __pyx_t_2) < 0) __PYX_ERR(0, 18, __pyx_L1_error) __Pyx_DECREF(__pyx_t_2); __pyx_t_2 = 0; - /* "gensim/models/_utils_any2vec.pyx":21 - * return ord(b) + /* "gensim/models/_utils_any2vec.pyx":100 + * # as opposed to a new character. + * # + * cdef unsigned char _MB_MASK = 0xC0 # <<<<<<<<<<<<<< + * cdef unsigned char _MB_START = 0x80 * - * _byte_to_int = _byte_to_int_py2 if PY2 else _byte_to_int_py3 # <<<<<<<<<<<<<< + */ + __pyx_v_6gensim_6models_14_utils_any2vec__MB_MASK = 0xC0; + + /* "gensim/models/_utils_any2vec.pyx":101 + * # + * cdef unsigned char _MB_MASK = 0xC0 + * cdef unsigned char _MB_START = 0x80 # <<<<<<<<<<<<<< * * */ - __Pyx_GetModuleGlobalName(__pyx_t_1, __pyx_n_s_PY2); if (unlikely(!__pyx_t_1)) __PYX_ERR(0, 21, __pyx_L1_error) - __Pyx_GOTREF(__pyx_t_1); - __pyx_t_3 = __Pyx_PyObject_IsTrue(__pyx_t_1); if (unlikely(__pyx_t_3 < 0)) __PYX_ERR(0, 21, __pyx_L1_error) - __Pyx_DECREF(__pyx_t_1); __pyx_t_1 = 0; - if (__pyx_t_3) { - __pyx_t_1 = __Pyx_CFunc_object____object___to_py(__pyx_f_6gensim_6models_14_utils_any2vec__byte_to_int_py2); if (unlikely(!__pyx_t_1)) __PYX_ERR(0, 21, __pyx_L1_error) - __Pyx_GOTREF(__pyx_t_1); - __pyx_t_2 = __pyx_t_1; - __pyx_t_1 = 0; - } else { - __pyx_t_1 = __Pyx_CFunc_object____object___to_py(__pyx_f_6gensim_6models_14_utils_any2vec__byte_to_int_py3); if (unlikely(!__pyx_t_1)) __PYX_ERR(0, 21, __pyx_L1_error) - __Pyx_GOTREF(__pyx_t_1); - __pyx_t_2 = __pyx_t_1; - __pyx_t_1 = 0; - } - if (PyDict_SetItem(__pyx_d, __pyx_n_s_byte_to_int, __pyx_t_2) < 0) __PYX_ERR(0, 21, __pyx_L1_error) - __Pyx_DECREF(__pyx_t_2); __pyx_t_2 = 0; + __pyx_v_6gensim_6models_14_utils_any2vec__MB_START = 0x80; /* "gensim/models/_utils_any2vec.pyx":1 * #!/usr/bin/env cython # <<<<<<<<<<<<<< @@ -5997,12 +5801,12 @@ if (!__Pyx_RefNanny) { if (PyDict_SetItem(__pyx_d, __pyx_n_s_test, __pyx_t_2) < 0) __PYX_ERR(0, 1, __pyx_L1_error) __Pyx_DECREF(__pyx_t_2); __pyx_t_2 = 0; - /* "cfunc.to_py":64 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1046 + * raise ImportError("numpy.core.umath failed to import") * - * @cname("__Pyx_CFunc_object____object___to_py") - * cdef object __Pyx_CFunc_object____object___to_py(object (*f)(object) ): # <<<<<<<<<<<<<< - * def wrap(object b): - * """wrap(b)""" + * cdef inline int import_ufunc() except -1: # <<<<<<<<<<<<<< + * try: + * _import_umath() */ /*--- Wrapped vars code ---*/ @@ -6076,6 +5880,43 @@ static PyObject *__Pyx_GetBuiltinName(PyObject *name) { return result; } +/* ArgTypeTest */ +static int __Pyx__ArgTypeTest(PyObject *obj, PyTypeObject *type, const char *name, int exact) +{ + if (unlikely(!type)) { + PyErr_SetString(PyExc_SystemError, "Missing type object"); + return 0; + } + else if (exact) { + #if PY_MAJOR_VERSION == 2 + if ((type == &PyBaseString_Type) && likely(__Pyx_PyBaseString_CheckExact(obj))) return 1; + #endif + } + else { + if (likely(__Pyx_TypeCheck(obj, type))) return 1; + } + PyErr_Format(PyExc_TypeError, + "Argument '%.200s' has incorrect type (expected %.200s, got %.200s)", + name, type->tp_name, Py_TYPE(obj)->tp_name); + return 0; +} + +/* unicode_iter */ +static CYTHON_INLINE int __Pyx_init_unicode_iteration( + PyObject* ustring, Py_ssize_t *length, void** data, int *kind) { +#if CYTHON_PEP393_ENABLED + if (unlikely(__Pyx_PyUnicode_READY(ustring) < 0)) return -1; + *kind = PyUnicode_KIND(ustring); + *length = PyUnicode_GET_LENGTH(ustring); + *data = PyUnicode_DATA(ustring); +#else + *kind = 0; + *length = PyUnicode_GET_SIZE(ustring); + *data = (void*)PyUnicode_AS_UNICODE(ustring); +#endif + return 0; +} + /* UnicodeAsUCS4 */ static CYTHON_INLINE Py_UCS4 __Pyx_PyUnicode_AsPy_UCS4(PyObject* x) { Py_ssize_t length; @@ -6136,391 +5977,88 @@ static long __Pyx__PyObject_Ord(PyObject* c) { return (long)(Py_UCS4)-1; } -/* GetModuleGlobalName */ -#if CYTHON_USE_DICT_VERSIONS -static PyObject *__Pyx__GetModuleGlobalName(PyObject *name, PY_UINT64_T *dict_version, PyObject **dict_cached_value) +/* JoinPyUnicode */ +static PyObject* __Pyx_PyUnicode_Join(PyObject* value_tuple, Py_ssize_t value_count, Py_ssize_t result_ulength, + CYTHON_UNUSED Py_UCS4 max_char) { +#if CYTHON_USE_UNICODE_INTERNALS && CYTHON_ASSUME_SAFE_MACROS && !CYTHON_AVOID_BORROWED_REFS + PyObject *result_uval; + int result_ukind; + Py_ssize_t i, char_pos; + void *result_udata; +#if CYTHON_PEP393_ENABLED + result_uval = PyUnicode_New(result_ulength, max_char); + if (unlikely(!result_uval)) return NULL; + result_ukind = (max_char <= 255) ? PyUnicode_1BYTE_KIND : (max_char <= 65535) ? PyUnicode_2BYTE_KIND : PyUnicode_4BYTE_KIND; + result_udata = PyUnicode_DATA(result_uval); #else -static CYTHON_INLINE PyObject *__Pyx__GetModuleGlobalName(PyObject *name) + result_uval = PyUnicode_FromUnicode(NULL, result_ulength); + if (unlikely(!result_uval)) return NULL; + result_ukind = sizeof(Py_UNICODE); + result_udata = PyUnicode_AS_UNICODE(result_uval); #endif -{ - PyObject *result; -#if !CYTHON_AVOID_BORROWED_REFS -#if CYTHON_COMPILING_IN_CPYTHON && PY_VERSION_HEX >= 0x030500A1 - result = _PyDict_GetItem_KnownHash(__pyx_d, name, ((PyASCIIObject *) name)->hash); - __PYX_UPDATE_DICT_CACHE(__pyx_d, result, *dict_cached_value, *dict_version) - if (likely(result)) { - return __Pyx_NewRef(result); - } else if (unlikely(PyErr_Occurred())) { - return NULL; - } -#else - result = PyDict_GetItem(__pyx_d, name); - __PYX_UPDATE_DICT_CACHE(__pyx_d, result, *dict_cached_value, *dict_version) - if (likely(result)) { - return __Pyx_NewRef(result); + char_pos = 0; + for (i=0; i < value_count; i++) { + int ukind; + Py_ssize_t ulength; + void *udata; + PyObject *uval = PyTuple_GET_ITEM(value_tuple, i); + if (unlikely(__Pyx_PyUnicode_READY(uval))) + goto bad; + ulength = __Pyx_PyUnicode_GET_LENGTH(uval); + if (unlikely(!ulength)) + continue; + if (unlikely(char_pos + ulength < 0)) + goto overflow; + ukind = __Pyx_PyUnicode_KIND(uval); + udata = __Pyx_PyUnicode_DATA(uval); + if (!CYTHON_PEP393_ENABLED || ukind == result_ukind) { + memcpy((char *)result_udata + char_pos * result_ukind, udata, (size_t) (ulength * result_ukind)); + } else { + #if CYTHON_COMPILING_IN_CPYTHON && PY_VERSION_HEX >= 0x030300F0 || defined(_PyUnicode_FastCopyCharacters) + _PyUnicode_FastCopyCharacters(result_uval, char_pos, uval, 0, ulength); + #else + Py_ssize_t j; + for (j=0; j < ulength; j++) { + Py_UCS4 uchar = __Pyx_PyUnicode_READ(ukind, udata, j); + __Pyx_PyUnicode_WRITE(result_ukind, result_udata, char_pos+j, uchar); + } + #endif + } + char_pos += ulength; } -#endif + return result_uval; +overflow: + PyErr_SetString(PyExc_OverflowError, "join() result is too long for a Python string"); +bad: + Py_DECREF(result_uval); + return NULL; #else - result = PyObject_GetItem(__pyx_d, name); - __PYX_UPDATE_DICT_CACHE(__pyx_d, result, *dict_cached_value, *dict_version) - if (likely(result)) { - return __Pyx_NewRef(result); - } - PyErr_Clear(); + result_ulength++; + value_count++; + return PyUnicode_Join(__pyx_empty_unicode, value_tuple); #endif - return __Pyx_GetBuiltinName(name); } -/* PyCFunctionFastCall */ -#if CYTHON_FAST_PYCCALL -static CYTHON_INLINE PyObject * __Pyx_PyCFunction_FastCall(PyObject *func_obj, PyObject **args, Py_ssize_t nargs) { - PyCFunctionObject *func = (PyCFunctionObject*)func_obj; - PyCFunction meth = PyCFunction_GET_FUNCTION(func); - PyObject *self = PyCFunction_GET_SELF(func); - int flags = PyCFunction_GET_FLAGS(func); - assert(PyCFunction_Check(func)); - assert(METH_FASTCALL == (flags & ~(METH_CLASS | METH_STATIC | METH_COEXIST | METH_KEYWORDS | METH_STACKLESS))); - assert(nargs >= 0); - assert(nargs == 0 || args != NULL); - /* _PyCFunction_FastCallDict() must not be called with an exception set, - because it may clear it (directly or indirectly) and so the - caller loses its exception */ - assert(!PyErr_Occurred()); - if ((PY_VERSION_HEX < 0x030700A0) || unlikely(flags & METH_KEYWORDS)) { - return (*((__Pyx_PyCFunctionFastWithKeywords)(void*)meth)) (self, args, nargs, NULL); - } else { - return (*((__Pyx_PyCFunctionFast)(void*)meth)) (self, args, nargs); +/* PyObjectCall */ +#if CYTHON_COMPILING_IN_CPYTHON +static CYTHON_INLINE PyObject* __Pyx_PyObject_Call(PyObject *func, PyObject *arg, PyObject *kw) { + PyObject *result; + ternaryfunc call = func->ob_type->tp_call; + if (unlikely(!call)) + return PyObject_Call(func, arg, kw); + if (unlikely(Py_EnterRecursiveCall((char*)" while calling a Python object"))) + return NULL; + result = (*call)(func, arg, kw); + Py_LeaveRecursiveCall(); + if (unlikely(!result) && unlikely(!PyErr_Occurred())) { + PyErr_SetString( + PyExc_SystemError, + "NULL result without error in PyObject_Call"); } + return result; } #endif -/* PyFunctionFastCall */ -#if CYTHON_FAST_PYCALL -static PyObject* __Pyx_PyFunction_FastCallNoKw(PyCodeObject *co, PyObject **args, Py_ssize_t na, - PyObject *globals) { - PyFrameObject *f; - PyThreadState *tstate = __Pyx_PyThreadState_Current; - PyObject **fastlocals; - Py_ssize_t i; - PyObject *result; - assert(globals != NULL); - /* XXX Perhaps we should create a specialized - PyFrame_New() that doesn't take locals, but does - take builtins without sanity checking them. - */ - assert(tstate != NULL); - f = PyFrame_New(tstate, co, globals, NULL); - if (f == NULL) { - return NULL; - } - fastlocals = __Pyx_PyFrame_GetLocalsplus(f); - for (i = 0; i < na; i++) { - Py_INCREF(*args); - fastlocals[i] = *args++; - } - result = PyEval_EvalFrameEx(f,0); - ++tstate->recursion_depth; - Py_DECREF(f); - --tstate->recursion_depth; - return result; -} -#if 1 || PY_VERSION_HEX < 0x030600B1 -static PyObject *__Pyx_PyFunction_FastCallDict(PyObject *func, PyObject **args, int nargs, PyObject *kwargs) { - PyCodeObject *co = (PyCodeObject *)PyFunction_GET_CODE(func); - PyObject *globals = PyFunction_GET_GLOBALS(func); - PyObject *argdefs = PyFunction_GET_DEFAULTS(func); - PyObject *closure; -#if PY_MAJOR_VERSION >= 3 - PyObject *kwdefs; -#endif - PyObject *kwtuple, **k; - PyObject **d; - Py_ssize_t nd; - Py_ssize_t nk; - PyObject *result; - assert(kwargs == NULL || PyDict_Check(kwargs)); - nk = kwargs ? PyDict_Size(kwargs) : 0; - if (Py_EnterRecursiveCall((char*)" while calling a Python object")) { - return NULL; - } - if ( -#if PY_MAJOR_VERSION >= 3 - co->co_kwonlyargcount == 0 && -#endif - likely(kwargs == NULL || nk == 0) && - co->co_flags == (CO_OPTIMIZED | CO_NEWLOCALS | CO_NOFREE)) { - if (argdefs == NULL && co->co_argcount == nargs) { - result = __Pyx_PyFunction_FastCallNoKw(co, args, nargs, globals); - goto done; - } - else if (nargs == 0 && argdefs != NULL - && co->co_argcount == Py_SIZE(argdefs)) { - /* function called with no arguments, but all parameters have - a default value: use default values as arguments .*/ - args = &PyTuple_GET_ITEM(argdefs, 0); - result =__Pyx_PyFunction_FastCallNoKw(co, args, Py_SIZE(argdefs), globals); - goto done; - } - } - if (kwargs != NULL) { - Py_ssize_t pos, i; - kwtuple = PyTuple_New(2 * nk); - if (kwtuple == NULL) { - result = NULL; - goto done; - } - k = &PyTuple_GET_ITEM(kwtuple, 0); - pos = i = 0; - while (PyDict_Next(kwargs, &pos, &k[i], &k[i+1])) { - Py_INCREF(k[i]); - Py_INCREF(k[i+1]); - i += 2; - } - nk = i / 2; - } - else { - kwtuple = NULL; - k = NULL; - } - closure = PyFunction_GET_CLOSURE(func); -#if PY_MAJOR_VERSION >= 3 - kwdefs = PyFunction_GET_KW_DEFAULTS(func); -#endif - if (argdefs != NULL) { - d = &PyTuple_GET_ITEM(argdefs, 0); - nd = Py_SIZE(argdefs); - } - else { - d = NULL; - nd = 0; - } -#if PY_MAJOR_VERSION >= 3 - result = PyEval_EvalCodeEx((PyObject*)co, globals, (PyObject *)NULL, - args, nargs, - k, (int)nk, - d, (int)nd, kwdefs, closure); -#else - result = PyEval_EvalCodeEx(co, globals, (PyObject *)NULL, - args, nargs, - k, (int)nk, - d, (int)nd, closure); -#endif - Py_XDECREF(kwtuple); -done: - Py_LeaveRecursiveCall(); - return result; -} -#endif -#endif - -/* PyObjectCall */ -#if CYTHON_COMPILING_IN_CPYTHON -static CYTHON_INLINE PyObject* __Pyx_PyObject_Call(PyObject *func, PyObject *arg, PyObject *kw) { - PyObject *result; - ternaryfunc call = func->ob_type->tp_call; - if (unlikely(!call)) - return PyObject_Call(func, arg, kw); - if (unlikely(Py_EnterRecursiveCall((char*)" while calling a Python object"))) - return NULL; - result = (*call)(func, arg, kw); - Py_LeaveRecursiveCall(); - if (unlikely(!result) && unlikely(!PyErr_Occurred())) { - PyErr_SetString( - PyExc_SystemError, - "NULL result without error in PyObject_Call"); - } - return result; -} -#endif - -/* PyObjectCall2Args */ -static CYTHON_UNUSED PyObject* __Pyx_PyObject_Call2Args(PyObject* function, PyObject* arg1, PyObject* arg2) { - PyObject *args, *result = NULL; - #if CYTHON_FAST_PYCALL - if (PyFunction_Check(function)) { - PyObject *args[2] = {arg1, arg2}; - return __Pyx_PyFunction_FastCall(function, args, 2); - } - #endif - #if CYTHON_FAST_PYCCALL - if (__Pyx_PyFastCFunction_Check(function)) { - PyObject *args[2] = {arg1, arg2}; - return __Pyx_PyCFunction_FastCall(function, args, 2); - } - #endif - args = PyTuple_New(2); - if (unlikely(!args)) goto done; - Py_INCREF(arg1); - PyTuple_SET_ITEM(args, 0, arg1); - Py_INCREF(arg2); - PyTuple_SET_ITEM(args, 1, arg2); - Py_INCREF(function); - result = __Pyx_PyObject_Call(function, args, NULL); - Py_DECREF(args); - Py_DECREF(function); -done: - return result; -} - -/* PyObjectCallMethO */ -#if CYTHON_COMPILING_IN_CPYTHON -static CYTHON_INLINE PyObject* __Pyx_PyObject_CallMethO(PyObject *func, PyObject *arg) { - PyObject *self, *result; - PyCFunction cfunc; - cfunc = PyCFunction_GET_FUNCTION(func); - self = PyCFunction_GET_SELF(func); - if (unlikely(Py_EnterRecursiveCall((char*)" while calling a Python object"))) - return NULL; - result = cfunc(self, arg); - Py_LeaveRecursiveCall(); - if (unlikely(!result) && unlikely(!PyErr_Occurred())) { - PyErr_SetString( - PyExc_SystemError, - "NULL result without error in PyObject_Call"); - } - return result; -} -#endif - -/* PyObjectCallOneArg */ -#if CYTHON_COMPILING_IN_CPYTHON -static PyObject* __Pyx__PyObject_CallOneArg(PyObject *func, PyObject *arg) { - PyObject *result; - PyObject *args = PyTuple_New(1); - if (unlikely(!args)) return NULL; - Py_INCREF(arg); - PyTuple_SET_ITEM(args, 0, arg); - result = __Pyx_PyObject_Call(func, args, NULL); - Py_DECREF(args); - return result; -} -static CYTHON_INLINE PyObject* __Pyx_PyObject_CallOneArg(PyObject *func, PyObject *arg) { -#if CYTHON_FAST_PYCALL - if (PyFunction_Check(func)) { - return __Pyx_PyFunction_FastCall(func, &arg, 1); - } -#endif - if (likely(PyCFunction_Check(func))) { - if (likely(PyCFunction_GET_FLAGS(func) & METH_O)) { - return __Pyx_PyObject_CallMethO(func, arg); -#if CYTHON_FAST_PYCCALL - } else if (PyCFunction_GET_FLAGS(func) & METH_FASTCALL) { - return __Pyx_PyCFunction_FastCall(func, &arg, 1); -#endif - } - } - return __Pyx__PyObject_CallOneArg(func, arg); -} -#else -static CYTHON_INLINE PyObject* __Pyx_PyObject_CallOneArg(PyObject *func, PyObject *arg) { - PyObject *result; - PyObject *args = PyTuple_Pack(1, arg); - if (unlikely(!args)) return NULL; - result = __Pyx_PyObject_Call(func, args, NULL); - Py_DECREF(args); - return result; -} -#endif - -/* ArgTypeTest */ -static int __Pyx__ArgTypeTest(PyObject *obj, PyTypeObject *type, const char *name, int exact) -{ - if (unlikely(!type)) { - PyErr_SetString(PyExc_SystemError, "Missing type object"); - return 0; - } - else if (exact) { - #if PY_MAJOR_VERSION == 2 - if ((type == &PyBaseString_Type) && likely(__Pyx_PyBaseString_CheckExact(obj))) return 1; - #endif - } - else { - if (likely(__Pyx_TypeCheck(obj, type))) return 1; - } - PyErr_Format(PyExc_TypeError, - "Argument '%.200s' has incorrect type (expected %.200s, got %.200s)", - name, type->tp_name, Py_TYPE(obj)->tp_name); - return 0; -} - -/* unicode_iter */ -static CYTHON_INLINE int __Pyx_init_unicode_iteration( - PyObject* ustring, Py_ssize_t *length, void** data, int *kind) { -#if CYTHON_PEP393_ENABLED - if (unlikely(__Pyx_PyUnicode_READY(ustring) < 0)) return -1; - *kind = PyUnicode_KIND(ustring); - *length = PyUnicode_GET_LENGTH(ustring); - *data = PyUnicode_DATA(ustring); -#else - *kind = 0; - *length = PyUnicode_GET_SIZE(ustring); - *data = (void*)PyUnicode_AS_UNICODE(ustring); -#endif - return 0; -} - -/* JoinPyUnicode */ -static PyObject* __Pyx_PyUnicode_Join(PyObject* value_tuple, Py_ssize_t value_count, Py_ssize_t result_ulength, - CYTHON_UNUSED Py_UCS4 max_char) { -#if CYTHON_USE_UNICODE_INTERNALS && CYTHON_ASSUME_SAFE_MACROS && !CYTHON_AVOID_BORROWED_REFS - PyObject *result_uval; - int result_ukind; - Py_ssize_t i, char_pos; - void *result_udata; -#if CYTHON_PEP393_ENABLED - result_uval = PyUnicode_New(result_ulength, max_char); - if (unlikely(!result_uval)) return NULL; - result_ukind = (max_char <= 255) ? PyUnicode_1BYTE_KIND : (max_char <= 65535) ? PyUnicode_2BYTE_KIND : PyUnicode_4BYTE_KIND; - result_udata = PyUnicode_DATA(result_uval); -#else - result_uval = PyUnicode_FromUnicode(NULL, result_ulength); - if (unlikely(!result_uval)) return NULL; - result_ukind = sizeof(Py_UNICODE); - result_udata = PyUnicode_AS_UNICODE(result_uval); -#endif - char_pos = 0; - for (i=0; i < value_count; i++) { - int ukind; - Py_ssize_t ulength; - void *udata; - PyObject *uval = PyTuple_GET_ITEM(value_tuple, i); - if (unlikely(__Pyx_PyUnicode_READY(uval))) - goto bad; - ulength = __Pyx_PyUnicode_GET_LENGTH(uval); - if (unlikely(!ulength)) - continue; - if (unlikely(char_pos + ulength < 0)) - goto overflow; - ukind = __Pyx_PyUnicode_KIND(uval); - udata = __Pyx_PyUnicode_DATA(uval); - if (!CYTHON_PEP393_ENABLED || ukind == result_ukind) { - memcpy((char *)result_udata + char_pos * result_ukind, udata, (size_t) (ulength * result_ukind)); - } else { - #if CYTHON_COMPILING_IN_CPYTHON && PY_VERSION_HEX >= 0x030300F0 || defined(_PyUnicode_FastCopyCharacters) - _PyUnicode_FastCopyCharacters(result_uval, char_pos, uval, 0, ulength); - #else - Py_ssize_t j; - for (j=0; j < ulength; j++) { - Py_UCS4 uchar = __Pyx_PyUnicode_READ(ukind, udata, j); - __Pyx_PyUnicode_WRITE(result_ukind, result_udata, char_pos+j, uchar); - } - #endif - } - char_pos += ulength; - } - return result_uval; -overflow: - PyErr_SetString(PyExc_OverflowError, "join() result is too long for a Python string"); -bad: - Py_DECREF(result_uval); - return NULL; -#else - result_ulength++; - value_count++; - return PyUnicode_Join(__pyx_empty_unicode, value_tuple); -#endif -} - /* PyIntBinop */ #if !CYTHON_COMPILING_IN_PYPY static PyObject* __Pyx_PyInt_AddObjC(PyObject *op1, PyObject *op2, CYTHON_UNUSED long intval, CYTHON_UNUSED int inplace) { @@ -6790,26 +6328,257 @@ static int __Pyx_ParseOptionalKeywords( goto invalid_keyword; } } - return 0; -arg_passed_twice: - __Pyx_RaiseDoubleKeywordsError(function_name, key); - goto bad; -invalid_keyword_type: - PyErr_Format(PyExc_TypeError, - "%.200s() keywords must be strings", function_name); - goto bad; -invalid_keyword: - PyErr_Format(PyExc_TypeError, - #if PY_MAJOR_VERSION < 3 - "%.200s() got an unexpected keyword argument '%.200s'", - function_name, PyString_AsString(key)); - #else - "%s() got an unexpected keyword argument '%U'", - function_name, key); - #endif -bad: - return -1; + return 0; +arg_passed_twice: + __Pyx_RaiseDoubleKeywordsError(function_name, key); + goto bad; +invalid_keyword_type: + PyErr_Format(PyExc_TypeError, + "%.200s() keywords must be strings", function_name); + goto bad; +invalid_keyword: + PyErr_Format(PyExc_TypeError, + #if PY_MAJOR_VERSION < 3 + "%.200s() got an unexpected keyword argument '%.200s'", + function_name, PyString_AsString(key)); + #else + "%s() got an unexpected keyword argument '%U'", + function_name, key); + #endif +bad: + return -1; +} + +/* PyCFunctionFastCall */ +#if CYTHON_FAST_PYCCALL +static CYTHON_INLINE PyObject * __Pyx_PyCFunction_FastCall(PyObject *func_obj, PyObject **args, Py_ssize_t nargs) { + PyCFunctionObject *func = (PyCFunctionObject*)func_obj; + PyCFunction meth = PyCFunction_GET_FUNCTION(func); + PyObject *self = PyCFunction_GET_SELF(func); + int flags = PyCFunction_GET_FLAGS(func); + assert(PyCFunction_Check(func)); + assert(METH_FASTCALL == (flags & ~(METH_CLASS | METH_STATIC | METH_COEXIST | METH_KEYWORDS | METH_STACKLESS))); + assert(nargs >= 0); + assert(nargs == 0 || args != NULL); + /* _PyCFunction_FastCallDict() must not be called with an exception set, + because it may clear it (directly or indirectly) and so the + caller loses its exception */ + assert(!PyErr_Occurred()); + if ((PY_VERSION_HEX < 0x030700A0) || unlikely(flags & METH_KEYWORDS)) { + return (*((__Pyx_PyCFunctionFastWithKeywords)(void*)meth)) (self, args, nargs, NULL); + } else { + return (*((__Pyx_PyCFunctionFast)(void*)meth)) (self, args, nargs); + } +} +#endif + +/* PyFunctionFastCall */ +#if CYTHON_FAST_PYCALL +static PyObject* __Pyx_PyFunction_FastCallNoKw(PyCodeObject *co, PyObject **args, Py_ssize_t na, + PyObject *globals) { + PyFrameObject *f; + PyThreadState *tstate = __Pyx_PyThreadState_Current; + PyObject **fastlocals; + Py_ssize_t i; + PyObject *result; + assert(globals != NULL); + /* XXX Perhaps we should create a specialized + PyFrame_New() that doesn't take locals, but does + take builtins without sanity checking them. + */ + assert(tstate != NULL); + f = PyFrame_New(tstate, co, globals, NULL); + if (f == NULL) { + return NULL; + } + fastlocals = __Pyx_PyFrame_GetLocalsplus(f); + for (i = 0; i < na; i++) { + Py_INCREF(*args); + fastlocals[i] = *args++; + } + result = PyEval_EvalFrameEx(f,0); + ++tstate->recursion_depth; + Py_DECREF(f); + --tstate->recursion_depth; + return result; +} +#if 1 || PY_VERSION_HEX < 0x030600B1 +static PyObject *__Pyx_PyFunction_FastCallDict(PyObject *func, PyObject **args, int nargs, PyObject *kwargs) { + PyCodeObject *co = (PyCodeObject *)PyFunction_GET_CODE(func); + PyObject *globals = PyFunction_GET_GLOBALS(func); + PyObject *argdefs = PyFunction_GET_DEFAULTS(func); + PyObject *closure; +#if PY_MAJOR_VERSION >= 3 + PyObject *kwdefs; +#endif + PyObject *kwtuple, **k; + PyObject **d; + Py_ssize_t nd; + Py_ssize_t nk; + PyObject *result; + assert(kwargs == NULL || PyDict_Check(kwargs)); + nk = kwargs ? PyDict_Size(kwargs) : 0; + if (Py_EnterRecursiveCall((char*)" while calling a Python object")) { + return NULL; + } + if ( +#if PY_MAJOR_VERSION >= 3 + co->co_kwonlyargcount == 0 && +#endif + likely(kwargs == NULL || nk == 0) && + co->co_flags == (CO_OPTIMIZED | CO_NEWLOCALS | CO_NOFREE)) { + if (argdefs == NULL && co->co_argcount == nargs) { + result = __Pyx_PyFunction_FastCallNoKw(co, args, nargs, globals); + goto done; + } + else if (nargs == 0 && argdefs != NULL + && co->co_argcount == Py_SIZE(argdefs)) { + /* function called with no arguments, but all parameters have + a default value: use default values as arguments .*/ + args = &PyTuple_GET_ITEM(argdefs, 0); + result =__Pyx_PyFunction_FastCallNoKw(co, args, Py_SIZE(argdefs), globals); + goto done; + } + } + if (kwargs != NULL) { + Py_ssize_t pos, i; + kwtuple = PyTuple_New(2 * nk); + if (kwtuple == NULL) { + result = NULL; + goto done; + } + k = &PyTuple_GET_ITEM(kwtuple, 0); + pos = i = 0; + while (PyDict_Next(kwargs, &pos, &k[i], &k[i+1])) { + Py_INCREF(k[i]); + Py_INCREF(k[i+1]); + i += 2; + } + nk = i / 2; + } + else { + kwtuple = NULL; + k = NULL; + } + closure = PyFunction_GET_CLOSURE(func); +#if PY_MAJOR_VERSION >= 3 + kwdefs = PyFunction_GET_KW_DEFAULTS(func); +#endif + if (argdefs != NULL) { + d = &PyTuple_GET_ITEM(argdefs, 0); + nd = Py_SIZE(argdefs); + } + else { + d = NULL; + nd = 0; + } +#if PY_MAJOR_VERSION >= 3 + result = PyEval_EvalCodeEx((PyObject*)co, globals, (PyObject *)NULL, + args, nargs, + k, (int)nk, + d, (int)nd, kwdefs, closure); +#else + result = PyEval_EvalCodeEx(co, globals, (PyObject *)NULL, + args, nargs, + k, (int)nk, + d, (int)nd, closure); +#endif + Py_XDECREF(kwtuple); +done: + Py_LeaveRecursiveCall(); + return result; +} +#endif +#endif + +/* PyObjectCall2Args */ +static CYTHON_UNUSED PyObject* __Pyx_PyObject_Call2Args(PyObject* function, PyObject* arg1, PyObject* arg2) { + PyObject *args, *result = NULL; + #if CYTHON_FAST_PYCALL + if (PyFunction_Check(function)) { + PyObject *args[2] = {arg1, arg2}; + return __Pyx_PyFunction_FastCall(function, args, 2); + } + #endif + #if CYTHON_FAST_PYCCALL + if (__Pyx_PyFastCFunction_Check(function)) { + PyObject *args[2] = {arg1, arg2}; + return __Pyx_PyCFunction_FastCall(function, args, 2); + } + #endif + args = PyTuple_New(2); + if (unlikely(!args)) goto done; + Py_INCREF(arg1); + PyTuple_SET_ITEM(args, 0, arg1); + Py_INCREF(arg2); + PyTuple_SET_ITEM(args, 1, arg2); + Py_INCREF(function); + result = __Pyx_PyObject_Call(function, args, NULL); + Py_DECREF(args); + Py_DECREF(function); +done: + return result; +} + +/* PyObjectCallMethO */ +#if CYTHON_COMPILING_IN_CPYTHON +static CYTHON_INLINE PyObject* __Pyx_PyObject_CallMethO(PyObject *func, PyObject *arg) { + PyObject *self, *result; + PyCFunction cfunc; + cfunc = PyCFunction_GET_FUNCTION(func); + self = PyCFunction_GET_SELF(func); + if (unlikely(Py_EnterRecursiveCall((char*)" while calling a Python object"))) + return NULL; + result = cfunc(self, arg); + Py_LeaveRecursiveCall(); + if (unlikely(!result) && unlikely(!PyErr_Occurred())) { + PyErr_SetString( + PyExc_SystemError, + "NULL result without error in PyObject_Call"); + } + return result; +} +#endif + +/* PyObjectCallOneArg */ +#if CYTHON_COMPILING_IN_CPYTHON +static PyObject* __Pyx__PyObject_CallOneArg(PyObject *func, PyObject *arg) { + PyObject *result; + PyObject *args = PyTuple_New(1); + if (unlikely(!args)) return NULL; + Py_INCREF(arg); + PyTuple_SET_ITEM(args, 0, arg); + result = __Pyx_PyObject_Call(func, args, NULL); + Py_DECREF(args); + return result; +} +static CYTHON_INLINE PyObject* __Pyx_PyObject_CallOneArg(PyObject *func, PyObject *arg) { +#if CYTHON_FAST_PYCALL + if (PyFunction_Check(func)) { + return __Pyx_PyFunction_FastCall(func, &arg, 1); + } +#endif + if (likely(PyCFunction_Check(func))) { + if (likely(PyCFunction_GET_FLAGS(func) & METH_O)) { + return __Pyx_PyObject_CallMethO(func, arg); +#if CYTHON_FAST_PYCCALL + } else if (PyCFunction_GET_FLAGS(func) & METH_FASTCALL) { + return __Pyx_PyCFunction_FastCall(func, &arg, 1); +#endif + } + } + return __Pyx__PyObject_CallOneArg(func, arg); } +#else +static CYTHON_INLINE PyObject* __Pyx_PyObject_CallOneArg(PyObject *func, PyObject *arg) { + PyObject *result; + PyObject *args = PyTuple_Pack(1, arg); + if (unlikely(!args)) return NULL; + result = __Pyx_PyObject_Call(func, args, NULL); + Py_DECREF(args); + return result; +} +#endif /* PyErrFetchRestore */ #if CYTHON_FAST_THREAD_STATE @@ -7173,711 +6942,36 @@ static int __Pyx_GetException(PyObject **type, PyObject **value, PyObject **tb) { _PyErr_StackItem *exc_info = tstate->exc_info; tmp_type = exc_info->exc_type; - tmp_value = exc_info->exc_value; - tmp_tb = exc_info->exc_traceback; - exc_info->exc_type = local_type; - exc_info->exc_value = local_value; - exc_info->exc_traceback = local_tb; - } - #else - tmp_type = tstate->exc_type; - tmp_value = tstate->exc_value; - tmp_tb = tstate->exc_traceback; - tstate->exc_type = local_type; - tstate->exc_value = local_value; - tstate->exc_traceback = local_tb; - #endif - Py_XDECREF(tmp_type); - Py_XDECREF(tmp_value); - Py_XDECREF(tmp_tb); -#else - PyErr_SetExcInfo(local_type, local_value, local_tb); -#endif - return 0; -bad: - *type = 0; - *value = 0; - *tb = 0; - Py_XDECREF(local_type); - Py_XDECREF(local_value); - Py_XDECREF(local_tb); - return -1; -} - -/* FetchCommonType */ -static PyTypeObject* __Pyx_FetchCommonType(PyTypeObject* type) { - PyObject* fake_module; - PyTypeObject* cached_type = NULL; - fake_module = PyImport_AddModule((char*) "_cython_" CYTHON_ABI); - if (!fake_module) return NULL; - Py_INCREF(fake_module); - cached_type = (PyTypeObject*) PyObject_GetAttrString(fake_module, type->tp_name); - if (cached_type) { - if (!PyType_Check((PyObject*)cached_type)) { - PyErr_Format(PyExc_TypeError, - "Shared Cython type %.200s is not a type object", - type->tp_name); - goto bad; - } - if (cached_type->tp_basicsize != type->tp_basicsize) { - PyErr_Format(PyExc_TypeError, - "Shared Cython type %.200s has the wrong size, try recompiling", - type->tp_name); - goto bad; - } - } else { - if (!PyErr_ExceptionMatches(PyExc_AttributeError)) goto bad; - PyErr_Clear(); - if (PyType_Ready(type) < 0) goto bad; - if (PyObject_SetAttrString(fake_module, type->tp_name, (PyObject*) type) < 0) - goto bad; - Py_INCREF(type); - cached_type = type; - } -done: - Py_DECREF(fake_module); - return cached_type; -bad: - Py_XDECREF(cached_type); - cached_type = NULL; - goto done; -} - -/* CythonFunction */ -#include -static PyObject * -__Pyx_CyFunction_get_doc(__pyx_CyFunctionObject *op, CYTHON_UNUSED void *closure) -{ - if (unlikely(op->func_doc == NULL)) { - if (op->func.m_ml->ml_doc) { -#if PY_MAJOR_VERSION >= 3 - op->func_doc = PyUnicode_FromString(op->func.m_ml->ml_doc); -#else - op->func_doc = PyString_FromString(op->func.m_ml->ml_doc); -#endif - if (unlikely(op->func_doc == NULL)) - return NULL; - } else { - Py_INCREF(Py_None); - return Py_None; - } - } - Py_INCREF(op->func_doc); - return op->func_doc; -} -static int -__Pyx_CyFunction_set_doc(__pyx_CyFunctionObject *op, PyObject *value, CYTHON_UNUSED void *context) -{ - PyObject *tmp = op->func_doc; - if (value == NULL) { - value = Py_None; - } - Py_INCREF(value); - op->func_doc = value; - Py_XDECREF(tmp); - return 0; -} -static PyObject * -__Pyx_CyFunction_get_name(__pyx_CyFunctionObject *op, CYTHON_UNUSED void *context) -{ - if (unlikely(op->func_name == NULL)) { -#if PY_MAJOR_VERSION >= 3 - op->func_name = PyUnicode_InternFromString(op->func.m_ml->ml_name); -#else - op->func_name = PyString_InternFromString(op->func.m_ml->ml_name); -#endif - if (unlikely(op->func_name == NULL)) - return NULL; - } - Py_INCREF(op->func_name); - return op->func_name; -} -static int -__Pyx_CyFunction_set_name(__pyx_CyFunctionObject *op, PyObject *value, CYTHON_UNUSED void *context) -{ - PyObject *tmp; -#if PY_MAJOR_VERSION >= 3 - if (unlikely(value == NULL || !PyUnicode_Check(value))) -#else - if (unlikely(value == NULL || !PyString_Check(value))) -#endif - { - PyErr_SetString(PyExc_TypeError, - "__name__ must be set to a string object"); - return -1; - } - tmp = op->func_name; - Py_INCREF(value); - op->func_name = value; - Py_XDECREF(tmp); - return 0; -} -static PyObject * -__Pyx_CyFunction_get_qualname(__pyx_CyFunctionObject *op, CYTHON_UNUSED void *context) -{ - Py_INCREF(op->func_qualname); - return op->func_qualname; -} -static int -__Pyx_CyFunction_set_qualname(__pyx_CyFunctionObject *op, PyObject *value, CYTHON_UNUSED void *context) -{ - PyObject *tmp; -#if PY_MAJOR_VERSION >= 3 - if (unlikely(value == NULL || !PyUnicode_Check(value))) -#else - if (unlikely(value == NULL || !PyString_Check(value))) -#endif - { - PyErr_SetString(PyExc_TypeError, - "__qualname__ must be set to a string object"); - return -1; - } - tmp = op->func_qualname; - Py_INCREF(value); - op->func_qualname = value; - Py_XDECREF(tmp); - return 0; -} -static PyObject * -__Pyx_CyFunction_get_self(__pyx_CyFunctionObject *m, CYTHON_UNUSED void *closure) -{ - PyObject *self; - self = m->func_closure; - if (self == NULL) - self = Py_None; - Py_INCREF(self); - return self; -} -static PyObject * -__Pyx_CyFunction_get_dict(__pyx_CyFunctionObject *op, CYTHON_UNUSED void *context) -{ - if (unlikely(op->func_dict == NULL)) { - op->func_dict = PyDict_New(); - if (unlikely(op->func_dict == NULL)) - return NULL; - } - Py_INCREF(op->func_dict); - return op->func_dict; -} -static int -__Pyx_CyFunction_set_dict(__pyx_CyFunctionObject *op, PyObject *value, CYTHON_UNUSED void *context) -{ - PyObject *tmp; - if (unlikely(value == NULL)) { - PyErr_SetString(PyExc_TypeError, - "function's dictionary may not be deleted"); - return -1; - } - if (unlikely(!PyDict_Check(value))) { - PyErr_SetString(PyExc_TypeError, - "setting function's dictionary to a non-dict"); - return -1; - } - tmp = op->func_dict; - Py_INCREF(value); - op->func_dict = value; - Py_XDECREF(tmp); - return 0; -} -static PyObject * -__Pyx_CyFunction_get_globals(__pyx_CyFunctionObject *op, CYTHON_UNUSED void *context) -{ - Py_INCREF(op->func_globals); - return op->func_globals; -} -static PyObject * -__Pyx_CyFunction_get_closure(CYTHON_UNUSED __pyx_CyFunctionObject *op, CYTHON_UNUSED void *context) -{ - Py_INCREF(Py_None); - return Py_None; -} -static PyObject * -__Pyx_CyFunction_get_code(__pyx_CyFunctionObject *op, CYTHON_UNUSED void *context) -{ - PyObject* result = (op->func_code) ? op->func_code : Py_None; - Py_INCREF(result); - return result; -} -static int -__Pyx_CyFunction_init_defaults(__pyx_CyFunctionObject *op) { - int result = 0; - PyObject *res = op->defaults_getter((PyObject *) op); - if (unlikely(!res)) - return -1; - #if CYTHON_ASSUME_SAFE_MACROS && !CYTHON_AVOID_BORROWED_REFS - op->defaults_tuple = PyTuple_GET_ITEM(res, 0); - Py_INCREF(op->defaults_tuple); - op->defaults_kwdict = PyTuple_GET_ITEM(res, 1); - Py_INCREF(op->defaults_kwdict); - #else - op->defaults_tuple = PySequence_ITEM(res, 0); - if (unlikely(!op->defaults_tuple)) result = -1; - else { - op->defaults_kwdict = PySequence_ITEM(res, 1); - if (unlikely(!op->defaults_kwdict)) result = -1; - } - #endif - Py_DECREF(res); - return result; -} -static int -__Pyx_CyFunction_set_defaults(__pyx_CyFunctionObject *op, PyObject* value, CYTHON_UNUSED void *context) { - PyObject* tmp; - if (!value) { - value = Py_None; - } else if (value != Py_None && !PyTuple_Check(value)) { - PyErr_SetString(PyExc_TypeError, - "__defaults__ must be set to a tuple object"); - return -1; - } - Py_INCREF(value); - tmp = op->defaults_tuple; - op->defaults_tuple = value; - Py_XDECREF(tmp); - return 0; -} -static PyObject * -__Pyx_CyFunction_get_defaults(__pyx_CyFunctionObject *op, CYTHON_UNUSED void *context) { - PyObject* result = op->defaults_tuple; - if (unlikely(!result)) { - if (op->defaults_getter) { - if (__Pyx_CyFunction_init_defaults(op) < 0) return NULL; - result = op->defaults_tuple; - } else { - result = Py_None; - } - } - Py_INCREF(result); - return result; -} -static int -__Pyx_CyFunction_set_kwdefaults(__pyx_CyFunctionObject *op, PyObject* value, CYTHON_UNUSED void *context) { - PyObject* tmp; - if (!value) { - value = Py_None; - } else if (value != Py_None && !PyDict_Check(value)) { - PyErr_SetString(PyExc_TypeError, - "__kwdefaults__ must be set to a dict object"); - return -1; - } - Py_INCREF(value); - tmp = op->defaults_kwdict; - op->defaults_kwdict = value; - Py_XDECREF(tmp); - return 0; -} -static PyObject * -__Pyx_CyFunction_get_kwdefaults(__pyx_CyFunctionObject *op, CYTHON_UNUSED void *context) { - PyObject* result = op->defaults_kwdict; - if (unlikely(!result)) { - if (op->defaults_getter) { - if (__Pyx_CyFunction_init_defaults(op) < 0) return NULL; - result = op->defaults_kwdict; - } else { - result = Py_None; - } - } - Py_INCREF(result); - return result; -} -static int -__Pyx_CyFunction_set_annotations(__pyx_CyFunctionObject *op, PyObject* value, CYTHON_UNUSED void *context) { - PyObject* tmp; - if (!value || value == Py_None) { - value = NULL; - } else if (!PyDict_Check(value)) { - PyErr_SetString(PyExc_TypeError, - "__annotations__ must be set to a dict object"); - return -1; - } - Py_XINCREF(value); - tmp = op->func_annotations; - op->func_annotations = value; - Py_XDECREF(tmp); - return 0; -} -static PyObject * -__Pyx_CyFunction_get_annotations(__pyx_CyFunctionObject *op, CYTHON_UNUSED void *context) { - PyObject* result = op->func_annotations; - if (unlikely(!result)) { - result = PyDict_New(); - if (unlikely(!result)) return NULL; - op->func_annotations = result; - } - Py_INCREF(result); - return result; -} -static PyGetSetDef __pyx_CyFunction_getsets[] = { - {(char *) "func_doc", (getter)__Pyx_CyFunction_get_doc, (setter)__Pyx_CyFunction_set_doc, 0, 0}, - {(char *) "__doc__", (getter)__Pyx_CyFunction_get_doc, (setter)__Pyx_CyFunction_set_doc, 0, 0}, - {(char *) "func_name", (getter)__Pyx_CyFunction_get_name, (setter)__Pyx_CyFunction_set_name, 0, 0}, - {(char *) "__name__", (getter)__Pyx_CyFunction_get_name, (setter)__Pyx_CyFunction_set_name, 0, 0}, - {(char *) "__qualname__", (getter)__Pyx_CyFunction_get_qualname, (setter)__Pyx_CyFunction_set_qualname, 0, 0}, - {(char *) "__self__", (getter)__Pyx_CyFunction_get_self, 0, 0, 0}, - {(char *) "func_dict", (getter)__Pyx_CyFunction_get_dict, (setter)__Pyx_CyFunction_set_dict, 0, 0}, - {(char *) "__dict__", (getter)__Pyx_CyFunction_get_dict, (setter)__Pyx_CyFunction_set_dict, 0, 0}, - {(char *) "func_globals", (getter)__Pyx_CyFunction_get_globals, 0, 0, 0}, - {(char *) "__globals__", (getter)__Pyx_CyFunction_get_globals, 0, 0, 0}, - {(char *) "func_closure", (getter)__Pyx_CyFunction_get_closure, 0, 0, 0}, - {(char *) "__closure__", (getter)__Pyx_CyFunction_get_closure, 0, 0, 0}, - {(char *) "func_code", (getter)__Pyx_CyFunction_get_code, 0, 0, 0}, - {(char *) "__code__", (getter)__Pyx_CyFunction_get_code, 0, 0, 0}, - {(char *) "func_defaults", (getter)__Pyx_CyFunction_get_defaults, (setter)__Pyx_CyFunction_set_defaults, 0, 0}, - {(char *) "__defaults__", (getter)__Pyx_CyFunction_get_defaults, (setter)__Pyx_CyFunction_set_defaults, 0, 0}, - {(char *) "__kwdefaults__", (getter)__Pyx_CyFunction_get_kwdefaults, (setter)__Pyx_CyFunction_set_kwdefaults, 0, 0}, - {(char *) "__annotations__", (getter)__Pyx_CyFunction_get_annotations, (setter)__Pyx_CyFunction_set_annotations, 0, 0}, - {0, 0, 0, 0, 0} -}; -static PyMemberDef __pyx_CyFunction_members[] = { - {(char *) "__module__", T_OBJECT, offsetof(PyCFunctionObject, m_module), PY_WRITE_RESTRICTED, 0}, - {0, 0, 0, 0, 0} -}; -static PyObject * -__Pyx_CyFunction_reduce(__pyx_CyFunctionObject *m, CYTHON_UNUSED PyObject *args) -{ -#if PY_MAJOR_VERSION >= 3 - return PyUnicode_FromString(m->func.m_ml->ml_name); -#else - return PyString_FromString(m->func.m_ml->ml_name); -#endif -} -static PyMethodDef __pyx_CyFunction_methods[] = { - {"__reduce__", (PyCFunction)__Pyx_CyFunction_reduce, METH_VARARGS, 0}, - {0, 0, 0, 0} -}; -#if PY_VERSION_HEX < 0x030500A0 -#define __Pyx_CyFunction_weakreflist(cyfunc) ((cyfunc)->func_weakreflist) -#else -#define __Pyx_CyFunction_weakreflist(cyfunc) ((cyfunc)->func.m_weakreflist) -#endif -static PyObject *__Pyx_CyFunction_New(PyTypeObject *type, PyMethodDef *ml, int flags, PyObject* qualname, - PyObject *closure, PyObject *module, PyObject* globals, PyObject* code) { - __pyx_CyFunctionObject *op = PyObject_GC_New(__pyx_CyFunctionObject, type); - if (op == NULL) - return NULL; - op->flags = flags; - __Pyx_CyFunction_weakreflist(op) = NULL; - op->func.m_ml = ml; - op->func.m_self = (PyObject *) op; - Py_XINCREF(closure); - op->func_closure = closure; - Py_XINCREF(module); - op->func.m_module = module; - op->func_dict = NULL; - op->func_name = NULL; - Py_INCREF(qualname); - op->func_qualname = qualname; - op->func_doc = NULL; - op->func_classobj = NULL; - op->func_globals = globals; - Py_INCREF(op->func_globals); - Py_XINCREF(code); - op->func_code = code; - op->defaults_pyobjects = 0; - op->defaults = NULL; - op->defaults_tuple = NULL; - op->defaults_kwdict = NULL; - op->defaults_getter = NULL; - op->func_annotations = NULL; - PyObject_GC_Track(op); - return (PyObject *) op; -} -static int -__Pyx_CyFunction_clear(__pyx_CyFunctionObject *m) -{ - Py_CLEAR(m->func_closure); - Py_CLEAR(m->func.m_module); - Py_CLEAR(m->func_dict); - Py_CLEAR(m->func_name); - Py_CLEAR(m->func_qualname); - Py_CLEAR(m->func_doc); - Py_CLEAR(m->func_globals); - Py_CLEAR(m->func_code); - Py_CLEAR(m->func_classobj); - Py_CLEAR(m->defaults_tuple); - Py_CLEAR(m->defaults_kwdict); - Py_CLEAR(m->func_annotations); - if (m->defaults) { - PyObject **pydefaults = __Pyx_CyFunction_Defaults(PyObject *, m); - int i; - for (i = 0; i < m->defaults_pyobjects; i++) - Py_XDECREF(pydefaults[i]); - PyObject_Free(m->defaults); - m->defaults = NULL; - } - return 0; -} -static void __Pyx__CyFunction_dealloc(__pyx_CyFunctionObject *m) -{ - if (__Pyx_CyFunction_weakreflist(m) != NULL) - PyObject_ClearWeakRefs((PyObject *) m); - __Pyx_CyFunction_clear(m); - PyObject_GC_Del(m); -} -static void __Pyx_CyFunction_dealloc(__pyx_CyFunctionObject *m) -{ - PyObject_GC_UnTrack(m); - __Pyx__CyFunction_dealloc(m); -} -static int __Pyx_CyFunction_traverse(__pyx_CyFunctionObject *m, visitproc visit, void *arg) -{ - Py_VISIT(m->func_closure); - Py_VISIT(m->func.m_module); - Py_VISIT(m->func_dict); - Py_VISIT(m->func_name); - Py_VISIT(m->func_qualname); - Py_VISIT(m->func_doc); - Py_VISIT(m->func_globals); - Py_VISIT(m->func_code); - Py_VISIT(m->func_classobj); - Py_VISIT(m->defaults_tuple); - Py_VISIT(m->defaults_kwdict); - if (m->defaults) { - PyObject **pydefaults = __Pyx_CyFunction_Defaults(PyObject *, m); - int i; - for (i = 0; i < m->defaults_pyobjects; i++) - Py_VISIT(pydefaults[i]); - } - return 0; -} -static PyObject *__Pyx_CyFunction_descr_get(PyObject *func, PyObject *obj, PyObject *type) -{ - __pyx_CyFunctionObject *m = (__pyx_CyFunctionObject *) func; - if (m->flags & __Pyx_CYFUNCTION_STATICMETHOD) { - Py_INCREF(func); - return func; - } - if (m->flags & __Pyx_CYFUNCTION_CLASSMETHOD) { - if (type == NULL) - type = (PyObject *)(Py_TYPE(obj)); - return __Pyx_PyMethod_New(func, type, (PyObject *)(Py_TYPE(type))); - } - if (obj == Py_None) - obj = NULL; - return __Pyx_PyMethod_New(func, obj, type); -} -static PyObject* -__Pyx_CyFunction_repr(__pyx_CyFunctionObject *op) -{ -#if PY_MAJOR_VERSION >= 3 - return PyUnicode_FromFormat("", - op->func_qualname, (void *)op); -#else - return PyString_FromFormat("", - PyString_AsString(op->func_qualname), (void *)op); -#endif -} -static PyObject * __Pyx_CyFunction_CallMethod(PyObject *func, PyObject *self, PyObject *arg, PyObject *kw) { - PyCFunctionObject* f = (PyCFunctionObject*)func; - PyCFunction meth = f->m_ml->ml_meth; - Py_ssize_t size; - switch (f->m_ml->ml_flags & (METH_VARARGS | METH_KEYWORDS | METH_NOARGS | METH_O)) { - case METH_VARARGS: - if (likely(kw == NULL || PyDict_Size(kw) == 0)) - return (*meth)(self, arg); - break; - case METH_VARARGS | METH_KEYWORDS: - return (*(PyCFunctionWithKeywords)(void*)meth)(self, arg, kw); - case METH_NOARGS: - if (likely(kw == NULL || PyDict_Size(kw) == 0)) { - size = PyTuple_GET_SIZE(arg); - if (likely(size == 0)) - return (*meth)(self, NULL); - PyErr_Format(PyExc_TypeError, - "%.200s() takes no arguments (%" CYTHON_FORMAT_SSIZE_T "d given)", - f->m_ml->ml_name, size); - return NULL; - } - break; - case METH_O: - if (likely(kw == NULL || PyDict_Size(kw) == 0)) { - size = PyTuple_GET_SIZE(arg); - if (likely(size == 1)) { - PyObject *result, *arg0; - #if CYTHON_ASSUME_SAFE_MACROS && !CYTHON_AVOID_BORROWED_REFS - arg0 = PyTuple_GET_ITEM(arg, 0); - #else - arg0 = PySequence_ITEM(arg, 0); if (unlikely(!arg0)) return NULL; - #endif - result = (*meth)(self, arg0); - #if !(CYTHON_ASSUME_SAFE_MACROS && !CYTHON_AVOID_BORROWED_REFS) - Py_DECREF(arg0); - #endif - return result; - } - PyErr_Format(PyExc_TypeError, - "%.200s() takes exactly one argument (%" CYTHON_FORMAT_SSIZE_T "d given)", - f->m_ml->ml_name, size); - return NULL; - } - break; - default: - PyErr_SetString(PyExc_SystemError, "Bad call flags in " - "__Pyx_CyFunction_Call. METH_OLDARGS is no " - "longer supported!"); - return NULL; - } - PyErr_Format(PyExc_TypeError, "%.200s() takes no keyword arguments", - f->m_ml->ml_name); - return NULL; -} -static CYTHON_INLINE PyObject *__Pyx_CyFunction_Call(PyObject *func, PyObject *arg, PyObject *kw) { - return __Pyx_CyFunction_CallMethod(func, ((PyCFunctionObject*)func)->m_self, arg, kw); -} -static PyObject *__Pyx_CyFunction_CallAsMethod(PyObject *func, PyObject *args, PyObject *kw) { - PyObject *result; - __pyx_CyFunctionObject *cyfunc = (__pyx_CyFunctionObject *) func; - if ((cyfunc->flags & __Pyx_CYFUNCTION_CCLASS) && !(cyfunc->flags & __Pyx_CYFUNCTION_STATICMETHOD)) { - Py_ssize_t argc; - PyObject *new_args; - PyObject *self; - argc = PyTuple_GET_SIZE(args); - new_args = PyTuple_GetSlice(args, 1, argc); - if (unlikely(!new_args)) - return NULL; - self = PyTuple_GetItem(args, 0); - if (unlikely(!self)) { - Py_DECREF(new_args); - return NULL; - } - result = __Pyx_CyFunction_CallMethod(func, self, new_args, kw); - Py_DECREF(new_args); - } else { - result = __Pyx_CyFunction_Call(func, args, kw); - } - return result; -} -static PyTypeObject __pyx_CyFunctionType_type = { - PyVarObject_HEAD_INIT(0, 0) - "cython_function_or_method", - sizeof(__pyx_CyFunctionObject), - 0, - (destructor) __Pyx_CyFunction_dealloc, - 0, - 0, - 0, -#if PY_MAJOR_VERSION < 3 - 0, -#else - 0, -#endif - (reprfunc) __Pyx_CyFunction_repr, - 0, - 0, - 0, - 0, - __Pyx_CyFunction_CallAsMethod, - 0, - 0, - 0, - 0, - Py_TPFLAGS_DEFAULT | Py_TPFLAGS_HAVE_GC, - 0, - (traverseproc) __Pyx_CyFunction_traverse, - (inquiry) __Pyx_CyFunction_clear, - 0, -#if PY_VERSION_HEX < 0x030500A0 - offsetof(__pyx_CyFunctionObject, func_weakreflist), -#else - offsetof(PyCFunctionObject, m_weakreflist), -#endif - 0, - 0, - __pyx_CyFunction_methods, - __pyx_CyFunction_members, - __pyx_CyFunction_getsets, - 0, - 0, - __Pyx_CyFunction_descr_get, - 0, - offsetof(__pyx_CyFunctionObject, func_dict), - 0, - 0, - 0, - 0, - 0, - 0, - 0, - 0, - 0, - 0, - 0, - 0, -#if PY_VERSION_HEX >= 0x030400a1 - 0, -#endif -}; -static int __pyx_CyFunction_init(void) { - __pyx_CyFunctionType = __Pyx_FetchCommonType(&__pyx_CyFunctionType_type); - if (unlikely(__pyx_CyFunctionType == NULL)) { - return -1; + tmp_value = exc_info->exc_value; + tmp_tb = exc_info->exc_traceback; + exc_info->exc_type = local_type; + exc_info->exc_value = local_value; + exc_info->exc_traceback = local_tb; } - return 0; -} -static CYTHON_INLINE void *__Pyx_CyFunction_InitDefaults(PyObject *func, size_t size, int pyobjects) { - __pyx_CyFunctionObject *m = (__pyx_CyFunctionObject *) func; - m->defaults = PyObject_Malloc(size); - if (unlikely(!m->defaults)) - return PyErr_NoMemory(); - memset(m->defaults, 0, size); - m->defaults_pyobjects = pyobjects; - return m->defaults; -} -static CYTHON_INLINE void __Pyx_CyFunction_SetDefaultsTuple(PyObject *func, PyObject *tuple) { - __pyx_CyFunctionObject *m = (__pyx_CyFunctionObject *) func; - m->defaults_tuple = tuple; - Py_INCREF(tuple); -} -static CYTHON_INLINE void __Pyx_CyFunction_SetDefaultsKwDict(PyObject *func, PyObject *dict) { - __pyx_CyFunctionObject *m = (__pyx_CyFunctionObject *) func; - m->defaults_kwdict = dict; - Py_INCREF(dict); -} -static CYTHON_INLINE void __Pyx_CyFunction_SetAnnotationsDict(PyObject *func, PyObject *dict) { - __pyx_CyFunctionObject *m = (__pyx_CyFunctionObject *) func; - m->func_annotations = dict; - Py_INCREF(dict); -} - -/* PyObject_GenericGetAttrNoDict */ -#if CYTHON_USE_TYPE_SLOTS && CYTHON_USE_PYTYPE_LOOKUP && PY_VERSION_HEX < 0x03070000 -static PyObject *__Pyx_RaiseGenericGetAttributeError(PyTypeObject *tp, PyObject *attr_name) { - PyErr_Format(PyExc_AttributeError, -#if PY_MAJOR_VERSION >= 3 - "'%.50s' object has no attribute '%U'", - tp->tp_name, attr_name); + #else + tmp_type = tstate->exc_type; + tmp_value = tstate->exc_value; + tmp_tb = tstate->exc_traceback; + tstate->exc_type = local_type; + tstate->exc_value = local_value; + tstate->exc_traceback = local_tb; + #endif + Py_XDECREF(tmp_type); + Py_XDECREF(tmp_value); + Py_XDECREF(tmp_tb); #else - "'%.50s' object has no attribute '%.400s'", - tp->tp_name, PyString_AS_STRING(attr_name)); + PyErr_SetExcInfo(local_type, local_value, local_tb); #endif - return NULL; -} -static CYTHON_INLINE PyObject* __Pyx_PyObject_GenericGetAttrNoDict(PyObject* obj, PyObject* attr_name) { - PyObject *descr; - PyTypeObject *tp = Py_TYPE(obj); - if (unlikely(!PyString_Check(attr_name))) { - return PyObject_GenericGetAttr(obj, attr_name); - } - assert(!tp->tp_dictoffset); - descr = _PyType_Lookup(tp, attr_name); - if (unlikely(!descr)) { - return __Pyx_RaiseGenericGetAttributeError(tp, attr_name); - } - Py_INCREF(descr); - #if PY_MAJOR_VERSION < 3 - if (likely(PyType_HasFeature(Py_TYPE(descr), Py_TPFLAGS_HAVE_CLASS))) - #endif - { - descrgetfunc f = Py_TYPE(descr)->tp_descr_get; - if (unlikely(f)) { - PyObject *res = f(descr, obj, (PyObject *)tp); - Py_DECREF(descr); - return res; - } - } - return descr; + return 0; +bad: + *type = 0; + *value = 0; + *tb = 0; + Py_XDECREF(local_type); + Py_XDECREF(local_value); + Py_XDECREF(local_tb); + return -1; } -#endif /* TypeImport */ #ifndef __PYX_HAVE_RT_ImportType @@ -8249,24 +7343,24 @@ static void __Pyx_AddTraceback(const char *funcname, int c_line, } /* CIntToPy */ -static CYTHON_INLINE PyObject* __Pyx_PyInt_From_long(long value) { - const long neg_one = (long) ((long) 0 - (long) 1), const_zero = (long) 0; +static CYTHON_INLINE PyObject* __Pyx_PyInt_From_uint32_t(uint32_t value) { + const uint32_t neg_one = (uint32_t) ((uint32_t) 0 - (uint32_t) 1), const_zero = (uint32_t) 0; const int is_unsigned = neg_one > const_zero; if (is_unsigned) { - if (sizeof(long) < sizeof(long)) { + if (sizeof(uint32_t) < sizeof(long)) { return PyInt_FromLong((long) value); - } else if (sizeof(long) <= sizeof(unsigned long)) { + } else if (sizeof(uint32_t) <= sizeof(unsigned long)) { return PyLong_FromUnsignedLong((unsigned long) value); #ifdef HAVE_LONG_LONG - } else if (sizeof(long) <= sizeof(unsigned PY_LONG_LONG)) { + } else if (sizeof(uint32_t) <= sizeof(unsigned PY_LONG_LONG)) { return PyLong_FromUnsignedLongLong((unsigned PY_LONG_LONG) value); #endif } } else { - if (sizeof(long) <= sizeof(long)) { + if (sizeof(uint32_t) <= sizeof(long)) { return PyInt_FromLong((long) value); #ifdef HAVE_LONG_LONG - } else if (sizeof(long) <= sizeof(PY_LONG_LONG)) { + } else if (sizeof(uint32_t) <= sizeof(PY_LONG_LONG)) { return PyLong_FromLongLong((PY_LONG_LONG) value); #endif } @@ -8274,7 +7368,7 @@ static CYTHON_INLINE PyObject* __Pyx_PyInt_From_long(long value) { { int one = 1; int little = (int)*(unsigned char *)&one; unsigned char *bytes = (unsigned char *)&value; - return _PyLong_FromByteArray(bytes, sizeof(long), + return _PyLong_FromByteArray(bytes, sizeof(uint32_t), little, !is_unsigned); } } @@ -8449,7 +7543,7 @@ static CYTHON_INLINE PyObject* __Pyx_PyInt_From_unsigned_int(unsigned int value) theta = 0; } else { r = -a.real; - theta = atan2f(0, -1); + theta = atan2f(0.0, -1.0); } } else { r = __Pyx_c_abs_float(a); @@ -8604,7 +7698,7 @@ static CYTHON_INLINE PyObject* __Pyx_PyInt_From_unsigned_int(unsigned int value) theta = 0; } else { r = -a.real; - theta = atan2(0, -1); + theta = atan2(0.0, -1.0); } } else { r = __Pyx_c_abs_double(a); @@ -8643,59 +7737,437 @@ static CYTHON_INLINE PyObject* __Pyx_PyInt_From_int(int value) { #endif } } - { - int one = 1; int little = (int)*(unsigned char *)&one; - unsigned char *bytes = (unsigned char *)&value; - return _PyLong_FromByteArray(bytes, sizeof(int), - little, !is_unsigned); - } + { + int one = 1; int little = (int)*(unsigned char *)&one; + unsigned char *bytes = (unsigned char *)&value; + return _PyLong_FromByteArray(bytes, sizeof(int), + little, !is_unsigned); + } +} + +/* CIntToPy */ +static CYTHON_INLINE PyObject* __Pyx_PyInt_From_enum__NPY_TYPES(enum NPY_TYPES value) { + const enum NPY_TYPES neg_one = (enum NPY_TYPES) ((enum NPY_TYPES) 0 - (enum NPY_TYPES) 1), const_zero = (enum NPY_TYPES) 0; + const int is_unsigned = neg_one > const_zero; + if (is_unsigned) { + if (sizeof(enum NPY_TYPES) < sizeof(long)) { + return PyInt_FromLong((long) value); + } else if (sizeof(enum NPY_TYPES) <= sizeof(unsigned long)) { + return PyLong_FromUnsignedLong((unsigned long) value); +#ifdef HAVE_LONG_LONG + } else if (sizeof(enum NPY_TYPES) <= sizeof(unsigned PY_LONG_LONG)) { + return PyLong_FromUnsignedLongLong((unsigned PY_LONG_LONG) value); +#endif + } + } else { + if (sizeof(enum NPY_TYPES) <= sizeof(long)) { + return PyInt_FromLong((long) value); +#ifdef HAVE_LONG_LONG + } else if (sizeof(enum NPY_TYPES) <= sizeof(PY_LONG_LONG)) { + return PyLong_FromLongLong((PY_LONG_LONG) value); +#endif + } + } + { + int one = 1; int little = (int)*(unsigned char *)&one; + unsigned char *bytes = (unsigned char *)&value; + return _PyLong_FromByteArray(bytes, sizeof(enum NPY_TYPES), + little, !is_unsigned); + } +} + +/* CIntFromPy */ +static CYTHON_INLINE unsigned int __Pyx_PyInt_As_unsigned_int(PyObject *x) { + const unsigned int neg_one = (unsigned int) ((unsigned int) 0 - (unsigned int) 1), const_zero = (unsigned int) 0; + const int is_unsigned = neg_one > const_zero; +#if PY_MAJOR_VERSION < 3 + if (likely(PyInt_Check(x))) { + if (sizeof(unsigned int) < sizeof(long)) { + __PYX_VERIFY_RETURN_INT(unsigned int, long, PyInt_AS_LONG(x)) + } else { + long val = PyInt_AS_LONG(x); + if (is_unsigned && unlikely(val < 0)) { + goto raise_neg_overflow; + } + return (unsigned int) val; + } + } else +#endif + if (likely(PyLong_Check(x))) { + if (is_unsigned) { +#if CYTHON_USE_PYLONG_INTERNALS + const digit* digits = ((PyLongObject*)x)->ob_digit; + switch (Py_SIZE(x)) { + case 0: return (unsigned int) 0; + case 1: __PYX_VERIFY_RETURN_INT(unsigned int, digit, digits[0]) + case 2: + if (8 * sizeof(unsigned int) > 1 * PyLong_SHIFT) { + if (8 * sizeof(unsigned long) > 2 * PyLong_SHIFT) { + __PYX_VERIFY_RETURN_INT(unsigned int, unsigned long, (((((unsigned long)digits[1]) << PyLong_SHIFT) | (unsigned long)digits[0]))) + } else if (8 * sizeof(unsigned int) >= 2 * PyLong_SHIFT) { + return (unsigned int) (((((unsigned int)digits[1]) << PyLong_SHIFT) | (unsigned int)digits[0])); + } + } + break; + case 3: + if (8 * sizeof(unsigned int) > 2 * PyLong_SHIFT) { + if (8 * sizeof(unsigned long) > 3 * PyLong_SHIFT) { + __PYX_VERIFY_RETURN_INT(unsigned int, unsigned long, (((((((unsigned long)digits[2]) << PyLong_SHIFT) | (unsigned long)digits[1]) << PyLong_SHIFT) | (unsigned long)digits[0]))) + } else if (8 * sizeof(unsigned int) >= 3 * PyLong_SHIFT) { + return (unsigned int) (((((((unsigned int)digits[2]) << PyLong_SHIFT) | (unsigned int)digits[1]) << PyLong_SHIFT) | (unsigned int)digits[0])); + } + } + break; + case 4: + if (8 * sizeof(unsigned int) > 3 * PyLong_SHIFT) { + if (8 * sizeof(unsigned long) > 4 * PyLong_SHIFT) { + __PYX_VERIFY_RETURN_INT(unsigned int, unsigned long, (((((((((unsigned long)digits[3]) << PyLong_SHIFT) | (unsigned long)digits[2]) << PyLong_SHIFT) | (unsigned long)digits[1]) << PyLong_SHIFT) | (unsigned long)digits[0]))) + } else if (8 * sizeof(unsigned int) >= 4 * PyLong_SHIFT) { + return (unsigned int) (((((((((unsigned int)digits[3]) << PyLong_SHIFT) | (unsigned int)digits[2]) << PyLong_SHIFT) | (unsigned int)digits[1]) << PyLong_SHIFT) | (unsigned int)digits[0])); + } + } + break; + } +#endif +#if CYTHON_COMPILING_IN_CPYTHON + if (unlikely(Py_SIZE(x) < 0)) { + goto raise_neg_overflow; + } +#else + { + int result = PyObject_RichCompareBool(x, Py_False, Py_LT); + if (unlikely(result < 0)) + return (unsigned int) -1; + if (unlikely(result == 1)) + goto raise_neg_overflow; + } +#endif + if (sizeof(unsigned int) <= sizeof(unsigned long)) { + __PYX_VERIFY_RETURN_INT_EXC(unsigned int, unsigned long, PyLong_AsUnsignedLong(x)) +#ifdef HAVE_LONG_LONG + } else if (sizeof(unsigned int) <= sizeof(unsigned PY_LONG_LONG)) { + __PYX_VERIFY_RETURN_INT_EXC(unsigned int, unsigned PY_LONG_LONG, PyLong_AsUnsignedLongLong(x)) +#endif + } + } else { +#if CYTHON_USE_PYLONG_INTERNALS + const digit* digits = ((PyLongObject*)x)->ob_digit; + switch (Py_SIZE(x)) { + case 0: return (unsigned int) 0; + case -1: __PYX_VERIFY_RETURN_INT(unsigned int, sdigit, (sdigit) (-(sdigit)digits[0])) + case 1: __PYX_VERIFY_RETURN_INT(unsigned int, digit, +digits[0]) + case -2: + if (8 * sizeof(unsigned int) - 1 > 1 * PyLong_SHIFT) { + if (8 * sizeof(unsigned long) > 2 * PyLong_SHIFT) { + __PYX_VERIFY_RETURN_INT(unsigned int, long, -(long) (((((unsigned long)digits[1]) << PyLong_SHIFT) | (unsigned long)digits[0]))) + } else if (8 * sizeof(unsigned int) - 1 > 2 * PyLong_SHIFT) { + return (unsigned int) (((unsigned int)-1)*(((((unsigned int)digits[1]) << PyLong_SHIFT) | (unsigned int)digits[0]))); + } + } + break; + case 2: + if (8 * sizeof(unsigned int) > 1 * PyLong_SHIFT) { + if (8 * sizeof(unsigned long) > 2 * PyLong_SHIFT) { + __PYX_VERIFY_RETURN_INT(unsigned int, unsigned long, (((((unsigned long)digits[1]) << PyLong_SHIFT) | (unsigned long)digits[0]))) + } else if (8 * sizeof(unsigned int) - 1 > 2 * PyLong_SHIFT) { + return (unsigned int) ((((((unsigned int)digits[1]) << PyLong_SHIFT) | (unsigned int)digits[0]))); + } + } + break; + case -3: + if (8 * sizeof(unsigned int) - 1 > 2 * PyLong_SHIFT) { + if (8 * sizeof(unsigned long) > 3 * PyLong_SHIFT) { + __PYX_VERIFY_RETURN_INT(unsigned int, long, -(long) (((((((unsigned long)digits[2]) << PyLong_SHIFT) | (unsigned long)digits[1]) << PyLong_SHIFT) | (unsigned long)digits[0]))) + } else if (8 * sizeof(unsigned int) - 1 > 3 * PyLong_SHIFT) { + return (unsigned int) (((unsigned int)-1)*(((((((unsigned int)digits[2]) << PyLong_SHIFT) | (unsigned int)digits[1]) << PyLong_SHIFT) | (unsigned int)digits[0]))); + } + } + break; + case 3: + if (8 * sizeof(unsigned int) > 2 * PyLong_SHIFT) { + if (8 * sizeof(unsigned long) > 3 * PyLong_SHIFT) { + __PYX_VERIFY_RETURN_INT(unsigned int, unsigned long, (((((((unsigned long)digits[2]) << PyLong_SHIFT) | (unsigned long)digits[1]) << PyLong_SHIFT) | (unsigned long)digits[0]))) + } else if (8 * sizeof(unsigned int) - 1 > 3 * PyLong_SHIFT) { + return (unsigned int) ((((((((unsigned int)digits[2]) << PyLong_SHIFT) | (unsigned int)digits[1]) << PyLong_SHIFT) | (unsigned int)digits[0]))); + } + } + break; + case -4: + if (8 * sizeof(unsigned int) - 1 > 3 * PyLong_SHIFT) { + if (8 * sizeof(unsigned long) > 4 * PyLong_SHIFT) { + __PYX_VERIFY_RETURN_INT(unsigned int, long, -(long) (((((((((unsigned long)digits[3]) << PyLong_SHIFT) | (unsigned long)digits[2]) << PyLong_SHIFT) | (unsigned long)digits[1]) << PyLong_SHIFT) | (unsigned long)digits[0]))) + } else if (8 * sizeof(unsigned int) - 1 > 4 * PyLong_SHIFT) { + return (unsigned int) (((unsigned int)-1)*(((((((((unsigned int)digits[3]) << PyLong_SHIFT) | (unsigned int)digits[2]) << PyLong_SHIFT) | (unsigned int)digits[1]) << PyLong_SHIFT) | (unsigned int)digits[0]))); + } + } + break; + case 4: + if (8 * sizeof(unsigned int) > 3 * PyLong_SHIFT) { + if (8 * sizeof(unsigned long) > 4 * PyLong_SHIFT) { + __PYX_VERIFY_RETURN_INT(unsigned int, unsigned long, (((((((((unsigned long)digits[3]) << PyLong_SHIFT) | (unsigned long)digits[2]) << PyLong_SHIFT) | (unsigned long)digits[1]) << PyLong_SHIFT) | (unsigned long)digits[0]))) + } else if (8 * sizeof(unsigned int) - 1 > 4 * PyLong_SHIFT) { + return (unsigned int) ((((((((((unsigned int)digits[3]) << PyLong_SHIFT) | (unsigned int)digits[2]) << PyLong_SHIFT) | (unsigned int)digits[1]) << PyLong_SHIFT) | (unsigned int)digits[0]))); + } + } + break; + } +#endif + if (sizeof(unsigned int) <= sizeof(long)) { + __PYX_VERIFY_RETURN_INT_EXC(unsigned int, long, PyLong_AsLong(x)) +#ifdef HAVE_LONG_LONG + } else if (sizeof(unsigned int) <= sizeof(PY_LONG_LONG)) { + __PYX_VERIFY_RETURN_INT_EXC(unsigned int, PY_LONG_LONG, PyLong_AsLongLong(x)) +#endif + } + } + { +#if CYTHON_COMPILING_IN_PYPY && !defined(_PyLong_AsByteArray) + PyErr_SetString(PyExc_RuntimeError, + "_PyLong_AsByteArray() not available in PyPy, cannot convert large numbers"); +#else + unsigned int val; + PyObject *v = __Pyx_PyNumber_IntOrLong(x); + #if PY_MAJOR_VERSION < 3 + if (likely(v) && !PyLong_Check(v)) { + PyObject *tmp = v; + v = PyNumber_Long(tmp); + Py_DECREF(tmp); + } + #endif + if (likely(v)) { + int one = 1; int is_little = (int)*(unsigned char *)&one; + unsigned char *bytes = (unsigned char *)&val; + int ret = _PyLong_AsByteArray((PyLongObject *)v, + bytes, sizeof(val), + is_little, !is_unsigned); + Py_DECREF(v); + if (likely(!ret)) + return val; + } +#endif + return (unsigned int) -1; + } + } else { + unsigned int val; + PyObject *tmp = __Pyx_PyNumber_IntOrLong(x); + if (!tmp) return (unsigned int) -1; + val = __Pyx_PyInt_As_unsigned_int(tmp); + Py_DECREF(tmp); + return val; + } +raise_overflow: + PyErr_SetString(PyExc_OverflowError, + "value too large to convert to unsigned int"); + return (unsigned int) -1; +raise_neg_overflow: + PyErr_SetString(PyExc_OverflowError, + "can't convert negative value to unsigned int"); + return (unsigned int) -1; } -/* CIntToPy */ -static CYTHON_INLINE PyObject* __Pyx_PyInt_From_enum__NPY_TYPES(enum NPY_TYPES value) { - const enum NPY_TYPES neg_one = (enum NPY_TYPES) ((enum NPY_TYPES) 0 - (enum NPY_TYPES) 1), const_zero = (enum NPY_TYPES) 0; +/* CIntFromPy */ +static CYTHON_INLINE char __Pyx_PyInt_As_char(PyObject *x) { + const char neg_one = (char) ((char) 0 - (char) 1), const_zero = (char) 0; const int is_unsigned = neg_one > const_zero; - if (is_unsigned) { - if (sizeof(enum NPY_TYPES) < sizeof(long)) { - return PyInt_FromLong((long) value); - } else if (sizeof(enum NPY_TYPES) <= sizeof(unsigned long)) { - return PyLong_FromUnsignedLong((unsigned long) value); +#if PY_MAJOR_VERSION < 3 + if (likely(PyInt_Check(x))) { + if (sizeof(char) < sizeof(long)) { + __PYX_VERIFY_RETURN_INT(char, long, PyInt_AS_LONG(x)) + } else { + long val = PyInt_AS_LONG(x); + if (is_unsigned && unlikely(val < 0)) { + goto raise_neg_overflow; + } + return (char) val; + } + } else +#endif + if (likely(PyLong_Check(x))) { + if (is_unsigned) { +#if CYTHON_USE_PYLONG_INTERNALS + const digit* digits = ((PyLongObject*)x)->ob_digit; + switch (Py_SIZE(x)) { + case 0: return (char) 0; + case 1: __PYX_VERIFY_RETURN_INT(char, digit, digits[0]) + case 2: + if (8 * sizeof(char) > 1 * PyLong_SHIFT) { + if (8 * sizeof(unsigned long) > 2 * PyLong_SHIFT) { + __PYX_VERIFY_RETURN_INT(char, unsigned long, (((((unsigned long)digits[1]) << PyLong_SHIFT) | (unsigned long)digits[0]))) + } else if (8 * sizeof(char) >= 2 * PyLong_SHIFT) { + return (char) (((((char)digits[1]) << PyLong_SHIFT) | (char)digits[0])); + } + } + break; + case 3: + if (8 * sizeof(char) > 2 * PyLong_SHIFT) { + if (8 * sizeof(unsigned long) > 3 * PyLong_SHIFT) { + __PYX_VERIFY_RETURN_INT(char, unsigned long, (((((((unsigned long)digits[2]) << PyLong_SHIFT) | (unsigned long)digits[1]) << PyLong_SHIFT) | (unsigned long)digits[0]))) + } else if (8 * sizeof(char) >= 3 * PyLong_SHIFT) { + return (char) (((((((char)digits[2]) << PyLong_SHIFT) | (char)digits[1]) << PyLong_SHIFT) | (char)digits[0])); + } + } + break; + case 4: + if (8 * sizeof(char) > 3 * PyLong_SHIFT) { + if (8 * sizeof(unsigned long) > 4 * PyLong_SHIFT) { + __PYX_VERIFY_RETURN_INT(char, unsigned long, (((((((((unsigned long)digits[3]) << PyLong_SHIFT) | (unsigned long)digits[2]) << PyLong_SHIFT) | (unsigned long)digits[1]) << PyLong_SHIFT) | (unsigned long)digits[0]))) + } else if (8 * sizeof(char) >= 4 * PyLong_SHIFT) { + return (char) (((((((((char)digits[3]) << PyLong_SHIFT) | (char)digits[2]) << PyLong_SHIFT) | (char)digits[1]) << PyLong_SHIFT) | (char)digits[0])); + } + } + break; + } +#endif +#if CYTHON_COMPILING_IN_CPYTHON + if (unlikely(Py_SIZE(x) < 0)) { + goto raise_neg_overflow; + } +#else + { + int result = PyObject_RichCompareBool(x, Py_False, Py_LT); + if (unlikely(result < 0)) + return (char) -1; + if (unlikely(result == 1)) + goto raise_neg_overflow; + } +#endif + if (sizeof(char) <= sizeof(unsigned long)) { + __PYX_VERIFY_RETURN_INT_EXC(char, unsigned long, PyLong_AsUnsignedLong(x)) #ifdef HAVE_LONG_LONG - } else if (sizeof(enum NPY_TYPES) <= sizeof(unsigned PY_LONG_LONG)) { - return PyLong_FromUnsignedLongLong((unsigned PY_LONG_LONG) value); + } else if (sizeof(char) <= sizeof(unsigned PY_LONG_LONG)) { + __PYX_VERIFY_RETURN_INT_EXC(char, unsigned PY_LONG_LONG, PyLong_AsUnsignedLongLong(x)) #endif - } - } else { - if (sizeof(enum NPY_TYPES) <= sizeof(long)) { - return PyInt_FromLong((long) value); + } + } else { +#if CYTHON_USE_PYLONG_INTERNALS + const digit* digits = ((PyLongObject*)x)->ob_digit; + switch (Py_SIZE(x)) { + case 0: return (char) 0; + case -1: __PYX_VERIFY_RETURN_INT(char, sdigit, (sdigit) (-(sdigit)digits[0])) + case 1: __PYX_VERIFY_RETURN_INT(char, digit, +digits[0]) + case -2: + if (8 * sizeof(char) - 1 > 1 * PyLong_SHIFT) { + if (8 * sizeof(unsigned long) > 2 * PyLong_SHIFT) { + __PYX_VERIFY_RETURN_INT(char, long, -(long) (((((unsigned long)digits[1]) << PyLong_SHIFT) | (unsigned long)digits[0]))) + } else if (8 * sizeof(char) - 1 > 2 * PyLong_SHIFT) { + return (char) (((char)-1)*(((((char)digits[1]) << PyLong_SHIFT) | (char)digits[0]))); + } + } + break; + case 2: + if (8 * sizeof(char) > 1 * PyLong_SHIFT) { + if (8 * sizeof(unsigned long) > 2 * PyLong_SHIFT) { + __PYX_VERIFY_RETURN_INT(char, unsigned long, (((((unsigned long)digits[1]) << PyLong_SHIFT) | (unsigned long)digits[0]))) + } else if (8 * sizeof(char) - 1 > 2 * PyLong_SHIFT) { + return (char) ((((((char)digits[1]) << PyLong_SHIFT) | (char)digits[0]))); + } + } + break; + case -3: + if (8 * sizeof(char) - 1 > 2 * PyLong_SHIFT) { + if (8 * sizeof(unsigned long) > 3 * PyLong_SHIFT) { + __PYX_VERIFY_RETURN_INT(char, long, -(long) (((((((unsigned long)digits[2]) << PyLong_SHIFT) | (unsigned long)digits[1]) << PyLong_SHIFT) | (unsigned long)digits[0]))) + } else if (8 * sizeof(char) - 1 > 3 * PyLong_SHIFT) { + return (char) (((char)-1)*(((((((char)digits[2]) << PyLong_SHIFT) | (char)digits[1]) << PyLong_SHIFT) | (char)digits[0]))); + } + } + break; + case 3: + if (8 * sizeof(char) > 2 * PyLong_SHIFT) { + if (8 * sizeof(unsigned long) > 3 * PyLong_SHIFT) { + __PYX_VERIFY_RETURN_INT(char, unsigned long, (((((((unsigned long)digits[2]) << PyLong_SHIFT) | (unsigned long)digits[1]) << PyLong_SHIFT) | (unsigned long)digits[0]))) + } else if (8 * sizeof(char) - 1 > 3 * PyLong_SHIFT) { + return (char) ((((((((char)digits[2]) << PyLong_SHIFT) | (char)digits[1]) << PyLong_SHIFT) | (char)digits[0]))); + } + } + break; + case -4: + if (8 * sizeof(char) - 1 > 3 * PyLong_SHIFT) { + if (8 * sizeof(unsigned long) > 4 * PyLong_SHIFT) { + __PYX_VERIFY_RETURN_INT(char, long, -(long) (((((((((unsigned long)digits[3]) << PyLong_SHIFT) | (unsigned long)digits[2]) << PyLong_SHIFT) | (unsigned long)digits[1]) << PyLong_SHIFT) | (unsigned long)digits[0]))) + } else if (8 * sizeof(char) - 1 > 4 * PyLong_SHIFT) { + return (char) (((char)-1)*(((((((((char)digits[3]) << PyLong_SHIFT) | (char)digits[2]) << PyLong_SHIFT) | (char)digits[1]) << PyLong_SHIFT) | (char)digits[0]))); + } + } + break; + case 4: + if (8 * sizeof(char) > 3 * PyLong_SHIFT) { + if (8 * sizeof(unsigned long) > 4 * PyLong_SHIFT) { + __PYX_VERIFY_RETURN_INT(char, unsigned long, (((((((((unsigned long)digits[3]) << PyLong_SHIFT) | (unsigned long)digits[2]) << PyLong_SHIFT) | (unsigned long)digits[1]) << PyLong_SHIFT) | (unsigned long)digits[0]))) + } else if (8 * sizeof(char) - 1 > 4 * PyLong_SHIFT) { + return (char) ((((((((((char)digits[3]) << PyLong_SHIFT) | (char)digits[2]) << PyLong_SHIFT) | (char)digits[1]) << PyLong_SHIFT) | (char)digits[0]))); + } + } + break; + } +#endif + if (sizeof(char) <= sizeof(long)) { + __PYX_VERIFY_RETURN_INT_EXC(char, long, PyLong_AsLong(x)) #ifdef HAVE_LONG_LONG - } else if (sizeof(enum NPY_TYPES) <= sizeof(PY_LONG_LONG)) { - return PyLong_FromLongLong((PY_LONG_LONG) value); + } else if (sizeof(char) <= sizeof(PY_LONG_LONG)) { + __PYX_VERIFY_RETURN_INT_EXC(char, PY_LONG_LONG, PyLong_AsLongLong(x)) #endif + } } + { +#if CYTHON_COMPILING_IN_PYPY && !defined(_PyLong_AsByteArray) + PyErr_SetString(PyExc_RuntimeError, + "_PyLong_AsByteArray() not available in PyPy, cannot convert large numbers"); +#else + char val; + PyObject *v = __Pyx_PyNumber_IntOrLong(x); + #if PY_MAJOR_VERSION < 3 + if (likely(v) && !PyLong_Check(v)) { + PyObject *tmp = v; + v = PyNumber_Long(tmp); + Py_DECREF(tmp); + } + #endif + if (likely(v)) { + int one = 1; int is_little = (int)*(unsigned char *)&one; + unsigned char *bytes = (unsigned char *)&val; + int ret = _PyLong_AsByteArray((PyLongObject *)v, + bytes, sizeof(val), + is_little, !is_unsigned); + Py_DECREF(v); + if (likely(!ret)) + return val; + } +#endif + return (char) -1; + } + } else { + char val; + PyObject *tmp = __Pyx_PyNumber_IntOrLong(x); + if (!tmp) return (char) -1; + val = __Pyx_PyInt_As_char(tmp); + Py_DECREF(tmp); + return val; } - { - int one = 1; int little = (int)*(unsigned char *)&one; - unsigned char *bytes = (unsigned char *)&value; - return _PyLong_FromByteArray(bytes, sizeof(enum NPY_TYPES), - little, !is_unsigned); - } +raise_overflow: + PyErr_SetString(PyExc_OverflowError, + "value too large to convert to char"); + return (char) -1; +raise_neg_overflow: + PyErr_SetString(PyExc_OverflowError, + "can't convert negative value to char"); + return (char) -1; } /* CIntFromPy */ -static CYTHON_INLINE unsigned int __Pyx_PyInt_As_unsigned_int(PyObject *x) { - const unsigned int neg_one = (unsigned int) ((unsigned int) 0 - (unsigned int) 1), const_zero = (unsigned int) 0; +static CYTHON_INLINE size_t __Pyx_PyInt_As_size_t(PyObject *x) { + const size_t neg_one = (size_t) ((size_t) 0 - (size_t) 1), const_zero = (size_t) 0; const int is_unsigned = neg_one > const_zero; #if PY_MAJOR_VERSION < 3 if (likely(PyInt_Check(x))) { - if (sizeof(unsigned int) < sizeof(long)) { - __PYX_VERIFY_RETURN_INT(unsigned int, long, PyInt_AS_LONG(x)) + if (sizeof(size_t) < sizeof(long)) { + __PYX_VERIFY_RETURN_INT(size_t, long, PyInt_AS_LONG(x)) } else { long val = PyInt_AS_LONG(x); if (is_unsigned && unlikely(val < 0)) { goto raise_neg_overflow; } - return (unsigned int) val; + return (size_t) val; } } else #endif @@ -8704,32 +8176,32 @@ static CYTHON_INLINE unsigned int __Pyx_PyInt_As_unsigned_int(PyObject *x) { #if CYTHON_USE_PYLONG_INTERNALS const digit* digits = ((PyLongObject*)x)->ob_digit; switch (Py_SIZE(x)) { - case 0: return (unsigned int) 0; - case 1: __PYX_VERIFY_RETURN_INT(unsigned int, digit, digits[0]) + case 0: return (size_t) 0; + case 1: __PYX_VERIFY_RETURN_INT(size_t, digit, digits[0]) case 2: - if (8 * sizeof(unsigned int) > 1 * PyLong_SHIFT) { + if (8 * sizeof(size_t) > 1 * PyLong_SHIFT) { if (8 * sizeof(unsigned long) > 2 * PyLong_SHIFT) { - __PYX_VERIFY_RETURN_INT(unsigned int, unsigned long, (((((unsigned long)digits[1]) << PyLong_SHIFT) | (unsigned long)digits[0]))) - } else if (8 * sizeof(unsigned int) >= 2 * PyLong_SHIFT) { - return (unsigned int) (((((unsigned int)digits[1]) << PyLong_SHIFT) | (unsigned int)digits[0])); + __PYX_VERIFY_RETURN_INT(size_t, unsigned long, (((((unsigned long)digits[1]) << PyLong_SHIFT) | (unsigned long)digits[0]))) + } else if (8 * sizeof(size_t) >= 2 * PyLong_SHIFT) { + return (size_t) (((((size_t)digits[1]) << PyLong_SHIFT) | (size_t)digits[0])); } } break; case 3: - if (8 * sizeof(unsigned int) > 2 * PyLong_SHIFT) { + if (8 * sizeof(size_t) > 2 * PyLong_SHIFT) { if (8 * sizeof(unsigned long) > 3 * PyLong_SHIFT) { - __PYX_VERIFY_RETURN_INT(unsigned int, unsigned long, (((((((unsigned long)digits[2]) << PyLong_SHIFT) | (unsigned long)digits[1]) << PyLong_SHIFT) | (unsigned long)digits[0]))) - } else if (8 * sizeof(unsigned int) >= 3 * PyLong_SHIFT) { - return (unsigned int) (((((((unsigned int)digits[2]) << PyLong_SHIFT) | (unsigned int)digits[1]) << PyLong_SHIFT) | (unsigned int)digits[0])); + __PYX_VERIFY_RETURN_INT(size_t, unsigned long, (((((((unsigned long)digits[2]) << PyLong_SHIFT) | (unsigned long)digits[1]) << PyLong_SHIFT) | (unsigned long)digits[0]))) + } else if (8 * sizeof(size_t) >= 3 * PyLong_SHIFT) { + return (size_t) (((((((size_t)digits[2]) << PyLong_SHIFT) | (size_t)digits[1]) << PyLong_SHIFT) | (size_t)digits[0])); } } break; case 4: - if (8 * sizeof(unsigned int) > 3 * PyLong_SHIFT) { + if (8 * sizeof(size_t) > 3 * PyLong_SHIFT) { if (8 * sizeof(unsigned long) > 4 * PyLong_SHIFT) { - __PYX_VERIFY_RETURN_INT(unsigned int, unsigned long, (((((((((unsigned long)digits[3]) << PyLong_SHIFT) | (unsigned long)digits[2]) << PyLong_SHIFT) | (unsigned long)digits[1]) << PyLong_SHIFT) | (unsigned long)digits[0]))) - } else if (8 * sizeof(unsigned int) >= 4 * PyLong_SHIFT) { - return (unsigned int) (((((((((unsigned int)digits[3]) << PyLong_SHIFT) | (unsigned int)digits[2]) << PyLong_SHIFT) | (unsigned int)digits[1]) << PyLong_SHIFT) | (unsigned int)digits[0])); + __PYX_VERIFY_RETURN_INT(size_t, unsigned long, (((((((((unsigned long)digits[3]) << PyLong_SHIFT) | (unsigned long)digits[2]) << PyLong_SHIFT) | (unsigned long)digits[1]) << PyLong_SHIFT) | (unsigned long)digits[0]))) + } else if (8 * sizeof(size_t) >= 4 * PyLong_SHIFT) { + return (size_t) (((((((((size_t)digits[3]) << PyLong_SHIFT) | (size_t)digits[2]) << PyLong_SHIFT) | (size_t)digits[1]) << PyLong_SHIFT) | (size_t)digits[0])); } } break; @@ -8743,86 +8215,86 @@ static CYTHON_INLINE unsigned int __Pyx_PyInt_As_unsigned_int(PyObject *x) { { int result = PyObject_RichCompareBool(x, Py_False, Py_LT); if (unlikely(result < 0)) - return (unsigned int) -1; + return (size_t) -1; if (unlikely(result == 1)) goto raise_neg_overflow; } #endif - if (sizeof(unsigned int) <= sizeof(unsigned long)) { - __PYX_VERIFY_RETURN_INT_EXC(unsigned int, unsigned long, PyLong_AsUnsignedLong(x)) + if (sizeof(size_t) <= sizeof(unsigned long)) { + __PYX_VERIFY_RETURN_INT_EXC(size_t, unsigned long, PyLong_AsUnsignedLong(x)) #ifdef HAVE_LONG_LONG - } else if (sizeof(unsigned int) <= sizeof(unsigned PY_LONG_LONG)) { - __PYX_VERIFY_RETURN_INT_EXC(unsigned int, unsigned PY_LONG_LONG, PyLong_AsUnsignedLongLong(x)) + } else if (sizeof(size_t) <= sizeof(unsigned PY_LONG_LONG)) { + __PYX_VERIFY_RETURN_INT_EXC(size_t, unsigned PY_LONG_LONG, PyLong_AsUnsignedLongLong(x)) #endif } } else { #if CYTHON_USE_PYLONG_INTERNALS const digit* digits = ((PyLongObject*)x)->ob_digit; switch (Py_SIZE(x)) { - case 0: return (unsigned int) 0; - case -1: __PYX_VERIFY_RETURN_INT(unsigned int, sdigit, (sdigit) (-(sdigit)digits[0])) - case 1: __PYX_VERIFY_RETURN_INT(unsigned int, digit, +digits[0]) + case 0: return (size_t) 0; + case -1: __PYX_VERIFY_RETURN_INT(size_t, sdigit, (sdigit) (-(sdigit)digits[0])) + case 1: __PYX_VERIFY_RETURN_INT(size_t, digit, +digits[0]) case -2: - if (8 * sizeof(unsigned int) - 1 > 1 * PyLong_SHIFT) { + if (8 * sizeof(size_t) - 1 > 1 * PyLong_SHIFT) { if (8 * sizeof(unsigned long) > 2 * PyLong_SHIFT) { - __PYX_VERIFY_RETURN_INT(unsigned int, long, -(long) (((((unsigned long)digits[1]) << PyLong_SHIFT) | (unsigned long)digits[0]))) - } else if (8 * sizeof(unsigned int) - 1 > 2 * PyLong_SHIFT) { - return (unsigned int) (((unsigned int)-1)*(((((unsigned int)digits[1]) << PyLong_SHIFT) | (unsigned int)digits[0]))); + __PYX_VERIFY_RETURN_INT(size_t, long, -(long) (((((unsigned long)digits[1]) << PyLong_SHIFT) | (unsigned long)digits[0]))) + } else if (8 * sizeof(size_t) - 1 > 2 * PyLong_SHIFT) { + return (size_t) (((size_t)-1)*(((((size_t)digits[1]) << PyLong_SHIFT) | (size_t)digits[0]))); } } break; case 2: - if (8 * sizeof(unsigned int) > 1 * PyLong_SHIFT) { + if (8 * sizeof(size_t) > 1 * PyLong_SHIFT) { if (8 * sizeof(unsigned long) > 2 * PyLong_SHIFT) { - __PYX_VERIFY_RETURN_INT(unsigned int, unsigned long, (((((unsigned long)digits[1]) << PyLong_SHIFT) | (unsigned long)digits[0]))) - } else if (8 * sizeof(unsigned int) - 1 > 2 * PyLong_SHIFT) { - return (unsigned int) ((((((unsigned int)digits[1]) << PyLong_SHIFT) | (unsigned int)digits[0]))); + __PYX_VERIFY_RETURN_INT(size_t, unsigned long, (((((unsigned long)digits[1]) << PyLong_SHIFT) | (unsigned long)digits[0]))) + } else if (8 * sizeof(size_t) - 1 > 2 * PyLong_SHIFT) { + return (size_t) ((((((size_t)digits[1]) << PyLong_SHIFT) | (size_t)digits[0]))); } } break; case -3: - if (8 * sizeof(unsigned int) - 1 > 2 * PyLong_SHIFT) { + if (8 * sizeof(size_t) - 1 > 2 * PyLong_SHIFT) { if (8 * sizeof(unsigned long) > 3 * PyLong_SHIFT) { - __PYX_VERIFY_RETURN_INT(unsigned int, long, -(long) (((((((unsigned long)digits[2]) << PyLong_SHIFT) | (unsigned long)digits[1]) << PyLong_SHIFT) | (unsigned long)digits[0]))) - } else if (8 * sizeof(unsigned int) - 1 > 3 * PyLong_SHIFT) { - return (unsigned int) (((unsigned int)-1)*(((((((unsigned int)digits[2]) << PyLong_SHIFT) | (unsigned int)digits[1]) << PyLong_SHIFT) | (unsigned int)digits[0]))); + __PYX_VERIFY_RETURN_INT(size_t, long, -(long) (((((((unsigned long)digits[2]) << PyLong_SHIFT) | (unsigned long)digits[1]) << PyLong_SHIFT) | (unsigned long)digits[0]))) + } else if (8 * sizeof(size_t) - 1 > 3 * PyLong_SHIFT) { + return (size_t) (((size_t)-1)*(((((((size_t)digits[2]) << PyLong_SHIFT) | (size_t)digits[1]) << PyLong_SHIFT) | (size_t)digits[0]))); } } break; case 3: - if (8 * sizeof(unsigned int) > 2 * PyLong_SHIFT) { + if (8 * sizeof(size_t) > 2 * PyLong_SHIFT) { if (8 * sizeof(unsigned long) > 3 * PyLong_SHIFT) { - __PYX_VERIFY_RETURN_INT(unsigned int, unsigned long, (((((((unsigned long)digits[2]) << PyLong_SHIFT) | (unsigned long)digits[1]) << PyLong_SHIFT) | (unsigned long)digits[0]))) - } else if (8 * sizeof(unsigned int) - 1 > 3 * PyLong_SHIFT) { - return (unsigned int) ((((((((unsigned int)digits[2]) << PyLong_SHIFT) | (unsigned int)digits[1]) << PyLong_SHIFT) | (unsigned int)digits[0]))); + __PYX_VERIFY_RETURN_INT(size_t, unsigned long, (((((((unsigned long)digits[2]) << PyLong_SHIFT) | (unsigned long)digits[1]) << PyLong_SHIFT) | (unsigned long)digits[0]))) + } else if (8 * sizeof(size_t) - 1 > 3 * PyLong_SHIFT) { + return (size_t) ((((((((size_t)digits[2]) << PyLong_SHIFT) | (size_t)digits[1]) << PyLong_SHIFT) | (size_t)digits[0]))); } } break; case -4: - if (8 * sizeof(unsigned int) - 1 > 3 * PyLong_SHIFT) { + if (8 * sizeof(size_t) - 1 > 3 * PyLong_SHIFT) { if (8 * sizeof(unsigned long) > 4 * PyLong_SHIFT) { - __PYX_VERIFY_RETURN_INT(unsigned int, long, -(long) (((((((((unsigned long)digits[3]) << PyLong_SHIFT) | (unsigned long)digits[2]) << PyLong_SHIFT) | (unsigned long)digits[1]) << PyLong_SHIFT) | (unsigned long)digits[0]))) - } else if (8 * sizeof(unsigned int) - 1 > 4 * PyLong_SHIFT) { - return (unsigned int) (((unsigned int)-1)*(((((((((unsigned int)digits[3]) << PyLong_SHIFT) | (unsigned int)digits[2]) << PyLong_SHIFT) | (unsigned int)digits[1]) << PyLong_SHIFT) | (unsigned int)digits[0]))); + __PYX_VERIFY_RETURN_INT(size_t, long, -(long) (((((((((unsigned long)digits[3]) << PyLong_SHIFT) | (unsigned long)digits[2]) << PyLong_SHIFT) | (unsigned long)digits[1]) << PyLong_SHIFT) | (unsigned long)digits[0]))) + } else if (8 * sizeof(size_t) - 1 > 4 * PyLong_SHIFT) { + return (size_t) (((size_t)-1)*(((((((((size_t)digits[3]) << PyLong_SHIFT) | (size_t)digits[2]) << PyLong_SHIFT) | (size_t)digits[1]) << PyLong_SHIFT) | (size_t)digits[0]))); } } break; case 4: - if (8 * sizeof(unsigned int) > 3 * PyLong_SHIFT) { + if (8 * sizeof(size_t) > 3 * PyLong_SHIFT) { if (8 * sizeof(unsigned long) > 4 * PyLong_SHIFT) { - __PYX_VERIFY_RETURN_INT(unsigned int, unsigned long, (((((((((unsigned long)digits[3]) << PyLong_SHIFT) | (unsigned long)digits[2]) << PyLong_SHIFT) | (unsigned long)digits[1]) << PyLong_SHIFT) | (unsigned long)digits[0]))) - } else if (8 * sizeof(unsigned int) - 1 > 4 * PyLong_SHIFT) { - return (unsigned int) ((((((((((unsigned int)digits[3]) << PyLong_SHIFT) | (unsigned int)digits[2]) << PyLong_SHIFT) | (unsigned int)digits[1]) << PyLong_SHIFT) | (unsigned int)digits[0]))); + __PYX_VERIFY_RETURN_INT(size_t, unsigned long, (((((((((unsigned long)digits[3]) << PyLong_SHIFT) | (unsigned long)digits[2]) << PyLong_SHIFT) | (unsigned long)digits[1]) << PyLong_SHIFT) | (unsigned long)digits[0]))) + } else if (8 * sizeof(size_t) - 1 > 4 * PyLong_SHIFT) { + return (size_t) ((((((((((size_t)digits[3]) << PyLong_SHIFT) | (size_t)digits[2]) << PyLong_SHIFT) | (size_t)digits[1]) << PyLong_SHIFT) | (size_t)digits[0]))); } } break; } #endif - if (sizeof(unsigned int) <= sizeof(long)) { - __PYX_VERIFY_RETURN_INT_EXC(unsigned int, long, PyLong_AsLong(x)) + if (sizeof(size_t) <= sizeof(long)) { + __PYX_VERIFY_RETURN_INT_EXC(size_t, long, PyLong_AsLong(x)) #ifdef HAVE_LONG_LONG - } else if (sizeof(unsigned int) <= sizeof(PY_LONG_LONG)) { - __PYX_VERIFY_RETURN_INT_EXC(unsigned int, PY_LONG_LONG, PyLong_AsLongLong(x)) + } else if (sizeof(size_t) <= sizeof(PY_LONG_LONG)) { + __PYX_VERIFY_RETURN_INT_EXC(size_t, PY_LONG_LONG, PyLong_AsLongLong(x)) #endif } } @@ -8831,7 +8303,7 @@ static CYTHON_INLINE unsigned int __Pyx_PyInt_As_unsigned_int(PyObject *x) { PyErr_SetString(PyExc_RuntimeError, "_PyLong_AsByteArray() not available in PyPy, cannot convert large numbers"); #else - unsigned int val; + size_t val; PyObject *v = __Pyx_PyNumber_IntOrLong(x); #if PY_MAJOR_VERSION < 3 if (likely(v) && !PyLong_Check(v)) { @@ -8851,24 +8323,24 @@ static CYTHON_INLINE unsigned int __Pyx_PyInt_As_unsigned_int(PyObject *x) { return val; } #endif - return (unsigned int) -1; + return (size_t) -1; } } else { - unsigned int val; + size_t val; PyObject *tmp = __Pyx_PyNumber_IntOrLong(x); - if (!tmp) return (unsigned int) -1; - val = __Pyx_PyInt_As_unsigned_int(tmp); + if (!tmp) return (size_t) -1; + val = __Pyx_PyInt_As_size_t(tmp); Py_DECREF(tmp); return val; } raise_overflow: PyErr_SetString(PyExc_OverflowError, - "value too large to convert to unsigned int"); - return (unsigned int) -1; + "value too large to convert to size_t"); + return (size_t) -1; raise_neg_overflow: PyErr_SetString(PyExc_OverflowError, - "can't convert negative value to unsigned int"); - return (unsigned int) -1; + "can't convert negative value to size_t"); + return (size_t) -1; } /* CIntFromPy */ @@ -9060,6 +8532,37 @@ static CYTHON_INLINE int __Pyx_PyInt_As_int(PyObject *x) { return (int) -1; } +/* CIntToPy */ +static CYTHON_INLINE PyObject* __Pyx_PyInt_From_long(long value) { + const long neg_one = (long) ((long) 0 - (long) 1), const_zero = (long) 0; + const int is_unsigned = neg_one > const_zero; + if (is_unsigned) { + if (sizeof(long) < sizeof(long)) { + return PyInt_FromLong((long) value); + } else if (sizeof(long) <= sizeof(unsigned long)) { + return PyLong_FromUnsignedLong((unsigned long) value); +#ifdef HAVE_LONG_LONG + } else if (sizeof(long) <= sizeof(unsigned PY_LONG_LONG)) { + return PyLong_FromUnsignedLongLong((unsigned PY_LONG_LONG) value); +#endif + } + } else { + if (sizeof(long) <= sizeof(long)) { + return PyInt_FromLong((long) value); +#ifdef HAVE_LONG_LONG + } else if (sizeof(long) <= sizeof(PY_LONG_LONG)) { + return PyLong_FromLongLong((PY_LONG_LONG) value); +#endif + } + } + { + int one = 1; int little = (int)*(unsigned char *)&one; + unsigned char *bytes = (unsigned char *)&value; + return _PyLong_FromByteArray(bytes, sizeof(long), + little, !is_unsigned); + } +} + /* CIntFromPy */ static CYTHON_INLINE long __Pyx_PyInt_As_long(PyObject *x) { const long neg_one = (long) ((long) 0 - (long) 1), const_zero = (long) 0; diff --git a/gensim/models/_utils_any2vec.pyx b/gensim/models/_utils_any2vec.pyx index f27d7e400f..cc4ba9bbb4 100644 --- a/gensim/models/_utils_any2vec.pyx +++ b/gensim/models/_utils_any2vec.pyx @@ -7,29 +7,27 @@ """General functions used for any2vec models.""" +# +# This is here to support older versions of the MSVC compiler that don't have stdint.h. +# +cdef extern from "stdint_wrapper.h": + ctypedef unsigned int uint32_t + ctypedef signed char int8_t + from six import PY2 import numpy as np cimport numpy as np -cdef _byte_to_int_py3(b): - return b - -cdef _byte_to_int_py2(b): - return ord(b) - -_byte_to_int = _byte_to_int_py2 if PY2 else _byte_to_int_py3 - - -cpdef ft_hash(unicode string): - """Calculate hash based on `string`. +cpdef ft_hash_bytes(bytes bytez): + """Calculate hash based on `bytez`. Reproduce `hash method from Facebook fastText implementation `_. Parameters ---------- - string : unicode - The string whose hash needs to be calculated. + bytez : bytes + The string whose hash needs to be calculated, encoded as UTF-8. Returns ------- @@ -37,10 +35,12 @@ cpdef ft_hash(unicode string): The hash of the string. """ - cdef unsigned int h = 2166136261 - for c in string.encode("utf-8"): - h = np.uint32(h ^ np.uint32(np.int8(_byte_to_int(c)))) - h = np.uint32(h * np.uint32(16777619)) + cdef uint32_t h = 2166136261 + cdef char b + + for b in bytez: + h = h ^ (b) + h = h * 16777619 return h @@ -92,3 +92,56 @@ cpdef compute_ngrams(word, unsigned int min_n, unsigned int max_n): for i in range(0, len(extended_word) - ngram_length + 1): ngrams.append(extended_word[i:i + ngram_length]) return ngrams + +# +# UTF-8 bytes that begin with 10 are subsequent bytes of a multi-byte sequence, +# as opposed to a new character. +# +cdef unsigned char _MB_MASK = 0xC0 +cdef unsigned char _MB_START = 0x80 + + +cpdef compute_ngrams_bytes(word, unsigned int min_n, unsigned int max_n): + """Computes ngrams for a word. + + Ported from the original FB implementation. + + Parameters + ---------- + word : str + A unicode string. + min_n : unsigned int + The minimum ngram length. + max_n : unsigned int + The maximum ngram length. + + Returns: + -------- + list of str + A list of ngrams, where each ngram is a list of **bytes**. + + See Also + -------- + `Original implementation `__ + + """ + cdef bytes utf8_word = ('<%s>' % word).encode("utf-8") + cdef const unsigned char *bytez = utf8_word + cdef size_t num_bytes = len(utf8_word) + cdef size_t j, i, n + + ngrams = [] + for i in range(num_bytes): + if bytez[i] & _MB_MASK == _MB_START: + continue + + j, n = i, 1 + while j < num_bytes and n <= max_n: + j += 1 + while j < num_bytes and (bytez[j] & _MB_MASK) == _MB_START: + j += 1 + if n >= min_n and not (n == 1 and (i == 0 or j == num_bytes)): + ngram = bytes(bytez[i:j]) + ngrams.append(ngram) + n += 1 + return ngrams diff --git a/gensim/models/deprecated/fasttext.py b/gensim/models/deprecated/fasttext.py index 836c66d4ca..81e01a5069 100644 --- a/gensim/models/deprecated/fasttext.py +++ b/gensim/models/deprecated/fasttext.py @@ -601,9 +601,9 @@ def train(self, sentences, total_examples=None, total_words=None, """ self.neg_labels = [] if self.negative > 0: - # precompute negative labels optimization for pure-python training - self.neg_labels = zeros(self.negative + 1) - self.neg_labels[0] = 1. + # precompute negative labels optimization for pure-python training + self.neg_labels = zeros(self.negative + 1) + self.neg_labels[0] = 1. Word2Vec.train( self, sentences, total_examples=self.corpus_count, epochs=self.iter, diff --git a/gensim/models/doc2vec.py b/gensim/models/doc2vec.py index 46508afdb3..9812dc5ef4 100644 --- a/gensim/models/doc2vec.py +++ b/gensim/models/doc2vec.py @@ -907,6 +907,9 @@ def infer_vector(self, doc_words, alpha=None, min_alpha=None, epochs=None, steps The inferred paragraph vector for the new document. """ + if isinstance(doc_words, string_types): + raise TypeError("Parameter doc_words of infer_vector() must be a list of strings (not a single string).") + alpha = alpha or self.alpha min_alpha = min_alpha or self.min_alpha epochs = epochs or steps or self.epochs diff --git a/gensim/models/doc2vec_corpusfile.cpp b/gensim/models/doc2vec_corpusfile.cpp index eb2afa5f98..e9f809730c 100644 --- a/gensim/models/doc2vec_corpusfile.cpp +++ b/gensim/models/doc2vec_corpusfile.cpp @@ -1,4 +1,4 @@ -/* Generated by Cython 0.29.2 */ +/* Generated by Cython 0.29.3 */ #define PY_SSIZE_T_CLEAN #include "Python.h" @@ -7,8 +7,8 @@ #elif PY_VERSION_HEX < 0x02060000 || (0x03000000 <= PY_VERSION_HEX && PY_VERSION_HEX < 0x03030000) #error Cython requires Python 2.6+ or Python 3.3+. #else -#define CYTHON_ABI "0_29_2" -#define CYTHON_HEX_VERSION 0x001D02F0 +#define CYTHON_ABI "0_29_3" +#define CYTHON_HEX_VERSION 0x001D03F0 #define CYTHON_FUTURE_DIVISION 0 #include #ifndef offsetof @@ -412,7 +412,7 @@ class __Pyx_FakeReference { typedef int Py_tss_t; static CYTHON_INLINE int PyThread_tss_create(Py_tss_t *key) { *key = PyThread_create_key(); - return 0; // PyThread_create_key reports success always + return 0; } static CYTHON_INLINE Py_tss_t * PyThread_tss_alloc(void) { Py_tss_t *key = (Py_tss_t *)PyObject_Malloc(sizeof(Py_tss_t)); @@ -435,7 +435,7 @@ static CYTHON_INLINE int PyThread_tss_set(Py_tss_t *key, void *value) { static CYTHON_INLINE void * PyThread_tss_get(Py_tss_t *key) { return PyThread_get_key_value(*key); } -#endif // TSS (Thread Specific Storage) API +#endif #if CYTHON_COMPILING_IN_CPYTHON || defined(_PyDict_NewPresized) #define __Pyx_PyDict_NewPresized(n) ((n <= 8) ? PyDict_New() : _PyDict_NewPresized(n)) #else @@ -883,7 +883,7 @@ static const char *__pyx_f[] = { #endif -/* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":776 +/* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":776 * # in Cython to enable them only on the right systems. * * ctypedef npy_int8 int8_t # <<<<<<<<<<<<<< @@ -892,7 +892,7 @@ static const char *__pyx_f[] = { */ typedef npy_int8 __pyx_t_5numpy_int8_t; -/* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":777 +/* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":777 * * ctypedef npy_int8 int8_t * ctypedef npy_int16 int16_t # <<<<<<<<<<<<<< @@ -901,7 +901,7 @@ typedef npy_int8 __pyx_t_5numpy_int8_t; */ typedef npy_int16 __pyx_t_5numpy_int16_t; -/* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":778 +/* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":778 * ctypedef npy_int8 int8_t * ctypedef npy_int16 int16_t * ctypedef npy_int32 int32_t # <<<<<<<<<<<<<< @@ -910,7 +910,7 @@ typedef npy_int16 __pyx_t_5numpy_int16_t; */ typedef npy_int32 __pyx_t_5numpy_int32_t; -/* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":779 +/* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":779 * ctypedef npy_int16 int16_t * ctypedef npy_int32 int32_t * ctypedef npy_int64 int64_t # <<<<<<<<<<<<<< @@ -919,7 +919,7 @@ typedef npy_int32 __pyx_t_5numpy_int32_t; */ typedef npy_int64 __pyx_t_5numpy_int64_t; -/* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":783 +/* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":783 * #ctypedef npy_int128 int128_t * * ctypedef npy_uint8 uint8_t # <<<<<<<<<<<<<< @@ -928,7 +928,7 @@ typedef npy_int64 __pyx_t_5numpy_int64_t; */ typedef npy_uint8 __pyx_t_5numpy_uint8_t; -/* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":784 +/* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":784 * * ctypedef npy_uint8 uint8_t * ctypedef npy_uint16 uint16_t # <<<<<<<<<<<<<< @@ -937,7 +937,7 @@ typedef npy_uint8 __pyx_t_5numpy_uint8_t; */ typedef npy_uint16 __pyx_t_5numpy_uint16_t; -/* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":785 +/* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":785 * ctypedef npy_uint8 uint8_t * ctypedef npy_uint16 uint16_t * ctypedef npy_uint32 uint32_t # <<<<<<<<<<<<<< @@ -946,7 +946,7 @@ typedef npy_uint16 __pyx_t_5numpy_uint16_t; */ typedef npy_uint32 __pyx_t_5numpy_uint32_t; -/* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":786 +/* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":786 * ctypedef npy_uint16 uint16_t * ctypedef npy_uint32 uint32_t * ctypedef npy_uint64 uint64_t # <<<<<<<<<<<<<< @@ -955,7 +955,7 @@ typedef npy_uint32 __pyx_t_5numpy_uint32_t; */ typedef npy_uint64 __pyx_t_5numpy_uint64_t; -/* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":790 +/* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":790 * #ctypedef npy_uint128 uint128_t * * ctypedef npy_float32 float32_t # <<<<<<<<<<<<<< @@ -964,7 +964,7 @@ typedef npy_uint64 __pyx_t_5numpy_uint64_t; */ typedef npy_float32 __pyx_t_5numpy_float32_t; -/* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":791 +/* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":791 * * ctypedef npy_float32 float32_t * ctypedef npy_float64 float64_t # <<<<<<<<<<<<<< @@ -973,7 +973,7 @@ typedef npy_float32 __pyx_t_5numpy_float32_t; */ typedef npy_float64 __pyx_t_5numpy_float64_t; -/* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":800 +/* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":800 * # The int types are mapped a bit surprising -- * # numpy.int corresponds to 'l' and numpy.long to 'q' * ctypedef npy_long int_t # <<<<<<<<<<<<<< @@ -982,7 +982,7 @@ typedef npy_float64 __pyx_t_5numpy_float64_t; */ typedef npy_long __pyx_t_5numpy_int_t; -/* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":801 +/* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":801 * # numpy.int corresponds to 'l' and numpy.long to 'q' * ctypedef npy_long int_t * ctypedef npy_longlong long_t # <<<<<<<<<<<<<< @@ -991,7 +991,7 @@ typedef npy_long __pyx_t_5numpy_int_t; */ typedef npy_longlong __pyx_t_5numpy_long_t; -/* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":802 +/* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":802 * ctypedef npy_long int_t * ctypedef npy_longlong long_t * ctypedef npy_longlong longlong_t # <<<<<<<<<<<<<< @@ -1000,7 +1000,7 @@ typedef npy_longlong __pyx_t_5numpy_long_t; */ typedef npy_longlong __pyx_t_5numpy_longlong_t; -/* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":804 +/* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":804 * ctypedef npy_longlong longlong_t * * ctypedef npy_ulong uint_t # <<<<<<<<<<<<<< @@ -1009,7 +1009,7 @@ typedef npy_longlong __pyx_t_5numpy_longlong_t; */ typedef npy_ulong __pyx_t_5numpy_uint_t; -/* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":805 +/* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":805 * * ctypedef npy_ulong uint_t * ctypedef npy_ulonglong ulong_t # <<<<<<<<<<<<<< @@ -1018,7 +1018,7 @@ typedef npy_ulong __pyx_t_5numpy_uint_t; */ typedef npy_ulonglong __pyx_t_5numpy_ulong_t; -/* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":806 +/* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":806 * ctypedef npy_ulong uint_t * ctypedef npy_ulonglong ulong_t * ctypedef npy_ulonglong ulonglong_t # <<<<<<<<<<<<<< @@ -1027,7 +1027,7 @@ typedef npy_ulonglong __pyx_t_5numpy_ulong_t; */ typedef npy_ulonglong __pyx_t_5numpy_ulonglong_t; -/* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":808 +/* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":808 * ctypedef npy_ulonglong ulonglong_t * * ctypedef npy_intp intp_t # <<<<<<<<<<<<<< @@ -1036,7 +1036,7 @@ typedef npy_ulonglong __pyx_t_5numpy_ulonglong_t; */ typedef npy_intp __pyx_t_5numpy_intp_t; -/* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":809 +/* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":809 * * ctypedef npy_intp intp_t * ctypedef npy_uintp uintp_t # <<<<<<<<<<<<<< @@ -1045,7 +1045,7 @@ typedef npy_intp __pyx_t_5numpy_intp_t; */ typedef npy_uintp __pyx_t_5numpy_uintp_t; -/* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":811 +/* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":811 * ctypedef npy_uintp uintp_t * * ctypedef npy_double float_t # <<<<<<<<<<<<<< @@ -1054,7 +1054,7 @@ typedef npy_uintp __pyx_t_5numpy_uintp_t; */ typedef npy_double __pyx_t_5numpy_float_t; -/* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":812 +/* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":812 * * ctypedef npy_double float_t * ctypedef npy_double double_t # <<<<<<<<<<<<<< @@ -1063,7 +1063,7 @@ typedef npy_double __pyx_t_5numpy_float_t; */ typedef npy_double __pyx_t_5numpy_double_t; -/* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":813 +/* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":813 * ctypedef npy_double float_t * ctypedef npy_double double_t * ctypedef npy_longdouble longdouble_t # <<<<<<<<<<<<<< @@ -1118,7 +1118,7 @@ static CYTHON_INLINE __pyx_t_double_complex __pyx_t_double_complex_from_parts(do struct __pyx_obj_6gensim_6models_19word2vec_corpusfile_CythonLineSentence; struct __pyx_obj_6gensim_6models_19word2vec_corpusfile_CythonVocab; -/* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":815 +/* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":815 * ctypedef npy_longdouble longdouble_t * * ctypedef npy_cfloat cfloat_t # <<<<<<<<<<<<<< @@ -1127,7 +1127,7 @@ struct __pyx_obj_6gensim_6models_19word2vec_corpusfile_CythonVocab; */ typedef npy_cfloat __pyx_t_5numpy_cfloat_t; -/* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":816 +/* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":816 * * ctypedef npy_cfloat cfloat_t * ctypedef npy_cdouble cdouble_t # <<<<<<<<<<<<<< @@ -1136,7 +1136,7 @@ typedef npy_cfloat __pyx_t_5numpy_cfloat_t; */ typedef npy_cdouble __pyx_t_5numpy_cdouble_t; -/* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":817 +/* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":817 * ctypedef npy_cfloat cfloat_t * ctypedef npy_cdouble cdouble_t * ctypedef npy_clongdouble clongdouble_t # <<<<<<<<<<<<<< @@ -1145,7 +1145,7 @@ typedef npy_cdouble __pyx_t_5numpy_cdouble_t; */ typedef npy_clongdouble __pyx_t_5numpy_clongdouble_t; -/* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":819 +/* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":819 * ctypedef npy_clongdouble clongdouble_t * * ctypedef npy_cdouble complex_t # <<<<<<<<<<<<<< @@ -5886,7 +5886,7 @@ static PyObject *__pyx_pf_6gensim_6models_18doc2vec_corpusfile_4d2v_train_epoch_ return __pyx_r; } -/* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":258 +/* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":258 * # experimental exception made for __getbuffer__ and __releasebuffer__ * # -- the details of this may change. * def __getbuffer__(ndarray self, Py_buffer* info, int flags): # <<<<<<<<<<<<<< @@ -5935,7 +5935,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P __pyx_v_info->obj = Py_None; __Pyx_INCREF(Py_None); __Pyx_GIVEREF(__pyx_v_info->obj); - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":265 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":265 * * cdef int i, ndim * cdef int endian_detector = 1 # <<<<<<<<<<<<<< @@ -5944,7 +5944,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P */ __pyx_v_endian_detector = 1; - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":266 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":266 * cdef int i, ndim * cdef int endian_detector = 1 * cdef bint little_endian = ((&endian_detector)[0] != 0) # <<<<<<<<<<<<<< @@ -5953,7 +5953,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P */ __pyx_v_little_endian = ((((char *)(&__pyx_v_endian_detector))[0]) != 0); - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":268 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":268 * cdef bint little_endian = ((&endian_detector)[0] != 0) * * ndim = PyArray_NDIM(self) # <<<<<<<<<<<<<< @@ -5962,7 +5962,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P */ __pyx_v_ndim = PyArray_NDIM(__pyx_v_self); - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":270 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":270 * ndim = PyArray_NDIM(self) * * if ((flags & pybuf.PyBUF_C_CONTIGUOUS == pybuf.PyBUF_C_CONTIGUOUS) # <<<<<<<<<<<<<< @@ -5976,7 +5976,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P goto __pyx_L4_bool_binop_done; } - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":271 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":271 * * if ((flags & pybuf.PyBUF_C_CONTIGUOUS == pybuf.PyBUF_C_CONTIGUOUS) * and not PyArray_CHKFLAGS(self, NPY_ARRAY_C_CONTIGUOUS)): # <<<<<<<<<<<<<< @@ -5987,7 +5987,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P __pyx_t_1 = __pyx_t_2; __pyx_L4_bool_binop_done:; - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":270 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":270 * ndim = PyArray_NDIM(self) * * if ((flags & pybuf.PyBUF_C_CONTIGUOUS == pybuf.PyBUF_C_CONTIGUOUS) # <<<<<<<<<<<<<< @@ -5996,7 +5996,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P */ if (unlikely(__pyx_t_1)) { - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":272 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":272 * if ((flags & pybuf.PyBUF_C_CONTIGUOUS == pybuf.PyBUF_C_CONTIGUOUS) * and not PyArray_CHKFLAGS(self, NPY_ARRAY_C_CONTIGUOUS)): * raise ValueError(u"ndarray is not C contiguous") # <<<<<<<<<<<<<< @@ -6009,7 +6009,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P __Pyx_DECREF(__pyx_t_3); __pyx_t_3 = 0; __PYX_ERR(1, 272, __pyx_L1_error) - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":270 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":270 * ndim = PyArray_NDIM(self) * * if ((flags & pybuf.PyBUF_C_CONTIGUOUS == pybuf.PyBUF_C_CONTIGUOUS) # <<<<<<<<<<<<<< @@ -6018,7 +6018,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P */ } - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":274 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":274 * raise ValueError(u"ndarray is not C contiguous") * * if ((flags & pybuf.PyBUF_F_CONTIGUOUS == pybuf.PyBUF_F_CONTIGUOUS) # <<<<<<<<<<<<<< @@ -6032,7 +6032,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P goto __pyx_L7_bool_binop_done; } - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":275 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":275 * * if ((flags & pybuf.PyBUF_F_CONTIGUOUS == pybuf.PyBUF_F_CONTIGUOUS) * and not PyArray_CHKFLAGS(self, NPY_ARRAY_F_CONTIGUOUS)): # <<<<<<<<<<<<<< @@ -6043,7 +6043,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P __pyx_t_1 = __pyx_t_2; __pyx_L7_bool_binop_done:; - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":274 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":274 * raise ValueError(u"ndarray is not C contiguous") * * if ((flags & pybuf.PyBUF_F_CONTIGUOUS == pybuf.PyBUF_F_CONTIGUOUS) # <<<<<<<<<<<<<< @@ -6052,7 +6052,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P */ if (unlikely(__pyx_t_1)) { - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":276 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":276 * if ((flags & pybuf.PyBUF_F_CONTIGUOUS == pybuf.PyBUF_F_CONTIGUOUS) * and not PyArray_CHKFLAGS(self, NPY_ARRAY_F_CONTIGUOUS)): * raise ValueError(u"ndarray is not Fortran contiguous") # <<<<<<<<<<<<<< @@ -6065,7 +6065,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P __Pyx_DECREF(__pyx_t_3); __pyx_t_3 = 0; __PYX_ERR(1, 276, __pyx_L1_error) - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":274 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":274 * raise ValueError(u"ndarray is not C contiguous") * * if ((flags & pybuf.PyBUF_F_CONTIGUOUS == pybuf.PyBUF_F_CONTIGUOUS) # <<<<<<<<<<<<<< @@ -6074,7 +6074,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P */ } - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":278 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":278 * raise ValueError(u"ndarray is not Fortran contiguous") * * info.buf = PyArray_DATA(self) # <<<<<<<<<<<<<< @@ -6083,7 +6083,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P */ __pyx_v_info->buf = PyArray_DATA(__pyx_v_self); - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":279 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":279 * * info.buf = PyArray_DATA(self) * info.ndim = ndim # <<<<<<<<<<<<<< @@ -6092,7 +6092,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P */ __pyx_v_info->ndim = __pyx_v_ndim; - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":280 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":280 * info.buf = PyArray_DATA(self) * info.ndim = ndim * if sizeof(npy_intp) != sizeof(Py_ssize_t): # <<<<<<<<<<<<<< @@ -6102,7 +6102,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P __pyx_t_1 = (((sizeof(npy_intp)) != (sizeof(Py_ssize_t))) != 0); if (__pyx_t_1) { - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":283 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":283 * # Allocate new buffer for strides and shape info. * # This is allocated as one block, strides first. * info.strides = PyObject_Malloc(sizeof(Py_ssize_t) * 2 * ndim) # <<<<<<<<<<<<<< @@ -6111,7 +6111,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P */ __pyx_v_info->strides = ((Py_ssize_t *)PyObject_Malloc((((sizeof(Py_ssize_t)) * 2) * ((size_t)__pyx_v_ndim)))); - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":284 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":284 * # This is allocated as one block, strides first. * info.strides = PyObject_Malloc(sizeof(Py_ssize_t) * 2 * ndim) * info.shape = info.strides + ndim # <<<<<<<<<<<<<< @@ -6120,7 +6120,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P */ __pyx_v_info->shape = (__pyx_v_info->strides + __pyx_v_ndim); - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":285 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":285 * info.strides = PyObject_Malloc(sizeof(Py_ssize_t) * 2 * ndim) * info.shape = info.strides + ndim * for i in range(ndim): # <<<<<<<<<<<<<< @@ -6132,7 +6132,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P for (__pyx_t_6 = 0; __pyx_t_6 < __pyx_t_5; __pyx_t_6+=1) { __pyx_v_i = __pyx_t_6; - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":286 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":286 * info.shape = info.strides + ndim * for i in range(ndim): * info.strides[i] = PyArray_STRIDES(self)[i] # <<<<<<<<<<<<<< @@ -6141,7 +6141,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P */ (__pyx_v_info->strides[__pyx_v_i]) = (PyArray_STRIDES(__pyx_v_self)[__pyx_v_i]); - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":287 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":287 * for i in range(ndim): * info.strides[i] = PyArray_STRIDES(self)[i] * info.shape[i] = PyArray_DIMS(self)[i] # <<<<<<<<<<<<<< @@ -6151,7 +6151,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P (__pyx_v_info->shape[__pyx_v_i]) = (PyArray_DIMS(__pyx_v_self)[__pyx_v_i]); } - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":280 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":280 * info.buf = PyArray_DATA(self) * info.ndim = ndim * if sizeof(npy_intp) != sizeof(Py_ssize_t): # <<<<<<<<<<<<<< @@ -6161,7 +6161,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P goto __pyx_L9; } - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":289 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":289 * info.shape[i] = PyArray_DIMS(self)[i] * else: * info.strides = PyArray_STRIDES(self) # <<<<<<<<<<<<<< @@ -6171,7 +6171,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P /*else*/ { __pyx_v_info->strides = ((Py_ssize_t *)PyArray_STRIDES(__pyx_v_self)); - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":290 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":290 * else: * info.strides = PyArray_STRIDES(self) * info.shape = PyArray_DIMS(self) # <<<<<<<<<<<<<< @@ -6182,7 +6182,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P } __pyx_L9:; - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":291 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":291 * info.strides = PyArray_STRIDES(self) * info.shape = PyArray_DIMS(self) * info.suboffsets = NULL # <<<<<<<<<<<<<< @@ -6191,7 +6191,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P */ __pyx_v_info->suboffsets = NULL; - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":292 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":292 * info.shape = PyArray_DIMS(self) * info.suboffsets = NULL * info.itemsize = PyArray_ITEMSIZE(self) # <<<<<<<<<<<<<< @@ -6200,7 +6200,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P */ __pyx_v_info->itemsize = PyArray_ITEMSIZE(__pyx_v_self); - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":293 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":293 * info.suboffsets = NULL * info.itemsize = PyArray_ITEMSIZE(self) * info.readonly = not PyArray_ISWRITEABLE(self) # <<<<<<<<<<<<<< @@ -6209,7 +6209,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P */ __pyx_v_info->readonly = (!(PyArray_ISWRITEABLE(__pyx_v_self) != 0)); - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":296 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":296 * * cdef int t * cdef char* f = NULL # <<<<<<<<<<<<<< @@ -6218,7 +6218,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P */ __pyx_v_f = NULL; - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":297 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":297 * cdef int t * cdef char* f = NULL * cdef dtype descr = PyArray_DESCR(self) # <<<<<<<<<<<<<< @@ -6231,7 +6231,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P __pyx_v_descr = ((PyArray_Descr *)__pyx_t_3); __pyx_t_3 = 0; - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":300 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":300 * cdef int offset * * info.obj = self # <<<<<<<<<<<<<< @@ -6244,7 +6244,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P __Pyx_DECREF(__pyx_v_info->obj); __pyx_v_info->obj = ((PyObject *)__pyx_v_self); - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":302 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":302 * info.obj = self * * if not PyDataType_HASFIELDS(descr): # <<<<<<<<<<<<<< @@ -6254,7 +6254,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P __pyx_t_1 = ((!(PyDataType_HASFIELDS(__pyx_v_descr) != 0)) != 0); if (__pyx_t_1) { - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":303 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":303 * * if not PyDataType_HASFIELDS(descr): * t = descr.type_num # <<<<<<<<<<<<<< @@ -6264,7 +6264,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P __pyx_t_4 = __pyx_v_descr->type_num; __pyx_v_t = __pyx_t_4; - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":304 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":304 * if not PyDataType_HASFIELDS(descr): * t = descr.type_num * if ((descr.byteorder == c'>' and little_endian) or # <<<<<<<<<<<<<< @@ -6284,7 +6284,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P } __pyx_L15_next_or:; - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":305 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":305 * t = descr.type_num * if ((descr.byteorder == c'>' and little_endian) or * (descr.byteorder == c'<' and not little_endian)): # <<<<<<<<<<<<<< @@ -6301,7 +6301,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P __pyx_t_1 = __pyx_t_2; __pyx_L14_bool_binop_done:; - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":304 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":304 * if not PyDataType_HASFIELDS(descr): * t = descr.type_num * if ((descr.byteorder == c'>' and little_endian) or # <<<<<<<<<<<<<< @@ -6310,7 +6310,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P */ if (unlikely(__pyx_t_1)) { - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":306 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":306 * if ((descr.byteorder == c'>' and little_endian) or * (descr.byteorder == c'<' and not little_endian)): * raise ValueError(u"Non-native byte order not supported") # <<<<<<<<<<<<<< @@ -6323,7 +6323,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P __Pyx_DECREF(__pyx_t_3); __pyx_t_3 = 0; __PYX_ERR(1, 306, __pyx_L1_error) - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":304 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":304 * if not PyDataType_HASFIELDS(descr): * t = descr.type_num * if ((descr.byteorder == c'>' and little_endian) or # <<<<<<<<<<<<<< @@ -6332,7 +6332,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P */ } - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":307 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":307 * (descr.byteorder == c'<' and not little_endian)): * raise ValueError(u"Non-native byte order not supported") * if t == NPY_BYTE: f = "b" # <<<<<<<<<<<<<< @@ -6345,7 +6345,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P break; case NPY_UBYTE: - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":308 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":308 * raise ValueError(u"Non-native byte order not supported") * if t == NPY_BYTE: f = "b" * elif t == NPY_UBYTE: f = "B" # <<<<<<<<<<<<<< @@ -6356,7 +6356,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P break; case NPY_SHORT: - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":309 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":309 * if t == NPY_BYTE: f = "b" * elif t == NPY_UBYTE: f = "B" * elif t == NPY_SHORT: f = "h" # <<<<<<<<<<<<<< @@ -6367,7 +6367,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P break; case NPY_USHORT: - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":310 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":310 * elif t == NPY_UBYTE: f = "B" * elif t == NPY_SHORT: f = "h" * elif t == NPY_USHORT: f = "H" # <<<<<<<<<<<<<< @@ -6378,7 +6378,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P break; case NPY_INT: - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":311 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":311 * elif t == NPY_SHORT: f = "h" * elif t == NPY_USHORT: f = "H" * elif t == NPY_INT: f = "i" # <<<<<<<<<<<<<< @@ -6389,7 +6389,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P break; case NPY_UINT: - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":312 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":312 * elif t == NPY_USHORT: f = "H" * elif t == NPY_INT: f = "i" * elif t == NPY_UINT: f = "I" # <<<<<<<<<<<<<< @@ -6400,7 +6400,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P break; case NPY_LONG: - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":313 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":313 * elif t == NPY_INT: f = "i" * elif t == NPY_UINT: f = "I" * elif t == NPY_LONG: f = "l" # <<<<<<<<<<<<<< @@ -6411,7 +6411,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P break; case NPY_ULONG: - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":314 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":314 * elif t == NPY_UINT: f = "I" * elif t == NPY_LONG: f = "l" * elif t == NPY_ULONG: f = "L" # <<<<<<<<<<<<<< @@ -6422,7 +6422,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P break; case NPY_LONGLONG: - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":315 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":315 * elif t == NPY_LONG: f = "l" * elif t == NPY_ULONG: f = "L" * elif t == NPY_LONGLONG: f = "q" # <<<<<<<<<<<<<< @@ -6433,7 +6433,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P break; case NPY_ULONGLONG: - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":316 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":316 * elif t == NPY_ULONG: f = "L" * elif t == NPY_LONGLONG: f = "q" * elif t == NPY_ULONGLONG: f = "Q" # <<<<<<<<<<<<<< @@ -6444,7 +6444,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P break; case NPY_FLOAT: - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":317 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":317 * elif t == NPY_LONGLONG: f = "q" * elif t == NPY_ULONGLONG: f = "Q" * elif t == NPY_FLOAT: f = "f" # <<<<<<<<<<<<<< @@ -6455,7 +6455,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P break; case NPY_DOUBLE: - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":318 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":318 * elif t == NPY_ULONGLONG: f = "Q" * elif t == NPY_FLOAT: f = "f" * elif t == NPY_DOUBLE: f = "d" # <<<<<<<<<<<<<< @@ -6466,7 +6466,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P break; case NPY_LONGDOUBLE: - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":319 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":319 * elif t == NPY_FLOAT: f = "f" * elif t == NPY_DOUBLE: f = "d" * elif t == NPY_LONGDOUBLE: f = "g" # <<<<<<<<<<<<<< @@ -6477,7 +6477,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P break; case NPY_CFLOAT: - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":320 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":320 * elif t == NPY_DOUBLE: f = "d" * elif t == NPY_LONGDOUBLE: f = "g" * elif t == NPY_CFLOAT: f = "Zf" # <<<<<<<<<<<<<< @@ -6488,7 +6488,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P break; case NPY_CDOUBLE: - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":321 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":321 * elif t == NPY_LONGDOUBLE: f = "g" * elif t == NPY_CFLOAT: f = "Zf" * elif t == NPY_CDOUBLE: f = "Zd" # <<<<<<<<<<<<<< @@ -6499,7 +6499,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P break; case NPY_CLONGDOUBLE: - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":322 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":322 * elif t == NPY_CFLOAT: f = "Zf" * elif t == NPY_CDOUBLE: f = "Zd" * elif t == NPY_CLONGDOUBLE: f = "Zg" # <<<<<<<<<<<<<< @@ -6510,7 +6510,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P break; case NPY_OBJECT: - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":323 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":323 * elif t == NPY_CDOUBLE: f = "Zd" * elif t == NPY_CLONGDOUBLE: f = "Zg" * elif t == NPY_OBJECT: f = "O" # <<<<<<<<<<<<<< @@ -6521,7 +6521,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P break; default: - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":325 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":325 * elif t == NPY_OBJECT: f = "O" * else: * raise ValueError(u"unknown dtype code in numpy.pxd (%d)" % t) # <<<<<<<<<<<<<< @@ -6542,7 +6542,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P break; } - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":326 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":326 * else: * raise ValueError(u"unknown dtype code in numpy.pxd (%d)" % t) * info.format = f # <<<<<<<<<<<<<< @@ -6551,7 +6551,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P */ __pyx_v_info->format = __pyx_v_f; - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":327 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":327 * raise ValueError(u"unknown dtype code in numpy.pxd (%d)" % t) * info.format = f * return # <<<<<<<<<<<<<< @@ -6561,7 +6561,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P __pyx_r = 0; goto __pyx_L0; - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":302 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":302 * info.obj = self * * if not PyDataType_HASFIELDS(descr): # <<<<<<<<<<<<<< @@ -6570,7 +6570,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P */ } - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":329 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":329 * return * else: * info.format = PyObject_Malloc(_buffer_format_string_len) # <<<<<<<<<<<<<< @@ -6580,7 +6580,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P /*else*/ { __pyx_v_info->format = ((char *)PyObject_Malloc(0xFF)); - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":330 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":330 * else: * info.format = PyObject_Malloc(_buffer_format_string_len) * info.format[0] = c'^' # Native data types, manual alignment # <<<<<<<<<<<<<< @@ -6589,7 +6589,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P */ (__pyx_v_info->format[0]) = '^'; - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":331 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":331 * info.format = PyObject_Malloc(_buffer_format_string_len) * info.format[0] = c'^' # Native data types, manual alignment * offset = 0 # <<<<<<<<<<<<<< @@ -6598,7 +6598,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P */ __pyx_v_offset = 0; - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":332 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":332 * info.format[0] = c'^' # Native data types, manual alignment * offset = 0 * f = _util_dtypestring(descr, info.format + 1, # <<<<<<<<<<<<<< @@ -6608,7 +6608,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P __pyx_t_9 = __pyx_f_5numpy__util_dtypestring(__pyx_v_descr, (__pyx_v_info->format + 1), (__pyx_v_info->format + 0xFF), (&__pyx_v_offset)); if (unlikely(__pyx_t_9 == ((char *)NULL))) __PYX_ERR(1, 332, __pyx_L1_error) __pyx_v_f = __pyx_t_9; - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":335 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":335 * info.format + _buffer_format_string_len, * &offset) * f[0] = c'\0' # Terminate format string # <<<<<<<<<<<<<< @@ -6618,7 +6618,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P (__pyx_v_f[0]) = '\x00'; } - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":258 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":258 * # experimental exception made for __getbuffer__ and __releasebuffer__ * # -- the details of this may change. * def __getbuffer__(ndarray self, Py_buffer* info, int flags): # <<<<<<<<<<<<<< @@ -6650,7 +6650,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P return __pyx_r; } -/* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":337 +/* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":337 * f[0] = c'\0' # Terminate format string * * def __releasebuffer__(ndarray self, Py_buffer* info): # <<<<<<<<<<<<<< @@ -6674,7 +6674,7 @@ static void __pyx_pf_5numpy_7ndarray_2__releasebuffer__(PyArrayObject *__pyx_v_s int __pyx_t_1; __Pyx_RefNannySetupContext("__releasebuffer__", 0); - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":338 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":338 * * def __releasebuffer__(ndarray self, Py_buffer* info): * if PyArray_HASFIELDS(self): # <<<<<<<<<<<<<< @@ -6684,7 +6684,7 @@ static void __pyx_pf_5numpy_7ndarray_2__releasebuffer__(PyArrayObject *__pyx_v_s __pyx_t_1 = (PyArray_HASFIELDS(__pyx_v_self) != 0); if (__pyx_t_1) { - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":339 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":339 * def __releasebuffer__(ndarray self, Py_buffer* info): * if PyArray_HASFIELDS(self): * PyObject_Free(info.format) # <<<<<<<<<<<<<< @@ -6693,7 +6693,7 @@ static void __pyx_pf_5numpy_7ndarray_2__releasebuffer__(PyArrayObject *__pyx_v_s */ PyObject_Free(__pyx_v_info->format); - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":338 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":338 * * def __releasebuffer__(ndarray self, Py_buffer* info): * if PyArray_HASFIELDS(self): # <<<<<<<<<<<<<< @@ -6702,7 +6702,7 @@ static void __pyx_pf_5numpy_7ndarray_2__releasebuffer__(PyArrayObject *__pyx_v_s */ } - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":340 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":340 * if PyArray_HASFIELDS(self): * PyObject_Free(info.format) * if sizeof(npy_intp) != sizeof(Py_ssize_t): # <<<<<<<<<<<<<< @@ -6712,7 +6712,7 @@ static void __pyx_pf_5numpy_7ndarray_2__releasebuffer__(PyArrayObject *__pyx_v_s __pyx_t_1 = (((sizeof(npy_intp)) != (sizeof(Py_ssize_t))) != 0); if (__pyx_t_1) { - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":341 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":341 * PyObject_Free(info.format) * if sizeof(npy_intp) != sizeof(Py_ssize_t): * PyObject_Free(info.strides) # <<<<<<<<<<<<<< @@ -6721,7 +6721,7 @@ static void __pyx_pf_5numpy_7ndarray_2__releasebuffer__(PyArrayObject *__pyx_v_s */ PyObject_Free(__pyx_v_info->strides); - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":340 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":340 * if PyArray_HASFIELDS(self): * PyObject_Free(info.format) * if sizeof(npy_intp) != sizeof(Py_ssize_t): # <<<<<<<<<<<<<< @@ -6730,7 +6730,7 @@ static void __pyx_pf_5numpy_7ndarray_2__releasebuffer__(PyArrayObject *__pyx_v_s */ } - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":337 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":337 * f[0] = c'\0' # Terminate format string * * def __releasebuffer__(ndarray self, Py_buffer* info): # <<<<<<<<<<<<<< @@ -6742,7 +6742,7 @@ static void __pyx_pf_5numpy_7ndarray_2__releasebuffer__(PyArrayObject *__pyx_v_s __Pyx_RefNannyFinishContext(); } -/* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":821 +/* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":821 * ctypedef npy_cdouble complex_t * * cdef inline object PyArray_MultiIterNew1(a): # <<<<<<<<<<<<<< @@ -6756,7 +6756,7 @@ static CYTHON_INLINE PyObject *__pyx_f_5numpy_PyArray_MultiIterNew1(PyObject *__ PyObject *__pyx_t_1 = NULL; __Pyx_RefNannySetupContext("PyArray_MultiIterNew1", 0); - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":822 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":822 * * cdef inline object PyArray_MultiIterNew1(a): * return PyArray_MultiIterNew(1, a) # <<<<<<<<<<<<<< @@ -6770,7 +6770,7 @@ static CYTHON_INLINE PyObject *__pyx_f_5numpy_PyArray_MultiIterNew1(PyObject *__ __pyx_t_1 = 0; goto __pyx_L0; - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":821 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":821 * ctypedef npy_cdouble complex_t * * cdef inline object PyArray_MultiIterNew1(a): # <<<<<<<<<<<<<< @@ -6789,7 +6789,7 @@ static CYTHON_INLINE PyObject *__pyx_f_5numpy_PyArray_MultiIterNew1(PyObject *__ return __pyx_r; } -/* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":824 +/* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":824 * return PyArray_MultiIterNew(1, a) * * cdef inline object PyArray_MultiIterNew2(a, b): # <<<<<<<<<<<<<< @@ -6803,7 +6803,7 @@ static CYTHON_INLINE PyObject *__pyx_f_5numpy_PyArray_MultiIterNew2(PyObject *__ PyObject *__pyx_t_1 = NULL; __Pyx_RefNannySetupContext("PyArray_MultiIterNew2", 0); - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":825 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":825 * * cdef inline object PyArray_MultiIterNew2(a, b): * return PyArray_MultiIterNew(2, a, b) # <<<<<<<<<<<<<< @@ -6817,7 +6817,7 @@ static CYTHON_INLINE PyObject *__pyx_f_5numpy_PyArray_MultiIterNew2(PyObject *__ __pyx_t_1 = 0; goto __pyx_L0; - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":824 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":824 * return PyArray_MultiIterNew(1, a) * * cdef inline object PyArray_MultiIterNew2(a, b): # <<<<<<<<<<<<<< @@ -6836,7 +6836,7 @@ static CYTHON_INLINE PyObject *__pyx_f_5numpy_PyArray_MultiIterNew2(PyObject *__ return __pyx_r; } -/* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":827 +/* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":827 * return PyArray_MultiIterNew(2, a, b) * * cdef inline object PyArray_MultiIterNew3(a, b, c): # <<<<<<<<<<<<<< @@ -6850,7 +6850,7 @@ static CYTHON_INLINE PyObject *__pyx_f_5numpy_PyArray_MultiIterNew3(PyObject *__ PyObject *__pyx_t_1 = NULL; __Pyx_RefNannySetupContext("PyArray_MultiIterNew3", 0); - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":828 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":828 * * cdef inline object PyArray_MultiIterNew3(a, b, c): * return PyArray_MultiIterNew(3, a, b, c) # <<<<<<<<<<<<<< @@ -6864,7 +6864,7 @@ static CYTHON_INLINE PyObject *__pyx_f_5numpy_PyArray_MultiIterNew3(PyObject *__ __pyx_t_1 = 0; goto __pyx_L0; - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":827 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":827 * return PyArray_MultiIterNew(2, a, b) * * cdef inline object PyArray_MultiIterNew3(a, b, c): # <<<<<<<<<<<<<< @@ -6883,7 +6883,7 @@ static CYTHON_INLINE PyObject *__pyx_f_5numpy_PyArray_MultiIterNew3(PyObject *__ return __pyx_r; } -/* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":830 +/* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":830 * return PyArray_MultiIterNew(3, a, b, c) * * cdef inline object PyArray_MultiIterNew4(a, b, c, d): # <<<<<<<<<<<<<< @@ -6897,7 +6897,7 @@ static CYTHON_INLINE PyObject *__pyx_f_5numpy_PyArray_MultiIterNew4(PyObject *__ PyObject *__pyx_t_1 = NULL; __Pyx_RefNannySetupContext("PyArray_MultiIterNew4", 0); - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":831 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":831 * * cdef inline object PyArray_MultiIterNew4(a, b, c, d): * return PyArray_MultiIterNew(4, a, b, c, d) # <<<<<<<<<<<<<< @@ -6911,7 +6911,7 @@ static CYTHON_INLINE PyObject *__pyx_f_5numpy_PyArray_MultiIterNew4(PyObject *__ __pyx_t_1 = 0; goto __pyx_L0; - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":830 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":830 * return PyArray_MultiIterNew(3, a, b, c) * * cdef inline object PyArray_MultiIterNew4(a, b, c, d): # <<<<<<<<<<<<<< @@ -6930,7 +6930,7 @@ static CYTHON_INLINE PyObject *__pyx_f_5numpy_PyArray_MultiIterNew4(PyObject *__ return __pyx_r; } -/* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":833 +/* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":833 * return PyArray_MultiIterNew(4, a, b, c, d) * * cdef inline object PyArray_MultiIterNew5(a, b, c, d, e): # <<<<<<<<<<<<<< @@ -6944,7 +6944,7 @@ static CYTHON_INLINE PyObject *__pyx_f_5numpy_PyArray_MultiIterNew5(PyObject *__ PyObject *__pyx_t_1 = NULL; __Pyx_RefNannySetupContext("PyArray_MultiIterNew5", 0); - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":834 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":834 * * cdef inline object PyArray_MultiIterNew5(a, b, c, d, e): * return PyArray_MultiIterNew(5, a, b, c, d, e) # <<<<<<<<<<<<<< @@ -6958,7 +6958,7 @@ static CYTHON_INLINE PyObject *__pyx_f_5numpy_PyArray_MultiIterNew5(PyObject *__ __pyx_t_1 = 0; goto __pyx_L0; - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":833 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":833 * return PyArray_MultiIterNew(4, a, b, c, d) * * cdef inline object PyArray_MultiIterNew5(a, b, c, d, e): # <<<<<<<<<<<<<< @@ -6977,7 +6977,7 @@ static CYTHON_INLINE PyObject *__pyx_f_5numpy_PyArray_MultiIterNew5(PyObject *__ return __pyx_r; } -/* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":836 +/* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":836 * return PyArray_MultiIterNew(5, a, b, c, d, e) * * cdef inline tuple PyDataType_SHAPE(dtype d): # <<<<<<<<<<<<<< @@ -6991,7 +6991,7 @@ static CYTHON_INLINE PyObject *__pyx_f_5numpy_PyDataType_SHAPE(PyArray_Descr *__ int __pyx_t_1; __Pyx_RefNannySetupContext("PyDataType_SHAPE", 0); - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":837 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":837 * * cdef inline tuple PyDataType_SHAPE(dtype d): * if PyDataType_HASSUBARRAY(d): # <<<<<<<<<<<<<< @@ -7001,7 +7001,7 @@ static CYTHON_INLINE PyObject *__pyx_f_5numpy_PyDataType_SHAPE(PyArray_Descr *__ __pyx_t_1 = (PyDataType_HASSUBARRAY(__pyx_v_d) != 0); if (__pyx_t_1) { - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":838 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":838 * cdef inline tuple PyDataType_SHAPE(dtype d): * if PyDataType_HASSUBARRAY(d): * return d.subarray.shape # <<<<<<<<<<<<<< @@ -7013,7 +7013,7 @@ static CYTHON_INLINE PyObject *__pyx_f_5numpy_PyDataType_SHAPE(PyArray_Descr *__ __pyx_r = ((PyObject*)__pyx_v_d->subarray->shape); goto __pyx_L0; - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":837 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":837 * * cdef inline tuple PyDataType_SHAPE(dtype d): * if PyDataType_HASSUBARRAY(d): # <<<<<<<<<<<<<< @@ -7022,7 +7022,7 @@ static CYTHON_INLINE PyObject *__pyx_f_5numpy_PyDataType_SHAPE(PyArray_Descr *__ */ } - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":840 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":840 * return d.subarray.shape * else: * return () # <<<<<<<<<<<<<< @@ -7036,7 +7036,7 @@ static CYTHON_INLINE PyObject *__pyx_f_5numpy_PyDataType_SHAPE(PyArray_Descr *__ goto __pyx_L0; } - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":836 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":836 * return PyArray_MultiIterNew(5, a, b, c, d, e) * * cdef inline tuple PyDataType_SHAPE(dtype d): # <<<<<<<<<<<<<< @@ -7051,7 +7051,7 @@ static CYTHON_INLINE PyObject *__pyx_f_5numpy_PyDataType_SHAPE(PyArray_Descr *__ return __pyx_r; } -/* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":842 +/* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":842 * return () * * cdef inline char* _util_dtypestring(dtype descr, char* f, char* end, int* offset) except NULL: # <<<<<<<<<<<<<< @@ -7080,7 +7080,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx char *__pyx_t_9; __Pyx_RefNannySetupContext("_util_dtypestring", 0); - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":847 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":847 * * cdef dtype child * cdef int endian_detector = 1 # <<<<<<<<<<<<<< @@ -7089,7 +7089,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx */ __pyx_v_endian_detector = 1; - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":848 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":848 * cdef dtype child * cdef int endian_detector = 1 * cdef bint little_endian = ((&endian_detector)[0] != 0) # <<<<<<<<<<<<<< @@ -7098,7 +7098,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx */ __pyx_v_little_endian = ((((char *)(&__pyx_v_endian_detector))[0]) != 0); - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":851 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":851 * cdef tuple fields * * for childname in descr.names: # <<<<<<<<<<<<<< @@ -7121,7 +7121,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx __Pyx_XDECREF_SET(__pyx_v_childname, __pyx_t_3); __pyx_t_3 = 0; - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":852 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":852 * * for childname in descr.names: * fields = descr.fields[childname] # <<<<<<<<<<<<<< @@ -7138,7 +7138,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx __Pyx_XDECREF_SET(__pyx_v_fields, ((PyObject*)__pyx_t_3)); __pyx_t_3 = 0; - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":853 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":853 * for childname in descr.names: * fields = descr.fields[childname] * child, new_offset = fields # <<<<<<<<<<<<<< @@ -7173,7 +7173,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx __Pyx_XDECREF_SET(__pyx_v_new_offset, __pyx_t_4); __pyx_t_4 = 0; - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":855 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":855 * child, new_offset = fields * * if (end - f) - (new_offset - offset[0]) < 15: # <<<<<<<<<<<<<< @@ -7190,7 +7190,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx __pyx_t_6 = ((((__pyx_v_end - __pyx_v_f) - ((int)__pyx_t_5)) < 15) != 0); if (unlikely(__pyx_t_6)) { - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":856 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":856 * * if (end - f) - (new_offset - offset[0]) < 15: * raise RuntimeError(u"Format string allocated too short, see comment in numpy.pxd") # <<<<<<<<<<<<<< @@ -7203,7 +7203,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx __Pyx_DECREF(__pyx_t_3); __pyx_t_3 = 0; __PYX_ERR(1, 856, __pyx_L1_error) - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":855 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":855 * child, new_offset = fields * * if (end - f) - (new_offset - offset[0]) < 15: # <<<<<<<<<<<<<< @@ -7212,7 +7212,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx */ } - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":858 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":858 * raise RuntimeError(u"Format string allocated too short, see comment in numpy.pxd") * * if ((child.byteorder == c'>' and little_endian) or # <<<<<<<<<<<<<< @@ -7232,7 +7232,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx } __pyx_L8_next_or:; - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":859 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":859 * * if ((child.byteorder == c'>' and little_endian) or * (child.byteorder == c'<' and not little_endian)): # <<<<<<<<<<<<<< @@ -7249,7 +7249,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx __pyx_t_6 = __pyx_t_7; __pyx_L7_bool_binop_done:; - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":858 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":858 * raise RuntimeError(u"Format string allocated too short, see comment in numpy.pxd") * * if ((child.byteorder == c'>' and little_endian) or # <<<<<<<<<<<<<< @@ -7258,7 +7258,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx */ if (unlikely(__pyx_t_6)) { - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":860 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":860 * if ((child.byteorder == c'>' and little_endian) or * (child.byteorder == c'<' and not little_endian)): * raise ValueError(u"Non-native byte order not supported") # <<<<<<<<<<<<<< @@ -7271,7 +7271,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx __Pyx_DECREF(__pyx_t_3); __pyx_t_3 = 0; __PYX_ERR(1, 860, __pyx_L1_error) - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":858 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":858 * raise RuntimeError(u"Format string allocated too short, see comment in numpy.pxd") * * if ((child.byteorder == c'>' and little_endian) or # <<<<<<<<<<<<<< @@ -7280,7 +7280,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx */ } - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":870 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":870 * * # Output padding bytes * while offset[0] < new_offset: # <<<<<<<<<<<<<< @@ -7296,7 +7296,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx __Pyx_DECREF(__pyx_t_4); __pyx_t_4 = 0; if (!__pyx_t_6) break; - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":871 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":871 * # Output padding bytes * while offset[0] < new_offset: * f[0] = 120 # "x"; pad byte # <<<<<<<<<<<<<< @@ -7305,7 +7305,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx */ (__pyx_v_f[0]) = 0x78; - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":872 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":872 * while offset[0] < new_offset: * f[0] = 120 # "x"; pad byte * f += 1 # <<<<<<<<<<<<<< @@ -7314,7 +7314,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx */ __pyx_v_f = (__pyx_v_f + 1); - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":873 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":873 * f[0] = 120 # "x"; pad byte * f += 1 * offset[0] += 1 # <<<<<<<<<<<<<< @@ -7325,7 +7325,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx (__pyx_v_offset[__pyx_t_8]) = ((__pyx_v_offset[__pyx_t_8]) + 1); } - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":875 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":875 * offset[0] += 1 * * offset[0] += child.itemsize # <<<<<<<<<<<<<< @@ -7335,7 +7335,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx __pyx_t_8 = 0; (__pyx_v_offset[__pyx_t_8]) = ((__pyx_v_offset[__pyx_t_8]) + __pyx_v_child->elsize); - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":877 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":877 * offset[0] += child.itemsize * * if not PyDataType_HASFIELDS(child): # <<<<<<<<<<<<<< @@ -7345,7 +7345,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx __pyx_t_6 = ((!(PyDataType_HASFIELDS(__pyx_v_child) != 0)) != 0); if (__pyx_t_6) { - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":878 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":878 * * if not PyDataType_HASFIELDS(child): * t = child.type_num # <<<<<<<<<<<<<< @@ -7357,7 +7357,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx __Pyx_XDECREF_SET(__pyx_v_t, __pyx_t_4); __pyx_t_4 = 0; - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":879 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":879 * if not PyDataType_HASFIELDS(child): * t = child.type_num * if end - f < 5: # <<<<<<<<<<<<<< @@ -7367,7 +7367,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx __pyx_t_6 = (((__pyx_v_end - __pyx_v_f) < 5) != 0); if (unlikely(__pyx_t_6)) { - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":880 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":880 * t = child.type_num * if end - f < 5: * raise RuntimeError(u"Format string allocated too short.") # <<<<<<<<<<<<<< @@ -7380,7 +7380,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx __Pyx_DECREF(__pyx_t_4); __pyx_t_4 = 0; __PYX_ERR(1, 880, __pyx_L1_error) - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":879 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":879 * if not PyDataType_HASFIELDS(child): * t = child.type_num * if end - f < 5: # <<<<<<<<<<<<<< @@ -7389,7 +7389,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx */ } - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":883 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":883 * * # Until ticket #99 is fixed, use integers to avoid warnings * if t == NPY_BYTE: f[0] = 98 #"b" # <<<<<<<<<<<<<< @@ -7407,7 +7407,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx goto __pyx_L15; } - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":884 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":884 * # Until ticket #99 is fixed, use integers to avoid warnings * if t == NPY_BYTE: f[0] = 98 #"b" * elif t == NPY_UBYTE: f[0] = 66 #"B" # <<<<<<<<<<<<<< @@ -7425,7 +7425,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx goto __pyx_L15; } - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":885 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":885 * if t == NPY_BYTE: f[0] = 98 #"b" * elif t == NPY_UBYTE: f[0] = 66 #"B" * elif t == NPY_SHORT: f[0] = 104 #"h" # <<<<<<<<<<<<<< @@ -7443,7 +7443,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx goto __pyx_L15; } - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":886 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":886 * elif t == NPY_UBYTE: f[0] = 66 #"B" * elif t == NPY_SHORT: f[0] = 104 #"h" * elif t == NPY_USHORT: f[0] = 72 #"H" # <<<<<<<<<<<<<< @@ -7461,7 +7461,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx goto __pyx_L15; } - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":887 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":887 * elif t == NPY_SHORT: f[0] = 104 #"h" * elif t == NPY_USHORT: f[0] = 72 #"H" * elif t == NPY_INT: f[0] = 105 #"i" # <<<<<<<<<<<<<< @@ -7479,7 +7479,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx goto __pyx_L15; } - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":888 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":888 * elif t == NPY_USHORT: f[0] = 72 #"H" * elif t == NPY_INT: f[0] = 105 #"i" * elif t == NPY_UINT: f[0] = 73 #"I" # <<<<<<<<<<<<<< @@ -7497,7 +7497,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx goto __pyx_L15; } - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":889 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":889 * elif t == NPY_INT: f[0] = 105 #"i" * elif t == NPY_UINT: f[0] = 73 #"I" * elif t == NPY_LONG: f[0] = 108 #"l" # <<<<<<<<<<<<<< @@ -7515,7 +7515,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx goto __pyx_L15; } - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":890 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":890 * elif t == NPY_UINT: f[0] = 73 #"I" * elif t == NPY_LONG: f[0] = 108 #"l" * elif t == NPY_ULONG: f[0] = 76 #"L" # <<<<<<<<<<<<<< @@ -7533,7 +7533,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx goto __pyx_L15; } - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":891 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":891 * elif t == NPY_LONG: f[0] = 108 #"l" * elif t == NPY_ULONG: f[0] = 76 #"L" * elif t == NPY_LONGLONG: f[0] = 113 #"q" # <<<<<<<<<<<<<< @@ -7551,7 +7551,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx goto __pyx_L15; } - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":892 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":892 * elif t == NPY_ULONG: f[0] = 76 #"L" * elif t == NPY_LONGLONG: f[0] = 113 #"q" * elif t == NPY_ULONGLONG: f[0] = 81 #"Q" # <<<<<<<<<<<<<< @@ -7569,7 +7569,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx goto __pyx_L15; } - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":893 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":893 * elif t == NPY_LONGLONG: f[0] = 113 #"q" * elif t == NPY_ULONGLONG: f[0] = 81 #"Q" * elif t == NPY_FLOAT: f[0] = 102 #"f" # <<<<<<<<<<<<<< @@ -7587,7 +7587,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx goto __pyx_L15; } - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":894 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":894 * elif t == NPY_ULONGLONG: f[0] = 81 #"Q" * elif t == NPY_FLOAT: f[0] = 102 #"f" * elif t == NPY_DOUBLE: f[0] = 100 #"d" # <<<<<<<<<<<<<< @@ -7605,7 +7605,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx goto __pyx_L15; } - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":895 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":895 * elif t == NPY_FLOAT: f[0] = 102 #"f" * elif t == NPY_DOUBLE: f[0] = 100 #"d" * elif t == NPY_LONGDOUBLE: f[0] = 103 #"g" # <<<<<<<<<<<<<< @@ -7623,7 +7623,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx goto __pyx_L15; } - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":896 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":896 * elif t == NPY_DOUBLE: f[0] = 100 #"d" * elif t == NPY_LONGDOUBLE: f[0] = 103 #"g" * elif t == NPY_CFLOAT: f[0] = 90; f[1] = 102; f += 1 # Zf # <<<<<<<<<<<<<< @@ -7643,7 +7643,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx goto __pyx_L15; } - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":897 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":897 * elif t == NPY_LONGDOUBLE: f[0] = 103 #"g" * elif t == NPY_CFLOAT: f[0] = 90; f[1] = 102; f += 1 # Zf * elif t == NPY_CDOUBLE: f[0] = 90; f[1] = 100; f += 1 # Zd # <<<<<<<<<<<<<< @@ -7663,7 +7663,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx goto __pyx_L15; } - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":898 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":898 * elif t == NPY_CFLOAT: f[0] = 90; f[1] = 102; f += 1 # Zf * elif t == NPY_CDOUBLE: f[0] = 90; f[1] = 100; f += 1 # Zd * elif t == NPY_CLONGDOUBLE: f[0] = 90; f[1] = 103; f += 1 # Zg # <<<<<<<<<<<<<< @@ -7683,7 +7683,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx goto __pyx_L15; } - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":899 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":899 * elif t == NPY_CDOUBLE: f[0] = 90; f[1] = 100; f += 1 # Zd * elif t == NPY_CLONGDOUBLE: f[0] = 90; f[1] = 103; f += 1 # Zg * elif t == NPY_OBJECT: f[0] = 79 #"O" # <<<<<<<<<<<<<< @@ -7701,7 +7701,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx goto __pyx_L15; } - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":901 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":901 * elif t == NPY_OBJECT: f[0] = 79 #"O" * else: * raise ValueError(u"unknown dtype code in numpy.pxd (%d)" % t) # <<<<<<<<<<<<<< @@ -7720,7 +7720,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx } __pyx_L15:; - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":902 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":902 * else: * raise ValueError(u"unknown dtype code in numpy.pxd (%d)" % t) * f += 1 # <<<<<<<<<<<<<< @@ -7729,7 +7729,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx */ __pyx_v_f = (__pyx_v_f + 1); - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":877 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":877 * offset[0] += child.itemsize * * if not PyDataType_HASFIELDS(child): # <<<<<<<<<<<<<< @@ -7739,7 +7739,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx goto __pyx_L13; } - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":906 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":906 * # Cython ignores struct boundary information ("T{...}"), * # so don't output it * f = _util_dtypestring(child, f, end, offset) # <<<<<<<<<<<<<< @@ -7752,7 +7752,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx } __pyx_L13:; - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":851 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":851 * cdef tuple fields * * for childname in descr.names: # <<<<<<<<<<<<<< @@ -7762,7 +7762,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx } __Pyx_DECREF(__pyx_t_1); __pyx_t_1 = 0; - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":907 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":907 * # so don't output it * f = _util_dtypestring(child, f, end, offset) * return f # <<<<<<<<<<<<<< @@ -7772,7 +7772,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx __pyx_r = __pyx_v_f; goto __pyx_L0; - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":842 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":842 * return () * * cdef inline char* _util_dtypestring(dtype descr, char* f, char* end, int* offset) except NULL: # <<<<<<<<<<<<<< @@ -7797,7 +7797,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx return __pyx_r; } -/* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1022 +/* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1022 * int _import_umath() except -1 * * cdef inline void set_array_base(ndarray arr, object base): # <<<<<<<<<<<<<< @@ -7809,7 +7809,7 @@ static CYTHON_INLINE void __pyx_f_5numpy_set_array_base(PyArrayObject *__pyx_v_a __Pyx_RefNannyDeclarations __Pyx_RefNannySetupContext("set_array_base", 0); - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1023 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1023 * * cdef inline void set_array_base(ndarray arr, object base): * Py_INCREF(base) # important to do this before stealing the reference below! # <<<<<<<<<<<<<< @@ -7818,7 +7818,7 @@ static CYTHON_INLINE void __pyx_f_5numpy_set_array_base(PyArrayObject *__pyx_v_a */ Py_INCREF(__pyx_v_base); - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1024 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1024 * cdef inline void set_array_base(ndarray arr, object base): * Py_INCREF(base) # important to do this before stealing the reference below! * PyArray_SetBaseObject(arr, base) # <<<<<<<<<<<<<< @@ -7827,7 +7827,7 @@ static CYTHON_INLINE void __pyx_f_5numpy_set_array_base(PyArrayObject *__pyx_v_a */ (void)(PyArray_SetBaseObject(__pyx_v_arr, __pyx_v_base)); - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1022 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1022 * int _import_umath() except -1 * * cdef inline void set_array_base(ndarray arr, object base): # <<<<<<<<<<<<<< @@ -7839,7 +7839,7 @@ static CYTHON_INLINE void __pyx_f_5numpy_set_array_base(PyArrayObject *__pyx_v_a __Pyx_RefNannyFinishContext(); } -/* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1026 +/* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1026 * PyArray_SetBaseObject(arr, base) * * cdef inline object get_array_base(ndarray arr): # <<<<<<<<<<<<<< @@ -7854,7 +7854,7 @@ static CYTHON_INLINE PyObject *__pyx_f_5numpy_get_array_base(PyArrayObject *__py int __pyx_t_1; __Pyx_RefNannySetupContext("get_array_base", 0); - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1027 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1027 * * cdef inline object get_array_base(ndarray arr): * base = PyArray_BASE(arr) # <<<<<<<<<<<<<< @@ -7863,7 +7863,7 @@ static CYTHON_INLINE PyObject *__pyx_f_5numpy_get_array_base(PyArrayObject *__py */ __pyx_v_base = PyArray_BASE(__pyx_v_arr); - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1028 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1028 * cdef inline object get_array_base(ndarray arr): * base = PyArray_BASE(arr) * if base is NULL: # <<<<<<<<<<<<<< @@ -7873,7 +7873,7 @@ static CYTHON_INLINE PyObject *__pyx_f_5numpy_get_array_base(PyArrayObject *__py __pyx_t_1 = ((__pyx_v_base == NULL) != 0); if (__pyx_t_1) { - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1029 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1029 * base = PyArray_BASE(arr) * if base is NULL: * return None # <<<<<<<<<<<<<< @@ -7884,7 +7884,7 @@ static CYTHON_INLINE PyObject *__pyx_f_5numpy_get_array_base(PyArrayObject *__py __pyx_r = Py_None; __Pyx_INCREF(Py_None); goto __pyx_L0; - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1028 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1028 * cdef inline object get_array_base(ndarray arr): * base = PyArray_BASE(arr) * if base is NULL: # <<<<<<<<<<<<<< @@ -7893,7 +7893,7 @@ static CYTHON_INLINE PyObject *__pyx_f_5numpy_get_array_base(PyArrayObject *__py */ } - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1030 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1030 * if base is NULL: * return None * return base # <<<<<<<<<<<<<< @@ -7905,7 +7905,7 @@ static CYTHON_INLINE PyObject *__pyx_f_5numpy_get_array_base(PyArrayObject *__py __pyx_r = ((PyObject *)__pyx_v_base); goto __pyx_L0; - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1026 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1026 * PyArray_SetBaseObject(arr, base) * * cdef inline object get_array_base(ndarray arr): # <<<<<<<<<<<<<< @@ -7920,7 +7920,7 @@ static CYTHON_INLINE PyObject *__pyx_f_5numpy_get_array_base(PyArrayObject *__py return __pyx_r; } -/* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1034 +/* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1034 * # Versions of the import_* functions which are more suitable for * # Cython code. * cdef inline int import_array() except -1: # <<<<<<<<<<<<<< @@ -7941,7 +7941,7 @@ static CYTHON_INLINE int __pyx_f_5numpy_import_array(void) { PyObject *__pyx_t_8 = NULL; __Pyx_RefNannySetupContext("import_array", 0); - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1035 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1035 * # Cython code. * cdef inline int import_array() except -1: * try: # <<<<<<<<<<<<<< @@ -7957,7 +7957,7 @@ static CYTHON_INLINE int __pyx_f_5numpy_import_array(void) { __Pyx_XGOTREF(__pyx_t_3); /*try:*/ { - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1036 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1036 * cdef inline int import_array() except -1: * try: * _import_array() # <<<<<<<<<<<<<< @@ -7966,7 +7966,7 @@ static CYTHON_INLINE int __pyx_f_5numpy_import_array(void) { */ __pyx_t_4 = _import_array(); if (unlikely(__pyx_t_4 == ((int)-1))) __PYX_ERR(1, 1036, __pyx_L3_error) - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1035 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1035 * # Cython code. * cdef inline int import_array() except -1: * try: # <<<<<<<<<<<<<< @@ -7980,7 +7980,7 @@ static CYTHON_INLINE int __pyx_f_5numpy_import_array(void) { goto __pyx_L8_try_end; __pyx_L3_error:; - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1037 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1037 * try: * _import_array() * except Exception: # <<<<<<<<<<<<<< @@ -7995,7 +7995,7 @@ static CYTHON_INLINE int __pyx_f_5numpy_import_array(void) { __Pyx_GOTREF(__pyx_t_6); __Pyx_GOTREF(__pyx_t_7); - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1038 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1038 * _import_array() * except Exception: * raise ImportError("numpy.core.multiarray failed to import") # <<<<<<<<<<<<<< @@ -8011,7 +8011,7 @@ static CYTHON_INLINE int __pyx_f_5numpy_import_array(void) { goto __pyx_L5_except_error; __pyx_L5_except_error:; - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1035 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1035 * # Cython code. * cdef inline int import_array() except -1: * try: # <<<<<<<<<<<<<< @@ -8026,7 +8026,7 @@ static CYTHON_INLINE int __pyx_f_5numpy_import_array(void) { __pyx_L8_try_end:; } - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1034 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1034 * # Versions of the import_* functions which are more suitable for * # Cython code. * cdef inline int import_array() except -1: # <<<<<<<<<<<<<< @@ -8049,7 +8049,7 @@ static CYTHON_INLINE int __pyx_f_5numpy_import_array(void) { return __pyx_r; } -/* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1040 +/* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1040 * raise ImportError("numpy.core.multiarray failed to import") * * cdef inline int import_umath() except -1: # <<<<<<<<<<<<<< @@ -8070,7 +8070,7 @@ static CYTHON_INLINE int __pyx_f_5numpy_import_umath(void) { PyObject *__pyx_t_8 = NULL; __Pyx_RefNannySetupContext("import_umath", 0); - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1041 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1041 * * cdef inline int import_umath() except -1: * try: # <<<<<<<<<<<<<< @@ -8086,7 +8086,7 @@ static CYTHON_INLINE int __pyx_f_5numpy_import_umath(void) { __Pyx_XGOTREF(__pyx_t_3); /*try:*/ { - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1042 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1042 * cdef inline int import_umath() except -1: * try: * _import_umath() # <<<<<<<<<<<<<< @@ -8095,7 +8095,7 @@ static CYTHON_INLINE int __pyx_f_5numpy_import_umath(void) { */ __pyx_t_4 = _import_umath(); if (unlikely(__pyx_t_4 == ((int)-1))) __PYX_ERR(1, 1042, __pyx_L3_error) - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1041 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1041 * * cdef inline int import_umath() except -1: * try: # <<<<<<<<<<<<<< @@ -8109,7 +8109,7 @@ static CYTHON_INLINE int __pyx_f_5numpy_import_umath(void) { goto __pyx_L8_try_end; __pyx_L3_error:; - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1043 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1043 * try: * _import_umath() * except Exception: # <<<<<<<<<<<<<< @@ -8124,7 +8124,7 @@ static CYTHON_INLINE int __pyx_f_5numpy_import_umath(void) { __Pyx_GOTREF(__pyx_t_6); __Pyx_GOTREF(__pyx_t_7); - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1044 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1044 * _import_umath() * except Exception: * raise ImportError("numpy.core.umath failed to import") # <<<<<<<<<<<<<< @@ -8140,7 +8140,7 @@ static CYTHON_INLINE int __pyx_f_5numpy_import_umath(void) { goto __pyx_L5_except_error; __pyx_L5_except_error:; - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1041 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1041 * * cdef inline int import_umath() except -1: * try: # <<<<<<<<<<<<<< @@ -8155,7 +8155,7 @@ static CYTHON_INLINE int __pyx_f_5numpy_import_umath(void) { __pyx_L8_try_end:; } - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1040 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1040 * raise ImportError("numpy.core.multiarray failed to import") * * cdef inline int import_umath() except -1: # <<<<<<<<<<<<<< @@ -8178,7 +8178,7 @@ static CYTHON_INLINE int __pyx_f_5numpy_import_umath(void) { return __pyx_r; } -/* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1046 +/* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1046 * raise ImportError("numpy.core.umath failed to import") * * cdef inline int import_ufunc() except -1: # <<<<<<<<<<<<<< @@ -8199,7 +8199,7 @@ static CYTHON_INLINE int __pyx_f_5numpy_import_ufunc(void) { PyObject *__pyx_t_8 = NULL; __Pyx_RefNannySetupContext("import_ufunc", 0); - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1047 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1047 * * cdef inline int import_ufunc() except -1: * try: # <<<<<<<<<<<<<< @@ -8215,7 +8215,7 @@ static CYTHON_INLINE int __pyx_f_5numpy_import_ufunc(void) { __Pyx_XGOTREF(__pyx_t_3); /*try:*/ { - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1048 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1048 * cdef inline int import_ufunc() except -1: * try: * _import_umath() # <<<<<<<<<<<<<< @@ -8224,7 +8224,7 @@ static CYTHON_INLINE int __pyx_f_5numpy_import_ufunc(void) { */ __pyx_t_4 = _import_umath(); if (unlikely(__pyx_t_4 == ((int)-1))) __PYX_ERR(1, 1048, __pyx_L3_error) - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1047 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1047 * * cdef inline int import_ufunc() except -1: * try: # <<<<<<<<<<<<<< @@ -8238,7 +8238,7 @@ static CYTHON_INLINE int __pyx_f_5numpy_import_ufunc(void) { goto __pyx_L8_try_end; __pyx_L3_error:; - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1049 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1049 * try: * _import_umath() * except Exception: # <<<<<<<<<<<<<< @@ -8252,7 +8252,7 @@ static CYTHON_INLINE int __pyx_f_5numpy_import_ufunc(void) { __Pyx_GOTREF(__pyx_t_6); __Pyx_GOTREF(__pyx_t_7); - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1050 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1050 * _import_umath() * except Exception: * raise ImportError("numpy.core.umath failed to import") # <<<<<<<<<<<<<< @@ -8266,7 +8266,7 @@ static CYTHON_INLINE int __pyx_f_5numpy_import_ufunc(void) { goto __pyx_L5_except_error; __pyx_L5_except_error:; - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1047 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1047 * * cdef inline int import_ufunc() except -1: * try: # <<<<<<<<<<<<<< @@ -8281,7 +8281,7 @@ static CYTHON_INLINE int __pyx_f_5numpy_import_ufunc(void) { __pyx_L8_try_end:; } - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1046 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1046 * raise ImportError("numpy.core.umath failed to import") * * cdef inline int import_ufunc() except -1: # <<<<<<<<<<<<<< @@ -8444,7 +8444,7 @@ static CYTHON_SMALL_CODE int __Pyx_InitCachedConstants(void) { __Pyx_RefNannyDeclarations __Pyx_RefNannySetupContext("__Pyx_InitCachedConstants", 0); - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":272 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":272 * if ((flags & pybuf.PyBUF_C_CONTIGUOUS == pybuf.PyBUF_C_CONTIGUOUS) * and not PyArray_CHKFLAGS(self, NPY_ARRAY_C_CONTIGUOUS)): * raise ValueError(u"ndarray is not C contiguous") # <<<<<<<<<<<<<< @@ -8455,7 +8455,7 @@ static CYTHON_SMALL_CODE int __Pyx_InitCachedConstants(void) { __Pyx_GOTREF(__pyx_tuple_); __Pyx_GIVEREF(__pyx_tuple_); - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":276 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":276 * if ((flags & pybuf.PyBUF_F_CONTIGUOUS == pybuf.PyBUF_F_CONTIGUOUS) * and not PyArray_CHKFLAGS(self, NPY_ARRAY_F_CONTIGUOUS)): * raise ValueError(u"ndarray is not Fortran contiguous") # <<<<<<<<<<<<<< @@ -8466,7 +8466,7 @@ static CYTHON_SMALL_CODE int __Pyx_InitCachedConstants(void) { __Pyx_GOTREF(__pyx_tuple__2); __Pyx_GIVEREF(__pyx_tuple__2); - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":306 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":306 * if ((descr.byteorder == c'>' and little_endian) or * (descr.byteorder == c'<' and not little_endian)): * raise ValueError(u"Non-native byte order not supported") # <<<<<<<<<<<<<< @@ -8477,7 +8477,7 @@ static CYTHON_SMALL_CODE int __Pyx_InitCachedConstants(void) { __Pyx_GOTREF(__pyx_tuple__3); __Pyx_GIVEREF(__pyx_tuple__3); - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":856 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":856 * * if (end - f) - (new_offset - offset[0]) < 15: * raise RuntimeError(u"Format string allocated too short, see comment in numpy.pxd") # <<<<<<<<<<<<<< @@ -8488,7 +8488,7 @@ static CYTHON_SMALL_CODE int __Pyx_InitCachedConstants(void) { __Pyx_GOTREF(__pyx_tuple__4); __Pyx_GIVEREF(__pyx_tuple__4); - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":880 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":880 * t = child.type_num * if end - f < 5: * raise RuntimeError(u"Format string allocated too short.") # <<<<<<<<<<<<<< @@ -8499,7 +8499,7 @@ static CYTHON_SMALL_CODE int __Pyx_InitCachedConstants(void) { __Pyx_GOTREF(__pyx_tuple__5); __Pyx_GIVEREF(__pyx_tuple__5); - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1038 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1038 * _import_array() * except Exception: * raise ImportError("numpy.core.multiarray failed to import") # <<<<<<<<<<<<<< @@ -8510,7 +8510,7 @@ static CYTHON_SMALL_CODE int __Pyx_InitCachedConstants(void) { __Pyx_GOTREF(__pyx_tuple__6); __Pyx_GIVEREF(__pyx_tuple__6); - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1044 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1044 * _import_umath() * except Exception: * raise ImportError("numpy.core.umath failed to import") # <<<<<<<<<<<<<< @@ -9116,7 +9116,7 @@ if (!__Pyx_RefNanny) { if (PyDict_SetItem(__pyx_d, __pyx_n_s_test, __pyx_t_7) < 0) __PYX_ERR(0, 1, __pyx_L1_error) __Pyx_DECREF(__pyx_t_7); __pyx_t_7 = 0; - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1046 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1046 * raise ImportError("numpy.core.umath failed to import") * * cdef inline int import_ufunc() except -1: # <<<<<<<<<<<<<< @@ -10589,7 +10589,7 @@ static CYTHON_INLINE PyObject* __Pyx_PyInt_From_PY_LONG_LONG(PY_LONG_LONG value) theta = 0; } else { r = -a.real; - theta = atan2f(0, -1); + theta = atan2f(0.0, -1.0); } } else { r = __Pyx_c_abs_float(a); @@ -10744,7 +10744,7 @@ static CYTHON_INLINE PyObject* __Pyx_PyInt_From_PY_LONG_LONG(PY_LONG_LONG value) theta = 0; } else { r = -a.real; - theta = atan2(0, -1); + theta = atan2(0.0, -1.0); } } else { r = __Pyx_c_abs_double(a); diff --git a/gensim/models/doc2vec_inner.c b/gensim/models/doc2vec_inner.c index 4f72058e4f..f273456a65 100644 --- a/gensim/models/doc2vec_inner.c +++ b/gensim/models/doc2vec_inner.c @@ -1,4 +1,4 @@ -/* Generated by Cython 0.29.2 */ +/* Generated by Cython 0.29.3 */ #define PY_SSIZE_T_CLEAN #include "Python.h" @@ -7,8 +7,8 @@ #elif PY_VERSION_HEX < 0x02060000 || (0x03000000 <= PY_VERSION_HEX && PY_VERSION_HEX < 0x03030000) #error Cython requires Python 2.6+ or Python 3.3+. #else -#define CYTHON_ABI "0_29_2" -#define CYTHON_HEX_VERSION 0x001D02F0 +#define CYTHON_ABI "0_29_3" +#define CYTHON_HEX_VERSION 0x001D03F0 #define CYTHON_FUTURE_DIVISION 0 #include #ifndef offsetof @@ -398,7 +398,7 @@ typedef int Py_tss_t; static CYTHON_INLINE int PyThread_tss_create(Py_tss_t *key) { *key = PyThread_create_key(); - return 0; // PyThread_create_key reports success always + return 0; } static CYTHON_INLINE Py_tss_t * PyThread_tss_alloc(void) { Py_tss_t *key = (Py_tss_t *)PyObject_Malloc(sizeof(Py_tss_t)); @@ -421,7 +421,7 @@ static CYTHON_INLINE int PyThread_tss_set(Py_tss_t *key, void *value) { static CYTHON_INLINE void * PyThread_tss_get(Py_tss_t *key) { return PyThread_get_key_value(*key); } -#endif // TSS (Thread Specific Storage) API +#endif #if CYTHON_COMPILING_IN_CPYTHON || defined(_PyDict_NewPresized) #define __Pyx_PyDict_NewPresized(n) ((n <= 8) ? PyDict_New() : _PyDict_NewPresized(n)) #else @@ -859,7 +859,7 @@ static const char *__pyx_f[] = { #endif -/* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":776 +/* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":776 * # in Cython to enable them only on the right systems. * * ctypedef npy_int8 int8_t # <<<<<<<<<<<<<< @@ -868,7 +868,7 @@ static const char *__pyx_f[] = { */ typedef npy_int8 __pyx_t_5numpy_int8_t; -/* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":777 +/* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":777 * * ctypedef npy_int8 int8_t * ctypedef npy_int16 int16_t # <<<<<<<<<<<<<< @@ -877,7 +877,7 @@ typedef npy_int8 __pyx_t_5numpy_int8_t; */ typedef npy_int16 __pyx_t_5numpy_int16_t; -/* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":778 +/* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":778 * ctypedef npy_int8 int8_t * ctypedef npy_int16 int16_t * ctypedef npy_int32 int32_t # <<<<<<<<<<<<<< @@ -886,7 +886,7 @@ typedef npy_int16 __pyx_t_5numpy_int16_t; */ typedef npy_int32 __pyx_t_5numpy_int32_t; -/* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":779 +/* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":779 * ctypedef npy_int16 int16_t * ctypedef npy_int32 int32_t * ctypedef npy_int64 int64_t # <<<<<<<<<<<<<< @@ -895,7 +895,7 @@ typedef npy_int32 __pyx_t_5numpy_int32_t; */ typedef npy_int64 __pyx_t_5numpy_int64_t; -/* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":783 +/* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":783 * #ctypedef npy_int128 int128_t * * ctypedef npy_uint8 uint8_t # <<<<<<<<<<<<<< @@ -904,7 +904,7 @@ typedef npy_int64 __pyx_t_5numpy_int64_t; */ typedef npy_uint8 __pyx_t_5numpy_uint8_t; -/* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":784 +/* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":784 * * ctypedef npy_uint8 uint8_t * ctypedef npy_uint16 uint16_t # <<<<<<<<<<<<<< @@ -913,7 +913,7 @@ typedef npy_uint8 __pyx_t_5numpy_uint8_t; */ typedef npy_uint16 __pyx_t_5numpy_uint16_t; -/* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":785 +/* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":785 * ctypedef npy_uint8 uint8_t * ctypedef npy_uint16 uint16_t * ctypedef npy_uint32 uint32_t # <<<<<<<<<<<<<< @@ -922,7 +922,7 @@ typedef npy_uint16 __pyx_t_5numpy_uint16_t; */ typedef npy_uint32 __pyx_t_5numpy_uint32_t; -/* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":786 +/* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":786 * ctypedef npy_uint16 uint16_t * ctypedef npy_uint32 uint32_t * ctypedef npy_uint64 uint64_t # <<<<<<<<<<<<<< @@ -931,7 +931,7 @@ typedef npy_uint32 __pyx_t_5numpy_uint32_t; */ typedef npy_uint64 __pyx_t_5numpy_uint64_t; -/* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":790 +/* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":790 * #ctypedef npy_uint128 uint128_t * * ctypedef npy_float32 float32_t # <<<<<<<<<<<<<< @@ -940,7 +940,7 @@ typedef npy_uint64 __pyx_t_5numpy_uint64_t; */ typedef npy_float32 __pyx_t_5numpy_float32_t; -/* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":791 +/* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":791 * * ctypedef npy_float32 float32_t * ctypedef npy_float64 float64_t # <<<<<<<<<<<<<< @@ -949,7 +949,7 @@ typedef npy_float32 __pyx_t_5numpy_float32_t; */ typedef npy_float64 __pyx_t_5numpy_float64_t; -/* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":800 +/* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":800 * # The int types are mapped a bit surprising -- * # numpy.int corresponds to 'l' and numpy.long to 'q' * ctypedef npy_long int_t # <<<<<<<<<<<<<< @@ -958,7 +958,7 @@ typedef npy_float64 __pyx_t_5numpy_float64_t; */ typedef npy_long __pyx_t_5numpy_int_t; -/* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":801 +/* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":801 * # numpy.int corresponds to 'l' and numpy.long to 'q' * ctypedef npy_long int_t * ctypedef npy_longlong long_t # <<<<<<<<<<<<<< @@ -967,7 +967,7 @@ typedef npy_long __pyx_t_5numpy_int_t; */ typedef npy_longlong __pyx_t_5numpy_long_t; -/* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":802 +/* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":802 * ctypedef npy_long int_t * ctypedef npy_longlong long_t * ctypedef npy_longlong longlong_t # <<<<<<<<<<<<<< @@ -976,7 +976,7 @@ typedef npy_longlong __pyx_t_5numpy_long_t; */ typedef npy_longlong __pyx_t_5numpy_longlong_t; -/* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":804 +/* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":804 * ctypedef npy_longlong longlong_t * * ctypedef npy_ulong uint_t # <<<<<<<<<<<<<< @@ -985,7 +985,7 @@ typedef npy_longlong __pyx_t_5numpy_longlong_t; */ typedef npy_ulong __pyx_t_5numpy_uint_t; -/* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":805 +/* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":805 * * ctypedef npy_ulong uint_t * ctypedef npy_ulonglong ulong_t # <<<<<<<<<<<<<< @@ -994,7 +994,7 @@ typedef npy_ulong __pyx_t_5numpy_uint_t; */ typedef npy_ulonglong __pyx_t_5numpy_ulong_t; -/* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":806 +/* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":806 * ctypedef npy_ulong uint_t * ctypedef npy_ulonglong ulong_t * ctypedef npy_ulonglong ulonglong_t # <<<<<<<<<<<<<< @@ -1003,7 +1003,7 @@ typedef npy_ulonglong __pyx_t_5numpy_ulong_t; */ typedef npy_ulonglong __pyx_t_5numpy_ulonglong_t; -/* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":808 +/* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":808 * ctypedef npy_ulonglong ulonglong_t * * ctypedef npy_intp intp_t # <<<<<<<<<<<<<< @@ -1012,7 +1012,7 @@ typedef npy_ulonglong __pyx_t_5numpy_ulonglong_t; */ typedef npy_intp __pyx_t_5numpy_intp_t; -/* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":809 +/* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":809 * * ctypedef npy_intp intp_t * ctypedef npy_uintp uintp_t # <<<<<<<<<<<<<< @@ -1021,7 +1021,7 @@ typedef npy_intp __pyx_t_5numpy_intp_t; */ typedef npy_uintp __pyx_t_5numpy_uintp_t; -/* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":811 +/* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":811 * ctypedef npy_uintp uintp_t * * ctypedef npy_double float_t # <<<<<<<<<<<<<< @@ -1030,7 +1030,7 @@ typedef npy_uintp __pyx_t_5numpy_uintp_t; */ typedef npy_double __pyx_t_5numpy_float_t; -/* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":812 +/* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":812 * * ctypedef npy_double float_t * ctypedef npy_double double_t # <<<<<<<<<<<<<< @@ -1039,7 +1039,7 @@ typedef npy_double __pyx_t_5numpy_float_t; */ typedef npy_double __pyx_t_5numpy_double_t; -/* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":813 +/* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":813 * ctypedef npy_double float_t * ctypedef npy_double double_t * ctypedef npy_longdouble longdouble_t # <<<<<<<<<<<<<< @@ -1083,7 +1083,7 @@ static CYTHON_INLINE __pyx_t_double_complex __pyx_t_double_complex_from_parts(do /*--- Type declarations ---*/ -/* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":815 +/* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":815 * ctypedef npy_longdouble longdouble_t * * ctypedef npy_cfloat cfloat_t # <<<<<<<<<<<<<< @@ -1092,7 +1092,7 @@ static CYTHON_INLINE __pyx_t_double_complex __pyx_t_double_complex_from_parts(do */ typedef npy_cfloat __pyx_t_5numpy_cfloat_t; -/* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":816 +/* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":816 * * ctypedef npy_cfloat cfloat_t * ctypedef npy_cdouble cdouble_t # <<<<<<<<<<<<<< @@ -1101,7 +1101,7 @@ typedef npy_cfloat __pyx_t_5numpy_cfloat_t; */ typedef npy_cdouble __pyx_t_5numpy_cdouble_t; -/* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":817 +/* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":817 * ctypedef npy_cfloat cfloat_t * ctypedef npy_cdouble cdouble_t * ctypedef npy_clongdouble clongdouble_t # <<<<<<<<<<<<<< @@ -1110,7 +1110,7 @@ typedef npy_cdouble __pyx_t_5numpy_cdouble_t; */ typedef npy_clongdouble __pyx_t_5numpy_clongdouble_t; -/* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":819 +/* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":819 * ctypedef npy_clongdouble clongdouble_t * * ctypedef npy_cdouble complex_t # <<<<<<<<<<<<<< @@ -7838,7 +7838,7 @@ static PyObject *__pyx_pf_6gensim_6models_13doc2vec_inner_4train_document_dm_con return __pyx_r; } -/* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":258 +/* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":258 * # experimental exception made for __getbuffer__ and __releasebuffer__ * # -- the details of this may change. * def __getbuffer__(ndarray self, Py_buffer* info, int flags): # <<<<<<<<<<<<<< @@ -7887,7 +7887,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P __pyx_v_info->obj = Py_None; __Pyx_INCREF(Py_None); __Pyx_GIVEREF(__pyx_v_info->obj); - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":265 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":265 * * cdef int i, ndim * cdef int endian_detector = 1 # <<<<<<<<<<<<<< @@ -7896,7 +7896,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P */ __pyx_v_endian_detector = 1; - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":266 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":266 * cdef int i, ndim * cdef int endian_detector = 1 * cdef bint little_endian = ((&endian_detector)[0] != 0) # <<<<<<<<<<<<<< @@ -7905,7 +7905,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P */ __pyx_v_little_endian = ((((char *)(&__pyx_v_endian_detector))[0]) != 0); - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":268 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":268 * cdef bint little_endian = ((&endian_detector)[0] != 0) * * ndim = PyArray_NDIM(self) # <<<<<<<<<<<<<< @@ -7914,7 +7914,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P */ __pyx_v_ndim = PyArray_NDIM(__pyx_v_self); - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":270 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":270 * ndim = PyArray_NDIM(self) * * if ((flags & pybuf.PyBUF_C_CONTIGUOUS == pybuf.PyBUF_C_CONTIGUOUS) # <<<<<<<<<<<<<< @@ -7928,7 +7928,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P goto __pyx_L4_bool_binop_done; } - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":271 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":271 * * if ((flags & pybuf.PyBUF_C_CONTIGUOUS == pybuf.PyBUF_C_CONTIGUOUS) * and not PyArray_CHKFLAGS(self, NPY_ARRAY_C_CONTIGUOUS)): # <<<<<<<<<<<<<< @@ -7939,7 +7939,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P __pyx_t_1 = __pyx_t_2; __pyx_L4_bool_binop_done:; - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":270 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":270 * ndim = PyArray_NDIM(self) * * if ((flags & pybuf.PyBUF_C_CONTIGUOUS == pybuf.PyBUF_C_CONTIGUOUS) # <<<<<<<<<<<<<< @@ -7948,7 +7948,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P */ if (unlikely(__pyx_t_1)) { - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":272 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":272 * if ((flags & pybuf.PyBUF_C_CONTIGUOUS == pybuf.PyBUF_C_CONTIGUOUS) * and not PyArray_CHKFLAGS(self, NPY_ARRAY_C_CONTIGUOUS)): * raise ValueError(u"ndarray is not C contiguous") # <<<<<<<<<<<<<< @@ -7961,7 +7961,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P __Pyx_DECREF(__pyx_t_3); __pyx_t_3 = 0; __PYX_ERR(1, 272, __pyx_L1_error) - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":270 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":270 * ndim = PyArray_NDIM(self) * * if ((flags & pybuf.PyBUF_C_CONTIGUOUS == pybuf.PyBUF_C_CONTIGUOUS) # <<<<<<<<<<<<<< @@ -7970,7 +7970,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P */ } - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":274 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":274 * raise ValueError(u"ndarray is not C contiguous") * * if ((flags & pybuf.PyBUF_F_CONTIGUOUS == pybuf.PyBUF_F_CONTIGUOUS) # <<<<<<<<<<<<<< @@ -7984,7 +7984,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P goto __pyx_L7_bool_binop_done; } - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":275 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":275 * * if ((flags & pybuf.PyBUF_F_CONTIGUOUS == pybuf.PyBUF_F_CONTIGUOUS) * and not PyArray_CHKFLAGS(self, NPY_ARRAY_F_CONTIGUOUS)): # <<<<<<<<<<<<<< @@ -7995,7 +7995,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P __pyx_t_1 = __pyx_t_2; __pyx_L7_bool_binop_done:; - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":274 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":274 * raise ValueError(u"ndarray is not C contiguous") * * if ((flags & pybuf.PyBUF_F_CONTIGUOUS == pybuf.PyBUF_F_CONTIGUOUS) # <<<<<<<<<<<<<< @@ -8004,7 +8004,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P */ if (unlikely(__pyx_t_1)) { - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":276 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":276 * if ((flags & pybuf.PyBUF_F_CONTIGUOUS == pybuf.PyBUF_F_CONTIGUOUS) * and not PyArray_CHKFLAGS(self, NPY_ARRAY_F_CONTIGUOUS)): * raise ValueError(u"ndarray is not Fortran contiguous") # <<<<<<<<<<<<<< @@ -8017,7 +8017,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P __Pyx_DECREF(__pyx_t_3); __pyx_t_3 = 0; __PYX_ERR(1, 276, __pyx_L1_error) - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":274 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":274 * raise ValueError(u"ndarray is not C contiguous") * * if ((flags & pybuf.PyBUF_F_CONTIGUOUS == pybuf.PyBUF_F_CONTIGUOUS) # <<<<<<<<<<<<<< @@ -8026,7 +8026,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P */ } - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":278 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":278 * raise ValueError(u"ndarray is not Fortran contiguous") * * info.buf = PyArray_DATA(self) # <<<<<<<<<<<<<< @@ -8035,7 +8035,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P */ __pyx_v_info->buf = PyArray_DATA(__pyx_v_self); - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":279 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":279 * * info.buf = PyArray_DATA(self) * info.ndim = ndim # <<<<<<<<<<<<<< @@ -8044,7 +8044,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P */ __pyx_v_info->ndim = __pyx_v_ndim; - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":280 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":280 * info.buf = PyArray_DATA(self) * info.ndim = ndim * if sizeof(npy_intp) != sizeof(Py_ssize_t): # <<<<<<<<<<<<<< @@ -8054,7 +8054,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P __pyx_t_1 = (((sizeof(npy_intp)) != (sizeof(Py_ssize_t))) != 0); if (__pyx_t_1) { - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":283 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":283 * # Allocate new buffer for strides and shape info. * # This is allocated as one block, strides first. * info.strides = PyObject_Malloc(sizeof(Py_ssize_t) * 2 * ndim) # <<<<<<<<<<<<<< @@ -8063,7 +8063,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P */ __pyx_v_info->strides = ((Py_ssize_t *)PyObject_Malloc((((sizeof(Py_ssize_t)) * 2) * ((size_t)__pyx_v_ndim)))); - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":284 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":284 * # This is allocated as one block, strides first. * info.strides = PyObject_Malloc(sizeof(Py_ssize_t) * 2 * ndim) * info.shape = info.strides + ndim # <<<<<<<<<<<<<< @@ -8072,7 +8072,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P */ __pyx_v_info->shape = (__pyx_v_info->strides + __pyx_v_ndim); - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":285 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":285 * info.strides = PyObject_Malloc(sizeof(Py_ssize_t) * 2 * ndim) * info.shape = info.strides + ndim * for i in range(ndim): # <<<<<<<<<<<<<< @@ -8084,7 +8084,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P for (__pyx_t_6 = 0; __pyx_t_6 < __pyx_t_5; __pyx_t_6+=1) { __pyx_v_i = __pyx_t_6; - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":286 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":286 * info.shape = info.strides + ndim * for i in range(ndim): * info.strides[i] = PyArray_STRIDES(self)[i] # <<<<<<<<<<<<<< @@ -8093,7 +8093,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P */ (__pyx_v_info->strides[__pyx_v_i]) = (PyArray_STRIDES(__pyx_v_self)[__pyx_v_i]); - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":287 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":287 * for i in range(ndim): * info.strides[i] = PyArray_STRIDES(self)[i] * info.shape[i] = PyArray_DIMS(self)[i] # <<<<<<<<<<<<<< @@ -8103,7 +8103,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P (__pyx_v_info->shape[__pyx_v_i]) = (PyArray_DIMS(__pyx_v_self)[__pyx_v_i]); } - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":280 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":280 * info.buf = PyArray_DATA(self) * info.ndim = ndim * if sizeof(npy_intp) != sizeof(Py_ssize_t): # <<<<<<<<<<<<<< @@ -8113,7 +8113,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P goto __pyx_L9; } - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":289 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":289 * info.shape[i] = PyArray_DIMS(self)[i] * else: * info.strides = PyArray_STRIDES(self) # <<<<<<<<<<<<<< @@ -8123,7 +8123,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P /*else*/ { __pyx_v_info->strides = ((Py_ssize_t *)PyArray_STRIDES(__pyx_v_self)); - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":290 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":290 * else: * info.strides = PyArray_STRIDES(self) * info.shape = PyArray_DIMS(self) # <<<<<<<<<<<<<< @@ -8134,7 +8134,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P } __pyx_L9:; - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":291 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":291 * info.strides = PyArray_STRIDES(self) * info.shape = PyArray_DIMS(self) * info.suboffsets = NULL # <<<<<<<<<<<<<< @@ -8143,7 +8143,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P */ __pyx_v_info->suboffsets = NULL; - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":292 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":292 * info.shape = PyArray_DIMS(self) * info.suboffsets = NULL * info.itemsize = PyArray_ITEMSIZE(self) # <<<<<<<<<<<<<< @@ -8152,7 +8152,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P */ __pyx_v_info->itemsize = PyArray_ITEMSIZE(__pyx_v_self); - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":293 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":293 * info.suboffsets = NULL * info.itemsize = PyArray_ITEMSIZE(self) * info.readonly = not PyArray_ISWRITEABLE(self) # <<<<<<<<<<<<<< @@ -8161,7 +8161,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P */ __pyx_v_info->readonly = (!(PyArray_ISWRITEABLE(__pyx_v_self) != 0)); - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":296 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":296 * * cdef int t * cdef char* f = NULL # <<<<<<<<<<<<<< @@ -8170,7 +8170,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P */ __pyx_v_f = NULL; - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":297 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":297 * cdef int t * cdef char* f = NULL * cdef dtype descr = PyArray_DESCR(self) # <<<<<<<<<<<<<< @@ -8183,7 +8183,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P __pyx_v_descr = ((PyArray_Descr *)__pyx_t_3); __pyx_t_3 = 0; - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":300 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":300 * cdef int offset * * info.obj = self # <<<<<<<<<<<<<< @@ -8196,7 +8196,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P __Pyx_DECREF(__pyx_v_info->obj); __pyx_v_info->obj = ((PyObject *)__pyx_v_self); - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":302 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":302 * info.obj = self * * if not PyDataType_HASFIELDS(descr): # <<<<<<<<<<<<<< @@ -8206,7 +8206,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P __pyx_t_1 = ((!(PyDataType_HASFIELDS(__pyx_v_descr) != 0)) != 0); if (__pyx_t_1) { - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":303 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":303 * * if not PyDataType_HASFIELDS(descr): * t = descr.type_num # <<<<<<<<<<<<<< @@ -8216,7 +8216,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P __pyx_t_4 = __pyx_v_descr->type_num; __pyx_v_t = __pyx_t_4; - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":304 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":304 * if not PyDataType_HASFIELDS(descr): * t = descr.type_num * if ((descr.byteorder == c'>' and little_endian) or # <<<<<<<<<<<<<< @@ -8236,7 +8236,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P } __pyx_L15_next_or:; - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":305 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":305 * t = descr.type_num * if ((descr.byteorder == c'>' and little_endian) or * (descr.byteorder == c'<' and not little_endian)): # <<<<<<<<<<<<<< @@ -8253,7 +8253,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P __pyx_t_1 = __pyx_t_2; __pyx_L14_bool_binop_done:; - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":304 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":304 * if not PyDataType_HASFIELDS(descr): * t = descr.type_num * if ((descr.byteorder == c'>' and little_endian) or # <<<<<<<<<<<<<< @@ -8262,7 +8262,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P */ if (unlikely(__pyx_t_1)) { - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":306 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":306 * if ((descr.byteorder == c'>' and little_endian) or * (descr.byteorder == c'<' and not little_endian)): * raise ValueError(u"Non-native byte order not supported") # <<<<<<<<<<<<<< @@ -8275,7 +8275,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P __Pyx_DECREF(__pyx_t_3); __pyx_t_3 = 0; __PYX_ERR(1, 306, __pyx_L1_error) - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":304 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":304 * if not PyDataType_HASFIELDS(descr): * t = descr.type_num * if ((descr.byteorder == c'>' and little_endian) or # <<<<<<<<<<<<<< @@ -8284,7 +8284,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P */ } - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":307 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":307 * (descr.byteorder == c'<' and not little_endian)): * raise ValueError(u"Non-native byte order not supported") * if t == NPY_BYTE: f = "b" # <<<<<<<<<<<<<< @@ -8297,7 +8297,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P break; case NPY_UBYTE: - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":308 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":308 * raise ValueError(u"Non-native byte order not supported") * if t == NPY_BYTE: f = "b" * elif t == NPY_UBYTE: f = "B" # <<<<<<<<<<<<<< @@ -8308,7 +8308,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P break; case NPY_SHORT: - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":309 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":309 * if t == NPY_BYTE: f = "b" * elif t == NPY_UBYTE: f = "B" * elif t == NPY_SHORT: f = "h" # <<<<<<<<<<<<<< @@ -8319,7 +8319,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P break; case NPY_USHORT: - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":310 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":310 * elif t == NPY_UBYTE: f = "B" * elif t == NPY_SHORT: f = "h" * elif t == NPY_USHORT: f = "H" # <<<<<<<<<<<<<< @@ -8330,7 +8330,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P break; case NPY_INT: - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":311 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":311 * elif t == NPY_SHORT: f = "h" * elif t == NPY_USHORT: f = "H" * elif t == NPY_INT: f = "i" # <<<<<<<<<<<<<< @@ -8341,7 +8341,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P break; case NPY_UINT: - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":312 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":312 * elif t == NPY_USHORT: f = "H" * elif t == NPY_INT: f = "i" * elif t == NPY_UINT: f = "I" # <<<<<<<<<<<<<< @@ -8352,7 +8352,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P break; case NPY_LONG: - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":313 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":313 * elif t == NPY_INT: f = "i" * elif t == NPY_UINT: f = "I" * elif t == NPY_LONG: f = "l" # <<<<<<<<<<<<<< @@ -8363,7 +8363,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P break; case NPY_ULONG: - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":314 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":314 * elif t == NPY_UINT: f = "I" * elif t == NPY_LONG: f = "l" * elif t == NPY_ULONG: f = "L" # <<<<<<<<<<<<<< @@ -8374,7 +8374,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P break; case NPY_LONGLONG: - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":315 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":315 * elif t == NPY_LONG: f = "l" * elif t == NPY_ULONG: f = "L" * elif t == NPY_LONGLONG: f = "q" # <<<<<<<<<<<<<< @@ -8385,7 +8385,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P break; case NPY_ULONGLONG: - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":316 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":316 * elif t == NPY_ULONG: f = "L" * elif t == NPY_LONGLONG: f = "q" * elif t == NPY_ULONGLONG: f = "Q" # <<<<<<<<<<<<<< @@ -8396,7 +8396,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P break; case NPY_FLOAT: - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":317 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":317 * elif t == NPY_LONGLONG: f = "q" * elif t == NPY_ULONGLONG: f = "Q" * elif t == NPY_FLOAT: f = "f" # <<<<<<<<<<<<<< @@ -8407,7 +8407,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P break; case NPY_DOUBLE: - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":318 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":318 * elif t == NPY_ULONGLONG: f = "Q" * elif t == NPY_FLOAT: f = "f" * elif t == NPY_DOUBLE: f = "d" # <<<<<<<<<<<<<< @@ -8418,7 +8418,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P break; case NPY_LONGDOUBLE: - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":319 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":319 * elif t == NPY_FLOAT: f = "f" * elif t == NPY_DOUBLE: f = "d" * elif t == NPY_LONGDOUBLE: f = "g" # <<<<<<<<<<<<<< @@ -8429,7 +8429,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P break; case NPY_CFLOAT: - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":320 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":320 * elif t == NPY_DOUBLE: f = "d" * elif t == NPY_LONGDOUBLE: f = "g" * elif t == NPY_CFLOAT: f = "Zf" # <<<<<<<<<<<<<< @@ -8440,7 +8440,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P break; case NPY_CDOUBLE: - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":321 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":321 * elif t == NPY_LONGDOUBLE: f = "g" * elif t == NPY_CFLOAT: f = "Zf" * elif t == NPY_CDOUBLE: f = "Zd" # <<<<<<<<<<<<<< @@ -8451,7 +8451,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P break; case NPY_CLONGDOUBLE: - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":322 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":322 * elif t == NPY_CFLOAT: f = "Zf" * elif t == NPY_CDOUBLE: f = "Zd" * elif t == NPY_CLONGDOUBLE: f = "Zg" # <<<<<<<<<<<<<< @@ -8462,7 +8462,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P break; case NPY_OBJECT: - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":323 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":323 * elif t == NPY_CDOUBLE: f = "Zd" * elif t == NPY_CLONGDOUBLE: f = "Zg" * elif t == NPY_OBJECT: f = "O" # <<<<<<<<<<<<<< @@ -8473,7 +8473,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P break; default: - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":325 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":325 * elif t == NPY_OBJECT: f = "O" * else: * raise ValueError(u"unknown dtype code in numpy.pxd (%d)" % t) # <<<<<<<<<<<<<< @@ -8494,7 +8494,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P break; } - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":326 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":326 * else: * raise ValueError(u"unknown dtype code in numpy.pxd (%d)" % t) * info.format = f # <<<<<<<<<<<<<< @@ -8503,7 +8503,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P */ __pyx_v_info->format = __pyx_v_f; - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":327 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":327 * raise ValueError(u"unknown dtype code in numpy.pxd (%d)" % t) * info.format = f * return # <<<<<<<<<<<<<< @@ -8513,7 +8513,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P __pyx_r = 0; goto __pyx_L0; - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":302 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":302 * info.obj = self * * if not PyDataType_HASFIELDS(descr): # <<<<<<<<<<<<<< @@ -8522,7 +8522,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P */ } - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":329 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":329 * return * else: * info.format = PyObject_Malloc(_buffer_format_string_len) # <<<<<<<<<<<<<< @@ -8532,7 +8532,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P /*else*/ { __pyx_v_info->format = ((char *)PyObject_Malloc(0xFF)); - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":330 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":330 * else: * info.format = PyObject_Malloc(_buffer_format_string_len) * info.format[0] = c'^' # Native data types, manual alignment # <<<<<<<<<<<<<< @@ -8541,7 +8541,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P */ (__pyx_v_info->format[0]) = '^'; - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":331 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":331 * info.format = PyObject_Malloc(_buffer_format_string_len) * info.format[0] = c'^' # Native data types, manual alignment * offset = 0 # <<<<<<<<<<<<<< @@ -8550,7 +8550,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P */ __pyx_v_offset = 0; - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":332 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":332 * info.format[0] = c'^' # Native data types, manual alignment * offset = 0 * f = _util_dtypestring(descr, info.format + 1, # <<<<<<<<<<<<<< @@ -8560,7 +8560,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P __pyx_t_9 = __pyx_f_5numpy__util_dtypestring(__pyx_v_descr, (__pyx_v_info->format + 1), (__pyx_v_info->format + 0xFF), (&__pyx_v_offset)); if (unlikely(__pyx_t_9 == ((char *)NULL))) __PYX_ERR(1, 332, __pyx_L1_error) __pyx_v_f = __pyx_t_9; - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":335 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":335 * info.format + _buffer_format_string_len, * &offset) * f[0] = c'\0' # Terminate format string # <<<<<<<<<<<<<< @@ -8570,7 +8570,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P (__pyx_v_f[0]) = '\x00'; } - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":258 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":258 * # experimental exception made for __getbuffer__ and __releasebuffer__ * # -- the details of this may change. * def __getbuffer__(ndarray self, Py_buffer* info, int flags): # <<<<<<<<<<<<<< @@ -8602,7 +8602,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P return __pyx_r; } -/* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":337 +/* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":337 * f[0] = c'\0' # Terminate format string * * def __releasebuffer__(ndarray self, Py_buffer* info): # <<<<<<<<<<<<<< @@ -8626,7 +8626,7 @@ static void __pyx_pf_5numpy_7ndarray_2__releasebuffer__(PyArrayObject *__pyx_v_s int __pyx_t_1; __Pyx_RefNannySetupContext("__releasebuffer__", 0); - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":338 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":338 * * def __releasebuffer__(ndarray self, Py_buffer* info): * if PyArray_HASFIELDS(self): # <<<<<<<<<<<<<< @@ -8636,7 +8636,7 @@ static void __pyx_pf_5numpy_7ndarray_2__releasebuffer__(PyArrayObject *__pyx_v_s __pyx_t_1 = (PyArray_HASFIELDS(__pyx_v_self) != 0); if (__pyx_t_1) { - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":339 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":339 * def __releasebuffer__(ndarray self, Py_buffer* info): * if PyArray_HASFIELDS(self): * PyObject_Free(info.format) # <<<<<<<<<<<<<< @@ -8645,7 +8645,7 @@ static void __pyx_pf_5numpy_7ndarray_2__releasebuffer__(PyArrayObject *__pyx_v_s */ PyObject_Free(__pyx_v_info->format); - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":338 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":338 * * def __releasebuffer__(ndarray self, Py_buffer* info): * if PyArray_HASFIELDS(self): # <<<<<<<<<<<<<< @@ -8654,7 +8654,7 @@ static void __pyx_pf_5numpy_7ndarray_2__releasebuffer__(PyArrayObject *__pyx_v_s */ } - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":340 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":340 * if PyArray_HASFIELDS(self): * PyObject_Free(info.format) * if sizeof(npy_intp) != sizeof(Py_ssize_t): # <<<<<<<<<<<<<< @@ -8664,7 +8664,7 @@ static void __pyx_pf_5numpy_7ndarray_2__releasebuffer__(PyArrayObject *__pyx_v_s __pyx_t_1 = (((sizeof(npy_intp)) != (sizeof(Py_ssize_t))) != 0); if (__pyx_t_1) { - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":341 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":341 * PyObject_Free(info.format) * if sizeof(npy_intp) != sizeof(Py_ssize_t): * PyObject_Free(info.strides) # <<<<<<<<<<<<<< @@ -8673,7 +8673,7 @@ static void __pyx_pf_5numpy_7ndarray_2__releasebuffer__(PyArrayObject *__pyx_v_s */ PyObject_Free(__pyx_v_info->strides); - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":340 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":340 * if PyArray_HASFIELDS(self): * PyObject_Free(info.format) * if sizeof(npy_intp) != sizeof(Py_ssize_t): # <<<<<<<<<<<<<< @@ -8682,7 +8682,7 @@ static void __pyx_pf_5numpy_7ndarray_2__releasebuffer__(PyArrayObject *__pyx_v_s */ } - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":337 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":337 * f[0] = c'\0' # Terminate format string * * def __releasebuffer__(ndarray self, Py_buffer* info): # <<<<<<<<<<<<<< @@ -8694,7 +8694,7 @@ static void __pyx_pf_5numpy_7ndarray_2__releasebuffer__(PyArrayObject *__pyx_v_s __Pyx_RefNannyFinishContext(); } -/* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":821 +/* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":821 * ctypedef npy_cdouble complex_t * * cdef inline object PyArray_MultiIterNew1(a): # <<<<<<<<<<<<<< @@ -8708,7 +8708,7 @@ static CYTHON_INLINE PyObject *__pyx_f_5numpy_PyArray_MultiIterNew1(PyObject *__ PyObject *__pyx_t_1 = NULL; __Pyx_RefNannySetupContext("PyArray_MultiIterNew1", 0); - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":822 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":822 * * cdef inline object PyArray_MultiIterNew1(a): * return PyArray_MultiIterNew(1, a) # <<<<<<<<<<<<<< @@ -8722,7 +8722,7 @@ static CYTHON_INLINE PyObject *__pyx_f_5numpy_PyArray_MultiIterNew1(PyObject *__ __pyx_t_1 = 0; goto __pyx_L0; - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":821 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":821 * ctypedef npy_cdouble complex_t * * cdef inline object PyArray_MultiIterNew1(a): # <<<<<<<<<<<<<< @@ -8741,7 +8741,7 @@ static CYTHON_INLINE PyObject *__pyx_f_5numpy_PyArray_MultiIterNew1(PyObject *__ return __pyx_r; } -/* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":824 +/* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":824 * return PyArray_MultiIterNew(1, a) * * cdef inline object PyArray_MultiIterNew2(a, b): # <<<<<<<<<<<<<< @@ -8755,7 +8755,7 @@ static CYTHON_INLINE PyObject *__pyx_f_5numpy_PyArray_MultiIterNew2(PyObject *__ PyObject *__pyx_t_1 = NULL; __Pyx_RefNannySetupContext("PyArray_MultiIterNew2", 0); - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":825 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":825 * * cdef inline object PyArray_MultiIterNew2(a, b): * return PyArray_MultiIterNew(2, a, b) # <<<<<<<<<<<<<< @@ -8769,7 +8769,7 @@ static CYTHON_INLINE PyObject *__pyx_f_5numpy_PyArray_MultiIterNew2(PyObject *__ __pyx_t_1 = 0; goto __pyx_L0; - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":824 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":824 * return PyArray_MultiIterNew(1, a) * * cdef inline object PyArray_MultiIterNew2(a, b): # <<<<<<<<<<<<<< @@ -8788,7 +8788,7 @@ static CYTHON_INLINE PyObject *__pyx_f_5numpy_PyArray_MultiIterNew2(PyObject *__ return __pyx_r; } -/* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":827 +/* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":827 * return PyArray_MultiIterNew(2, a, b) * * cdef inline object PyArray_MultiIterNew3(a, b, c): # <<<<<<<<<<<<<< @@ -8802,7 +8802,7 @@ static CYTHON_INLINE PyObject *__pyx_f_5numpy_PyArray_MultiIterNew3(PyObject *__ PyObject *__pyx_t_1 = NULL; __Pyx_RefNannySetupContext("PyArray_MultiIterNew3", 0); - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":828 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":828 * * cdef inline object PyArray_MultiIterNew3(a, b, c): * return PyArray_MultiIterNew(3, a, b, c) # <<<<<<<<<<<<<< @@ -8816,7 +8816,7 @@ static CYTHON_INLINE PyObject *__pyx_f_5numpy_PyArray_MultiIterNew3(PyObject *__ __pyx_t_1 = 0; goto __pyx_L0; - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":827 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":827 * return PyArray_MultiIterNew(2, a, b) * * cdef inline object PyArray_MultiIterNew3(a, b, c): # <<<<<<<<<<<<<< @@ -8835,7 +8835,7 @@ static CYTHON_INLINE PyObject *__pyx_f_5numpy_PyArray_MultiIterNew3(PyObject *__ return __pyx_r; } -/* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":830 +/* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":830 * return PyArray_MultiIterNew(3, a, b, c) * * cdef inline object PyArray_MultiIterNew4(a, b, c, d): # <<<<<<<<<<<<<< @@ -8849,7 +8849,7 @@ static CYTHON_INLINE PyObject *__pyx_f_5numpy_PyArray_MultiIterNew4(PyObject *__ PyObject *__pyx_t_1 = NULL; __Pyx_RefNannySetupContext("PyArray_MultiIterNew4", 0); - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":831 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":831 * * cdef inline object PyArray_MultiIterNew4(a, b, c, d): * return PyArray_MultiIterNew(4, a, b, c, d) # <<<<<<<<<<<<<< @@ -8863,7 +8863,7 @@ static CYTHON_INLINE PyObject *__pyx_f_5numpy_PyArray_MultiIterNew4(PyObject *__ __pyx_t_1 = 0; goto __pyx_L0; - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":830 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":830 * return PyArray_MultiIterNew(3, a, b, c) * * cdef inline object PyArray_MultiIterNew4(a, b, c, d): # <<<<<<<<<<<<<< @@ -8882,7 +8882,7 @@ static CYTHON_INLINE PyObject *__pyx_f_5numpy_PyArray_MultiIterNew4(PyObject *__ return __pyx_r; } -/* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":833 +/* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":833 * return PyArray_MultiIterNew(4, a, b, c, d) * * cdef inline object PyArray_MultiIterNew5(a, b, c, d, e): # <<<<<<<<<<<<<< @@ -8896,7 +8896,7 @@ static CYTHON_INLINE PyObject *__pyx_f_5numpy_PyArray_MultiIterNew5(PyObject *__ PyObject *__pyx_t_1 = NULL; __Pyx_RefNannySetupContext("PyArray_MultiIterNew5", 0); - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":834 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":834 * * cdef inline object PyArray_MultiIterNew5(a, b, c, d, e): * return PyArray_MultiIterNew(5, a, b, c, d, e) # <<<<<<<<<<<<<< @@ -8910,7 +8910,7 @@ static CYTHON_INLINE PyObject *__pyx_f_5numpy_PyArray_MultiIterNew5(PyObject *__ __pyx_t_1 = 0; goto __pyx_L0; - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":833 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":833 * return PyArray_MultiIterNew(4, a, b, c, d) * * cdef inline object PyArray_MultiIterNew5(a, b, c, d, e): # <<<<<<<<<<<<<< @@ -8929,7 +8929,7 @@ static CYTHON_INLINE PyObject *__pyx_f_5numpy_PyArray_MultiIterNew5(PyObject *__ return __pyx_r; } -/* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":836 +/* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":836 * return PyArray_MultiIterNew(5, a, b, c, d, e) * * cdef inline tuple PyDataType_SHAPE(dtype d): # <<<<<<<<<<<<<< @@ -8943,7 +8943,7 @@ static CYTHON_INLINE PyObject *__pyx_f_5numpy_PyDataType_SHAPE(PyArray_Descr *__ int __pyx_t_1; __Pyx_RefNannySetupContext("PyDataType_SHAPE", 0); - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":837 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":837 * * cdef inline tuple PyDataType_SHAPE(dtype d): * if PyDataType_HASSUBARRAY(d): # <<<<<<<<<<<<<< @@ -8953,7 +8953,7 @@ static CYTHON_INLINE PyObject *__pyx_f_5numpy_PyDataType_SHAPE(PyArray_Descr *__ __pyx_t_1 = (PyDataType_HASSUBARRAY(__pyx_v_d) != 0); if (__pyx_t_1) { - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":838 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":838 * cdef inline tuple PyDataType_SHAPE(dtype d): * if PyDataType_HASSUBARRAY(d): * return d.subarray.shape # <<<<<<<<<<<<<< @@ -8965,7 +8965,7 @@ static CYTHON_INLINE PyObject *__pyx_f_5numpy_PyDataType_SHAPE(PyArray_Descr *__ __pyx_r = ((PyObject*)__pyx_v_d->subarray->shape); goto __pyx_L0; - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":837 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":837 * * cdef inline tuple PyDataType_SHAPE(dtype d): * if PyDataType_HASSUBARRAY(d): # <<<<<<<<<<<<<< @@ -8974,7 +8974,7 @@ static CYTHON_INLINE PyObject *__pyx_f_5numpy_PyDataType_SHAPE(PyArray_Descr *__ */ } - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":840 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":840 * return d.subarray.shape * else: * return () # <<<<<<<<<<<<<< @@ -8988,7 +8988,7 @@ static CYTHON_INLINE PyObject *__pyx_f_5numpy_PyDataType_SHAPE(PyArray_Descr *__ goto __pyx_L0; } - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":836 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":836 * return PyArray_MultiIterNew(5, a, b, c, d, e) * * cdef inline tuple PyDataType_SHAPE(dtype d): # <<<<<<<<<<<<<< @@ -9003,7 +9003,7 @@ static CYTHON_INLINE PyObject *__pyx_f_5numpy_PyDataType_SHAPE(PyArray_Descr *__ return __pyx_r; } -/* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":842 +/* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":842 * return () * * cdef inline char* _util_dtypestring(dtype descr, char* f, char* end, int* offset) except NULL: # <<<<<<<<<<<<<< @@ -9032,7 +9032,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx char *__pyx_t_9; __Pyx_RefNannySetupContext("_util_dtypestring", 0); - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":847 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":847 * * cdef dtype child * cdef int endian_detector = 1 # <<<<<<<<<<<<<< @@ -9041,7 +9041,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx */ __pyx_v_endian_detector = 1; - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":848 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":848 * cdef dtype child * cdef int endian_detector = 1 * cdef bint little_endian = ((&endian_detector)[0] != 0) # <<<<<<<<<<<<<< @@ -9050,7 +9050,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx */ __pyx_v_little_endian = ((((char *)(&__pyx_v_endian_detector))[0]) != 0); - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":851 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":851 * cdef tuple fields * * for childname in descr.names: # <<<<<<<<<<<<<< @@ -9073,7 +9073,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx __Pyx_XDECREF_SET(__pyx_v_childname, __pyx_t_3); __pyx_t_3 = 0; - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":852 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":852 * * for childname in descr.names: * fields = descr.fields[childname] # <<<<<<<<<<<<<< @@ -9090,7 +9090,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx __Pyx_XDECREF_SET(__pyx_v_fields, ((PyObject*)__pyx_t_3)); __pyx_t_3 = 0; - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":853 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":853 * for childname in descr.names: * fields = descr.fields[childname] * child, new_offset = fields # <<<<<<<<<<<<<< @@ -9125,7 +9125,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx __Pyx_XDECREF_SET(__pyx_v_new_offset, __pyx_t_4); __pyx_t_4 = 0; - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":855 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":855 * child, new_offset = fields * * if (end - f) - (new_offset - offset[0]) < 15: # <<<<<<<<<<<<<< @@ -9142,7 +9142,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx __pyx_t_6 = ((((__pyx_v_end - __pyx_v_f) - ((int)__pyx_t_5)) < 15) != 0); if (unlikely(__pyx_t_6)) { - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":856 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":856 * * if (end - f) - (new_offset - offset[0]) < 15: * raise RuntimeError(u"Format string allocated too short, see comment in numpy.pxd") # <<<<<<<<<<<<<< @@ -9155,7 +9155,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx __Pyx_DECREF(__pyx_t_3); __pyx_t_3 = 0; __PYX_ERR(1, 856, __pyx_L1_error) - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":855 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":855 * child, new_offset = fields * * if (end - f) - (new_offset - offset[0]) < 15: # <<<<<<<<<<<<<< @@ -9164,7 +9164,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx */ } - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":858 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":858 * raise RuntimeError(u"Format string allocated too short, see comment in numpy.pxd") * * if ((child.byteorder == c'>' and little_endian) or # <<<<<<<<<<<<<< @@ -9184,7 +9184,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx } __pyx_L8_next_or:; - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":859 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":859 * * if ((child.byteorder == c'>' and little_endian) or * (child.byteorder == c'<' and not little_endian)): # <<<<<<<<<<<<<< @@ -9201,7 +9201,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx __pyx_t_6 = __pyx_t_7; __pyx_L7_bool_binop_done:; - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":858 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":858 * raise RuntimeError(u"Format string allocated too short, see comment in numpy.pxd") * * if ((child.byteorder == c'>' and little_endian) or # <<<<<<<<<<<<<< @@ -9210,7 +9210,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx */ if (unlikely(__pyx_t_6)) { - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":860 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":860 * if ((child.byteorder == c'>' and little_endian) or * (child.byteorder == c'<' and not little_endian)): * raise ValueError(u"Non-native byte order not supported") # <<<<<<<<<<<<<< @@ -9223,7 +9223,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx __Pyx_DECREF(__pyx_t_3); __pyx_t_3 = 0; __PYX_ERR(1, 860, __pyx_L1_error) - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":858 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":858 * raise RuntimeError(u"Format string allocated too short, see comment in numpy.pxd") * * if ((child.byteorder == c'>' and little_endian) or # <<<<<<<<<<<<<< @@ -9232,7 +9232,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx */ } - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":870 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":870 * * # Output padding bytes * while offset[0] < new_offset: # <<<<<<<<<<<<<< @@ -9248,7 +9248,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx __Pyx_DECREF(__pyx_t_4); __pyx_t_4 = 0; if (!__pyx_t_6) break; - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":871 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":871 * # Output padding bytes * while offset[0] < new_offset: * f[0] = 120 # "x"; pad byte # <<<<<<<<<<<<<< @@ -9257,7 +9257,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx */ (__pyx_v_f[0]) = 0x78; - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":872 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":872 * while offset[0] < new_offset: * f[0] = 120 # "x"; pad byte * f += 1 # <<<<<<<<<<<<<< @@ -9266,7 +9266,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx */ __pyx_v_f = (__pyx_v_f + 1); - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":873 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":873 * f[0] = 120 # "x"; pad byte * f += 1 * offset[0] += 1 # <<<<<<<<<<<<<< @@ -9277,7 +9277,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx (__pyx_v_offset[__pyx_t_8]) = ((__pyx_v_offset[__pyx_t_8]) + 1); } - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":875 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":875 * offset[0] += 1 * * offset[0] += child.itemsize # <<<<<<<<<<<<<< @@ -9287,7 +9287,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx __pyx_t_8 = 0; (__pyx_v_offset[__pyx_t_8]) = ((__pyx_v_offset[__pyx_t_8]) + __pyx_v_child->elsize); - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":877 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":877 * offset[0] += child.itemsize * * if not PyDataType_HASFIELDS(child): # <<<<<<<<<<<<<< @@ -9297,7 +9297,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx __pyx_t_6 = ((!(PyDataType_HASFIELDS(__pyx_v_child) != 0)) != 0); if (__pyx_t_6) { - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":878 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":878 * * if not PyDataType_HASFIELDS(child): * t = child.type_num # <<<<<<<<<<<<<< @@ -9309,7 +9309,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx __Pyx_XDECREF_SET(__pyx_v_t, __pyx_t_4); __pyx_t_4 = 0; - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":879 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":879 * if not PyDataType_HASFIELDS(child): * t = child.type_num * if end - f < 5: # <<<<<<<<<<<<<< @@ -9319,7 +9319,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx __pyx_t_6 = (((__pyx_v_end - __pyx_v_f) < 5) != 0); if (unlikely(__pyx_t_6)) { - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":880 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":880 * t = child.type_num * if end - f < 5: * raise RuntimeError(u"Format string allocated too short.") # <<<<<<<<<<<<<< @@ -9332,7 +9332,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx __Pyx_DECREF(__pyx_t_4); __pyx_t_4 = 0; __PYX_ERR(1, 880, __pyx_L1_error) - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":879 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":879 * if not PyDataType_HASFIELDS(child): * t = child.type_num * if end - f < 5: # <<<<<<<<<<<<<< @@ -9341,7 +9341,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx */ } - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":883 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":883 * * # Until ticket #99 is fixed, use integers to avoid warnings * if t == NPY_BYTE: f[0] = 98 #"b" # <<<<<<<<<<<<<< @@ -9359,7 +9359,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx goto __pyx_L15; } - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":884 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":884 * # Until ticket #99 is fixed, use integers to avoid warnings * if t == NPY_BYTE: f[0] = 98 #"b" * elif t == NPY_UBYTE: f[0] = 66 #"B" # <<<<<<<<<<<<<< @@ -9377,7 +9377,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx goto __pyx_L15; } - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":885 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":885 * if t == NPY_BYTE: f[0] = 98 #"b" * elif t == NPY_UBYTE: f[0] = 66 #"B" * elif t == NPY_SHORT: f[0] = 104 #"h" # <<<<<<<<<<<<<< @@ -9395,7 +9395,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx goto __pyx_L15; } - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":886 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":886 * elif t == NPY_UBYTE: f[0] = 66 #"B" * elif t == NPY_SHORT: f[0] = 104 #"h" * elif t == NPY_USHORT: f[0] = 72 #"H" # <<<<<<<<<<<<<< @@ -9413,7 +9413,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx goto __pyx_L15; } - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":887 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":887 * elif t == NPY_SHORT: f[0] = 104 #"h" * elif t == NPY_USHORT: f[0] = 72 #"H" * elif t == NPY_INT: f[0] = 105 #"i" # <<<<<<<<<<<<<< @@ -9431,7 +9431,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx goto __pyx_L15; } - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":888 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":888 * elif t == NPY_USHORT: f[0] = 72 #"H" * elif t == NPY_INT: f[0] = 105 #"i" * elif t == NPY_UINT: f[0] = 73 #"I" # <<<<<<<<<<<<<< @@ -9449,7 +9449,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx goto __pyx_L15; } - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":889 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":889 * elif t == NPY_INT: f[0] = 105 #"i" * elif t == NPY_UINT: f[0] = 73 #"I" * elif t == NPY_LONG: f[0] = 108 #"l" # <<<<<<<<<<<<<< @@ -9467,7 +9467,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx goto __pyx_L15; } - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":890 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":890 * elif t == NPY_UINT: f[0] = 73 #"I" * elif t == NPY_LONG: f[0] = 108 #"l" * elif t == NPY_ULONG: f[0] = 76 #"L" # <<<<<<<<<<<<<< @@ -9485,7 +9485,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx goto __pyx_L15; } - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":891 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":891 * elif t == NPY_LONG: f[0] = 108 #"l" * elif t == NPY_ULONG: f[0] = 76 #"L" * elif t == NPY_LONGLONG: f[0] = 113 #"q" # <<<<<<<<<<<<<< @@ -9503,7 +9503,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx goto __pyx_L15; } - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":892 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":892 * elif t == NPY_ULONG: f[0] = 76 #"L" * elif t == NPY_LONGLONG: f[0] = 113 #"q" * elif t == NPY_ULONGLONG: f[0] = 81 #"Q" # <<<<<<<<<<<<<< @@ -9521,7 +9521,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx goto __pyx_L15; } - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":893 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":893 * elif t == NPY_LONGLONG: f[0] = 113 #"q" * elif t == NPY_ULONGLONG: f[0] = 81 #"Q" * elif t == NPY_FLOAT: f[0] = 102 #"f" # <<<<<<<<<<<<<< @@ -9539,7 +9539,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx goto __pyx_L15; } - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":894 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":894 * elif t == NPY_ULONGLONG: f[0] = 81 #"Q" * elif t == NPY_FLOAT: f[0] = 102 #"f" * elif t == NPY_DOUBLE: f[0] = 100 #"d" # <<<<<<<<<<<<<< @@ -9557,7 +9557,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx goto __pyx_L15; } - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":895 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":895 * elif t == NPY_FLOAT: f[0] = 102 #"f" * elif t == NPY_DOUBLE: f[0] = 100 #"d" * elif t == NPY_LONGDOUBLE: f[0] = 103 #"g" # <<<<<<<<<<<<<< @@ -9575,7 +9575,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx goto __pyx_L15; } - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":896 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":896 * elif t == NPY_DOUBLE: f[0] = 100 #"d" * elif t == NPY_LONGDOUBLE: f[0] = 103 #"g" * elif t == NPY_CFLOAT: f[0] = 90; f[1] = 102; f += 1 # Zf # <<<<<<<<<<<<<< @@ -9595,7 +9595,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx goto __pyx_L15; } - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":897 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":897 * elif t == NPY_LONGDOUBLE: f[0] = 103 #"g" * elif t == NPY_CFLOAT: f[0] = 90; f[1] = 102; f += 1 # Zf * elif t == NPY_CDOUBLE: f[0] = 90; f[1] = 100; f += 1 # Zd # <<<<<<<<<<<<<< @@ -9615,7 +9615,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx goto __pyx_L15; } - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":898 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":898 * elif t == NPY_CFLOAT: f[0] = 90; f[1] = 102; f += 1 # Zf * elif t == NPY_CDOUBLE: f[0] = 90; f[1] = 100; f += 1 # Zd * elif t == NPY_CLONGDOUBLE: f[0] = 90; f[1] = 103; f += 1 # Zg # <<<<<<<<<<<<<< @@ -9635,7 +9635,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx goto __pyx_L15; } - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":899 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":899 * elif t == NPY_CDOUBLE: f[0] = 90; f[1] = 100; f += 1 # Zd * elif t == NPY_CLONGDOUBLE: f[0] = 90; f[1] = 103; f += 1 # Zg * elif t == NPY_OBJECT: f[0] = 79 #"O" # <<<<<<<<<<<<<< @@ -9653,7 +9653,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx goto __pyx_L15; } - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":901 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":901 * elif t == NPY_OBJECT: f[0] = 79 #"O" * else: * raise ValueError(u"unknown dtype code in numpy.pxd (%d)" % t) # <<<<<<<<<<<<<< @@ -9672,7 +9672,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx } __pyx_L15:; - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":902 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":902 * else: * raise ValueError(u"unknown dtype code in numpy.pxd (%d)" % t) * f += 1 # <<<<<<<<<<<<<< @@ -9681,7 +9681,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx */ __pyx_v_f = (__pyx_v_f + 1); - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":877 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":877 * offset[0] += child.itemsize * * if not PyDataType_HASFIELDS(child): # <<<<<<<<<<<<<< @@ -9691,7 +9691,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx goto __pyx_L13; } - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":906 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":906 * # Cython ignores struct boundary information ("T{...}"), * # so don't output it * f = _util_dtypestring(child, f, end, offset) # <<<<<<<<<<<<<< @@ -9704,7 +9704,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx } __pyx_L13:; - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":851 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":851 * cdef tuple fields * * for childname in descr.names: # <<<<<<<<<<<<<< @@ -9714,7 +9714,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx } __Pyx_DECREF(__pyx_t_1); __pyx_t_1 = 0; - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":907 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":907 * # so don't output it * f = _util_dtypestring(child, f, end, offset) * return f # <<<<<<<<<<<<<< @@ -9724,7 +9724,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx __pyx_r = __pyx_v_f; goto __pyx_L0; - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":842 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":842 * return () * * cdef inline char* _util_dtypestring(dtype descr, char* f, char* end, int* offset) except NULL: # <<<<<<<<<<<<<< @@ -9749,7 +9749,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx return __pyx_r; } -/* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1022 +/* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1022 * int _import_umath() except -1 * * cdef inline void set_array_base(ndarray arr, object base): # <<<<<<<<<<<<<< @@ -9761,7 +9761,7 @@ static CYTHON_INLINE void __pyx_f_5numpy_set_array_base(PyArrayObject *__pyx_v_a __Pyx_RefNannyDeclarations __Pyx_RefNannySetupContext("set_array_base", 0); - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1023 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1023 * * cdef inline void set_array_base(ndarray arr, object base): * Py_INCREF(base) # important to do this before stealing the reference below! # <<<<<<<<<<<<<< @@ -9770,7 +9770,7 @@ static CYTHON_INLINE void __pyx_f_5numpy_set_array_base(PyArrayObject *__pyx_v_a */ Py_INCREF(__pyx_v_base); - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1024 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1024 * cdef inline void set_array_base(ndarray arr, object base): * Py_INCREF(base) # important to do this before stealing the reference below! * PyArray_SetBaseObject(arr, base) # <<<<<<<<<<<<<< @@ -9779,7 +9779,7 @@ static CYTHON_INLINE void __pyx_f_5numpy_set_array_base(PyArrayObject *__pyx_v_a */ (void)(PyArray_SetBaseObject(__pyx_v_arr, __pyx_v_base)); - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1022 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1022 * int _import_umath() except -1 * * cdef inline void set_array_base(ndarray arr, object base): # <<<<<<<<<<<<<< @@ -9791,7 +9791,7 @@ static CYTHON_INLINE void __pyx_f_5numpy_set_array_base(PyArrayObject *__pyx_v_a __Pyx_RefNannyFinishContext(); } -/* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1026 +/* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1026 * PyArray_SetBaseObject(arr, base) * * cdef inline object get_array_base(ndarray arr): # <<<<<<<<<<<<<< @@ -9806,7 +9806,7 @@ static CYTHON_INLINE PyObject *__pyx_f_5numpy_get_array_base(PyArrayObject *__py int __pyx_t_1; __Pyx_RefNannySetupContext("get_array_base", 0); - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1027 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1027 * * cdef inline object get_array_base(ndarray arr): * base = PyArray_BASE(arr) # <<<<<<<<<<<<<< @@ -9815,7 +9815,7 @@ static CYTHON_INLINE PyObject *__pyx_f_5numpy_get_array_base(PyArrayObject *__py */ __pyx_v_base = PyArray_BASE(__pyx_v_arr); - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1028 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1028 * cdef inline object get_array_base(ndarray arr): * base = PyArray_BASE(arr) * if base is NULL: # <<<<<<<<<<<<<< @@ -9825,7 +9825,7 @@ static CYTHON_INLINE PyObject *__pyx_f_5numpy_get_array_base(PyArrayObject *__py __pyx_t_1 = ((__pyx_v_base == NULL) != 0); if (__pyx_t_1) { - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1029 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1029 * base = PyArray_BASE(arr) * if base is NULL: * return None # <<<<<<<<<<<<<< @@ -9836,7 +9836,7 @@ static CYTHON_INLINE PyObject *__pyx_f_5numpy_get_array_base(PyArrayObject *__py __pyx_r = Py_None; __Pyx_INCREF(Py_None); goto __pyx_L0; - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1028 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1028 * cdef inline object get_array_base(ndarray arr): * base = PyArray_BASE(arr) * if base is NULL: # <<<<<<<<<<<<<< @@ -9845,7 +9845,7 @@ static CYTHON_INLINE PyObject *__pyx_f_5numpy_get_array_base(PyArrayObject *__py */ } - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1030 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1030 * if base is NULL: * return None * return base # <<<<<<<<<<<<<< @@ -9857,7 +9857,7 @@ static CYTHON_INLINE PyObject *__pyx_f_5numpy_get_array_base(PyArrayObject *__py __pyx_r = ((PyObject *)__pyx_v_base); goto __pyx_L0; - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1026 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1026 * PyArray_SetBaseObject(arr, base) * * cdef inline object get_array_base(ndarray arr): # <<<<<<<<<<<<<< @@ -9872,7 +9872,7 @@ static CYTHON_INLINE PyObject *__pyx_f_5numpy_get_array_base(PyArrayObject *__py return __pyx_r; } -/* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1034 +/* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1034 * # Versions of the import_* functions which are more suitable for * # Cython code. * cdef inline int import_array() except -1: # <<<<<<<<<<<<<< @@ -9893,7 +9893,7 @@ static CYTHON_INLINE int __pyx_f_5numpy_import_array(void) { PyObject *__pyx_t_8 = NULL; __Pyx_RefNannySetupContext("import_array", 0); - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1035 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1035 * # Cython code. * cdef inline int import_array() except -1: * try: # <<<<<<<<<<<<<< @@ -9909,7 +9909,7 @@ static CYTHON_INLINE int __pyx_f_5numpy_import_array(void) { __Pyx_XGOTREF(__pyx_t_3); /*try:*/ { - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1036 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1036 * cdef inline int import_array() except -1: * try: * _import_array() # <<<<<<<<<<<<<< @@ -9918,7 +9918,7 @@ static CYTHON_INLINE int __pyx_f_5numpy_import_array(void) { */ __pyx_t_4 = _import_array(); if (unlikely(__pyx_t_4 == ((int)-1))) __PYX_ERR(1, 1036, __pyx_L3_error) - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1035 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1035 * # Cython code. * cdef inline int import_array() except -1: * try: # <<<<<<<<<<<<<< @@ -9932,7 +9932,7 @@ static CYTHON_INLINE int __pyx_f_5numpy_import_array(void) { goto __pyx_L8_try_end; __pyx_L3_error:; - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1037 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1037 * try: * _import_array() * except Exception: # <<<<<<<<<<<<<< @@ -9947,7 +9947,7 @@ static CYTHON_INLINE int __pyx_f_5numpy_import_array(void) { __Pyx_GOTREF(__pyx_t_6); __Pyx_GOTREF(__pyx_t_7); - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1038 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1038 * _import_array() * except Exception: * raise ImportError("numpy.core.multiarray failed to import") # <<<<<<<<<<<<<< @@ -9963,7 +9963,7 @@ static CYTHON_INLINE int __pyx_f_5numpy_import_array(void) { goto __pyx_L5_except_error; __pyx_L5_except_error:; - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1035 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1035 * # Cython code. * cdef inline int import_array() except -1: * try: # <<<<<<<<<<<<<< @@ -9978,7 +9978,7 @@ static CYTHON_INLINE int __pyx_f_5numpy_import_array(void) { __pyx_L8_try_end:; } - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1034 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1034 * # Versions of the import_* functions which are more suitable for * # Cython code. * cdef inline int import_array() except -1: # <<<<<<<<<<<<<< @@ -10001,7 +10001,7 @@ static CYTHON_INLINE int __pyx_f_5numpy_import_array(void) { return __pyx_r; } -/* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1040 +/* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1040 * raise ImportError("numpy.core.multiarray failed to import") * * cdef inline int import_umath() except -1: # <<<<<<<<<<<<<< @@ -10022,7 +10022,7 @@ static CYTHON_INLINE int __pyx_f_5numpy_import_umath(void) { PyObject *__pyx_t_8 = NULL; __Pyx_RefNannySetupContext("import_umath", 0); - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1041 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1041 * * cdef inline int import_umath() except -1: * try: # <<<<<<<<<<<<<< @@ -10038,7 +10038,7 @@ static CYTHON_INLINE int __pyx_f_5numpy_import_umath(void) { __Pyx_XGOTREF(__pyx_t_3); /*try:*/ { - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1042 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1042 * cdef inline int import_umath() except -1: * try: * _import_umath() # <<<<<<<<<<<<<< @@ -10047,7 +10047,7 @@ static CYTHON_INLINE int __pyx_f_5numpy_import_umath(void) { */ __pyx_t_4 = _import_umath(); if (unlikely(__pyx_t_4 == ((int)-1))) __PYX_ERR(1, 1042, __pyx_L3_error) - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1041 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1041 * * cdef inline int import_umath() except -1: * try: # <<<<<<<<<<<<<< @@ -10061,7 +10061,7 @@ static CYTHON_INLINE int __pyx_f_5numpy_import_umath(void) { goto __pyx_L8_try_end; __pyx_L3_error:; - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1043 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1043 * try: * _import_umath() * except Exception: # <<<<<<<<<<<<<< @@ -10076,7 +10076,7 @@ static CYTHON_INLINE int __pyx_f_5numpy_import_umath(void) { __Pyx_GOTREF(__pyx_t_6); __Pyx_GOTREF(__pyx_t_7); - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1044 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1044 * _import_umath() * except Exception: * raise ImportError("numpy.core.umath failed to import") # <<<<<<<<<<<<<< @@ -10092,7 +10092,7 @@ static CYTHON_INLINE int __pyx_f_5numpy_import_umath(void) { goto __pyx_L5_except_error; __pyx_L5_except_error:; - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1041 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1041 * * cdef inline int import_umath() except -1: * try: # <<<<<<<<<<<<<< @@ -10107,7 +10107,7 @@ static CYTHON_INLINE int __pyx_f_5numpy_import_umath(void) { __pyx_L8_try_end:; } - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1040 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1040 * raise ImportError("numpy.core.multiarray failed to import") * * cdef inline int import_umath() except -1: # <<<<<<<<<<<<<< @@ -10130,7 +10130,7 @@ static CYTHON_INLINE int __pyx_f_5numpy_import_umath(void) { return __pyx_r; } -/* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1046 +/* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1046 * raise ImportError("numpy.core.umath failed to import") * * cdef inline int import_ufunc() except -1: # <<<<<<<<<<<<<< @@ -10151,7 +10151,7 @@ static CYTHON_INLINE int __pyx_f_5numpy_import_ufunc(void) { PyObject *__pyx_t_8 = NULL; __Pyx_RefNannySetupContext("import_ufunc", 0); - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1047 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1047 * * cdef inline int import_ufunc() except -1: * try: # <<<<<<<<<<<<<< @@ -10167,7 +10167,7 @@ static CYTHON_INLINE int __pyx_f_5numpy_import_ufunc(void) { __Pyx_XGOTREF(__pyx_t_3); /*try:*/ { - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1048 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1048 * cdef inline int import_ufunc() except -1: * try: * _import_umath() # <<<<<<<<<<<<<< @@ -10176,7 +10176,7 @@ static CYTHON_INLINE int __pyx_f_5numpy_import_ufunc(void) { */ __pyx_t_4 = _import_umath(); if (unlikely(__pyx_t_4 == ((int)-1))) __PYX_ERR(1, 1048, __pyx_L3_error) - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1047 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1047 * * cdef inline int import_ufunc() except -1: * try: # <<<<<<<<<<<<<< @@ -10190,7 +10190,7 @@ static CYTHON_INLINE int __pyx_f_5numpy_import_ufunc(void) { goto __pyx_L8_try_end; __pyx_L3_error:; - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1049 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1049 * try: * _import_umath() * except Exception: # <<<<<<<<<<<<<< @@ -10204,7 +10204,7 @@ static CYTHON_INLINE int __pyx_f_5numpy_import_ufunc(void) { __Pyx_GOTREF(__pyx_t_6); __Pyx_GOTREF(__pyx_t_7); - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1050 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1050 * _import_umath() * except Exception: * raise ImportError("numpy.core.umath failed to import") # <<<<<<<<<<<<<< @@ -10218,7 +10218,7 @@ static CYTHON_INLINE int __pyx_f_5numpy_import_ufunc(void) { goto __pyx_L5_except_error; __pyx_L5_except_error:; - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1047 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1047 * * cdef inline int import_ufunc() except -1: * try: # <<<<<<<<<<<<<< @@ -10233,7 +10233,7 @@ static CYTHON_INLINE int __pyx_f_5numpy_import_ufunc(void) { __pyx_L8_try_end:; } - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1046 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1046 * raise ImportError("numpy.core.umath failed to import") * * cdef inline int import_ufunc() except -1: # <<<<<<<<<<<<<< @@ -10417,7 +10417,7 @@ static CYTHON_SMALL_CODE int __Pyx_InitCachedConstants(void) { __Pyx_GOTREF(__pyx_tuple__2); __Pyx_GIVEREF(__pyx_tuple__2); - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":272 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":272 * if ((flags & pybuf.PyBUF_C_CONTIGUOUS == pybuf.PyBUF_C_CONTIGUOUS) * and not PyArray_CHKFLAGS(self, NPY_ARRAY_C_CONTIGUOUS)): * raise ValueError(u"ndarray is not C contiguous") # <<<<<<<<<<<<<< @@ -10428,7 +10428,7 @@ static CYTHON_SMALL_CODE int __Pyx_InitCachedConstants(void) { __Pyx_GOTREF(__pyx_tuple__3); __Pyx_GIVEREF(__pyx_tuple__3); - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":276 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":276 * if ((flags & pybuf.PyBUF_F_CONTIGUOUS == pybuf.PyBUF_F_CONTIGUOUS) * and not PyArray_CHKFLAGS(self, NPY_ARRAY_F_CONTIGUOUS)): * raise ValueError(u"ndarray is not Fortran contiguous") # <<<<<<<<<<<<<< @@ -10439,7 +10439,7 @@ static CYTHON_SMALL_CODE int __Pyx_InitCachedConstants(void) { __Pyx_GOTREF(__pyx_tuple__4); __Pyx_GIVEREF(__pyx_tuple__4); - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":306 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":306 * if ((descr.byteorder == c'>' and little_endian) or * (descr.byteorder == c'<' and not little_endian)): * raise ValueError(u"Non-native byte order not supported") # <<<<<<<<<<<<<< @@ -10450,7 +10450,7 @@ static CYTHON_SMALL_CODE int __Pyx_InitCachedConstants(void) { __Pyx_GOTREF(__pyx_tuple__5); __Pyx_GIVEREF(__pyx_tuple__5); - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":856 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":856 * * if (end - f) - (new_offset - offset[0]) < 15: * raise RuntimeError(u"Format string allocated too short, see comment in numpy.pxd") # <<<<<<<<<<<<<< @@ -10461,7 +10461,7 @@ static CYTHON_SMALL_CODE int __Pyx_InitCachedConstants(void) { __Pyx_GOTREF(__pyx_tuple__6); __Pyx_GIVEREF(__pyx_tuple__6); - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":880 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":880 * t = child.type_num * if end - f < 5: * raise RuntimeError(u"Format string allocated too short.") # <<<<<<<<<<<<<< @@ -10472,7 +10472,7 @@ static CYTHON_SMALL_CODE int __Pyx_InitCachedConstants(void) { __Pyx_GOTREF(__pyx_tuple__7); __Pyx_GIVEREF(__pyx_tuple__7); - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1038 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1038 * _import_array() * except Exception: * raise ImportError("numpy.core.multiarray failed to import") # <<<<<<<<<<<<<< @@ -10483,7 +10483,7 @@ static CYTHON_SMALL_CODE int __Pyx_InitCachedConstants(void) { __Pyx_GOTREF(__pyx_tuple__8); __Pyx_GIVEREF(__pyx_tuple__8); - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1044 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1044 * _import_umath() * except Exception: * raise ImportError("numpy.core.umath failed to import") # <<<<<<<<<<<<<< @@ -10969,8 +10969,8 @@ if (!__Pyx_RefNanny) { __Pyx_XDECREF(__pyx_t_5); __pyx_t_5 = 0; goto __pyx_L7_try_end; __pyx_L2_error:; - __Pyx_XDECREF(__pyx_t_2); __pyx_t_2 = 0; __Pyx_XDECREF(__pyx_t_1); __pyx_t_1 = 0; + __Pyx_XDECREF(__pyx_t_2); __pyx_t_2 = 0; /* "gensim/models/doc2vec_inner.pyx":23 * try: @@ -11096,7 +11096,7 @@ if (!__Pyx_RefNanny) { if (PyDict_SetItem(__pyx_d, __pyx_n_s_test, __pyx_t_7) < 0) __PYX_ERR(0, 1, __pyx_L1_error) __Pyx_DECREF(__pyx_t_7); __pyx_t_7 = 0; - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1046 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1046 * raise ImportError("numpy.core.umath failed to import") * * cdef inline int import_ufunc() except -1: # <<<<<<<<<<<<<< @@ -12754,7 +12754,7 @@ static CYTHON_INLINE PyObject* __Pyx_PyInt_From_unsigned_PY_LONG_LONG(unsigned P theta = 0; } else { r = -a.real; - theta = atan2f(0, -1); + theta = atan2f(0.0, -1.0); } } else { r = __Pyx_c_abs_float(a); @@ -12909,7 +12909,7 @@ static CYTHON_INLINE PyObject* __Pyx_PyInt_From_unsigned_PY_LONG_LONG(unsigned P theta = 0; } else { r = -a.real; - theta = atan2(0, -1); + theta = atan2(0.0, -1.0); } } else { r = __Pyx_c_abs_double(a); diff --git a/gensim/models/fasttext.py b/gensim/models/fasttext.py index 1b03268442..7fd1db6dbc 100644 --- a/gensim/models/fasttext.py +++ b/gensim/models/fasttext.py @@ -14,6 +14,9 @@ This module contains a fast native C implementation of Fasttext with Python interfaces. It is **not** only a wrapper around Facebook's implementation. +This module supports loading models trained with Facebook's fastText implementation. +It also supports continuing training from such models. + For a tutorial see `this notebook `_. @@ -27,10 +30,96 @@ .. sourcecode:: pycon - >>> from gensim.test.utils import common_texts - >>> from gensim.models import FastText + >>> # from gensim.models import FastText # FIXME: why does Sphinx dislike this import? + >>> from gensim.test.utils import common_texts # some example sentences + >>> + >>> print(common_texts[0]) + ['human', 'interface', 'computer'] + >>> print(len(common_texts)) + 9 + >>> model = FastText(size=4, window=3, min_count=1) # instantiate + >>> model.build_vocab(sentences=common_texts) + >>> model.train(sentences=common_texts, total_examples=len(common_texts), epochs=10) # train + +Once you have a model, you can access its keyed vectors via the `model.wv` attributes. +The keyed vectors instance is quite powerful: it can perform a wide range of NLP tasks. +For a full list of examples, see :class:`~gensim.models.keyedvectors.FastTextKeyedVectors`. + +You can also pass all the above parameters to the constructor to do everything +in a single line: + +.. sourcecode:: pycon + + >>> model2 = FastText(size=4, window=3, min_count=1, sentences=common_texts, iter=10) + +.. Important:: + This style of initialize-and-train in a single line is **deprecated**. We include it here + for backward compatibility only. + + Please use the initialize-`build_vocab`-`train` pattern above instead, including using `epochs` + instead of `iter`. + The motivation is to simplify the API and resolve naming inconsistencies, + e.g. the iter parameter to the constructor is called epochs in the train function. + +The two models above are instantiated differently, but behave identically. +For example, we can compare the embeddings they've calculated for the word "computer": + +.. sourcecode:: pycon + + >>> import numpy as np + >>> + >>> np.allclose(model.wv['computer'], model2.wv['computer']) + True + + +In the above examples, we trained the model from sentences (lists of words) loaded into memory. +This is OK for smaller datasets, but for larger datasets, we recommend streaming the file, +for example from disk or the network. +In Gensim, we refer to such datasets as "corpora" (singular "corpus"), and keep them +in the format described in :class:`~gensim.models.word2vec.LineSentence`. +Passing a corpus is simple: + +.. sourcecode:: pycon + + >>> from gensim.test.utils import datapath >>> - >>> model = FastText(common_texts, size=4, window=3, min_count=1, iter=10) + >>> corpus_file = datapath('lee_background.cor') # absolute path to corpus + >>> model3 = FastText(size=4, window=3, min_count=1) + >>> model3.build_vocab(corpus_file=corpus_file) # scan over corpus to build the vocabulary + >>> + >>> total_words = model3.corpus_total_words # number of words in the corpus + >>> model3.train(corpus_file=corpus_file, total_words=total_words, epochs=5) + +The model needs the `total_words` parameter in order to +manage the training rate (alpha) correctly, and to give accurate progress estimates. +The above example relies on an implementation detail: the +:meth:`~gensim.models.fasttext.FastText.build_vocab` method +sets the `corpus_total_words` (and also `corpus_count`) model attributes. +You may calculate them by scanning over the corpus yourself, too. + +If you have a corpus in a different format, then you can use it by wrapping it +in an `iterator `_. +Your iterator should yield a list of strings each time, where each string should be a separate word. +Gensim will take care of the rest: + +.. sourcecode:: pycon + + >>> from gensim.utils import tokenize + >>> import smart_open + >>> + >>> + >>> class MyIter(object): + ... def __iter__(self): + ... path = datapath('crime-and-punishment.txt') + ... with smart_open.smart_open(path, 'r', encoding='utf-8') as fin: + ... for line in fin: + ... yield list(tokenize(line)) + >>> + >>> + >>> model4 = FastText(size=4, window=3, min_count=1) + >>> model4.build_vocab(sentences=MyIter()) + >>> total_examples = model4.corpus_count + >>> model4.train(sentences=MyIter(), total_examples=total_examples, epochs=5) Persist a model to disk with: @@ -41,7 +130,67 @@ >>> fname = get_tmpfile("fasttext.model") >>> >>> model.save(fname) - >>> model = FastText.load(fname) # you can continue training with the loaded model! + >>> model = FastText.load(fname) + +Once loaded, such models behave identically to those created from scratch. +For example, you can continue training the loaded model: + +.. sourcecode:: pycon + + >>> import numpy as np + >>> + >>> 'computation' in model.wv.vocab # New word, currently out of vocab + False + >>> old_vector = np.copy(model.wv['computation']) # Grab the existing vector + >>> new_sentences = [ + ... ['computer', 'aided', 'design'], + ... ['computer', 'science'], + ... ['computational', 'complexity'], + ... ['military', 'supercomputer'], + ... ['central', 'processing', 'unit'], + ... ['onboard', 'car', 'computer'], + ... ] + >>> + >>> model.build_vocab(new_sentences, update=True) # Update the vocabulary + >>> model.train(new_sentences, total_examples=len(new_sentences), epochs=model.epochs) + >>> + >>> new_vector = model.wv['computation'] + >>> np.allclose(old_vector, new_vector, atol=1e-4) # Vector has changed, model has learnt something + False + >>> 'computation' in model.wv.vocab # Word is still out of vocab + False + +.. Important:: + Be sure to call the :meth:`~gensim.models.fasttext.FastText.build_vocab` + method with `update=True` before the :meth:`~gensim.models.fasttext.FastText.train` method + when continuing training. Without this call, previously unseen terms + will not be added to the vocabulary. + +You can also load models trained with Facebook's fastText implementation: + +.. sourcecode:: pycon + + >>> cap_path = datapath("crime-and-punishment.bin") + >>> # Partial model: loads quickly, uses less RAM, but cannot continue training + >>> fb_partial = FastText.load_fasttext_format(cap_path, full_model=False) + >>> # Full model: loads slowly, consumes RAM, but can continue training (see below) + >>> fb_full = FastText.load_fasttext_format(cap_path, full_model=True) + +Once loaded, such models behave identically to those trained from scratch. +You may continue training them on new data: + +.. sourcecode:: pycon + + >>> 'computer' in fb_full.wv.vocab # New word, currently out of vocab + False + >>> old_computer = np.copy(fb_full.wv['computer']) # Calculate current vectors + >>> fb_full.build_vocab(new_sentences, update=True) + >>> fb_full.train(new_sentences, total_examples=len(new_sentences), epochs=model.epochs) + >>> new_computer = fb_full.wv['computer'] + >>> np.allclose(old_computer, new_computer, atol=1e-4) # Vector has changed, model has learnt something + False + >>> 'computer' in fb_full.wv.vocab # New word is now in the vocabulary + True Retrieve word-vector for vocab and out-of-vocab word: @@ -85,6 +234,33 @@ >>> analogies_result = model.wv.evaluate_word_analogies(datapath('questions-words.txt')) +Implementation Notes +-------------------- + +These notes may help developers navigate our fastText implementation. +The implementation is split across several submodules: + +- :mod:`gensim.models.fasttext`: This module. Contains FastText-specific functionality only. +- :mod:`gensim.models.keyedvectors`: Implements both generic and FastText-specific functionality. +- :mod:`gensim.models.word2vec`: Contains implementations for the vocabulary + and the trainables for FastText. +- :mod:`gensim.models.base_any2vec`: Contains implementations for the base. + classes, including functionality such as callbacks, logging. +- :mod:`gensim.models.utils_any2vec`: Wrapper over Cython extensions. +- :mod:`gensim.utils`: Implements model I/O (loading and saving). + +Our implementation relies heavily on inheritance. +It consists of several important classes: + +- :class:`~gensim.models.word2vec.Word2VecVocab`: the vocabulary. + Keeps track of all the unique words, sometimes discarding the extremely rare ones. + This is sometimes called the Dictionary within Gensim. +- :class:`~gensim.models.keyedvectors.FastTextKeyedVectors`: the vectors. + Once training is complete, this class is sufficient for calculating embeddings. +- :class:`~gensim.models.fasttext.FastTextTrainables`: the underlying neural network. + The implementation uses this class to *learn* the word embeddings. +- :class:`~gensim.models.fasttext.FastText`: ties everything together. + """ import logging @@ -98,7 +274,7 @@ from gensim.models.word2vec import Word2VecVocab, Word2VecTrainables, train_sg_pair, train_cbow_pair from gensim.models.keyedvectors import FastTextKeyedVectors from gensim.models.base_any2vec import BaseWordEmbeddingsModel -from gensim.models.utils_any2vec import _compute_ngrams, _ft_hash, _ft_hash_broken +from gensim.models.utils_any2vec import ft_ngram_hashes from smart_open import smart_open from gensim.utils import deprecated, call_on_class_only @@ -235,9 +411,6 @@ def train_epoch_cbow(model, corpus_file, offset, _cython_vocab, _cur_epoch, _exp raise RuntimeError("Training with corpus_file argument is not supported") -FASTTEXT_FILEFORMAT_MAGIC = 793712314 - - class FastText(BaseWordEmbeddingsModel): """Train, use and evaluate word representations learned using the method described in `Enriching Word Vectors with Subword Information `_, aka FastText. @@ -246,8 +419,6 @@ class FastText(BaseWordEmbeddingsModel): :meth:`~gensim.models.fasttext.FastText.load` methods, or loaded from a format compatible with the original Fasttext implementation via :meth:`~gensim.models.fasttext.FastText.load_fasttext_format`. - Some important internal attributes are the following: - Attributes ---------- wv : :class:`~gensim.models.keyedvectors.FastTextKeyedVectors` @@ -535,7 +706,7 @@ def build_vocab(self, sentences=None, corpus_file=None, update=False, progress_p def _set_train_params(self, **kwargs): # # We need the wv.buckets_word member to be initialized in order to - # continue training. The _clear_post_train method destroys this + # continue training. The _clear_post_train method destroys this # variable, so we reinitialize it here, if needed. # # The .old_vocab_len and .old_hash2index_len members are set only to @@ -554,8 +725,6 @@ def _clear_post_train(self): self.wv.buckets_word = None def estimate_memory(self, vocab_size=None, report=None): - hash_fn = _ft_hash if self.wv.compatible_hash else _ft_hash_broken - vocab_size = vocab_size or len(self.wv.vocab) vec_size = self.vector_size * np.dtype(np.float32).itemsize l1_size = self.trainables.layer1_size * np.dtype(np.float32).itemsize @@ -574,9 +743,15 @@ def estimate_memory(self, vocab_size=None, report=None): buckets = set() num_ngrams = 0 for word in self.wv.vocab: - ngrams = _compute_ngrams(word, self.wv.min_n, self.wv.max_n) - num_ngrams += len(ngrams) - buckets.update(hash_fn(ng) % self.trainables.bucket for ng in ngrams) + hashes = ft_ngram_hashes( + word, + self.wv.min_n, + self.wv.max_n, + self.trainables.bucket, + self.wv.compatible_hash + ) + num_ngrams += len(hashes) + buckets.update(hashes) num_buckets = len(buckets) report['syn0_ngrams'] = num_buckets * vec_size # A tuple (48 bytes) with num_ngrams_word ints (8 bytes) for each word @@ -704,6 +879,14 @@ def train(self, sentences=None, corpus_file=None, total_examples=None, total_wor >>> model.train(sentences, total_examples=model.corpus_count, epochs=model.epochs) """ + cant_train = hasattr(self.trainables, 'syn1neg') and self.trainables.syn1neg is None + if cant_train: + raise ValueError( + 'this model cannot be trained any further, ' + 'if this is a native model, try loading it with ' + 'FastText.load_fasttext_format(path, full_model=True)' + ) + super(FastText, self).train( sentences=sentences, corpus_file=corpus_file, total_examples=total_examples, total_words=total_words, epochs=epochs, start_alpha=start_alpha, end_alpha=end_alpha, word_count=word_count, @@ -754,12 +937,22 @@ def __contains__(self, word): return self.wv.__contains__(word) @classmethod - def load_fasttext_format(cls, model_file, encoding='utf8'): + def load_fasttext_format(cls, model_file, encoding='utf8', full_model=True): """Load the input-hidden weight matrix from Facebook's native fasttext `.bin` and `.vec` output files. + By default, this function loads the full model. A full model allows + continuing training with more data, but also consumes more RAM and + takes longer to load. If you do not need to continue training and only + wish the work with the already-trained embeddings, use `full_model=False` + for faster loading and to save RAM. + Notes ------ - Due to limitations in the FastText API, you cannot continue training with a model loaded this way. + Facebook provides both `.vec` and `.bin` files with their modules. + The former contains human-readable vectors. + The latter contains machine-readable vectors along with other model parameters. + This function effectively ignores `.vec` output file, since that file is redundant. + It only needs the `.bin` file. Parameters ---------- @@ -770,14 +963,55 @@ def load_fasttext_format(cls, model_file, encoding='utf8'): as Gensim requires only `.bin` file to the load entire fastText model. encoding : str, optional Specifies the file encoding. + full_model : boolean, optional + If False, skips loading the hidden output matrix. This saves a fair bit + of CPU time and RAM, but **prevents training continuation**. + + Examples + -------- + + Load, infer, continue training: + + .. sourcecode:: pycon + + >>> from gensim.test.utils import datapath + >>> + >>> cap_path = datapath("crime-and-punishment.bin") + >>> fb_full = FastText.load_fasttext_format(cap_path, full_model=True) + >>> + >>> 'landlord' in fb_full.wv.vocab # Word is out of vocabulary + False + >>> oov_term = fb_full.wv['landlord'] + >>> + >>> 'landlady' in fb_full.wv.vocab # Word is in the vocabulary + True + >>> iv_term = fb_full.wv['landlady'] + >>> + >>> new_sent = [['lord', 'of', 'the', 'rings'], ['lord', 'of', 'the', 'flies']] + >>> fb_full.build_vocab(new_sent, update=True) + >>> fb_full.train(sentences=new_sent, total_examples=len(new_sent), epochs=5) + + Load quickly, infer (forego training continuation): + + .. sourcecode:: pycon + + >>> fb_partial = FastText.load_fasttext_format(cap_path, full_model=False) + >>> + >>> 'landlord' in fb_partial.wv.vocab # Word is out of vocabulary + False + >>> oov_term = fb_partial.wv['landlord'] + >>> + >>> 'landlady' in fb_partial.wv.vocab # Word is in the vocabulary + True + >>> iv_term = fb_partial.wv['landlady'] Returns ------- - :class: `~gensim.models.fasttext.FastText` + gensim.models.fasttext.FastText The loaded model. """ - return _load_fasttext_format(model_file, encoding=encoding) + return _load_fasttext_format(model_file, encoding=encoding, full_model=full_model) def load_binary_data(self, encoding='utf8'): """Load data from a binary file created by Facebook's native FastText. @@ -841,7 +1075,7 @@ def load(cls, *args, **kwargs): if not hasattr(model.wv, 'compatible_hash'): logger.warning( - "This older model was trained with a buggy hash function. " + "This older model was trained with a buggy hash function. " "The model will continue to work, but consider training it " "from scratch." ) @@ -862,15 +1096,42 @@ def accuracy(self, questions, restrict_vocab=30000, most_similar=None, case_inse return self.wv.accuracy(questions, restrict_vocab, most_similar, case_insensitive) -# -# Keep for backward compatibility. -# class FastTextVocab(Word2VecVocab): + """This is a redundant class. It exists only to maintain backwards compatibility + with older gensim versions.""" pass class FastTextTrainables(Word2VecTrainables): - """Represents the inner shallow neural network used to train :class:`~gensim.models.fasttext.FastText`.""" + """Represents the inner shallow neural network used to train :class:`~gensim.models.fasttext.FastText`. + + Mostly inherits from its parent (:class:`~gensim.models.word2vec.Word2VecTrainables`). + Adds logic for calculating and maintaining ngram weights. + + Attributes + ---------- + hashfxn : function + Used for randomly initializing weights. Defaults to the built-in hash() + layer1_size : int + The size of the inner layer of the NN. Equal to the vector dimensionality. + Set in the :class:`~gensim.models.word2vec.Word2VecTrainables` constructor. + seed : float + The random generator seed used in reset_weights and update_weights. + syn1 : numpy.array + The inner layer of the NN. Each row corresponds to a term in the vocabulary. + Columns correspond to weights of the inner layer. + There are layer1_size such weights. + Set in the reset_weights and update_weights methods, only if hierarchical sampling is used. + syn1neg : numpy.array + Similar to syn1, but only set if negative sampling is used. + vectors_lockf : numpy.array + A one-dimensional array with one element for each term in the vocab. Set in reset_weights to an array of ones. + vectors_vocab_lockf : numpy.array + Similar to vectors_vocab_lockf, ones(len(model.trainables.vectors), dtype=REAL) + vectors_ngrams_lockf : numpy.array + np.ones((self.bucket, wv.vector_size), dtype=REAL) + + """ def __init__(self, vector_size=100, seed=1, hashfxn=hash, bucket=2000000): super(FastTextTrainables, self).__init__( vector_size=vector_size, seed=seed, hashfxn=hashfxn) @@ -884,17 +1145,17 @@ def __init__(self, vector_size=100, seed=1, hashfxn=hash, bucket=2000000): # 2. vectors_ngrams_lockf # # These are both 2D matrices of shapes equal to the shapes of - # wv.vectors_vocab and wv.vectors_ngrams. So, each row corresponds to + # wv.vectors_vocab and wv.vectors_ngrams. So, each row corresponds to # a vector, and each column corresponds to a dimension within that # vector. # # Lockf stands for "lock factor": zero values suppress learning, one - # values enable it. Interestingly, the vectors_vocab_lockf and + # values enable it. Interestingly, the vectors_vocab_lockf and # vectors_ngrams_lockf seem to be used only by the C code in # fasttext_inner.pyx. # # The word2vec implementation also uses vectors_lockf: in that case, - # it's a 1D array, with a real number for each vector. The FastText + # it's a 1D array, with a real number for each vector. The FastText # implementation inherits this vectors_lockf attribute but doesn't # appear to use it. # @@ -959,7 +1220,7 @@ def _pad_ones(m, new_shape): return vstack([m, suffix]) -def _load_fasttext_format(model_file, encoding='utf-8'): +def _load_fasttext_format(model_file, encoding='utf-8', full_model=True): """Load the input-hidden weight matrix from Facebook's native fasttext `.bin` and `.vec` output files. Parameters @@ -971,16 +1232,20 @@ def _load_fasttext_format(model_file, encoding='utf-8'): as Gensim requires only `.bin` file to the load entire fastText model. encoding : str, optional Specifies the file encoding. + full_model : boolean, optional + If False, skips loading the hidden output matrix. This saves a fair bit + of CPU time and RAM, but prevents training continuation. Returns ------- :class: `~gensim.models.fasttext.FastText` The loaded model. + """ if not model_file.endswith('.bin'): model_file += '.bin' with smart_open(model_file, 'rb') as fin: - m = gensim.models._fasttext_bin.load(fin, encoding=encoding) + m = gensim.models._fasttext_bin.load(fin, encoding=encoding, full_model=full_model) model = FastText( size=m.dim, @@ -999,8 +1264,23 @@ def _load_fasttext_format(model_file, encoding='utf-8'): model.vocabulary.raw_vocab = m.raw_vocab model.vocabulary.nwords = m.nwords model.vocabulary.vocab_size = m.vocab_size - model.vocabulary.prepare_vocab(model.hs, model.negative, model.wv, - update=True, min_count=model.min_count) + + # + # This is here to fix https://github.com/RaRe-Technologies/gensim/pull/2373. + # + # We explicitly set min_count=1 regardless of the model's parameters to + # ignore the trim rule when building the vocabulary. We do this in order + # to support loading native models that were trained with pretrained vectors. + # Such models will contain vectors for _all_ encountered words, not only + # those occurring more frequently than min_count. + # + # Native models trained _without_ pretrained vectors already contain the + # trimmed raw_vocab, so this change does not affect them. + # + model.vocabulary.prepare_vocab( + model.hs, model.negative, model.wv, + update=True, min_count=1, + ) model.num_original_vectors = m.vectors_ngrams.shape[0] diff --git a/gensim/models/fasttext_corpusfile.cpp b/gensim/models/fasttext_corpusfile.cpp index 1b34620bca..6a92571f95 100644 --- a/gensim/models/fasttext_corpusfile.cpp +++ b/gensim/models/fasttext_corpusfile.cpp @@ -1,4 +1,4 @@ -/* Generated by Cython 0.29.2 */ +/* Generated by Cython 0.29.3 */ #define PY_SSIZE_T_CLEAN #include "Python.h" @@ -7,8 +7,8 @@ #elif PY_VERSION_HEX < 0x02060000 || (0x03000000 <= PY_VERSION_HEX && PY_VERSION_HEX < 0x03030000) #error Cython requires Python 2.6+ or Python 3.3+. #else -#define CYTHON_ABI "0_29_2" -#define CYTHON_HEX_VERSION 0x001D02F0 +#define CYTHON_ABI "0_29_3" +#define CYTHON_HEX_VERSION 0x001D03F0 #define CYTHON_FUTURE_DIVISION 0 #include #ifndef offsetof @@ -412,7 +412,7 @@ class __Pyx_FakeReference { typedef int Py_tss_t; static CYTHON_INLINE int PyThread_tss_create(Py_tss_t *key) { *key = PyThread_create_key(); - return 0; // PyThread_create_key reports success always + return 0; } static CYTHON_INLINE Py_tss_t * PyThread_tss_alloc(void) { Py_tss_t *key = (Py_tss_t *)PyObject_Malloc(sizeof(Py_tss_t)); @@ -435,7 +435,7 @@ static CYTHON_INLINE int PyThread_tss_set(Py_tss_t *key, void *value) { static CYTHON_INLINE void * PyThread_tss_get(Py_tss_t *key) { return PyThread_get_key_value(*key); } -#endif // TSS (Thread Specific Storage) API +#endif #if CYTHON_COMPILING_IN_CPYTHON || defined(_PyDict_NewPresized) #define __Pyx_PyDict_NewPresized(n) ((n <= 8) ? PyDict_New() : _PyDict_NewPresized(n)) #else @@ -883,7 +883,7 @@ static const char *__pyx_f[] = { #endif -/* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":776 +/* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":776 * # in Cython to enable them only on the right systems. * * ctypedef npy_int8 int8_t # <<<<<<<<<<<<<< @@ -892,7 +892,7 @@ static const char *__pyx_f[] = { */ typedef npy_int8 __pyx_t_5numpy_int8_t; -/* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":777 +/* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":777 * * ctypedef npy_int8 int8_t * ctypedef npy_int16 int16_t # <<<<<<<<<<<<<< @@ -901,7 +901,7 @@ typedef npy_int8 __pyx_t_5numpy_int8_t; */ typedef npy_int16 __pyx_t_5numpy_int16_t; -/* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":778 +/* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":778 * ctypedef npy_int8 int8_t * ctypedef npy_int16 int16_t * ctypedef npy_int32 int32_t # <<<<<<<<<<<<<< @@ -910,7 +910,7 @@ typedef npy_int16 __pyx_t_5numpy_int16_t; */ typedef npy_int32 __pyx_t_5numpy_int32_t; -/* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":779 +/* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":779 * ctypedef npy_int16 int16_t * ctypedef npy_int32 int32_t * ctypedef npy_int64 int64_t # <<<<<<<<<<<<<< @@ -919,7 +919,7 @@ typedef npy_int32 __pyx_t_5numpy_int32_t; */ typedef npy_int64 __pyx_t_5numpy_int64_t; -/* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":783 +/* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":783 * #ctypedef npy_int128 int128_t * * ctypedef npy_uint8 uint8_t # <<<<<<<<<<<<<< @@ -928,7 +928,7 @@ typedef npy_int64 __pyx_t_5numpy_int64_t; */ typedef npy_uint8 __pyx_t_5numpy_uint8_t; -/* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":784 +/* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":784 * * ctypedef npy_uint8 uint8_t * ctypedef npy_uint16 uint16_t # <<<<<<<<<<<<<< @@ -937,7 +937,7 @@ typedef npy_uint8 __pyx_t_5numpy_uint8_t; */ typedef npy_uint16 __pyx_t_5numpy_uint16_t; -/* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":785 +/* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":785 * ctypedef npy_uint8 uint8_t * ctypedef npy_uint16 uint16_t * ctypedef npy_uint32 uint32_t # <<<<<<<<<<<<<< @@ -946,7 +946,7 @@ typedef npy_uint16 __pyx_t_5numpy_uint16_t; */ typedef npy_uint32 __pyx_t_5numpy_uint32_t; -/* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":786 +/* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":786 * ctypedef npy_uint16 uint16_t * ctypedef npy_uint32 uint32_t * ctypedef npy_uint64 uint64_t # <<<<<<<<<<<<<< @@ -955,7 +955,7 @@ typedef npy_uint32 __pyx_t_5numpy_uint32_t; */ typedef npy_uint64 __pyx_t_5numpy_uint64_t; -/* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":790 +/* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":790 * #ctypedef npy_uint128 uint128_t * * ctypedef npy_float32 float32_t # <<<<<<<<<<<<<< @@ -964,7 +964,7 @@ typedef npy_uint64 __pyx_t_5numpy_uint64_t; */ typedef npy_float32 __pyx_t_5numpy_float32_t; -/* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":791 +/* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":791 * * ctypedef npy_float32 float32_t * ctypedef npy_float64 float64_t # <<<<<<<<<<<<<< @@ -973,7 +973,7 @@ typedef npy_float32 __pyx_t_5numpy_float32_t; */ typedef npy_float64 __pyx_t_5numpy_float64_t; -/* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":800 +/* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":800 * # The int types are mapped a bit surprising -- * # numpy.int corresponds to 'l' and numpy.long to 'q' * ctypedef npy_long int_t # <<<<<<<<<<<<<< @@ -982,7 +982,7 @@ typedef npy_float64 __pyx_t_5numpy_float64_t; */ typedef npy_long __pyx_t_5numpy_int_t; -/* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":801 +/* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":801 * # numpy.int corresponds to 'l' and numpy.long to 'q' * ctypedef npy_long int_t * ctypedef npy_longlong long_t # <<<<<<<<<<<<<< @@ -991,7 +991,7 @@ typedef npy_long __pyx_t_5numpy_int_t; */ typedef npy_longlong __pyx_t_5numpy_long_t; -/* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":802 +/* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":802 * ctypedef npy_long int_t * ctypedef npy_longlong long_t * ctypedef npy_longlong longlong_t # <<<<<<<<<<<<<< @@ -1000,7 +1000,7 @@ typedef npy_longlong __pyx_t_5numpy_long_t; */ typedef npy_longlong __pyx_t_5numpy_longlong_t; -/* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":804 +/* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":804 * ctypedef npy_longlong longlong_t * * ctypedef npy_ulong uint_t # <<<<<<<<<<<<<< @@ -1009,7 +1009,7 @@ typedef npy_longlong __pyx_t_5numpy_longlong_t; */ typedef npy_ulong __pyx_t_5numpy_uint_t; -/* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":805 +/* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":805 * * ctypedef npy_ulong uint_t * ctypedef npy_ulonglong ulong_t # <<<<<<<<<<<<<< @@ -1018,7 +1018,7 @@ typedef npy_ulong __pyx_t_5numpy_uint_t; */ typedef npy_ulonglong __pyx_t_5numpy_ulong_t; -/* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":806 +/* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":806 * ctypedef npy_ulong uint_t * ctypedef npy_ulonglong ulong_t * ctypedef npy_ulonglong ulonglong_t # <<<<<<<<<<<<<< @@ -1027,7 +1027,7 @@ typedef npy_ulonglong __pyx_t_5numpy_ulong_t; */ typedef npy_ulonglong __pyx_t_5numpy_ulonglong_t; -/* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":808 +/* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":808 * ctypedef npy_ulonglong ulonglong_t * * ctypedef npy_intp intp_t # <<<<<<<<<<<<<< @@ -1036,7 +1036,7 @@ typedef npy_ulonglong __pyx_t_5numpy_ulonglong_t; */ typedef npy_intp __pyx_t_5numpy_intp_t; -/* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":809 +/* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":809 * * ctypedef npy_intp intp_t * ctypedef npy_uintp uintp_t # <<<<<<<<<<<<<< @@ -1045,7 +1045,7 @@ typedef npy_intp __pyx_t_5numpy_intp_t; */ typedef npy_uintp __pyx_t_5numpy_uintp_t; -/* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":811 +/* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":811 * ctypedef npy_uintp uintp_t * * ctypedef npy_double float_t # <<<<<<<<<<<<<< @@ -1054,7 +1054,7 @@ typedef npy_uintp __pyx_t_5numpy_uintp_t; */ typedef npy_double __pyx_t_5numpy_float_t; -/* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":812 +/* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":812 * * ctypedef npy_double float_t * ctypedef npy_double double_t # <<<<<<<<<<<<<< @@ -1063,7 +1063,7 @@ typedef npy_double __pyx_t_5numpy_float_t; */ typedef npy_double __pyx_t_5numpy_double_t; -/* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":813 +/* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":813 * ctypedef npy_double float_t * ctypedef npy_double double_t * ctypedef npy_longdouble longdouble_t # <<<<<<<<<<<<<< @@ -1127,7 +1127,7 @@ static CYTHON_INLINE __pyx_t_double_complex __pyx_t_double_complex_from_parts(do struct __pyx_obj_6gensim_6models_19word2vec_corpusfile_CythonLineSentence; struct __pyx_obj_6gensim_6models_19word2vec_corpusfile_CythonVocab; -/* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":815 +/* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":815 * ctypedef npy_longdouble longdouble_t * * ctypedef npy_cfloat cfloat_t # <<<<<<<<<<<<<< @@ -1136,7 +1136,7 @@ struct __pyx_obj_6gensim_6models_19word2vec_corpusfile_CythonVocab; */ typedef npy_cfloat __pyx_t_5numpy_cfloat_t; -/* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":816 +/* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":816 * * ctypedef npy_cfloat cfloat_t * ctypedef npy_cdouble cdouble_t # <<<<<<<<<<<<<< @@ -1145,7 +1145,7 @@ typedef npy_cfloat __pyx_t_5numpy_cfloat_t; */ typedef npy_cdouble __pyx_t_5numpy_cdouble_t; -/* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":817 +/* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":817 * ctypedef npy_cfloat cfloat_t * ctypedef npy_cdouble cdouble_t * ctypedef npy_clongdouble clongdouble_t # <<<<<<<<<<<<<< @@ -1154,7 +1154,7 @@ typedef npy_cdouble __pyx_t_5numpy_cdouble_t; */ typedef npy_clongdouble __pyx_t_5numpy_clongdouble_t; -/* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":819 +/* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":819 * ctypedef npy_clongdouble clongdouble_t * * ctypedef npy_cdouble complex_t # <<<<<<<<<<<<<< @@ -3967,7 +3967,7 @@ static PyObject *__pyx_pf_6gensim_6models_19fasttext_corpusfile_2train_epoch_cbo return __pyx_r; } -/* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":258 +/* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":258 * # experimental exception made for __getbuffer__ and __releasebuffer__ * # -- the details of this may change. * def __getbuffer__(ndarray self, Py_buffer* info, int flags): # <<<<<<<<<<<<<< @@ -4016,7 +4016,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P __pyx_v_info->obj = Py_None; __Pyx_INCREF(Py_None); __Pyx_GIVEREF(__pyx_v_info->obj); - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":265 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":265 * * cdef int i, ndim * cdef int endian_detector = 1 # <<<<<<<<<<<<<< @@ -4025,7 +4025,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P */ __pyx_v_endian_detector = 1; - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":266 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":266 * cdef int i, ndim * cdef int endian_detector = 1 * cdef bint little_endian = ((&endian_detector)[0] != 0) # <<<<<<<<<<<<<< @@ -4034,7 +4034,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P */ __pyx_v_little_endian = ((((char *)(&__pyx_v_endian_detector))[0]) != 0); - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":268 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":268 * cdef bint little_endian = ((&endian_detector)[0] != 0) * * ndim = PyArray_NDIM(self) # <<<<<<<<<<<<<< @@ -4043,7 +4043,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P */ __pyx_v_ndim = PyArray_NDIM(__pyx_v_self); - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":270 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":270 * ndim = PyArray_NDIM(self) * * if ((flags & pybuf.PyBUF_C_CONTIGUOUS == pybuf.PyBUF_C_CONTIGUOUS) # <<<<<<<<<<<<<< @@ -4057,7 +4057,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P goto __pyx_L4_bool_binop_done; } - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":271 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":271 * * if ((flags & pybuf.PyBUF_C_CONTIGUOUS == pybuf.PyBUF_C_CONTIGUOUS) * and not PyArray_CHKFLAGS(self, NPY_ARRAY_C_CONTIGUOUS)): # <<<<<<<<<<<<<< @@ -4068,7 +4068,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P __pyx_t_1 = __pyx_t_2; __pyx_L4_bool_binop_done:; - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":270 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":270 * ndim = PyArray_NDIM(self) * * if ((flags & pybuf.PyBUF_C_CONTIGUOUS == pybuf.PyBUF_C_CONTIGUOUS) # <<<<<<<<<<<<<< @@ -4077,7 +4077,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P */ if (unlikely(__pyx_t_1)) { - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":272 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":272 * if ((flags & pybuf.PyBUF_C_CONTIGUOUS == pybuf.PyBUF_C_CONTIGUOUS) * and not PyArray_CHKFLAGS(self, NPY_ARRAY_C_CONTIGUOUS)): * raise ValueError(u"ndarray is not C contiguous") # <<<<<<<<<<<<<< @@ -4090,7 +4090,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P __Pyx_DECREF(__pyx_t_3); __pyx_t_3 = 0; __PYX_ERR(1, 272, __pyx_L1_error) - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":270 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":270 * ndim = PyArray_NDIM(self) * * if ((flags & pybuf.PyBUF_C_CONTIGUOUS == pybuf.PyBUF_C_CONTIGUOUS) # <<<<<<<<<<<<<< @@ -4099,7 +4099,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P */ } - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":274 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":274 * raise ValueError(u"ndarray is not C contiguous") * * if ((flags & pybuf.PyBUF_F_CONTIGUOUS == pybuf.PyBUF_F_CONTIGUOUS) # <<<<<<<<<<<<<< @@ -4113,7 +4113,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P goto __pyx_L7_bool_binop_done; } - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":275 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":275 * * if ((flags & pybuf.PyBUF_F_CONTIGUOUS == pybuf.PyBUF_F_CONTIGUOUS) * and not PyArray_CHKFLAGS(self, NPY_ARRAY_F_CONTIGUOUS)): # <<<<<<<<<<<<<< @@ -4124,7 +4124,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P __pyx_t_1 = __pyx_t_2; __pyx_L7_bool_binop_done:; - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":274 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":274 * raise ValueError(u"ndarray is not C contiguous") * * if ((flags & pybuf.PyBUF_F_CONTIGUOUS == pybuf.PyBUF_F_CONTIGUOUS) # <<<<<<<<<<<<<< @@ -4133,7 +4133,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P */ if (unlikely(__pyx_t_1)) { - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":276 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":276 * if ((flags & pybuf.PyBUF_F_CONTIGUOUS == pybuf.PyBUF_F_CONTIGUOUS) * and not PyArray_CHKFLAGS(self, NPY_ARRAY_F_CONTIGUOUS)): * raise ValueError(u"ndarray is not Fortran contiguous") # <<<<<<<<<<<<<< @@ -4146,7 +4146,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P __Pyx_DECREF(__pyx_t_3); __pyx_t_3 = 0; __PYX_ERR(1, 276, __pyx_L1_error) - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":274 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":274 * raise ValueError(u"ndarray is not C contiguous") * * if ((flags & pybuf.PyBUF_F_CONTIGUOUS == pybuf.PyBUF_F_CONTIGUOUS) # <<<<<<<<<<<<<< @@ -4155,7 +4155,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P */ } - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":278 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":278 * raise ValueError(u"ndarray is not Fortran contiguous") * * info.buf = PyArray_DATA(self) # <<<<<<<<<<<<<< @@ -4164,7 +4164,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P */ __pyx_v_info->buf = PyArray_DATA(__pyx_v_self); - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":279 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":279 * * info.buf = PyArray_DATA(self) * info.ndim = ndim # <<<<<<<<<<<<<< @@ -4173,7 +4173,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P */ __pyx_v_info->ndim = __pyx_v_ndim; - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":280 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":280 * info.buf = PyArray_DATA(self) * info.ndim = ndim * if sizeof(npy_intp) != sizeof(Py_ssize_t): # <<<<<<<<<<<<<< @@ -4183,7 +4183,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P __pyx_t_1 = (((sizeof(npy_intp)) != (sizeof(Py_ssize_t))) != 0); if (__pyx_t_1) { - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":283 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":283 * # Allocate new buffer for strides and shape info. * # This is allocated as one block, strides first. * info.strides = PyObject_Malloc(sizeof(Py_ssize_t) * 2 * ndim) # <<<<<<<<<<<<<< @@ -4192,7 +4192,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P */ __pyx_v_info->strides = ((Py_ssize_t *)PyObject_Malloc((((sizeof(Py_ssize_t)) * 2) * ((size_t)__pyx_v_ndim)))); - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":284 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":284 * # This is allocated as one block, strides first. * info.strides = PyObject_Malloc(sizeof(Py_ssize_t) * 2 * ndim) * info.shape = info.strides + ndim # <<<<<<<<<<<<<< @@ -4201,7 +4201,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P */ __pyx_v_info->shape = (__pyx_v_info->strides + __pyx_v_ndim); - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":285 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":285 * info.strides = PyObject_Malloc(sizeof(Py_ssize_t) * 2 * ndim) * info.shape = info.strides + ndim * for i in range(ndim): # <<<<<<<<<<<<<< @@ -4213,7 +4213,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P for (__pyx_t_6 = 0; __pyx_t_6 < __pyx_t_5; __pyx_t_6+=1) { __pyx_v_i = __pyx_t_6; - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":286 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":286 * info.shape = info.strides + ndim * for i in range(ndim): * info.strides[i] = PyArray_STRIDES(self)[i] # <<<<<<<<<<<<<< @@ -4222,7 +4222,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P */ (__pyx_v_info->strides[__pyx_v_i]) = (PyArray_STRIDES(__pyx_v_self)[__pyx_v_i]); - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":287 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":287 * for i in range(ndim): * info.strides[i] = PyArray_STRIDES(self)[i] * info.shape[i] = PyArray_DIMS(self)[i] # <<<<<<<<<<<<<< @@ -4232,7 +4232,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P (__pyx_v_info->shape[__pyx_v_i]) = (PyArray_DIMS(__pyx_v_self)[__pyx_v_i]); } - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":280 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":280 * info.buf = PyArray_DATA(self) * info.ndim = ndim * if sizeof(npy_intp) != sizeof(Py_ssize_t): # <<<<<<<<<<<<<< @@ -4242,7 +4242,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P goto __pyx_L9; } - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":289 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":289 * info.shape[i] = PyArray_DIMS(self)[i] * else: * info.strides = PyArray_STRIDES(self) # <<<<<<<<<<<<<< @@ -4252,7 +4252,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P /*else*/ { __pyx_v_info->strides = ((Py_ssize_t *)PyArray_STRIDES(__pyx_v_self)); - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":290 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":290 * else: * info.strides = PyArray_STRIDES(self) * info.shape = PyArray_DIMS(self) # <<<<<<<<<<<<<< @@ -4263,7 +4263,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P } __pyx_L9:; - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":291 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":291 * info.strides = PyArray_STRIDES(self) * info.shape = PyArray_DIMS(self) * info.suboffsets = NULL # <<<<<<<<<<<<<< @@ -4272,7 +4272,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P */ __pyx_v_info->suboffsets = NULL; - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":292 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":292 * info.shape = PyArray_DIMS(self) * info.suboffsets = NULL * info.itemsize = PyArray_ITEMSIZE(self) # <<<<<<<<<<<<<< @@ -4281,7 +4281,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P */ __pyx_v_info->itemsize = PyArray_ITEMSIZE(__pyx_v_self); - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":293 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":293 * info.suboffsets = NULL * info.itemsize = PyArray_ITEMSIZE(self) * info.readonly = not PyArray_ISWRITEABLE(self) # <<<<<<<<<<<<<< @@ -4290,7 +4290,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P */ __pyx_v_info->readonly = (!(PyArray_ISWRITEABLE(__pyx_v_self) != 0)); - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":296 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":296 * * cdef int t * cdef char* f = NULL # <<<<<<<<<<<<<< @@ -4299,7 +4299,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P */ __pyx_v_f = NULL; - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":297 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":297 * cdef int t * cdef char* f = NULL * cdef dtype descr = PyArray_DESCR(self) # <<<<<<<<<<<<<< @@ -4312,7 +4312,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P __pyx_v_descr = ((PyArray_Descr *)__pyx_t_3); __pyx_t_3 = 0; - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":300 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":300 * cdef int offset * * info.obj = self # <<<<<<<<<<<<<< @@ -4325,7 +4325,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P __Pyx_DECREF(__pyx_v_info->obj); __pyx_v_info->obj = ((PyObject *)__pyx_v_self); - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":302 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":302 * info.obj = self * * if not PyDataType_HASFIELDS(descr): # <<<<<<<<<<<<<< @@ -4335,7 +4335,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P __pyx_t_1 = ((!(PyDataType_HASFIELDS(__pyx_v_descr) != 0)) != 0); if (__pyx_t_1) { - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":303 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":303 * * if not PyDataType_HASFIELDS(descr): * t = descr.type_num # <<<<<<<<<<<<<< @@ -4345,7 +4345,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P __pyx_t_4 = __pyx_v_descr->type_num; __pyx_v_t = __pyx_t_4; - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":304 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":304 * if not PyDataType_HASFIELDS(descr): * t = descr.type_num * if ((descr.byteorder == c'>' and little_endian) or # <<<<<<<<<<<<<< @@ -4365,7 +4365,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P } __pyx_L15_next_or:; - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":305 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":305 * t = descr.type_num * if ((descr.byteorder == c'>' and little_endian) or * (descr.byteorder == c'<' and not little_endian)): # <<<<<<<<<<<<<< @@ -4382,7 +4382,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P __pyx_t_1 = __pyx_t_2; __pyx_L14_bool_binop_done:; - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":304 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":304 * if not PyDataType_HASFIELDS(descr): * t = descr.type_num * if ((descr.byteorder == c'>' and little_endian) or # <<<<<<<<<<<<<< @@ -4391,7 +4391,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P */ if (unlikely(__pyx_t_1)) { - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":306 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":306 * if ((descr.byteorder == c'>' and little_endian) or * (descr.byteorder == c'<' and not little_endian)): * raise ValueError(u"Non-native byte order not supported") # <<<<<<<<<<<<<< @@ -4404,7 +4404,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P __Pyx_DECREF(__pyx_t_3); __pyx_t_3 = 0; __PYX_ERR(1, 306, __pyx_L1_error) - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":304 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":304 * if not PyDataType_HASFIELDS(descr): * t = descr.type_num * if ((descr.byteorder == c'>' and little_endian) or # <<<<<<<<<<<<<< @@ -4413,7 +4413,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P */ } - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":307 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":307 * (descr.byteorder == c'<' and not little_endian)): * raise ValueError(u"Non-native byte order not supported") * if t == NPY_BYTE: f = "b" # <<<<<<<<<<<<<< @@ -4426,7 +4426,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P break; case NPY_UBYTE: - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":308 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":308 * raise ValueError(u"Non-native byte order not supported") * if t == NPY_BYTE: f = "b" * elif t == NPY_UBYTE: f = "B" # <<<<<<<<<<<<<< @@ -4437,7 +4437,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P break; case NPY_SHORT: - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":309 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":309 * if t == NPY_BYTE: f = "b" * elif t == NPY_UBYTE: f = "B" * elif t == NPY_SHORT: f = "h" # <<<<<<<<<<<<<< @@ -4448,7 +4448,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P break; case NPY_USHORT: - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":310 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":310 * elif t == NPY_UBYTE: f = "B" * elif t == NPY_SHORT: f = "h" * elif t == NPY_USHORT: f = "H" # <<<<<<<<<<<<<< @@ -4459,7 +4459,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P break; case NPY_INT: - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":311 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":311 * elif t == NPY_SHORT: f = "h" * elif t == NPY_USHORT: f = "H" * elif t == NPY_INT: f = "i" # <<<<<<<<<<<<<< @@ -4470,7 +4470,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P break; case NPY_UINT: - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":312 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":312 * elif t == NPY_USHORT: f = "H" * elif t == NPY_INT: f = "i" * elif t == NPY_UINT: f = "I" # <<<<<<<<<<<<<< @@ -4481,7 +4481,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P break; case NPY_LONG: - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":313 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":313 * elif t == NPY_INT: f = "i" * elif t == NPY_UINT: f = "I" * elif t == NPY_LONG: f = "l" # <<<<<<<<<<<<<< @@ -4492,7 +4492,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P break; case NPY_ULONG: - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":314 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":314 * elif t == NPY_UINT: f = "I" * elif t == NPY_LONG: f = "l" * elif t == NPY_ULONG: f = "L" # <<<<<<<<<<<<<< @@ -4503,7 +4503,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P break; case NPY_LONGLONG: - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":315 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":315 * elif t == NPY_LONG: f = "l" * elif t == NPY_ULONG: f = "L" * elif t == NPY_LONGLONG: f = "q" # <<<<<<<<<<<<<< @@ -4514,7 +4514,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P break; case NPY_ULONGLONG: - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":316 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":316 * elif t == NPY_ULONG: f = "L" * elif t == NPY_LONGLONG: f = "q" * elif t == NPY_ULONGLONG: f = "Q" # <<<<<<<<<<<<<< @@ -4525,7 +4525,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P break; case NPY_FLOAT: - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":317 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":317 * elif t == NPY_LONGLONG: f = "q" * elif t == NPY_ULONGLONG: f = "Q" * elif t == NPY_FLOAT: f = "f" # <<<<<<<<<<<<<< @@ -4536,7 +4536,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P break; case NPY_DOUBLE: - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":318 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":318 * elif t == NPY_ULONGLONG: f = "Q" * elif t == NPY_FLOAT: f = "f" * elif t == NPY_DOUBLE: f = "d" # <<<<<<<<<<<<<< @@ -4547,7 +4547,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P break; case NPY_LONGDOUBLE: - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":319 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":319 * elif t == NPY_FLOAT: f = "f" * elif t == NPY_DOUBLE: f = "d" * elif t == NPY_LONGDOUBLE: f = "g" # <<<<<<<<<<<<<< @@ -4558,7 +4558,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P break; case NPY_CFLOAT: - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":320 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":320 * elif t == NPY_DOUBLE: f = "d" * elif t == NPY_LONGDOUBLE: f = "g" * elif t == NPY_CFLOAT: f = "Zf" # <<<<<<<<<<<<<< @@ -4569,7 +4569,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P break; case NPY_CDOUBLE: - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":321 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":321 * elif t == NPY_LONGDOUBLE: f = "g" * elif t == NPY_CFLOAT: f = "Zf" * elif t == NPY_CDOUBLE: f = "Zd" # <<<<<<<<<<<<<< @@ -4580,7 +4580,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P break; case NPY_CLONGDOUBLE: - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":322 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":322 * elif t == NPY_CFLOAT: f = "Zf" * elif t == NPY_CDOUBLE: f = "Zd" * elif t == NPY_CLONGDOUBLE: f = "Zg" # <<<<<<<<<<<<<< @@ -4591,7 +4591,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P break; case NPY_OBJECT: - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":323 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":323 * elif t == NPY_CDOUBLE: f = "Zd" * elif t == NPY_CLONGDOUBLE: f = "Zg" * elif t == NPY_OBJECT: f = "O" # <<<<<<<<<<<<<< @@ -4602,7 +4602,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P break; default: - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":325 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":325 * elif t == NPY_OBJECT: f = "O" * else: * raise ValueError(u"unknown dtype code in numpy.pxd (%d)" % t) # <<<<<<<<<<<<<< @@ -4623,7 +4623,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P break; } - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":326 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":326 * else: * raise ValueError(u"unknown dtype code in numpy.pxd (%d)" % t) * info.format = f # <<<<<<<<<<<<<< @@ -4632,7 +4632,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P */ __pyx_v_info->format = __pyx_v_f; - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":327 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":327 * raise ValueError(u"unknown dtype code in numpy.pxd (%d)" % t) * info.format = f * return # <<<<<<<<<<<<<< @@ -4642,7 +4642,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P __pyx_r = 0; goto __pyx_L0; - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":302 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":302 * info.obj = self * * if not PyDataType_HASFIELDS(descr): # <<<<<<<<<<<<<< @@ -4651,7 +4651,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P */ } - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":329 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":329 * return * else: * info.format = PyObject_Malloc(_buffer_format_string_len) # <<<<<<<<<<<<<< @@ -4661,7 +4661,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P /*else*/ { __pyx_v_info->format = ((char *)PyObject_Malloc(0xFF)); - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":330 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":330 * else: * info.format = PyObject_Malloc(_buffer_format_string_len) * info.format[0] = c'^' # Native data types, manual alignment # <<<<<<<<<<<<<< @@ -4670,7 +4670,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P */ (__pyx_v_info->format[0]) = '^'; - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":331 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":331 * info.format = PyObject_Malloc(_buffer_format_string_len) * info.format[0] = c'^' # Native data types, manual alignment * offset = 0 # <<<<<<<<<<<<<< @@ -4679,7 +4679,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P */ __pyx_v_offset = 0; - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":332 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":332 * info.format[0] = c'^' # Native data types, manual alignment * offset = 0 * f = _util_dtypestring(descr, info.format + 1, # <<<<<<<<<<<<<< @@ -4689,7 +4689,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P __pyx_t_9 = __pyx_f_5numpy__util_dtypestring(__pyx_v_descr, (__pyx_v_info->format + 1), (__pyx_v_info->format + 0xFF), (&__pyx_v_offset)); if (unlikely(__pyx_t_9 == ((char *)NULL))) __PYX_ERR(1, 332, __pyx_L1_error) __pyx_v_f = __pyx_t_9; - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":335 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":335 * info.format + _buffer_format_string_len, * &offset) * f[0] = c'\0' # Terminate format string # <<<<<<<<<<<<<< @@ -4699,7 +4699,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P (__pyx_v_f[0]) = '\x00'; } - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":258 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":258 * # experimental exception made for __getbuffer__ and __releasebuffer__ * # -- the details of this may change. * def __getbuffer__(ndarray self, Py_buffer* info, int flags): # <<<<<<<<<<<<<< @@ -4731,7 +4731,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P return __pyx_r; } -/* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":337 +/* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":337 * f[0] = c'\0' # Terminate format string * * def __releasebuffer__(ndarray self, Py_buffer* info): # <<<<<<<<<<<<<< @@ -4755,7 +4755,7 @@ static void __pyx_pf_5numpy_7ndarray_2__releasebuffer__(PyArrayObject *__pyx_v_s int __pyx_t_1; __Pyx_RefNannySetupContext("__releasebuffer__", 0); - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":338 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":338 * * def __releasebuffer__(ndarray self, Py_buffer* info): * if PyArray_HASFIELDS(self): # <<<<<<<<<<<<<< @@ -4765,7 +4765,7 @@ static void __pyx_pf_5numpy_7ndarray_2__releasebuffer__(PyArrayObject *__pyx_v_s __pyx_t_1 = (PyArray_HASFIELDS(__pyx_v_self) != 0); if (__pyx_t_1) { - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":339 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":339 * def __releasebuffer__(ndarray self, Py_buffer* info): * if PyArray_HASFIELDS(self): * PyObject_Free(info.format) # <<<<<<<<<<<<<< @@ -4774,7 +4774,7 @@ static void __pyx_pf_5numpy_7ndarray_2__releasebuffer__(PyArrayObject *__pyx_v_s */ PyObject_Free(__pyx_v_info->format); - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":338 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":338 * * def __releasebuffer__(ndarray self, Py_buffer* info): * if PyArray_HASFIELDS(self): # <<<<<<<<<<<<<< @@ -4783,7 +4783,7 @@ static void __pyx_pf_5numpy_7ndarray_2__releasebuffer__(PyArrayObject *__pyx_v_s */ } - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":340 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":340 * if PyArray_HASFIELDS(self): * PyObject_Free(info.format) * if sizeof(npy_intp) != sizeof(Py_ssize_t): # <<<<<<<<<<<<<< @@ -4793,7 +4793,7 @@ static void __pyx_pf_5numpy_7ndarray_2__releasebuffer__(PyArrayObject *__pyx_v_s __pyx_t_1 = (((sizeof(npy_intp)) != (sizeof(Py_ssize_t))) != 0); if (__pyx_t_1) { - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":341 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":341 * PyObject_Free(info.format) * if sizeof(npy_intp) != sizeof(Py_ssize_t): * PyObject_Free(info.strides) # <<<<<<<<<<<<<< @@ -4802,7 +4802,7 @@ static void __pyx_pf_5numpy_7ndarray_2__releasebuffer__(PyArrayObject *__pyx_v_s */ PyObject_Free(__pyx_v_info->strides); - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":340 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":340 * if PyArray_HASFIELDS(self): * PyObject_Free(info.format) * if sizeof(npy_intp) != sizeof(Py_ssize_t): # <<<<<<<<<<<<<< @@ -4811,7 +4811,7 @@ static void __pyx_pf_5numpy_7ndarray_2__releasebuffer__(PyArrayObject *__pyx_v_s */ } - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":337 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":337 * f[0] = c'\0' # Terminate format string * * def __releasebuffer__(ndarray self, Py_buffer* info): # <<<<<<<<<<<<<< @@ -4823,7 +4823,7 @@ static void __pyx_pf_5numpy_7ndarray_2__releasebuffer__(PyArrayObject *__pyx_v_s __Pyx_RefNannyFinishContext(); } -/* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":821 +/* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":821 * ctypedef npy_cdouble complex_t * * cdef inline object PyArray_MultiIterNew1(a): # <<<<<<<<<<<<<< @@ -4837,7 +4837,7 @@ static CYTHON_INLINE PyObject *__pyx_f_5numpy_PyArray_MultiIterNew1(PyObject *__ PyObject *__pyx_t_1 = NULL; __Pyx_RefNannySetupContext("PyArray_MultiIterNew1", 0); - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":822 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":822 * * cdef inline object PyArray_MultiIterNew1(a): * return PyArray_MultiIterNew(1, a) # <<<<<<<<<<<<<< @@ -4851,7 +4851,7 @@ static CYTHON_INLINE PyObject *__pyx_f_5numpy_PyArray_MultiIterNew1(PyObject *__ __pyx_t_1 = 0; goto __pyx_L0; - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":821 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":821 * ctypedef npy_cdouble complex_t * * cdef inline object PyArray_MultiIterNew1(a): # <<<<<<<<<<<<<< @@ -4870,7 +4870,7 @@ static CYTHON_INLINE PyObject *__pyx_f_5numpy_PyArray_MultiIterNew1(PyObject *__ return __pyx_r; } -/* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":824 +/* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":824 * return PyArray_MultiIterNew(1, a) * * cdef inline object PyArray_MultiIterNew2(a, b): # <<<<<<<<<<<<<< @@ -4884,7 +4884,7 @@ static CYTHON_INLINE PyObject *__pyx_f_5numpy_PyArray_MultiIterNew2(PyObject *__ PyObject *__pyx_t_1 = NULL; __Pyx_RefNannySetupContext("PyArray_MultiIterNew2", 0); - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":825 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":825 * * cdef inline object PyArray_MultiIterNew2(a, b): * return PyArray_MultiIterNew(2, a, b) # <<<<<<<<<<<<<< @@ -4898,7 +4898,7 @@ static CYTHON_INLINE PyObject *__pyx_f_5numpy_PyArray_MultiIterNew2(PyObject *__ __pyx_t_1 = 0; goto __pyx_L0; - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":824 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":824 * return PyArray_MultiIterNew(1, a) * * cdef inline object PyArray_MultiIterNew2(a, b): # <<<<<<<<<<<<<< @@ -4917,7 +4917,7 @@ static CYTHON_INLINE PyObject *__pyx_f_5numpy_PyArray_MultiIterNew2(PyObject *__ return __pyx_r; } -/* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":827 +/* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":827 * return PyArray_MultiIterNew(2, a, b) * * cdef inline object PyArray_MultiIterNew3(a, b, c): # <<<<<<<<<<<<<< @@ -4931,7 +4931,7 @@ static CYTHON_INLINE PyObject *__pyx_f_5numpy_PyArray_MultiIterNew3(PyObject *__ PyObject *__pyx_t_1 = NULL; __Pyx_RefNannySetupContext("PyArray_MultiIterNew3", 0); - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":828 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":828 * * cdef inline object PyArray_MultiIterNew3(a, b, c): * return PyArray_MultiIterNew(3, a, b, c) # <<<<<<<<<<<<<< @@ -4945,7 +4945,7 @@ static CYTHON_INLINE PyObject *__pyx_f_5numpy_PyArray_MultiIterNew3(PyObject *__ __pyx_t_1 = 0; goto __pyx_L0; - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":827 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":827 * return PyArray_MultiIterNew(2, a, b) * * cdef inline object PyArray_MultiIterNew3(a, b, c): # <<<<<<<<<<<<<< @@ -4964,7 +4964,7 @@ static CYTHON_INLINE PyObject *__pyx_f_5numpy_PyArray_MultiIterNew3(PyObject *__ return __pyx_r; } -/* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":830 +/* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":830 * return PyArray_MultiIterNew(3, a, b, c) * * cdef inline object PyArray_MultiIterNew4(a, b, c, d): # <<<<<<<<<<<<<< @@ -4978,7 +4978,7 @@ static CYTHON_INLINE PyObject *__pyx_f_5numpy_PyArray_MultiIterNew4(PyObject *__ PyObject *__pyx_t_1 = NULL; __Pyx_RefNannySetupContext("PyArray_MultiIterNew4", 0); - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":831 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":831 * * cdef inline object PyArray_MultiIterNew4(a, b, c, d): * return PyArray_MultiIterNew(4, a, b, c, d) # <<<<<<<<<<<<<< @@ -4992,7 +4992,7 @@ static CYTHON_INLINE PyObject *__pyx_f_5numpy_PyArray_MultiIterNew4(PyObject *__ __pyx_t_1 = 0; goto __pyx_L0; - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":830 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":830 * return PyArray_MultiIterNew(3, a, b, c) * * cdef inline object PyArray_MultiIterNew4(a, b, c, d): # <<<<<<<<<<<<<< @@ -5011,7 +5011,7 @@ static CYTHON_INLINE PyObject *__pyx_f_5numpy_PyArray_MultiIterNew4(PyObject *__ return __pyx_r; } -/* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":833 +/* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":833 * return PyArray_MultiIterNew(4, a, b, c, d) * * cdef inline object PyArray_MultiIterNew5(a, b, c, d, e): # <<<<<<<<<<<<<< @@ -5025,7 +5025,7 @@ static CYTHON_INLINE PyObject *__pyx_f_5numpy_PyArray_MultiIterNew5(PyObject *__ PyObject *__pyx_t_1 = NULL; __Pyx_RefNannySetupContext("PyArray_MultiIterNew5", 0); - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":834 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":834 * * cdef inline object PyArray_MultiIterNew5(a, b, c, d, e): * return PyArray_MultiIterNew(5, a, b, c, d, e) # <<<<<<<<<<<<<< @@ -5039,7 +5039,7 @@ static CYTHON_INLINE PyObject *__pyx_f_5numpy_PyArray_MultiIterNew5(PyObject *__ __pyx_t_1 = 0; goto __pyx_L0; - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":833 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":833 * return PyArray_MultiIterNew(4, a, b, c, d) * * cdef inline object PyArray_MultiIterNew5(a, b, c, d, e): # <<<<<<<<<<<<<< @@ -5058,7 +5058,7 @@ static CYTHON_INLINE PyObject *__pyx_f_5numpy_PyArray_MultiIterNew5(PyObject *__ return __pyx_r; } -/* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":836 +/* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":836 * return PyArray_MultiIterNew(5, a, b, c, d, e) * * cdef inline tuple PyDataType_SHAPE(dtype d): # <<<<<<<<<<<<<< @@ -5072,7 +5072,7 @@ static CYTHON_INLINE PyObject *__pyx_f_5numpy_PyDataType_SHAPE(PyArray_Descr *__ int __pyx_t_1; __Pyx_RefNannySetupContext("PyDataType_SHAPE", 0); - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":837 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":837 * * cdef inline tuple PyDataType_SHAPE(dtype d): * if PyDataType_HASSUBARRAY(d): # <<<<<<<<<<<<<< @@ -5082,7 +5082,7 @@ static CYTHON_INLINE PyObject *__pyx_f_5numpy_PyDataType_SHAPE(PyArray_Descr *__ __pyx_t_1 = (PyDataType_HASSUBARRAY(__pyx_v_d) != 0); if (__pyx_t_1) { - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":838 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":838 * cdef inline tuple PyDataType_SHAPE(dtype d): * if PyDataType_HASSUBARRAY(d): * return d.subarray.shape # <<<<<<<<<<<<<< @@ -5094,7 +5094,7 @@ static CYTHON_INLINE PyObject *__pyx_f_5numpy_PyDataType_SHAPE(PyArray_Descr *__ __pyx_r = ((PyObject*)__pyx_v_d->subarray->shape); goto __pyx_L0; - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":837 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":837 * * cdef inline tuple PyDataType_SHAPE(dtype d): * if PyDataType_HASSUBARRAY(d): # <<<<<<<<<<<<<< @@ -5103,7 +5103,7 @@ static CYTHON_INLINE PyObject *__pyx_f_5numpy_PyDataType_SHAPE(PyArray_Descr *__ */ } - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":840 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":840 * return d.subarray.shape * else: * return () # <<<<<<<<<<<<<< @@ -5117,7 +5117,7 @@ static CYTHON_INLINE PyObject *__pyx_f_5numpy_PyDataType_SHAPE(PyArray_Descr *__ goto __pyx_L0; } - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":836 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":836 * return PyArray_MultiIterNew(5, a, b, c, d, e) * * cdef inline tuple PyDataType_SHAPE(dtype d): # <<<<<<<<<<<<<< @@ -5132,7 +5132,7 @@ static CYTHON_INLINE PyObject *__pyx_f_5numpy_PyDataType_SHAPE(PyArray_Descr *__ return __pyx_r; } -/* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":842 +/* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":842 * return () * * cdef inline char* _util_dtypestring(dtype descr, char* f, char* end, int* offset) except NULL: # <<<<<<<<<<<<<< @@ -5161,7 +5161,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx char *__pyx_t_9; __Pyx_RefNannySetupContext("_util_dtypestring", 0); - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":847 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":847 * * cdef dtype child * cdef int endian_detector = 1 # <<<<<<<<<<<<<< @@ -5170,7 +5170,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx */ __pyx_v_endian_detector = 1; - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":848 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":848 * cdef dtype child * cdef int endian_detector = 1 * cdef bint little_endian = ((&endian_detector)[0] != 0) # <<<<<<<<<<<<<< @@ -5179,7 +5179,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx */ __pyx_v_little_endian = ((((char *)(&__pyx_v_endian_detector))[0]) != 0); - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":851 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":851 * cdef tuple fields * * for childname in descr.names: # <<<<<<<<<<<<<< @@ -5202,7 +5202,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx __Pyx_XDECREF_SET(__pyx_v_childname, __pyx_t_3); __pyx_t_3 = 0; - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":852 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":852 * * for childname in descr.names: * fields = descr.fields[childname] # <<<<<<<<<<<<<< @@ -5219,7 +5219,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx __Pyx_XDECREF_SET(__pyx_v_fields, ((PyObject*)__pyx_t_3)); __pyx_t_3 = 0; - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":853 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":853 * for childname in descr.names: * fields = descr.fields[childname] * child, new_offset = fields # <<<<<<<<<<<<<< @@ -5254,7 +5254,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx __Pyx_XDECREF_SET(__pyx_v_new_offset, __pyx_t_4); __pyx_t_4 = 0; - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":855 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":855 * child, new_offset = fields * * if (end - f) - (new_offset - offset[0]) < 15: # <<<<<<<<<<<<<< @@ -5271,7 +5271,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx __pyx_t_6 = ((((__pyx_v_end - __pyx_v_f) - ((int)__pyx_t_5)) < 15) != 0); if (unlikely(__pyx_t_6)) { - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":856 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":856 * * if (end - f) - (new_offset - offset[0]) < 15: * raise RuntimeError(u"Format string allocated too short, see comment in numpy.pxd") # <<<<<<<<<<<<<< @@ -5284,7 +5284,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx __Pyx_DECREF(__pyx_t_3); __pyx_t_3 = 0; __PYX_ERR(1, 856, __pyx_L1_error) - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":855 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":855 * child, new_offset = fields * * if (end - f) - (new_offset - offset[0]) < 15: # <<<<<<<<<<<<<< @@ -5293,7 +5293,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx */ } - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":858 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":858 * raise RuntimeError(u"Format string allocated too short, see comment in numpy.pxd") * * if ((child.byteorder == c'>' and little_endian) or # <<<<<<<<<<<<<< @@ -5313,7 +5313,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx } __pyx_L8_next_or:; - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":859 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":859 * * if ((child.byteorder == c'>' and little_endian) or * (child.byteorder == c'<' and not little_endian)): # <<<<<<<<<<<<<< @@ -5330,7 +5330,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx __pyx_t_6 = __pyx_t_7; __pyx_L7_bool_binop_done:; - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":858 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":858 * raise RuntimeError(u"Format string allocated too short, see comment in numpy.pxd") * * if ((child.byteorder == c'>' and little_endian) or # <<<<<<<<<<<<<< @@ -5339,7 +5339,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx */ if (unlikely(__pyx_t_6)) { - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":860 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":860 * if ((child.byteorder == c'>' and little_endian) or * (child.byteorder == c'<' and not little_endian)): * raise ValueError(u"Non-native byte order not supported") # <<<<<<<<<<<<<< @@ -5352,7 +5352,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx __Pyx_DECREF(__pyx_t_3); __pyx_t_3 = 0; __PYX_ERR(1, 860, __pyx_L1_error) - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":858 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":858 * raise RuntimeError(u"Format string allocated too short, see comment in numpy.pxd") * * if ((child.byteorder == c'>' and little_endian) or # <<<<<<<<<<<<<< @@ -5361,7 +5361,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx */ } - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":870 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":870 * * # Output padding bytes * while offset[0] < new_offset: # <<<<<<<<<<<<<< @@ -5377,7 +5377,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx __Pyx_DECREF(__pyx_t_4); __pyx_t_4 = 0; if (!__pyx_t_6) break; - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":871 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":871 * # Output padding bytes * while offset[0] < new_offset: * f[0] = 120 # "x"; pad byte # <<<<<<<<<<<<<< @@ -5386,7 +5386,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx */ (__pyx_v_f[0]) = 0x78; - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":872 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":872 * while offset[0] < new_offset: * f[0] = 120 # "x"; pad byte * f += 1 # <<<<<<<<<<<<<< @@ -5395,7 +5395,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx */ __pyx_v_f = (__pyx_v_f + 1); - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":873 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":873 * f[0] = 120 # "x"; pad byte * f += 1 * offset[0] += 1 # <<<<<<<<<<<<<< @@ -5406,7 +5406,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx (__pyx_v_offset[__pyx_t_8]) = ((__pyx_v_offset[__pyx_t_8]) + 1); } - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":875 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":875 * offset[0] += 1 * * offset[0] += child.itemsize # <<<<<<<<<<<<<< @@ -5416,7 +5416,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx __pyx_t_8 = 0; (__pyx_v_offset[__pyx_t_8]) = ((__pyx_v_offset[__pyx_t_8]) + __pyx_v_child->elsize); - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":877 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":877 * offset[0] += child.itemsize * * if not PyDataType_HASFIELDS(child): # <<<<<<<<<<<<<< @@ -5426,7 +5426,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx __pyx_t_6 = ((!(PyDataType_HASFIELDS(__pyx_v_child) != 0)) != 0); if (__pyx_t_6) { - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":878 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":878 * * if not PyDataType_HASFIELDS(child): * t = child.type_num # <<<<<<<<<<<<<< @@ -5438,7 +5438,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx __Pyx_XDECREF_SET(__pyx_v_t, __pyx_t_4); __pyx_t_4 = 0; - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":879 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":879 * if not PyDataType_HASFIELDS(child): * t = child.type_num * if end - f < 5: # <<<<<<<<<<<<<< @@ -5448,7 +5448,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx __pyx_t_6 = (((__pyx_v_end - __pyx_v_f) < 5) != 0); if (unlikely(__pyx_t_6)) { - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":880 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":880 * t = child.type_num * if end - f < 5: * raise RuntimeError(u"Format string allocated too short.") # <<<<<<<<<<<<<< @@ -5461,7 +5461,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx __Pyx_DECREF(__pyx_t_4); __pyx_t_4 = 0; __PYX_ERR(1, 880, __pyx_L1_error) - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":879 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":879 * if not PyDataType_HASFIELDS(child): * t = child.type_num * if end - f < 5: # <<<<<<<<<<<<<< @@ -5470,7 +5470,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx */ } - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":883 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":883 * * # Until ticket #99 is fixed, use integers to avoid warnings * if t == NPY_BYTE: f[0] = 98 #"b" # <<<<<<<<<<<<<< @@ -5488,7 +5488,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx goto __pyx_L15; } - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":884 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":884 * # Until ticket #99 is fixed, use integers to avoid warnings * if t == NPY_BYTE: f[0] = 98 #"b" * elif t == NPY_UBYTE: f[0] = 66 #"B" # <<<<<<<<<<<<<< @@ -5506,7 +5506,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx goto __pyx_L15; } - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":885 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":885 * if t == NPY_BYTE: f[0] = 98 #"b" * elif t == NPY_UBYTE: f[0] = 66 #"B" * elif t == NPY_SHORT: f[0] = 104 #"h" # <<<<<<<<<<<<<< @@ -5524,7 +5524,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx goto __pyx_L15; } - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":886 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":886 * elif t == NPY_UBYTE: f[0] = 66 #"B" * elif t == NPY_SHORT: f[0] = 104 #"h" * elif t == NPY_USHORT: f[0] = 72 #"H" # <<<<<<<<<<<<<< @@ -5542,7 +5542,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx goto __pyx_L15; } - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":887 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":887 * elif t == NPY_SHORT: f[0] = 104 #"h" * elif t == NPY_USHORT: f[0] = 72 #"H" * elif t == NPY_INT: f[0] = 105 #"i" # <<<<<<<<<<<<<< @@ -5560,7 +5560,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx goto __pyx_L15; } - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":888 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":888 * elif t == NPY_USHORT: f[0] = 72 #"H" * elif t == NPY_INT: f[0] = 105 #"i" * elif t == NPY_UINT: f[0] = 73 #"I" # <<<<<<<<<<<<<< @@ -5578,7 +5578,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx goto __pyx_L15; } - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":889 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":889 * elif t == NPY_INT: f[0] = 105 #"i" * elif t == NPY_UINT: f[0] = 73 #"I" * elif t == NPY_LONG: f[0] = 108 #"l" # <<<<<<<<<<<<<< @@ -5596,7 +5596,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx goto __pyx_L15; } - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":890 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":890 * elif t == NPY_UINT: f[0] = 73 #"I" * elif t == NPY_LONG: f[0] = 108 #"l" * elif t == NPY_ULONG: f[0] = 76 #"L" # <<<<<<<<<<<<<< @@ -5614,7 +5614,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx goto __pyx_L15; } - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":891 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":891 * elif t == NPY_LONG: f[0] = 108 #"l" * elif t == NPY_ULONG: f[0] = 76 #"L" * elif t == NPY_LONGLONG: f[0] = 113 #"q" # <<<<<<<<<<<<<< @@ -5632,7 +5632,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx goto __pyx_L15; } - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":892 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":892 * elif t == NPY_ULONG: f[0] = 76 #"L" * elif t == NPY_LONGLONG: f[0] = 113 #"q" * elif t == NPY_ULONGLONG: f[0] = 81 #"Q" # <<<<<<<<<<<<<< @@ -5650,7 +5650,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx goto __pyx_L15; } - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":893 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":893 * elif t == NPY_LONGLONG: f[0] = 113 #"q" * elif t == NPY_ULONGLONG: f[0] = 81 #"Q" * elif t == NPY_FLOAT: f[0] = 102 #"f" # <<<<<<<<<<<<<< @@ -5668,7 +5668,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx goto __pyx_L15; } - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":894 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":894 * elif t == NPY_ULONGLONG: f[0] = 81 #"Q" * elif t == NPY_FLOAT: f[0] = 102 #"f" * elif t == NPY_DOUBLE: f[0] = 100 #"d" # <<<<<<<<<<<<<< @@ -5686,7 +5686,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx goto __pyx_L15; } - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":895 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":895 * elif t == NPY_FLOAT: f[0] = 102 #"f" * elif t == NPY_DOUBLE: f[0] = 100 #"d" * elif t == NPY_LONGDOUBLE: f[0] = 103 #"g" # <<<<<<<<<<<<<< @@ -5704,7 +5704,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx goto __pyx_L15; } - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":896 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":896 * elif t == NPY_DOUBLE: f[0] = 100 #"d" * elif t == NPY_LONGDOUBLE: f[0] = 103 #"g" * elif t == NPY_CFLOAT: f[0] = 90; f[1] = 102; f += 1 # Zf # <<<<<<<<<<<<<< @@ -5724,7 +5724,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx goto __pyx_L15; } - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":897 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":897 * elif t == NPY_LONGDOUBLE: f[0] = 103 #"g" * elif t == NPY_CFLOAT: f[0] = 90; f[1] = 102; f += 1 # Zf * elif t == NPY_CDOUBLE: f[0] = 90; f[1] = 100; f += 1 # Zd # <<<<<<<<<<<<<< @@ -5744,7 +5744,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx goto __pyx_L15; } - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":898 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":898 * elif t == NPY_CFLOAT: f[0] = 90; f[1] = 102; f += 1 # Zf * elif t == NPY_CDOUBLE: f[0] = 90; f[1] = 100; f += 1 # Zd * elif t == NPY_CLONGDOUBLE: f[0] = 90; f[1] = 103; f += 1 # Zg # <<<<<<<<<<<<<< @@ -5764,7 +5764,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx goto __pyx_L15; } - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":899 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":899 * elif t == NPY_CDOUBLE: f[0] = 90; f[1] = 100; f += 1 # Zd * elif t == NPY_CLONGDOUBLE: f[0] = 90; f[1] = 103; f += 1 # Zg * elif t == NPY_OBJECT: f[0] = 79 #"O" # <<<<<<<<<<<<<< @@ -5782,7 +5782,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx goto __pyx_L15; } - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":901 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":901 * elif t == NPY_OBJECT: f[0] = 79 #"O" * else: * raise ValueError(u"unknown dtype code in numpy.pxd (%d)" % t) # <<<<<<<<<<<<<< @@ -5801,7 +5801,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx } __pyx_L15:; - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":902 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":902 * else: * raise ValueError(u"unknown dtype code in numpy.pxd (%d)" % t) * f += 1 # <<<<<<<<<<<<<< @@ -5810,7 +5810,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx */ __pyx_v_f = (__pyx_v_f + 1); - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":877 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":877 * offset[0] += child.itemsize * * if not PyDataType_HASFIELDS(child): # <<<<<<<<<<<<<< @@ -5820,7 +5820,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx goto __pyx_L13; } - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":906 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":906 * # Cython ignores struct boundary information ("T{...}"), * # so don't output it * f = _util_dtypestring(child, f, end, offset) # <<<<<<<<<<<<<< @@ -5833,7 +5833,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx } __pyx_L13:; - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":851 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":851 * cdef tuple fields * * for childname in descr.names: # <<<<<<<<<<<<<< @@ -5843,7 +5843,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx } __Pyx_DECREF(__pyx_t_1); __pyx_t_1 = 0; - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":907 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":907 * # so don't output it * f = _util_dtypestring(child, f, end, offset) * return f # <<<<<<<<<<<<<< @@ -5853,7 +5853,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx __pyx_r = __pyx_v_f; goto __pyx_L0; - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":842 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":842 * return () * * cdef inline char* _util_dtypestring(dtype descr, char* f, char* end, int* offset) except NULL: # <<<<<<<<<<<<<< @@ -5878,7 +5878,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx return __pyx_r; } -/* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1022 +/* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1022 * int _import_umath() except -1 * * cdef inline void set_array_base(ndarray arr, object base): # <<<<<<<<<<<<<< @@ -5890,7 +5890,7 @@ static CYTHON_INLINE void __pyx_f_5numpy_set_array_base(PyArrayObject *__pyx_v_a __Pyx_RefNannyDeclarations __Pyx_RefNannySetupContext("set_array_base", 0); - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1023 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1023 * * cdef inline void set_array_base(ndarray arr, object base): * Py_INCREF(base) # important to do this before stealing the reference below! # <<<<<<<<<<<<<< @@ -5899,7 +5899,7 @@ static CYTHON_INLINE void __pyx_f_5numpy_set_array_base(PyArrayObject *__pyx_v_a */ Py_INCREF(__pyx_v_base); - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1024 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1024 * cdef inline void set_array_base(ndarray arr, object base): * Py_INCREF(base) # important to do this before stealing the reference below! * PyArray_SetBaseObject(arr, base) # <<<<<<<<<<<<<< @@ -5908,7 +5908,7 @@ static CYTHON_INLINE void __pyx_f_5numpy_set_array_base(PyArrayObject *__pyx_v_a */ (void)(PyArray_SetBaseObject(__pyx_v_arr, __pyx_v_base)); - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1022 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1022 * int _import_umath() except -1 * * cdef inline void set_array_base(ndarray arr, object base): # <<<<<<<<<<<<<< @@ -5920,7 +5920,7 @@ static CYTHON_INLINE void __pyx_f_5numpy_set_array_base(PyArrayObject *__pyx_v_a __Pyx_RefNannyFinishContext(); } -/* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1026 +/* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1026 * PyArray_SetBaseObject(arr, base) * * cdef inline object get_array_base(ndarray arr): # <<<<<<<<<<<<<< @@ -5935,7 +5935,7 @@ static CYTHON_INLINE PyObject *__pyx_f_5numpy_get_array_base(PyArrayObject *__py int __pyx_t_1; __Pyx_RefNannySetupContext("get_array_base", 0); - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1027 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1027 * * cdef inline object get_array_base(ndarray arr): * base = PyArray_BASE(arr) # <<<<<<<<<<<<<< @@ -5944,7 +5944,7 @@ static CYTHON_INLINE PyObject *__pyx_f_5numpy_get_array_base(PyArrayObject *__py */ __pyx_v_base = PyArray_BASE(__pyx_v_arr); - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1028 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1028 * cdef inline object get_array_base(ndarray arr): * base = PyArray_BASE(arr) * if base is NULL: # <<<<<<<<<<<<<< @@ -5954,7 +5954,7 @@ static CYTHON_INLINE PyObject *__pyx_f_5numpy_get_array_base(PyArrayObject *__py __pyx_t_1 = ((__pyx_v_base == NULL) != 0); if (__pyx_t_1) { - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1029 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1029 * base = PyArray_BASE(arr) * if base is NULL: * return None # <<<<<<<<<<<<<< @@ -5965,7 +5965,7 @@ static CYTHON_INLINE PyObject *__pyx_f_5numpy_get_array_base(PyArrayObject *__py __pyx_r = Py_None; __Pyx_INCREF(Py_None); goto __pyx_L0; - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1028 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1028 * cdef inline object get_array_base(ndarray arr): * base = PyArray_BASE(arr) * if base is NULL: # <<<<<<<<<<<<<< @@ -5974,7 +5974,7 @@ static CYTHON_INLINE PyObject *__pyx_f_5numpy_get_array_base(PyArrayObject *__py */ } - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1030 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1030 * if base is NULL: * return None * return base # <<<<<<<<<<<<<< @@ -5986,7 +5986,7 @@ static CYTHON_INLINE PyObject *__pyx_f_5numpy_get_array_base(PyArrayObject *__py __pyx_r = ((PyObject *)__pyx_v_base); goto __pyx_L0; - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1026 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1026 * PyArray_SetBaseObject(arr, base) * * cdef inline object get_array_base(ndarray arr): # <<<<<<<<<<<<<< @@ -6001,7 +6001,7 @@ static CYTHON_INLINE PyObject *__pyx_f_5numpy_get_array_base(PyArrayObject *__py return __pyx_r; } -/* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1034 +/* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1034 * # Versions of the import_* functions which are more suitable for * # Cython code. * cdef inline int import_array() except -1: # <<<<<<<<<<<<<< @@ -6022,7 +6022,7 @@ static CYTHON_INLINE int __pyx_f_5numpy_import_array(void) { PyObject *__pyx_t_8 = NULL; __Pyx_RefNannySetupContext("import_array", 0); - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1035 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1035 * # Cython code. * cdef inline int import_array() except -1: * try: # <<<<<<<<<<<<<< @@ -6038,7 +6038,7 @@ static CYTHON_INLINE int __pyx_f_5numpy_import_array(void) { __Pyx_XGOTREF(__pyx_t_3); /*try:*/ { - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1036 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1036 * cdef inline int import_array() except -1: * try: * _import_array() # <<<<<<<<<<<<<< @@ -6047,7 +6047,7 @@ static CYTHON_INLINE int __pyx_f_5numpy_import_array(void) { */ __pyx_t_4 = _import_array(); if (unlikely(__pyx_t_4 == ((int)-1))) __PYX_ERR(1, 1036, __pyx_L3_error) - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1035 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1035 * # Cython code. * cdef inline int import_array() except -1: * try: # <<<<<<<<<<<<<< @@ -6061,7 +6061,7 @@ static CYTHON_INLINE int __pyx_f_5numpy_import_array(void) { goto __pyx_L8_try_end; __pyx_L3_error:; - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1037 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1037 * try: * _import_array() * except Exception: # <<<<<<<<<<<<<< @@ -6076,7 +6076,7 @@ static CYTHON_INLINE int __pyx_f_5numpy_import_array(void) { __Pyx_GOTREF(__pyx_t_6); __Pyx_GOTREF(__pyx_t_7); - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1038 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1038 * _import_array() * except Exception: * raise ImportError("numpy.core.multiarray failed to import") # <<<<<<<<<<<<<< @@ -6092,7 +6092,7 @@ static CYTHON_INLINE int __pyx_f_5numpy_import_array(void) { goto __pyx_L5_except_error; __pyx_L5_except_error:; - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1035 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1035 * # Cython code. * cdef inline int import_array() except -1: * try: # <<<<<<<<<<<<<< @@ -6107,7 +6107,7 @@ static CYTHON_INLINE int __pyx_f_5numpy_import_array(void) { __pyx_L8_try_end:; } - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1034 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1034 * # Versions of the import_* functions which are more suitable for * # Cython code. * cdef inline int import_array() except -1: # <<<<<<<<<<<<<< @@ -6130,7 +6130,7 @@ static CYTHON_INLINE int __pyx_f_5numpy_import_array(void) { return __pyx_r; } -/* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1040 +/* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1040 * raise ImportError("numpy.core.multiarray failed to import") * * cdef inline int import_umath() except -1: # <<<<<<<<<<<<<< @@ -6151,7 +6151,7 @@ static CYTHON_INLINE int __pyx_f_5numpy_import_umath(void) { PyObject *__pyx_t_8 = NULL; __Pyx_RefNannySetupContext("import_umath", 0); - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1041 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1041 * * cdef inline int import_umath() except -1: * try: # <<<<<<<<<<<<<< @@ -6167,7 +6167,7 @@ static CYTHON_INLINE int __pyx_f_5numpy_import_umath(void) { __Pyx_XGOTREF(__pyx_t_3); /*try:*/ { - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1042 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1042 * cdef inline int import_umath() except -1: * try: * _import_umath() # <<<<<<<<<<<<<< @@ -6176,7 +6176,7 @@ static CYTHON_INLINE int __pyx_f_5numpy_import_umath(void) { */ __pyx_t_4 = _import_umath(); if (unlikely(__pyx_t_4 == ((int)-1))) __PYX_ERR(1, 1042, __pyx_L3_error) - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1041 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1041 * * cdef inline int import_umath() except -1: * try: # <<<<<<<<<<<<<< @@ -6190,7 +6190,7 @@ static CYTHON_INLINE int __pyx_f_5numpy_import_umath(void) { goto __pyx_L8_try_end; __pyx_L3_error:; - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1043 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1043 * try: * _import_umath() * except Exception: # <<<<<<<<<<<<<< @@ -6205,7 +6205,7 @@ static CYTHON_INLINE int __pyx_f_5numpy_import_umath(void) { __Pyx_GOTREF(__pyx_t_6); __Pyx_GOTREF(__pyx_t_7); - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1044 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1044 * _import_umath() * except Exception: * raise ImportError("numpy.core.umath failed to import") # <<<<<<<<<<<<<< @@ -6221,7 +6221,7 @@ static CYTHON_INLINE int __pyx_f_5numpy_import_umath(void) { goto __pyx_L5_except_error; __pyx_L5_except_error:; - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1041 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1041 * * cdef inline int import_umath() except -1: * try: # <<<<<<<<<<<<<< @@ -6236,7 +6236,7 @@ static CYTHON_INLINE int __pyx_f_5numpy_import_umath(void) { __pyx_L8_try_end:; } - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1040 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1040 * raise ImportError("numpy.core.multiarray failed to import") * * cdef inline int import_umath() except -1: # <<<<<<<<<<<<<< @@ -6259,7 +6259,7 @@ static CYTHON_INLINE int __pyx_f_5numpy_import_umath(void) { return __pyx_r; } -/* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1046 +/* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1046 * raise ImportError("numpy.core.umath failed to import") * * cdef inline int import_ufunc() except -1: # <<<<<<<<<<<<<< @@ -6280,7 +6280,7 @@ static CYTHON_INLINE int __pyx_f_5numpy_import_ufunc(void) { PyObject *__pyx_t_8 = NULL; __Pyx_RefNannySetupContext("import_ufunc", 0); - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1047 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1047 * * cdef inline int import_ufunc() except -1: * try: # <<<<<<<<<<<<<< @@ -6296,7 +6296,7 @@ static CYTHON_INLINE int __pyx_f_5numpy_import_ufunc(void) { __Pyx_XGOTREF(__pyx_t_3); /*try:*/ { - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1048 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1048 * cdef inline int import_ufunc() except -1: * try: * _import_umath() # <<<<<<<<<<<<<< @@ -6305,7 +6305,7 @@ static CYTHON_INLINE int __pyx_f_5numpy_import_ufunc(void) { */ __pyx_t_4 = _import_umath(); if (unlikely(__pyx_t_4 == ((int)-1))) __PYX_ERR(1, 1048, __pyx_L3_error) - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1047 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1047 * * cdef inline int import_ufunc() except -1: * try: # <<<<<<<<<<<<<< @@ -6319,7 +6319,7 @@ static CYTHON_INLINE int __pyx_f_5numpy_import_ufunc(void) { goto __pyx_L8_try_end; __pyx_L3_error:; - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1049 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1049 * try: * _import_umath() * except Exception: # <<<<<<<<<<<<<< @@ -6333,7 +6333,7 @@ static CYTHON_INLINE int __pyx_f_5numpy_import_ufunc(void) { __Pyx_GOTREF(__pyx_t_6); __Pyx_GOTREF(__pyx_t_7); - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1050 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1050 * _import_umath() * except Exception: * raise ImportError("numpy.core.umath failed to import") # <<<<<<<<<<<<<< @@ -6347,7 +6347,7 @@ static CYTHON_INLINE int __pyx_f_5numpy_import_ufunc(void) { goto __pyx_L5_except_error; __pyx_L5_except_error:; - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1047 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1047 * * cdef inline int import_ufunc() except -1: * try: # <<<<<<<<<<<<<< @@ -6362,7 +6362,7 @@ static CYTHON_INLINE int __pyx_f_5numpy_import_ufunc(void) { __pyx_L8_try_end:; } - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1046 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1046 * raise ImportError("numpy.core.umath failed to import") * * cdef inline int import_ufunc() except -1: # <<<<<<<<<<<<<< @@ -6507,7 +6507,7 @@ static CYTHON_SMALL_CODE int __Pyx_InitCachedConstants(void) { __Pyx_RefNannyDeclarations __Pyx_RefNannySetupContext("__Pyx_InitCachedConstants", 0); - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":272 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":272 * if ((flags & pybuf.PyBUF_C_CONTIGUOUS == pybuf.PyBUF_C_CONTIGUOUS) * and not PyArray_CHKFLAGS(self, NPY_ARRAY_C_CONTIGUOUS)): * raise ValueError(u"ndarray is not C contiguous") # <<<<<<<<<<<<<< @@ -6518,7 +6518,7 @@ static CYTHON_SMALL_CODE int __Pyx_InitCachedConstants(void) { __Pyx_GOTREF(__pyx_tuple_); __Pyx_GIVEREF(__pyx_tuple_); - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":276 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":276 * if ((flags & pybuf.PyBUF_F_CONTIGUOUS == pybuf.PyBUF_F_CONTIGUOUS) * and not PyArray_CHKFLAGS(self, NPY_ARRAY_F_CONTIGUOUS)): * raise ValueError(u"ndarray is not Fortran contiguous") # <<<<<<<<<<<<<< @@ -6529,7 +6529,7 @@ static CYTHON_SMALL_CODE int __Pyx_InitCachedConstants(void) { __Pyx_GOTREF(__pyx_tuple__2); __Pyx_GIVEREF(__pyx_tuple__2); - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":306 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":306 * if ((descr.byteorder == c'>' and little_endian) or * (descr.byteorder == c'<' and not little_endian)): * raise ValueError(u"Non-native byte order not supported") # <<<<<<<<<<<<<< @@ -6540,7 +6540,7 @@ static CYTHON_SMALL_CODE int __Pyx_InitCachedConstants(void) { __Pyx_GOTREF(__pyx_tuple__3); __Pyx_GIVEREF(__pyx_tuple__3); - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":856 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":856 * * if (end - f) - (new_offset - offset[0]) < 15: * raise RuntimeError(u"Format string allocated too short, see comment in numpy.pxd") # <<<<<<<<<<<<<< @@ -6551,7 +6551,7 @@ static CYTHON_SMALL_CODE int __Pyx_InitCachedConstants(void) { __Pyx_GOTREF(__pyx_tuple__4); __Pyx_GIVEREF(__pyx_tuple__4); - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":880 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":880 * t = child.type_num * if end - f < 5: * raise RuntimeError(u"Format string allocated too short.") # <<<<<<<<<<<<<< @@ -6562,7 +6562,7 @@ static CYTHON_SMALL_CODE int __Pyx_InitCachedConstants(void) { __Pyx_GOTREF(__pyx_tuple__5); __Pyx_GIVEREF(__pyx_tuple__5); - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1038 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1038 * _import_array() * except Exception: * raise ImportError("numpy.core.multiarray failed to import") # <<<<<<<<<<<<<< @@ -6573,7 +6573,7 @@ static CYTHON_SMALL_CODE int __Pyx_InitCachedConstants(void) { __Pyx_GOTREF(__pyx_tuple__6); __Pyx_GIVEREF(__pyx_tuple__6); - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1044 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1044 * _import_umath() * except Exception: * raise ImportError("numpy.core.umath failed to import") # <<<<<<<<<<<<<< @@ -7014,7 +7014,7 @@ if (!__Pyx_RefNanny) { if (PyDict_SetItem(__pyx_d, __pyx_n_s_test, __pyx_t_1) < 0) __PYX_ERR(0, 1, __pyx_L1_error) __Pyx_DECREF(__pyx_t_1); __pyx_t_1 = 0; - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1046 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1046 * raise ImportError("numpy.core.umath failed to import") * * cdef inline int import_ufunc() except -1: # <<<<<<<<<<<<<< @@ -8438,7 +8438,7 @@ static CYTHON_INLINE PyObject* __Pyx_PyInt_From_PY_LONG_LONG(PY_LONG_LONG value) theta = 0; } else { r = -a.real; - theta = atan2f(0, -1); + theta = atan2f(0.0, -1.0); } } else { r = __Pyx_c_abs_float(a); @@ -8593,7 +8593,7 @@ static CYTHON_INLINE PyObject* __Pyx_PyInt_From_PY_LONG_LONG(PY_LONG_LONG value) theta = 0; } else { r = -a.real; - theta = atan2(0, -1); + theta = atan2(0.0, -1.0); } } else { r = __Pyx_c_abs_double(a); diff --git a/gensim/models/fasttext_inner.c b/gensim/models/fasttext_inner.c index 7f533cd546..36ab7f97b7 100644 --- a/gensim/models/fasttext_inner.c +++ b/gensim/models/fasttext_inner.c @@ -1,4 +1,4 @@ -/* Generated by Cython 0.29.2 */ +/* Generated by Cython 0.29.3 */ #define PY_SSIZE_T_CLEAN #include "Python.h" @@ -7,8 +7,8 @@ #elif PY_VERSION_HEX < 0x02060000 || (0x03000000 <= PY_VERSION_HEX && PY_VERSION_HEX < 0x03030000) #error Cython requires Python 2.6+ or Python 3.3+. #else -#define CYTHON_ABI "0_29_2" -#define CYTHON_HEX_VERSION 0x001D02F0 +#define CYTHON_ABI "0_29_3" +#define CYTHON_HEX_VERSION 0x001D03F0 #define CYTHON_FUTURE_DIVISION 0 #include #ifndef offsetof @@ -398,7 +398,7 @@ typedef int Py_tss_t; static CYTHON_INLINE int PyThread_tss_create(Py_tss_t *key) { *key = PyThread_create_key(); - return 0; // PyThread_create_key reports success always + return 0; } static CYTHON_INLINE Py_tss_t * PyThread_tss_alloc(void) { Py_tss_t *key = (Py_tss_t *)PyObject_Malloc(sizeof(Py_tss_t)); @@ -421,7 +421,7 @@ static CYTHON_INLINE int PyThread_tss_set(Py_tss_t *key, void *value) { static CYTHON_INLINE void * PyThread_tss_get(Py_tss_t *key) { return PyThread_get_key_value(*key); } -#endif // TSS (Thread Specific Storage) API +#endif #if CYTHON_COMPILING_IN_CPYTHON || defined(_PyDict_NewPresized) #define __Pyx_PyDict_NewPresized(n) ((n <= 8) ? PyDict_New() : _PyDict_NewPresized(n)) #else @@ -860,7 +860,7 @@ static const char *__pyx_f[] = { #endif -/* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":776 +/* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":776 * # in Cython to enable them only on the right systems. * * ctypedef npy_int8 int8_t # <<<<<<<<<<<<<< @@ -869,7 +869,7 @@ static const char *__pyx_f[] = { */ typedef npy_int8 __pyx_t_5numpy_int8_t; -/* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":777 +/* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":777 * * ctypedef npy_int8 int8_t * ctypedef npy_int16 int16_t # <<<<<<<<<<<<<< @@ -878,7 +878,7 @@ typedef npy_int8 __pyx_t_5numpy_int8_t; */ typedef npy_int16 __pyx_t_5numpy_int16_t; -/* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":778 +/* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":778 * ctypedef npy_int8 int8_t * ctypedef npy_int16 int16_t * ctypedef npy_int32 int32_t # <<<<<<<<<<<<<< @@ -887,7 +887,7 @@ typedef npy_int16 __pyx_t_5numpy_int16_t; */ typedef npy_int32 __pyx_t_5numpy_int32_t; -/* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":779 +/* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":779 * ctypedef npy_int16 int16_t * ctypedef npy_int32 int32_t * ctypedef npy_int64 int64_t # <<<<<<<<<<<<<< @@ -896,7 +896,7 @@ typedef npy_int32 __pyx_t_5numpy_int32_t; */ typedef npy_int64 __pyx_t_5numpy_int64_t; -/* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":783 +/* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":783 * #ctypedef npy_int128 int128_t * * ctypedef npy_uint8 uint8_t # <<<<<<<<<<<<<< @@ -905,7 +905,7 @@ typedef npy_int64 __pyx_t_5numpy_int64_t; */ typedef npy_uint8 __pyx_t_5numpy_uint8_t; -/* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":784 +/* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":784 * * ctypedef npy_uint8 uint8_t * ctypedef npy_uint16 uint16_t # <<<<<<<<<<<<<< @@ -914,7 +914,7 @@ typedef npy_uint8 __pyx_t_5numpy_uint8_t; */ typedef npy_uint16 __pyx_t_5numpy_uint16_t; -/* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":785 +/* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":785 * ctypedef npy_uint8 uint8_t * ctypedef npy_uint16 uint16_t * ctypedef npy_uint32 uint32_t # <<<<<<<<<<<<<< @@ -923,7 +923,7 @@ typedef npy_uint16 __pyx_t_5numpy_uint16_t; */ typedef npy_uint32 __pyx_t_5numpy_uint32_t; -/* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":786 +/* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":786 * ctypedef npy_uint16 uint16_t * ctypedef npy_uint32 uint32_t * ctypedef npy_uint64 uint64_t # <<<<<<<<<<<<<< @@ -932,7 +932,7 @@ typedef npy_uint32 __pyx_t_5numpy_uint32_t; */ typedef npy_uint64 __pyx_t_5numpy_uint64_t; -/* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":790 +/* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":790 * #ctypedef npy_uint128 uint128_t * * ctypedef npy_float32 float32_t # <<<<<<<<<<<<<< @@ -941,7 +941,7 @@ typedef npy_uint64 __pyx_t_5numpy_uint64_t; */ typedef npy_float32 __pyx_t_5numpy_float32_t; -/* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":791 +/* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":791 * * ctypedef npy_float32 float32_t * ctypedef npy_float64 float64_t # <<<<<<<<<<<<<< @@ -950,7 +950,7 @@ typedef npy_float32 __pyx_t_5numpy_float32_t; */ typedef npy_float64 __pyx_t_5numpy_float64_t; -/* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":800 +/* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":800 * # The int types are mapped a bit surprising -- * # numpy.int corresponds to 'l' and numpy.long to 'q' * ctypedef npy_long int_t # <<<<<<<<<<<<<< @@ -959,7 +959,7 @@ typedef npy_float64 __pyx_t_5numpy_float64_t; */ typedef npy_long __pyx_t_5numpy_int_t; -/* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":801 +/* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":801 * # numpy.int corresponds to 'l' and numpy.long to 'q' * ctypedef npy_long int_t * ctypedef npy_longlong long_t # <<<<<<<<<<<<<< @@ -968,7 +968,7 @@ typedef npy_long __pyx_t_5numpy_int_t; */ typedef npy_longlong __pyx_t_5numpy_long_t; -/* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":802 +/* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":802 * ctypedef npy_long int_t * ctypedef npy_longlong long_t * ctypedef npy_longlong longlong_t # <<<<<<<<<<<<<< @@ -977,7 +977,7 @@ typedef npy_longlong __pyx_t_5numpy_long_t; */ typedef npy_longlong __pyx_t_5numpy_longlong_t; -/* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":804 +/* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":804 * ctypedef npy_longlong longlong_t * * ctypedef npy_ulong uint_t # <<<<<<<<<<<<<< @@ -986,7 +986,7 @@ typedef npy_longlong __pyx_t_5numpy_longlong_t; */ typedef npy_ulong __pyx_t_5numpy_uint_t; -/* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":805 +/* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":805 * * ctypedef npy_ulong uint_t * ctypedef npy_ulonglong ulong_t # <<<<<<<<<<<<<< @@ -995,7 +995,7 @@ typedef npy_ulong __pyx_t_5numpy_uint_t; */ typedef npy_ulonglong __pyx_t_5numpy_ulong_t; -/* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":806 +/* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":806 * ctypedef npy_ulong uint_t * ctypedef npy_ulonglong ulong_t * ctypedef npy_ulonglong ulonglong_t # <<<<<<<<<<<<<< @@ -1004,7 +1004,7 @@ typedef npy_ulonglong __pyx_t_5numpy_ulong_t; */ typedef npy_ulonglong __pyx_t_5numpy_ulonglong_t; -/* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":808 +/* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":808 * ctypedef npy_ulonglong ulonglong_t * * ctypedef npy_intp intp_t # <<<<<<<<<<<<<< @@ -1013,7 +1013,7 @@ typedef npy_ulonglong __pyx_t_5numpy_ulonglong_t; */ typedef npy_intp __pyx_t_5numpy_intp_t; -/* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":809 +/* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":809 * * ctypedef npy_intp intp_t * ctypedef npy_uintp uintp_t # <<<<<<<<<<<<<< @@ -1022,7 +1022,7 @@ typedef npy_intp __pyx_t_5numpy_intp_t; */ typedef npy_uintp __pyx_t_5numpy_uintp_t; -/* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":811 +/* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":811 * ctypedef npy_uintp uintp_t * * ctypedef npy_double float_t # <<<<<<<<<<<<<< @@ -1031,7 +1031,7 @@ typedef npy_uintp __pyx_t_5numpy_uintp_t; */ typedef npy_double __pyx_t_5numpy_float_t; -/* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":812 +/* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":812 * * ctypedef npy_double float_t * ctypedef npy_double double_t # <<<<<<<<<<<<<< @@ -1040,7 +1040,7 @@ typedef npy_double __pyx_t_5numpy_float_t; */ typedef npy_double __pyx_t_5numpy_double_t; -/* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":813 +/* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":813 * ctypedef npy_double float_t * ctypedef npy_double double_t * ctypedef npy_longdouble longdouble_t # <<<<<<<<<<<<<< @@ -1084,7 +1084,7 @@ static CYTHON_INLINE __pyx_t_double_complex __pyx_t_double_complex_from_parts(do /*--- Type declarations ---*/ -/* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":815 +/* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":815 * ctypedef npy_longdouble longdouble_t * * ctypedef npy_cfloat cfloat_t # <<<<<<<<<<<<<< @@ -1093,7 +1093,7 @@ static CYTHON_INLINE __pyx_t_double_complex __pyx_t_double_complex_from_parts(do */ typedef npy_cfloat __pyx_t_5numpy_cfloat_t; -/* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":816 +/* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":816 * * ctypedef npy_cfloat cfloat_t * ctypedef npy_cdouble cdouble_t # <<<<<<<<<<<<<< @@ -1102,7 +1102,7 @@ typedef npy_cfloat __pyx_t_5numpy_cfloat_t; */ typedef npy_cdouble __pyx_t_5numpy_cdouble_t; -/* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":817 +/* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":817 * ctypedef npy_cfloat cfloat_t * ctypedef npy_cdouble cdouble_t * ctypedef npy_clongdouble clongdouble_t # <<<<<<<<<<<<<< @@ -1111,7 +1111,7 @@ typedef npy_cdouble __pyx_t_5numpy_cdouble_t; */ typedef npy_clongdouble __pyx_t_5numpy_clongdouble_t; -/* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":819 +/* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":819 * ctypedef npy_clongdouble clongdouble_t * * ctypedef npy_cdouble complex_t # <<<<<<<<<<<<<< @@ -6560,7 +6560,7 @@ static PyObject *__pyx_pf_6gensim_6models_14fasttext_inner_4init(CYTHON_UNUSED P return __pyx_r; } -/* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":258 +/* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":258 * # experimental exception made for __getbuffer__ and __releasebuffer__ * # -- the details of this may change. * def __getbuffer__(ndarray self, Py_buffer* info, int flags): # <<<<<<<<<<<<<< @@ -6609,7 +6609,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P __pyx_v_info->obj = Py_None; __Pyx_INCREF(Py_None); __Pyx_GIVEREF(__pyx_v_info->obj); - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":265 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":265 * * cdef int i, ndim * cdef int endian_detector = 1 # <<<<<<<<<<<<<< @@ -6618,7 +6618,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P */ __pyx_v_endian_detector = 1; - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":266 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":266 * cdef int i, ndim * cdef int endian_detector = 1 * cdef bint little_endian = ((&endian_detector)[0] != 0) # <<<<<<<<<<<<<< @@ -6627,7 +6627,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P */ __pyx_v_little_endian = ((((char *)(&__pyx_v_endian_detector))[0]) != 0); - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":268 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":268 * cdef bint little_endian = ((&endian_detector)[0] != 0) * * ndim = PyArray_NDIM(self) # <<<<<<<<<<<<<< @@ -6636,7 +6636,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P */ __pyx_v_ndim = PyArray_NDIM(__pyx_v_self); - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":270 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":270 * ndim = PyArray_NDIM(self) * * if ((flags & pybuf.PyBUF_C_CONTIGUOUS == pybuf.PyBUF_C_CONTIGUOUS) # <<<<<<<<<<<<<< @@ -6650,7 +6650,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P goto __pyx_L4_bool_binop_done; } - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":271 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":271 * * if ((flags & pybuf.PyBUF_C_CONTIGUOUS == pybuf.PyBUF_C_CONTIGUOUS) * and not PyArray_CHKFLAGS(self, NPY_ARRAY_C_CONTIGUOUS)): # <<<<<<<<<<<<<< @@ -6661,7 +6661,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P __pyx_t_1 = __pyx_t_2; __pyx_L4_bool_binop_done:; - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":270 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":270 * ndim = PyArray_NDIM(self) * * if ((flags & pybuf.PyBUF_C_CONTIGUOUS == pybuf.PyBUF_C_CONTIGUOUS) # <<<<<<<<<<<<<< @@ -6670,7 +6670,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P */ if (unlikely(__pyx_t_1)) { - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":272 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":272 * if ((flags & pybuf.PyBUF_C_CONTIGUOUS == pybuf.PyBUF_C_CONTIGUOUS) * and not PyArray_CHKFLAGS(self, NPY_ARRAY_C_CONTIGUOUS)): * raise ValueError(u"ndarray is not C contiguous") # <<<<<<<<<<<<<< @@ -6683,7 +6683,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P __Pyx_DECREF(__pyx_t_3); __pyx_t_3 = 0; __PYX_ERR(1, 272, __pyx_L1_error) - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":270 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":270 * ndim = PyArray_NDIM(self) * * if ((flags & pybuf.PyBUF_C_CONTIGUOUS == pybuf.PyBUF_C_CONTIGUOUS) # <<<<<<<<<<<<<< @@ -6692,7 +6692,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P */ } - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":274 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":274 * raise ValueError(u"ndarray is not C contiguous") * * if ((flags & pybuf.PyBUF_F_CONTIGUOUS == pybuf.PyBUF_F_CONTIGUOUS) # <<<<<<<<<<<<<< @@ -6706,7 +6706,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P goto __pyx_L7_bool_binop_done; } - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":275 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":275 * * if ((flags & pybuf.PyBUF_F_CONTIGUOUS == pybuf.PyBUF_F_CONTIGUOUS) * and not PyArray_CHKFLAGS(self, NPY_ARRAY_F_CONTIGUOUS)): # <<<<<<<<<<<<<< @@ -6717,7 +6717,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P __pyx_t_1 = __pyx_t_2; __pyx_L7_bool_binop_done:; - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":274 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":274 * raise ValueError(u"ndarray is not C contiguous") * * if ((flags & pybuf.PyBUF_F_CONTIGUOUS == pybuf.PyBUF_F_CONTIGUOUS) # <<<<<<<<<<<<<< @@ -6726,7 +6726,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P */ if (unlikely(__pyx_t_1)) { - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":276 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":276 * if ((flags & pybuf.PyBUF_F_CONTIGUOUS == pybuf.PyBUF_F_CONTIGUOUS) * and not PyArray_CHKFLAGS(self, NPY_ARRAY_F_CONTIGUOUS)): * raise ValueError(u"ndarray is not Fortran contiguous") # <<<<<<<<<<<<<< @@ -6739,7 +6739,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P __Pyx_DECREF(__pyx_t_3); __pyx_t_3 = 0; __PYX_ERR(1, 276, __pyx_L1_error) - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":274 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":274 * raise ValueError(u"ndarray is not C contiguous") * * if ((flags & pybuf.PyBUF_F_CONTIGUOUS == pybuf.PyBUF_F_CONTIGUOUS) # <<<<<<<<<<<<<< @@ -6748,7 +6748,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P */ } - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":278 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":278 * raise ValueError(u"ndarray is not Fortran contiguous") * * info.buf = PyArray_DATA(self) # <<<<<<<<<<<<<< @@ -6757,7 +6757,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P */ __pyx_v_info->buf = PyArray_DATA(__pyx_v_self); - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":279 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":279 * * info.buf = PyArray_DATA(self) * info.ndim = ndim # <<<<<<<<<<<<<< @@ -6766,7 +6766,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P */ __pyx_v_info->ndim = __pyx_v_ndim; - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":280 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":280 * info.buf = PyArray_DATA(self) * info.ndim = ndim * if sizeof(npy_intp) != sizeof(Py_ssize_t): # <<<<<<<<<<<<<< @@ -6776,7 +6776,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P __pyx_t_1 = (((sizeof(npy_intp)) != (sizeof(Py_ssize_t))) != 0); if (__pyx_t_1) { - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":283 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":283 * # Allocate new buffer for strides and shape info. * # This is allocated as one block, strides first. * info.strides = PyObject_Malloc(sizeof(Py_ssize_t) * 2 * ndim) # <<<<<<<<<<<<<< @@ -6785,7 +6785,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P */ __pyx_v_info->strides = ((Py_ssize_t *)PyObject_Malloc((((sizeof(Py_ssize_t)) * 2) * ((size_t)__pyx_v_ndim)))); - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":284 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":284 * # This is allocated as one block, strides first. * info.strides = PyObject_Malloc(sizeof(Py_ssize_t) * 2 * ndim) * info.shape = info.strides + ndim # <<<<<<<<<<<<<< @@ -6794,7 +6794,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P */ __pyx_v_info->shape = (__pyx_v_info->strides + __pyx_v_ndim); - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":285 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":285 * info.strides = PyObject_Malloc(sizeof(Py_ssize_t) * 2 * ndim) * info.shape = info.strides + ndim * for i in range(ndim): # <<<<<<<<<<<<<< @@ -6806,7 +6806,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P for (__pyx_t_6 = 0; __pyx_t_6 < __pyx_t_5; __pyx_t_6+=1) { __pyx_v_i = __pyx_t_6; - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":286 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":286 * info.shape = info.strides + ndim * for i in range(ndim): * info.strides[i] = PyArray_STRIDES(self)[i] # <<<<<<<<<<<<<< @@ -6815,7 +6815,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P */ (__pyx_v_info->strides[__pyx_v_i]) = (PyArray_STRIDES(__pyx_v_self)[__pyx_v_i]); - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":287 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":287 * for i in range(ndim): * info.strides[i] = PyArray_STRIDES(self)[i] * info.shape[i] = PyArray_DIMS(self)[i] # <<<<<<<<<<<<<< @@ -6825,7 +6825,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P (__pyx_v_info->shape[__pyx_v_i]) = (PyArray_DIMS(__pyx_v_self)[__pyx_v_i]); } - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":280 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":280 * info.buf = PyArray_DATA(self) * info.ndim = ndim * if sizeof(npy_intp) != sizeof(Py_ssize_t): # <<<<<<<<<<<<<< @@ -6835,7 +6835,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P goto __pyx_L9; } - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":289 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":289 * info.shape[i] = PyArray_DIMS(self)[i] * else: * info.strides = PyArray_STRIDES(self) # <<<<<<<<<<<<<< @@ -6845,7 +6845,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P /*else*/ { __pyx_v_info->strides = ((Py_ssize_t *)PyArray_STRIDES(__pyx_v_self)); - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":290 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":290 * else: * info.strides = PyArray_STRIDES(self) * info.shape = PyArray_DIMS(self) # <<<<<<<<<<<<<< @@ -6856,7 +6856,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P } __pyx_L9:; - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":291 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":291 * info.strides = PyArray_STRIDES(self) * info.shape = PyArray_DIMS(self) * info.suboffsets = NULL # <<<<<<<<<<<<<< @@ -6865,7 +6865,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P */ __pyx_v_info->suboffsets = NULL; - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":292 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":292 * info.shape = PyArray_DIMS(self) * info.suboffsets = NULL * info.itemsize = PyArray_ITEMSIZE(self) # <<<<<<<<<<<<<< @@ -6874,7 +6874,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P */ __pyx_v_info->itemsize = PyArray_ITEMSIZE(__pyx_v_self); - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":293 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":293 * info.suboffsets = NULL * info.itemsize = PyArray_ITEMSIZE(self) * info.readonly = not PyArray_ISWRITEABLE(self) # <<<<<<<<<<<<<< @@ -6883,7 +6883,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P */ __pyx_v_info->readonly = (!(PyArray_ISWRITEABLE(__pyx_v_self) != 0)); - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":296 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":296 * * cdef int t * cdef char* f = NULL # <<<<<<<<<<<<<< @@ -6892,7 +6892,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P */ __pyx_v_f = NULL; - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":297 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":297 * cdef int t * cdef char* f = NULL * cdef dtype descr = PyArray_DESCR(self) # <<<<<<<<<<<<<< @@ -6905,7 +6905,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P __pyx_v_descr = ((PyArray_Descr *)__pyx_t_3); __pyx_t_3 = 0; - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":300 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":300 * cdef int offset * * info.obj = self # <<<<<<<<<<<<<< @@ -6918,7 +6918,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P __Pyx_DECREF(__pyx_v_info->obj); __pyx_v_info->obj = ((PyObject *)__pyx_v_self); - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":302 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":302 * info.obj = self * * if not PyDataType_HASFIELDS(descr): # <<<<<<<<<<<<<< @@ -6928,7 +6928,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P __pyx_t_1 = ((!(PyDataType_HASFIELDS(__pyx_v_descr) != 0)) != 0); if (__pyx_t_1) { - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":303 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":303 * * if not PyDataType_HASFIELDS(descr): * t = descr.type_num # <<<<<<<<<<<<<< @@ -6938,7 +6938,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P __pyx_t_4 = __pyx_v_descr->type_num; __pyx_v_t = __pyx_t_4; - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":304 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":304 * if not PyDataType_HASFIELDS(descr): * t = descr.type_num * if ((descr.byteorder == c'>' and little_endian) or # <<<<<<<<<<<<<< @@ -6958,7 +6958,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P } __pyx_L15_next_or:; - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":305 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":305 * t = descr.type_num * if ((descr.byteorder == c'>' and little_endian) or * (descr.byteorder == c'<' and not little_endian)): # <<<<<<<<<<<<<< @@ -6975,7 +6975,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P __pyx_t_1 = __pyx_t_2; __pyx_L14_bool_binop_done:; - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":304 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":304 * if not PyDataType_HASFIELDS(descr): * t = descr.type_num * if ((descr.byteorder == c'>' and little_endian) or # <<<<<<<<<<<<<< @@ -6984,7 +6984,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P */ if (unlikely(__pyx_t_1)) { - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":306 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":306 * if ((descr.byteorder == c'>' and little_endian) or * (descr.byteorder == c'<' and not little_endian)): * raise ValueError(u"Non-native byte order not supported") # <<<<<<<<<<<<<< @@ -6997,7 +6997,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P __Pyx_DECREF(__pyx_t_3); __pyx_t_3 = 0; __PYX_ERR(1, 306, __pyx_L1_error) - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":304 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":304 * if not PyDataType_HASFIELDS(descr): * t = descr.type_num * if ((descr.byteorder == c'>' and little_endian) or # <<<<<<<<<<<<<< @@ -7006,7 +7006,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P */ } - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":307 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":307 * (descr.byteorder == c'<' and not little_endian)): * raise ValueError(u"Non-native byte order not supported") * if t == NPY_BYTE: f = "b" # <<<<<<<<<<<<<< @@ -7019,7 +7019,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P break; case NPY_UBYTE: - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":308 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":308 * raise ValueError(u"Non-native byte order not supported") * if t == NPY_BYTE: f = "b" * elif t == NPY_UBYTE: f = "B" # <<<<<<<<<<<<<< @@ -7030,7 +7030,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P break; case NPY_SHORT: - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":309 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":309 * if t == NPY_BYTE: f = "b" * elif t == NPY_UBYTE: f = "B" * elif t == NPY_SHORT: f = "h" # <<<<<<<<<<<<<< @@ -7041,7 +7041,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P break; case NPY_USHORT: - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":310 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":310 * elif t == NPY_UBYTE: f = "B" * elif t == NPY_SHORT: f = "h" * elif t == NPY_USHORT: f = "H" # <<<<<<<<<<<<<< @@ -7052,7 +7052,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P break; case NPY_INT: - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":311 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":311 * elif t == NPY_SHORT: f = "h" * elif t == NPY_USHORT: f = "H" * elif t == NPY_INT: f = "i" # <<<<<<<<<<<<<< @@ -7063,7 +7063,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P break; case NPY_UINT: - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":312 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":312 * elif t == NPY_USHORT: f = "H" * elif t == NPY_INT: f = "i" * elif t == NPY_UINT: f = "I" # <<<<<<<<<<<<<< @@ -7074,7 +7074,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P break; case NPY_LONG: - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":313 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":313 * elif t == NPY_INT: f = "i" * elif t == NPY_UINT: f = "I" * elif t == NPY_LONG: f = "l" # <<<<<<<<<<<<<< @@ -7085,7 +7085,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P break; case NPY_ULONG: - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":314 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":314 * elif t == NPY_UINT: f = "I" * elif t == NPY_LONG: f = "l" * elif t == NPY_ULONG: f = "L" # <<<<<<<<<<<<<< @@ -7096,7 +7096,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P break; case NPY_LONGLONG: - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":315 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":315 * elif t == NPY_LONG: f = "l" * elif t == NPY_ULONG: f = "L" * elif t == NPY_LONGLONG: f = "q" # <<<<<<<<<<<<<< @@ -7107,7 +7107,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P break; case NPY_ULONGLONG: - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":316 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":316 * elif t == NPY_ULONG: f = "L" * elif t == NPY_LONGLONG: f = "q" * elif t == NPY_ULONGLONG: f = "Q" # <<<<<<<<<<<<<< @@ -7118,7 +7118,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P break; case NPY_FLOAT: - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":317 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":317 * elif t == NPY_LONGLONG: f = "q" * elif t == NPY_ULONGLONG: f = "Q" * elif t == NPY_FLOAT: f = "f" # <<<<<<<<<<<<<< @@ -7129,7 +7129,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P break; case NPY_DOUBLE: - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":318 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":318 * elif t == NPY_ULONGLONG: f = "Q" * elif t == NPY_FLOAT: f = "f" * elif t == NPY_DOUBLE: f = "d" # <<<<<<<<<<<<<< @@ -7140,7 +7140,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P break; case NPY_LONGDOUBLE: - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":319 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":319 * elif t == NPY_FLOAT: f = "f" * elif t == NPY_DOUBLE: f = "d" * elif t == NPY_LONGDOUBLE: f = "g" # <<<<<<<<<<<<<< @@ -7151,7 +7151,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P break; case NPY_CFLOAT: - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":320 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":320 * elif t == NPY_DOUBLE: f = "d" * elif t == NPY_LONGDOUBLE: f = "g" * elif t == NPY_CFLOAT: f = "Zf" # <<<<<<<<<<<<<< @@ -7162,7 +7162,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P break; case NPY_CDOUBLE: - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":321 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":321 * elif t == NPY_LONGDOUBLE: f = "g" * elif t == NPY_CFLOAT: f = "Zf" * elif t == NPY_CDOUBLE: f = "Zd" # <<<<<<<<<<<<<< @@ -7173,7 +7173,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P break; case NPY_CLONGDOUBLE: - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":322 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":322 * elif t == NPY_CFLOAT: f = "Zf" * elif t == NPY_CDOUBLE: f = "Zd" * elif t == NPY_CLONGDOUBLE: f = "Zg" # <<<<<<<<<<<<<< @@ -7184,7 +7184,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P break; case NPY_OBJECT: - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":323 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":323 * elif t == NPY_CDOUBLE: f = "Zd" * elif t == NPY_CLONGDOUBLE: f = "Zg" * elif t == NPY_OBJECT: f = "O" # <<<<<<<<<<<<<< @@ -7195,7 +7195,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P break; default: - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":325 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":325 * elif t == NPY_OBJECT: f = "O" * else: * raise ValueError(u"unknown dtype code in numpy.pxd (%d)" % t) # <<<<<<<<<<<<<< @@ -7216,7 +7216,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P break; } - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":326 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":326 * else: * raise ValueError(u"unknown dtype code in numpy.pxd (%d)" % t) * info.format = f # <<<<<<<<<<<<<< @@ -7225,7 +7225,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P */ __pyx_v_info->format = __pyx_v_f; - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":327 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":327 * raise ValueError(u"unknown dtype code in numpy.pxd (%d)" % t) * info.format = f * return # <<<<<<<<<<<<<< @@ -7235,7 +7235,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P __pyx_r = 0; goto __pyx_L0; - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":302 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":302 * info.obj = self * * if not PyDataType_HASFIELDS(descr): # <<<<<<<<<<<<<< @@ -7244,7 +7244,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P */ } - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":329 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":329 * return * else: * info.format = PyObject_Malloc(_buffer_format_string_len) # <<<<<<<<<<<<<< @@ -7254,7 +7254,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P /*else*/ { __pyx_v_info->format = ((char *)PyObject_Malloc(0xFF)); - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":330 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":330 * else: * info.format = PyObject_Malloc(_buffer_format_string_len) * info.format[0] = c'^' # Native data types, manual alignment # <<<<<<<<<<<<<< @@ -7263,7 +7263,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P */ (__pyx_v_info->format[0]) = '^'; - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":331 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":331 * info.format = PyObject_Malloc(_buffer_format_string_len) * info.format[0] = c'^' # Native data types, manual alignment * offset = 0 # <<<<<<<<<<<<<< @@ -7272,7 +7272,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P */ __pyx_v_offset = 0; - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":332 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":332 * info.format[0] = c'^' # Native data types, manual alignment * offset = 0 * f = _util_dtypestring(descr, info.format + 1, # <<<<<<<<<<<<<< @@ -7282,7 +7282,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P __pyx_t_9 = __pyx_f_5numpy__util_dtypestring(__pyx_v_descr, (__pyx_v_info->format + 1), (__pyx_v_info->format + 0xFF), (&__pyx_v_offset)); if (unlikely(__pyx_t_9 == ((char *)NULL))) __PYX_ERR(1, 332, __pyx_L1_error) __pyx_v_f = __pyx_t_9; - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":335 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":335 * info.format + _buffer_format_string_len, * &offset) * f[0] = c'\0' # Terminate format string # <<<<<<<<<<<<<< @@ -7292,7 +7292,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P (__pyx_v_f[0]) = '\x00'; } - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":258 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":258 * # experimental exception made for __getbuffer__ and __releasebuffer__ * # -- the details of this may change. * def __getbuffer__(ndarray self, Py_buffer* info, int flags): # <<<<<<<<<<<<<< @@ -7324,7 +7324,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P return __pyx_r; } -/* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":337 +/* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":337 * f[0] = c'\0' # Terminate format string * * def __releasebuffer__(ndarray self, Py_buffer* info): # <<<<<<<<<<<<<< @@ -7348,7 +7348,7 @@ static void __pyx_pf_5numpy_7ndarray_2__releasebuffer__(PyArrayObject *__pyx_v_s int __pyx_t_1; __Pyx_RefNannySetupContext("__releasebuffer__", 0); - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":338 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":338 * * def __releasebuffer__(ndarray self, Py_buffer* info): * if PyArray_HASFIELDS(self): # <<<<<<<<<<<<<< @@ -7358,7 +7358,7 @@ static void __pyx_pf_5numpy_7ndarray_2__releasebuffer__(PyArrayObject *__pyx_v_s __pyx_t_1 = (PyArray_HASFIELDS(__pyx_v_self) != 0); if (__pyx_t_1) { - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":339 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":339 * def __releasebuffer__(ndarray self, Py_buffer* info): * if PyArray_HASFIELDS(self): * PyObject_Free(info.format) # <<<<<<<<<<<<<< @@ -7367,7 +7367,7 @@ static void __pyx_pf_5numpy_7ndarray_2__releasebuffer__(PyArrayObject *__pyx_v_s */ PyObject_Free(__pyx_v_info->format); - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":338 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":338 * * def __releasebuffer__(ndarray self, Py_buffer* info): * if PyArray_HASFIELDS(self): # <<<<<<<<<<<<<< @@ -7376,7 +7376,7 @@ static void __pyx_pf_5numpy_7ndarray_2__releasebuffer__(PyArrayObject *__pyx_v_s */ } - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":340 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":340 * if PyArray_HASFIELDS(self): * PyObject_Free(info.format) * if sizeof(npy_intp) != sizeof(Py_ssize_t): # <<<<<<<<<<<<<< @@ -7386,7 +7386,7 @@ static void __pyx_pf_5numpy_7ndarray_2__releasebuffer__(PyArrayObject *__pyx_v_s __pyx_t_1 = (((sizeof(npy_intp)) != (sizeof(Py_ssize_t))) != 0); if (__pyx_t_1) { - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":341 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":341 * PyObject_Free(info.format) * if sizeof(npy_intp) != sizeof(Py_ssize_t): * PyObject_Free(info.strides) # <<<<<<<<<<<<<< @@ -7395,7 +7395,7 @@ static void __pyx_pf_5numpy_7ndarray_2__releasebuffer__(PyArrayObject *__pyx_v_s */ PyObject_Free(__pyx_v_info->strides); - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":340 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":340 * if PyArray_HASFIELDS(self): * PyObject_Free(info.format) * if sizeof(npy_intp) != sizeof(Py_ssize_t): # <<<<<<<<<<<<<< @@ -7404,7 +7404,7 @@ static void __pyx_pf_5numpy_7ndarray_2__releasebuffer__(PyArrayObject *__pyx_v_s */ } - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":337 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":337 * f[0] = c'\0' # Terminate format string * * def __releasebuffer__(ndarray self, Py_buffer* info): # <<<<<<<<<<<<<< @@ -7416,7 +7416,7 @@ static void __pyx_pf_5numpy_7ndarray_2__releasebuffer__(PyArrayObject *__pyx_v_s __Pyx_RefNannyFinishContext(); } -/* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":821 +/* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":821 * ctypedef npy_cdouble complex_t * * cdef inline object PyArray_MultiIterNew1(a): # <<<<<<<<<<<<<< @@ -7430,7 +7430,7 @@ static CYTHON_INLINE PyObject *__pyx_f_5numpy_PyArray_MultiIterNew1(PyObject *__ PyObject *__pyx_t_1 = NULL; __Pyx_RefNannySetupContext("PyArray_MultiIterNew1", 0); - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":822 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":822 * * cdef inline object PyArray_MultiIterNew1(a): * return PyArray_MultiIterNew(1, a) # <<<<<<<<<<<<<< @@ -7444,7 +7444,7 @@ static CYTHON_INLINE PyObject *__pyx_f_5numpy_PyArray_MultiIterNew1(PyObject *__ __pyx_t_1 = 0; goto __pyx_L0; - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":821 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":821 * ctypedef npy_cdouble complex_t * * cdef inline object PyArray_MultiIterNew1(a): # <<<<<<<<<<<<<< @@ -7463,7 +7463,7 @@ static CYTHON_INLINE PyObject *__pyx_f_5numpy_PyArray_MultiIterNew1(PyObject *__ return __pyx_r; } -/* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":824 +/* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":824 * return PyArray_MultiIterNew(1, a) * * cdef inline object PyArray_MultiIterNew2(a, b): # <<<<<<<<<<<<<< @@ -7477,7 +7477,7 @@ static CYTHON_INLINE PyObject *__pyx_f_5numpy_PyArray_MultiIterNew2(PyObject *__ PyObject *__pyx_t_1 = NULL; __Pyx_RefNannySetupContext("PyArray_MultiIterNew2", 0); - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":825 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":825 * * cdef inline object PyArray_MultiIterNew2(a, b): * return PyArray_MultiIterNew(2, a, b) # <<<<<<<<<<<<<< @@ -7491,7 +7491,7 @@ static CYTHON_INLINE PyObject *__pyx_f_5numpy_PyArray_MultiIterNew2(PyObject *__ __pyx_t_1 = 0; goto __pyx_L0; - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":824 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":824 * return PyArray_MultiIterNew(1, a) * * cdef inline object PyArray_MultiIterNew2(a, b): # <<<<<<<<<<<<<< @@ -7510,7 +7510,7 @@ static CYTHON_INLINE PyObject *__pyx_f_5numpy_PyArray_MultiIterNew2(PyObject *__ return __pyx_r; } -/* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":827 +/* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":827 * return PyArray_MultiIterNew(2, a, b) * * cdef inline object PyArray_MultiIterNew3(a, b, c): # <<<<<<<<<<<<<< @@ -7524,7 +7524,7 @@ static CYTHON_INLINE PyObject *__pyx_f_5numpy_PyArray_MultiIterNew3(PyObject *__ PyObject *__pyx_t_1 = NULL; __Pyx_RefNannySetupContext("PyArray_MultiIterNew3", 0); - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":828 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":828 * * cdef inline object PyArray_MultiIterNew3(a, b, c): * return PyArray_MultiIterNew(3, a, b, c) # <<<<<<<<<<<<<< @@ -7538,7 +7538,7 @@ static CYTHON_INLINE PyObject *__pyx_f_5numpy_PyArray_MultiIterNew3(PyObject *__ __pyx_t_1 = 0; goto __pyx_L0; - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":827 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":827 * return PyArray_MultiIterNew(2, a, b) * * cdef inline object PyArray_MultiIterNew3(a, b, c): # <<<<<<<<<<<<<< @@ -7557,7 +7557,7 @@ static CYTHON_INLINE PyObject *__pyx_f_5numpy_PyArray_MultiIterNew3(PyObject *__ return __pyx_r; } -/* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":830 +/* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":830 * return PyArray_MultiIterNew(3, a, b, c) * * cdef inline object PyArray_MultiIterNew4(a, b, c, d): # <<<<<<<<<<<<<< @@ -7571,7 +7571,7 @@ static CYTHON_INLINE PyObject *__pyx_f_5numpy_PyArray_MultiIterNew4(PyObject *__ PyObject *__pyx_t_1 = NULL; __Pyx_RefNannySetupContext("PyArray_MultiIterNew4", 0); - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":831 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":831 * * cdef inline object PyArray_MultiIterNew4(a, b, c, d): * return PyArray_MultiIterNew(4, a, b, c, d) # <<<<<<<<<<<<<< @@ -7585,7 +7585,7 @@ static CYTHON_INLINE PyObject *__pyx_f_5numpy_PyArray_MultiIterNew4(PyObject *__ __pyx_t_1 = 0; goto __pyx_L0; - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":830 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":830 * return PyArray_MultiIterNew(3, a, b, c) * * cdef inline object PyArray_MultiIterNew4(a, b, c, d): # <<<<<<<<<<<<<< @@ -7604,7 +7604,7 @@ static CYTHON_INLINE PyObject *__pyx_f_5numpy_PyArray_MultiIterNew4(PyObject *__ return __pyx_r; } -/* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":833 +/* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":833 * return PyArray_MultiIterNew(4, a, b, c, d) * * cdef inline object PyArray_MultiIterNew5(a, b, c, d, e): # <<<<<<<<<<<<<< @@ -7618,7 +7618,7 @@ static CYTHON_INLINE PyObject *__pyx_f_5numpy_PyArray_MultiIterNew5(PyObject *__ PyObject *__pyx_t_1 = NULL; __Pyx_RefNannySetupContext("PyArray_MultiIterNew5", 0); - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":834 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":834 * * cdef inline object PyArray_MultiIterNew5(a, b, c, d, e): * return PyArray_MultiIterNew(5, a, b, c, d, e) # <<<<<<<<<<<<<< @@ -7632,7 +7632,7 @@ static CYTHON_INLINE PyObject *__pyx_f_5numpy_PyArray_MultiIterNew5(PyObject *__ __pyx_t_1 = 0; goto __pyx_L0; - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":833 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":833 * return PyArray_MultiIterNew(4, a, b, c, d) * * cdef inline object PyArray_MultiIterNew5(a, b, c, d, e): # <<<<<<<<<<<<<< @@ -7651,7 +7651,7 @@ static CYTHON_INLINE PyObject *__pyx_f_5numpy_PyArray_MultiIterNew5(PyObject *__ return __pyx_r; } -/* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":836 +/* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":836 * return PyArray_MultiIterNew(5, a, b, c, d, e) * * cdef inline tuple PyDataType_SHAPE(dtype d): # <<<<<<<<<<<<<< @@ -7665,7 +7665,7 @@ static CYTHON_INLINE PyObject *__pyx_f_5numpy_PyDataType_SHAPE(PyArray_Descr *__ int __pyx_t_1; __Pyx_RefNannySetupContext("PyDataType_SHAPE", 0); - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":837 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":837 * * cdef inline tuple PyDataType_SHAPE(dtype d): * if PyDataType_HASSUBARRAY(d): # <<<<<<<<<<<<<< @@ -7675,7 +7675,7 @@ static CYTHON_INLINE PyObject *__pyx_f_5numpy_PyDataType_SHAPE(PyArray_Descr *__ __pyx_t_1 = (PyDataType_HASSUBARRAY(__pyx_v_d) != 0); if (__pyx_t_1) { - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":838 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":838 * cdef inline tuple PyDataType_SHAPE(dtype d): * if PyDataType_HASSUBARRAY(d): * return d.subarray.shape # <<<<<<<<<<<<<< @@ -7687,7 +7687,7 @@ static CYTHON_INLINE PyObject *__pyx_f_5numpy_PyDataType_SHAPE(PyArray_Descr *__ __pyx_r = ((PyObject*)__pyx_v_d->subarray->shape); goto __pyx_L0; - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":837 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":837 * * cdef inline tuple PyDataType_SHAPE(dtype d): * if PyDataType_HASSUBARRAY(d): # <<<<<<<<<<<<<< @@ -7696,7 +7696,7 @@ static CYTHON_INLINE PyObject *__pyx_f_5numpy_PyDataType_SHAPE(PyArray_Descr *__ */ } - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":840 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":840 * return d.subarray.shape * else: * return () # <<<<<<<<<<<<<< @@ -7710,7 +7710,7 @@ static CYTHON_INLINE PyObject *__pyx_f_5numpy_PyDataType_SHAPE(PyArray_Descr *__ goto __pyx_L0; } - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":836 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":836 * return PyArray_MultiIterNew(5, a, b, c, d, e) * * cdef inline tuple PyDataType_SHAPE(dtype d): # <<<<<<<<<<<<<< @@ -7725,7 +7725,7 @@ static CYTHON_INLINE PyObject *__pyx_f_5numpy_PyDataType_SHAPE(PyArray_Descr *__ return __pyx_r; } -/* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":842 +/* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":842 * return () * * cdef inline char* _util_dtypestring(dtype descr, char* f, char* end, int* offset) except NULL: # <<<<<<<<<<<<<< @@ -7754,7 +7754,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx char *__pyx_t_9; __Pyx_RefNannySetupContext("_util_dtypestring", 0); - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":847 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":847 * * cdef dtype child * cdef int endian_detector = 1 # <<<<<<<<<<<<<< @@ -7763,7 +7763,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx */ __pyx_v_endian_detector = 1; - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":848 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":848 * cdef dtype child * cdef int endian_detector = 1 * cdef bint little_endian = ((&endian_detector)[0] != 0) # <<<<<<<<<<<<<< @@ -7772,7 +7772,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx */ __pyx_v_little_endian = ((((char *)(&__pyx_v_endian_detector))[0]) != 0); - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":851 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":851 * cdef tuple fields * * for childname in descr.names: # <<<<<<<<<<<<<< @@ -7795,7 +7795,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx __Pyx_XDECREF_SET(__pyx_v_childname, __pyx_t_3); __pyx_t_3 = 0; - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":852 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":852 * * for childname in descr.names: * fields = descr.fields[childname] # <<<<<<<<<<<<<< @@ -7812,7 +7812,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx __Pyx_XDECREF_SET(__pyx_v_fields, ((PyObject*)__pyx_t_3)); __pyx_t_3 = 0; - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":853 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":853 * for childname in descr.names: * fields = descr.fields[childname] * child, new_offset = fields # <<<<<<<<<<<<<< @@ -7847,7 +7847,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx __Pyx_XDECREF_SET(__pyx_v_new_offset, __pyx_t_4); __pyx_t_4 = 0; - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":855 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":855 * child, new_offset = fields * * if (end - f) - (new_offset - offset[0]) < 15: # <<<<<<<<<<<<<< @@ -7864,7 +7864,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx __pyx_t_6 = ((((__pyx_v_end - __pyx_v_f) - ((int)__pyx_t_5)) < 15) != 0); if (unlikely(__pyx_t_6)) { - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":856 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":856 * * if (end - f) - (new_offset - offset[0]) < 15: * raise RuntimeError(u"Format string allocated too short, see comment in numpy.pxd") # <<<<<<<<<<<<<< @@ -7877,7 +7877,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx __Pyx_DECREF(__pyx_t_3); __pyx_t_3 = 0; __PYX_ERR(1, 856, __pyx_L1_error) - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":855 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":855 * child, new_offset = fields * * if (end - f) - (new_offset - offset[0]) < 15: # <<<<<<<<<<<<<< @@ -7886,7 +7886,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx */ } - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":858 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":858 * raise RuntimeError(u"Format string allocated too short, see comment in numpy.pxd") * * if ((child.byteorder == c'>' and little_endian) or # <<<<<<<<<<<<<< @@ -7906,7 +7906,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx } __pyx_L8_next_or:; - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":859 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":859 * * if ((child.byteorder == c'>' and little_endian) or * (child.byteorder == c'<' and not little_endian)): # <<<<<<<<<<<<<< @@ -7923,7 +7923,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx __pyx_t_6 = __pyx_t_7; __pyx_L7_bool_binop_done:; - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":858 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":858 * raise RuntimeError(u"Format string allocated too short, see comment in numpy.pxd") * * if ((child.byteorder == c'>' and little_endian) or # <<<<<<<<<<<<<< @@ -7932,7 +7932,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx */ if (unlikely(__pyx_t_6)) { - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":860 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":860 * if ((child.byteorder == c'>' and little_endian) or * (child.byteorder == c'<' and not little_endian)): * raise ValueError(u"Non-native byte order not supported") # <<<<<<<<<<<<<< @@ -7945,7 +7945,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx __Pyx_DECREF(__pyx_t_3); __pyx_t_3 = 0; __PYX_ERR(1, 860, __pyx_L1_error) - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":858 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":858 * raise RuntimeError(u"Format string allocated too short, see comment in numpy.pxd") * * if ((child.byteorder == c'>' and little_endian) or # <<<<<<<<<<<<<< @@ -7954,7 +7954,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx */ } - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":870 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":870 * * # Output padding bytes * while offset[0] < new_offset: # <<<<<<<<<<<<<< @@ -7970,7 +7970,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx __Pyx_DECREF(__pyx_t_4); __pyx_t_4 = 0; if (!__pyx_t_6) break; - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":871 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":871 * # Output padding bytes * while offset[0] < new_offset: * f[0] = 120 # "x"; pad byte # <<<<<<<<<<<<<< @@ -7979,7 +7979,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx */ (__pyx_v_f[0]) = 0x78; - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":872 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":872 * while offset[0] < new_offset: * f[0] = 120 # "x"; pad byte * f += 1 # <<<<<<<<<<<<<< @@ -7988,7 +7988,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx */ __pyx_v_f = (__pyx_v_f + 1); - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":873 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":873 * f[0] = 120 # "x"; pad byte * f += 1 * offset[0] += 1 # <<<<<<<<<<<<<< @@ -7999,7 +7999,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx (__pyx_v_offset[__pyx_t_8]) = ((__pyx_v_offset[__pyx_t_8]) + 1); } - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":875 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":875 * offset[0] += 1 * * offset[0] += child.itemsize # <<<<<<<<<<<<<< @@ -8009,7 +8009,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx __pyx_t_8 = 0; (__pyx_v_offset[__pyx_t_8]) = ((__pyx_v_offset[__pyx_t_8]) + __pyx_v_child->elsize); - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":877 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":877 * offset[0] += child.itemsize * * if not PyDataType_HASFIELDS(child): # <<<<<<<<<<<<<< @@ -8019,7 +8019,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx __pyx_t_6 = ((!(PyDataType_HASFIELDS(__pyx_v_child) != 0)) != 0); if (__pyx_t_6) { - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":878 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":878 * * if not PyDataType_HASFIELDS(child): * t = child.type_num # <<<<<<<<<<<<<< @@ -8031,7 +8031,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx __Pyx_XDECREF_SET(__pyx_v_t, __pyx_t_4); __pyx_t_4 = 0; - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":879 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":879 * if not PyDataType_HASFIELDS(child): * t = child.type_num * if end - f < 5: # <<<<<<<<<<<<<< @@ -8041,7 +8041,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx __pyx_t_6 = (((__pyx_v_end - __pyx_v_f) < 5) != 0); if (unlikely(__pyx_t_6)) { - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":880 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":880 * t = child.type_num * if end - f < 5: * raise RuntimeError(u"Format string allocated too short.") # <<<<<<<<<<<<<< @@ -8054,7 +8054,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx __Pyx_DECREF(__pyx_t_4); __pyx_t_4 = 0; __PYX_ERR(1, 880, __pyx_L1_error) - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":879 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":879 * if not PyDataType_HASFIELDS(child): * t = child.type_num * if end - f < 5: # <<<<<<<<<<<<<< @@ -8063,7 +8063,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx */ } - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":883 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":883 * * # Until ticket #99 is fixed, use integers to avoid warnings * if t == NPY_BYTE: f[0] = 98 #"b" # <<<<<<<<<<<<<< @@ -8081,7 +8081,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx goto __pyx_L15; } - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":884 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":884 * # Until ticket #99 is fixed, use integers to avoid warnings * if t == NPY_BYTE: f[0] = 98 #"b" * elif t == NPY_UBYTE: f[0] = 66 #"B" # <<<<<<<<<<<<<< @@ -8099,7 +8099,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx goto __pyx_L15; } - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":885 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":885 * if t == NPY_BYTE: f[0] = 98 #"b" * elif t == NPY_UBYTE: f[0] = 66 #"B" * elif t == NPY_SHORT: f[0] = 104 #"h" # <<<<<<<<<<<<<< @@ -8117,7 +8117,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx goto __pyx_L15; } - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":886 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":886 * elif t == NPY_UBYTE: f[0] = 66 #"B" * elif t == NPY_SHORT: f[0] = 104 #"h" * elif t == NPY_USHORT: f[0] = 72 #"H" # <<<<<<<<<<<<<< @@ -8135,7 +8135,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx goto __pyx_L15; } - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":887 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":887 * elif t == NPY_SHORT: f[0] = 104 #"h" * elif t == NPY_USHORT: f[0] = 72 #"H" * elif t == NPY_INT: f[0] = 105 #"i" # <<<<<<<<<<<<<< @@ -8153,7 +8153,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx goto __pyx_L15; } - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":888 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":888 * elif t == NPY_USHORT: f[0] = 72 #"H" * elif t == NPY_INT: f[0] = 105 #"i" * elif t == NPY_UINT: f[0] = 73 #"I" # <<<<<<<<<<<<<< @@ -8171,7 +8171,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx goto __pyx_L15; } - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":889 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":889 * elif t == NPY_INT: f[0] = 105 #"i" * elif t == NPY_UINT: f[0] = 73 #"I" * elif t == NPY_LONG: f[0] = 108 #"l" # <<<<<<<<<<<<<< @@ -8189,7 +8189,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx goto __pyx_L15; } - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":890 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":890 * elif t == NPY_UINT: f[0] = 73 #"I" * elif t == NPY_LONG: f[0] = 108 #"l" * elif t == NPY_ULONG: f[0] = 76 #"L" # <<<<<<<<<<<<<< @@ -8207,7 +8207,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx goto __pyx_L15; } - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":891 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":891 * elif t == NPY_LONG: f[0] = 108 #"l" * elif t == NPY_ULONG: f[0] = 76 #"L" * elif t == NPY_LONGLONG: f[0] = 113 #"q" # <<<<<<<<<<<<<< @@ -8225,7 +8225,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx goto __pyx_L15; } - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":892 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":892 * elif t == NPY_ULONG: f[0] = 76 #"L" * elif t == NPY_LONGLONG: f[0] = 113 #"q" * elif t == NPY_ULONGLONG: f[0] = 81 #"Q" # <<<<<<<<<<<<<< @@ -8243,7 +8243,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx goto __pyx_L15; } - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":893 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":893 * elif t == NPY_LONGLONG: f[0] = 113 #"q" * elif t == NPY_ULONGLONG: f[0] = 81 #"Q" * elif t == NPY_FLOAT: f[0] = 102 #"f" # <<<<<<<<<<<<<< @@ -8261,7 +8261,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx goto __pyx_L15; } - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":894 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":894 * elif t == NPY_ULONGLONG: f[0] = 81 #"Q" * elif t == NPY_FLOAT: f[0] = 102 #"f" * elif t == NPY_DOUBLE: f[0] = 100 #"d" # <<<<<<<<<<<<<< @@ -8279,7 +8279,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx goto __pyx_L15; } - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":895 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":895 * elif t == NPY_FLOAT: f[0] = 102 #"f" * elif t == NPY_DOUBLE: f[0] = 100 #"d" * elif t == NPY_LONGDOUBLE: f[0] = 103 #"g" # <<<<<<<<<<<<<< @@ -8297,7 +8297,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx goto __pyx_L15; } - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":896 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":896 * elif t == NPY_DOUBLE: f[0] = 100 #"d" * elif t == NPY_LONGDOUBLE: f[0] = 103 #"g" * elif t == NPY_CFLOAT: f[0] = 90; f[1] = 102; f += 1 # Zf # <<<<<<<<<<<<<< @@ -8317,7 +8317,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx goto __pyx_L15; } - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":897 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":897 * elif t == NPY_LONGDOUBLE: f[0] = 103 #"g" * elif t == NPY_CFLOAT: f[0] = 90; f[1] = 102; f += 1 # Zf * elif t == NPY_CDOUBLE: f[0] = 90; f[1] = 100; f += 1 # Zd # <<<<<<<<<<<<<< @@ -8337,7 +8337,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx goto __pyx_L15; } - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":898 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":898 * elif t == NPY_CFLOAT: f[0] = 90; f[1] = 102; f += 1 # Zf * elif t == NPY_CDOUBLE: f[0] = 90; f[1] = 100; f += 1 # Zd * elif t == NPY_CLONGDOUBLE: f[0] = 90; f[1] = 103; f += 1 # Zg # <<<<<<<<<<<<<< @@ -8357,7 +8357,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx goto __pyx_L15; } - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":899 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":899 * elif t == NPY_CDOUBLE: f[0] = 90; f[1] = 100; f += 1 # Zd * elif t == NPY_CLONGDOUBLE: f[0] = 90; f[1] = 103; f += 1 # Zg * elif t == NPY_OBJECT: f[0] = 79 #"O" # <<<<<<<<<<<<<< @@ -8375,7 +8375,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx goto __pyx_L15; } - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":901 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":901 * elif t == NPY_OBJECT: f[0] = 79 #"O" * else: * raise ValueError(u"unknown dtype code in numpy.pxd (%d)" % t) # <<<<<<<<<<<<<< @@ -8394,7 +8394,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx } __pyx_L15:; - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":902 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":902 * else: * raise ValueError(u"unknown dtype code in numpy.pxd (%d)" % t) * f += 1 # <<<<<<<<<<<<<< @@ -8403,7 +8403,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx */ __pyx_v_f = (__pyx_v_f + 1); - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":877 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":877 * offset[0] += child.itemsize * * if not PyDataType_HASFIELDS(child): # <<<<<<<<<<<<<< @@ -8413,7 +8413,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx goto __pyx_L13; } - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":906 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":906 * # Cython ignores struct boundary information ("T{...}"), * # so don't output it * f = _util_dtypestring(child, f, end, offset) # <<<<<<<<<<<<<< @@ -8426,7 +8426,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx } __pyx_L13:; - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":851 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":851 * cdef tuple fields * * for childname in descr.names: # <<<<<<<<<<<<<< @@ -8436,7 +8436,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx } __Pyx_DECREF(__pyx_t_1); __pyx_t_1 = 0; - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":907 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":907 * # so don't output it * f = _util_dtypestring(child, f, end, offset) * return f # <<<<<<<<<<<<<< @@ -8446,7 +8446,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx __pyx_r = __pyx_v_f; goto __pyx_L0; - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":842 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":842 * return () * * cdef inline char* _util_dtypestring(dtype descr, char* f, char* end, int* offset) except NULL: # <<<<<<<<<<<<<< @@ -8471,7 +8471,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx return __pyx_r; } -/* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1022 +/* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1022 * int _import_umath() except -1 * * cdef inline void set_array_base(ndarray arr, object base): # <<<<<<<<<<<<<< @@ -8483,7 +8483,7 @@ static CYTHON_INLINE void __pyx_f_5numpy_set_array_base(PyArrayObject *__pyx_v_a __Pyx_RefNannyDeclarations __Pyx_RefNannySetupContext("set_array_base", 0); - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1023 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1023 * * cdef inline void set_array_base(ndarray arr, object base): * Py_INCREF(base) # important to do this before stealing the reference below! # <<<<<<<<<<<<<< @@ -8492,7 +8492,7 @@ static CYTHON_INLINE void __pyx_f_5numpy_set_array_base(PyArrayObject *__pyx_v_a */ Py_INCREF(__pyx_v_base); - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1024 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1024 * cdef inline void set_array_base(ndarray arr, object base): * Py_INCREF(base) # important to do this before stealing the reference below! * PyArray_SetBaseObject(arr, base) # <<<<<<<<<<<<<< @@ -8501,7 +8501,7 @@ static CYTHON_INLINE void __pyx_f_5numpy_set_array_base(PyArrayObject *__pyx_v_a */ (void)(PyArray_SetBaseObject(__pyx_v_arr, __pyx_v_base)); - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1022 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1022 * int _import_umath() except -1 * * cdef inline void set_array_base(ndarray arr, object base): # <<<<<<<<<<<<<< @@ -8513,7 +8513,7 @@ static CYTHON_INLINE void __pyx_f_5numpy_set_array_base(PyArrayObject *__pyx_v_a __Pyx_RefNannyFinishContext(); } -/* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1026 +/* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1026 * PyArray_SetBaseObject(arr, base) * * cdef inline object get_array_base(ndarray arr): # <<<<<<<<<<<<<< @@ -8528,7 +8528,7 @@ static CYTHON_INLINE PyObject *__pyx_f_5numpy_get_array_base(PyArrayObject *__py int __pyx_t_1; __Pyx_RefNannySetupContext("get_array_base", 0); - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1027 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1027 * * cdef inline object get_array_base(ndarray arr): * base = PyArray_BASE(arr) # <<<<<<<<<<<<<< @@ -8537,7 +8537,7 @@ static CYTHON_INLINE PyObject *__pyx_f_5numpy_get_array_base(PyArrayObject *__py */ __pyx_v_base = PyArray_BASE(__pyx_v_arr); - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1028 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1028 * cdef inline object get_array_base(ndarray arr): * base = PyArray_BASE(arr) * if base is NULL: # <<<<<<<<<<<<<< @@ -8547,7 +8547,7 @@ static CYTHON_INLINE PyObject *__pyx_f_5numpy_get_array_base(PyArrayObject *__py __pyx_t_1 = ((__pyx_v_base == NULL) != 0); if (__pyx_t_1) { - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1029 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1029 * base = PyArray_BASE(arr) * if base is NULL: * return None # <<<<<<<<<<<<<< @@ -8558,7 +8558,7 @@ static CYTHON_INLINE PyObject *__pyx_f_5numpy_get_array_base(PyArrayObject *__py __pyx_r = Py_None; __Pyx_INCREF(Py_None); goto __pyx_L0; - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1028 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1028 * cdef inline object get_array_base(ndarray arr): * base = PyArray_BASE(arr) * if base is NULL: # <<<<<<<<<<<<<< @@ -8567,7 +8567,7 @@ static CYTHON_INLINE PyObject *__pyx_f_5numpy_get_array_base(PyArrayObject *__py */ } - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1030 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1030 * if base is NULL: * return None * return base # <<<<<<<<<<<<<< @@ -8579,7 +8579,7 @@ static CYTHON_INLINE PyObject *__pyx_f_5numpy_get_array_base(PyArrayObject *__py __pyx_r = ((PyObject *)__pyx_v_base); goto __pyx_L0; - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1026 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1026 * PyArray_SetBaseObject(arr, base) * * cdef inline object get_array_base(ndarray arr): # <<<<<<<<<<<<<< @@ -8594,7 +8594,7 @@ static CYTHON_INLINE PyObject *__pyx_f_5numpy_get_array_base(PyArrayObject *__py return __pyx_r; } -/* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1034 +/* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1034 * # Versions of the import_* functions which are more suitable for * # Cython code. * cdef inline int import_array() except -1: # <<<<<<<<<<<<<< @@ -8615,7 +8615,7 @@ static CYTHON_INLINE int __pyx_f_5numpy_import_array(void) { PyObject *__pyx_t_8 = NULL; __Pyx_RefNannySetupContext("import_array", 0); - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1035 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1035 * # Cython code. * cdef inline int import_array() except -1: * try: # <<<<<<<<<<<<<< @@ -8631,7 +8631,7 @@ static CYTHON_INLINE int __pyx_f_5numpy_import_array(void) { __Pyx_XGOTREF(__pyx_t_3); /*try:*/ { - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1036 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1036 * cdef inline int import_array() except -1: * try: * _import_array() # <<<<<<<<<<<<<< @@ -8640,7 +8640,7 @@ static CYTHON_INLINE int __pyx_f_5numpy_import_array(void) { */ __pyx_t_4 = _import_array(); if (unlikely(__pyx_t_4 == ((int)-1))) __PYX_ERR(1, 1036, __pyx_L3_error) - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1035 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1035 * # Cython code. * cdef inline int import_array() except -1: * try: # <<<<<<<<<<<<<< @@ -8654,7 +8654,7 @@ static CYTHON_INLINE int __pyx_f_5numpy_import_array(void) { goto __pyx_L8_try_end; __pyx_L3_error:; - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1037 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1037 * try: * _import_array() * except Exception: # <<<<<<<<<<<<<< @@ -8669,7 +8669,7 @@ static CYTHON_INLINE int __pyx_f_5numpy_import_array(void) { __Pyx_GOTREF(__pyx_t_6); __Pyx_GOTREF(__pyx_t_7); - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1038 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1038 * _import_array() * except Exception: * raise ImportError("numpy.core.multiarray failed to import") # <<<<<<<<<<<<<< @@ -8685,7 +8685,7 @@ static CYTHON_INLINE int __pyx_f_5numpy_import_array(void) { goto __pyx_L5_except_error; __pyx_L5_except_error:; - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1035 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1035 * # Cython code. * cdef inline int import_array() except -1: * try: # <<<<<<<<<<<<<< @@ -8700,7 +8700,7 @@ static CYTHON_INLINE int __pyx_f_5numpy_import_array(void) { __pyx_L8_try_end:; } - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1034 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1034 * # Versions of the import_* functions which are more suitable for * # Cython code. * cdef inline int import_array() except -1: # <<<<<<<<<<<<<< @@ -8723,7 +8723,7 @@ static CYTHON_INLINE int __pyx_f_5numpy_import_array(void) { return __pyx_r; } -/* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1040 +/* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1040 * raise ImportError("numpy.core.multiarray failed to import") * * cdef inline int import_umath() except -1: # <<<<<<<<<<<<<< @@ -8744,7 +8744,7 @@ static CYTHON_INLINE int __pyx_f_5numpy_import_umath(void) { PyObject *__pyx_t_8 = NULL; __Pyx_RefNannySetupContext("import_umath", 0); - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1041 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1041 * * cdef inline int import_umath() except -1: * try: # <<<<<<<<<<<<<< @@ -8760,7 +8760,7 @@ static CYTHON_INLINE int __pyx_f_5numpy_import_umath(void) { __Pyx_XGOTREF(__pyx_t_3); /*try:*/ { - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1042 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1042 * cdef inline int import_umath() except -1: * try: * _import_umath() # <<<<<<<<<<<<<< @@ -8769,7 +8769,7 @@ static CYTHON_INLINE int __pyx_f_5numpy_import_umath(void) { */ __pyx_t_4 = _import_umath(); if (unlikely(__pyx_t_4 == ((int)-1))) __PYX_ERR(1, 1042, __pyx_L3_error) - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1041 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1041 * * cdef inline int import_umath() except -1: * try: # <<<<<<<<<<<<<< @@ -8783,7 +8783,7 @@ static CYTHON_INLINE int __pyx_f_5numpy_import_umath(void) { goto __pyx_L8_try_end; __pyx_L3_error:; - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1043 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1043 * try: * _import_umath() * except Exception: # <<<<<<<<<<<<<< @@ -8798,7 +8798,7 @@ static CYTHON_INLINE int __pyx_f_5numpy_import_umath(void) { __Pyx_GOTREF(__pyx_t_6); __Pyx_GOTREF(__pyx_t_7); - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1044 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1044 * _import_umath() * except Exception: * raise ImportError("numpy.core.umath failed to import") # <<<<<<<<<<<<<< @@ -8814,7 +8814,7 @@ static CYTHON_INLINE int __pyx_f_5numpy_import_umath(void) { goto __pyx_L5_except_error; __pyx_L5_except_error:; - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1041 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1041 * * cdef inline int import_umath() except -1: * try: # <<<<<<<<<<<<<< @@ -8829,7 +8829,7 @@ static CYTHON_INLINE int __pyx_f_5numpy_import_umath(void) { __pyx_L8_try_end:; } - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1040 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1040 * raise ImportError("numpy.core.multiarray failed to import") * * cdef inline int import_umath() except -1: # <<<<<<<<<<<<<< @@ -8852,7 +8852,7 @@ static CYTHON_INLINE int __pyx_f_5numpy_import_umath(void) { return __pyx_r; } -/* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1046 +/* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1046 * raise ImportError("numpy.core.umath failed to import") * * cdef inline int import_ufunc() except -1: # <<<<<<<<<<<<<< @@ -8873,7 +8873,7 @@ static CYTHON_INLINE int __pyx_f_5numpy_import_ufunc(void) { PyObject *__pyx_t_8 = NULL; __Pyx_RefNannySetupContext("import_ufunc", 0); - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1047 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1047 * * cdef inline int import_ufunc() except -1: * try: # <<<<<<<<<<<<<< @@ -8889,7 +8889,7 @@ static CYTHON_INLINE int __pyx_f_5numpy_import_ufunc(void) { __Pyx_XGOTREF(__pyx_t_3); /*try:*/ { - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1048 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1048 * cdef inline int import_ufunc() except -1: * try: * _import_umath() # <<<<<<<<<<<<<< @@ -8898,7 +8898,7 @@ static CYTHON_INLINE int __pyx_f_5numpy_import_ufunc(void) { */ __pyx_t_4 = _import_umath(); if (unlikely(__pyx_t_4 == ((int)-1))) __PYX_ERR(1, 1048, __pyx_L3_error) - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1047 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1047 * * cdef inline int import_ufunc() except -1: * try: # <<<<<<<<<<<<<< @@ -8912,7 +8912,7 @@ static CYTHON_INLINE int __pyx_f_5numpy_import_ufunc(void) { goto __pyx_L8_try_end; __pyx_L3_error:; - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1049 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1049 * try: * _import_umath() * except Exception: # <<<<<<<<<<<<<< @@ -8926,7 +8926,7 @@ static CYTHON_INLINE int __pyx_f_5numpy_import_ufunc(void) { __Pyx_GOTREF(__pyx_t_6); __Pyx_GOTREF(__pyx_t_7); - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1050 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1050 * _import_umath() * except Exception: * raise ImportError("numpy.core.umath failed to import") # <<<<<<<<<<<<<< @@ -8940,7 +8940,7 @@ static CYTHON_INLINE int __pyx_f_5numpy_import_ufunc(void) { goto __pyx_L5_except_error; __pyx_L5_except_error:; - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1047 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1047 * * cdef inline int import_ufunc() except -1: * try: # <<<<<<<<<<<<<< @@ -8955,7 +8955,7 @@ static CYTHON_INLINE int __pyx_f_5numpy_import_ufunc(void) { __pyx_L8_try_end:; } - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1046 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1046 * raise ImportError("numpy.core.umath failed to import") * * cdef inline int import_ufunc() except -1: # <<<<<<<<<<<<<< @@ -9135,7 +9135,7 @@ static CYTHON_SMALL_CODE int __Pyx_InitCachedConstants(void) { __Pyx_GOTREF(__pyx_tuple_); __Pyx_GIVEREF(__pyx_tuple_); - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":272 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":272 * if ((flags & pybuf.PyBUF_C_CONTIGUOUS == pybuf.PyBUF_C_CONTIGUOUS) * and not PyArray_CHKFLAGS(self, NPY_ARRAY_C_CONTIGUOUS)): * raise ValueError(u"ndarray is not C contiguous") # <<<<<<<<<<<<<< @@ -9146,7 +9146,7 @@ static CYTHON_SMALL_CODE int __Pyx_InitCachedConstants(void) { __Pyx_GOTREF(__pyx_tuple__2); __Pyx_GIVEREF(__pyx_tuple__2); - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":276 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":276 * if ((flags & pybuf.PyBUF_F_CONTIGUOUS == pybuf.PyBUF_F_CONTIGUOUS) * and not PyArray_CHKFLAGS(self, NPY_ARRAY_F_CONTIGUOUS)): * raise ValueError(u"ndarray is not Fortran contiguous") # <<<<<<<<<<<<<< @@ -9157,7 +9157,7 @@ static CYTHON_SMALL_CODE int __Pyx_InitCachedConstants(void) { __Pyx_GOTREF(__pyx_tuple__3); __Pyx_GIVEREF(__pyx_tuple__3); - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":306 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":306 * if ((descr.byteorder == c'>' and little_endian) or * (descr.byteorder == c'<' and not little_endian)): * raise ValueError(u"Non-native byte order not supported") # <<<<<<<<<<<<<< @@ -9168,7 +9168,7 @@ static CYTHON_SMALL_CODE int __Pyx_InitCachedConstants(void) { __Pyx_GOTREF(__pyx_tuple__4); __Pyx_GIVEREF(__pyx_tuple__4); - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":856 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":856 * * if (end - f) - (new_offset - offset[0]) < 15: * raise RuntimeError(u"Format string allocated too short, see comment in numpy.pxd") # <<<<<<<<<<<<<< @@ -9179,7 +9179,7 @@ static CYTHON_SMALL_CODE int __Pyx_InitCachedConstants(void) { __Pyx_GOTREF(__pyx_tuple__5); __Pyx_GIVEREF(__pyx_tuple__5); - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":880 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":880 * t = child.type_num * if end - f < 5: * raise RuntimeError(u"Format string allocated too short.") # <<<<<<<<<<<<<< @@ -9190,7 +9190,7 @@ static CYTHON_SMALL_CODE int __Pyx_InitCachedConstants(void) { __Pyx_GOTREF(__pyx_tuple__6); __Pyx_GIVEREF(__pyx_tuple__6); - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1038 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1038 * _import_array() * except Exception: * raise ImportError("numpy.core.multiarray failed to import") # <<<<<<<<<<<<<< @@ -9201,7 +9201,7 @@ static CYTHON_SMALL_CODE int __Pyx_InitCachedConstants(void) { __Pyx_GOTREF(__pyx_tuple__7); __Pyx_GIVEREF(__pyx_tuple__7); - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1044 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1044 * _import_umath() * except Exception: * raise ImportError("numpy.core.umath failed to import") # <<<<<<<<<<<<<< @@ -9827,7 +9827,7 @@ if (!__Pyx_RefNanny) { if (PyDict_SetItem(__pyx_d, __pyx_n_s_test, __pyx_t_7) < 0) __PYX_ERR(0, 1, __pyx_L1_error) __Pyx_DECREF(__pyx_t_7); __pyx_t_7 = 0; - /* "../../.virtualenvs/release/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1046 + /* "../../.virtualenvs/aaa/local/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1046 * raise ImportError("numpy.core.umath failed to import") * * cdef inline int import_ufunc() except -1: # <<<<<<<<<<<<<< @@ -11538,7 +11538,7 @@ static CYTHON_INLINE PyObject* __Pyx_PyInt_From_unsigned_PY_LONG_LONG(unsigned P theta = 0; } else { r = -a.real; - theta = atan2f(0, -1); + theta = atan2f(0.0, -1.0); } } else { r = __Pyx_c_abs_float(a); @@ -11693,7 +11693,7 @@ static CYTHON_INLINE PyObject* __Pyx_PyInt_From_unsigned_PY_LONG_LONG(unsigned P theta = 0; } else { r = -a.real; - theta = atan2(0, -1); + theta = atan2(0.0, -1.0); } } else { r = __Pyx_c_abs_double(a); diff --git a/gensim/models/keyedvectors.py b/gensim/models/keyedvectors.py index d9dad1cc56..1428503c8a 100644 --- a/gensim/models/keyedvectors.py +++ b/gensim/models/keyedvectors.py @@ -182,9 +182,7 @@ from gensim.models.utils_any2vec import ( _save_word2vec_format, _load_word2vec_format, - _compute_ngrams, - _ft_hash, - _ft_hash_broken + ft_ngram_hashes, ) from gensim.similarities.termsim import TermSimilarityIndex, SparseTermSimilarityMatrix @@ -513,6 +511,9 @@ def most_similar(self, positive=None, negative=None, topn=10, restrict_vocab=Non Sequence of (word, similarity). """ + if topn is not None and topn < 1: + return [] + if positive is None: positive = [] if negative is None: @@ -552,7 +553,7 @@ def most_similar(self, positive=None, negative=None, topn=10, restrict_vocab=Non limited = self.vectors_norm if restrict_vocab is None else self.vectors_norm[:restrict_vocab] dists = dot(limited, mean) - if not topn: + if topn is None: return dists best = matutils.argsort(dists, topn=topn + len(all_words), reverse=True) # ignore (don't return) words from the input @@ -1512,6 +1513,15 @@ def get_keras_embedding(self, train_embeddings=False): ) return layer + @classmethod + def load(cls, fname_or_handle, **kwargs): + model = super(WordEmbeddingsKeyedVectors, cls).load(fname_or_handle, **kwargs) + if isinstance(model, FastTextKeyedVectors): + if not hasattr(model, 'compatible_hash'): + model.compatible_hash = False + + return model + KeyedVectors = Word2VecKeyedVectors # alias for backward compatibility @@ -1804,7 +1814,7 @@ def distances(self, d1, other_docs=()): other_vectors = self[other_docs] return 1 - WordEmbeddingsKeyedVectors.cosine_similarities(input_vector, other_vectors) - def similarity_unseen_docs(self, model, doc_words1, doc_words2, alpha=0.1, min_alpha=0.0001, steps=5): + def similarity_unseen_docs(self, model, doc_words1, doc_words2, alpha=None, min_alpha=None, steps=None): """Compute cosine similarity between two post-bulk out of training documents. Parameters @@ -1939,11 +1949,14 @@ class FastTextKeyedVectors(WordEmbeddingsKeyedVectors): Attributes ---------- vectors_vocab : np.array - A vector for each entity in the vocabulary. + Each row corresponds to a vector for an entity in the vocabulary. + Columns correspond to vector dimensions. vectors_vocab_norm : np.array Same as vectors_vocab, but the vectors are L2 normalized. vectors_ngrams : np.array A vector for each ngram across all entities in the vocabulary. + Each row is a vector that corresponds to a bucket. + Columns correspond to vector dimensions. vectors_ngrams_norm : np.array Same as vectors_ngrams, but the vectors are L2 normalized. Under some conditions, may actually be the same matrix as @@ -1957,7 +1970,8 @@ class FastTextKeyedVectors(WordEmbeddingsKeyedVectors): bucket to an index, and then indexing into vectors_ngrams (in other words, vectors_ngrams[hash2index[hash_fn(ngram) % bucket]]. num_ngram_vectors : int - TODO + The number of vectors that correspond to ngrams, as opposed to terms + (full words). """ def __init__(self, vector_size, min_n, max_n, bucket, compatible_hash): @@ -1974,6 +1988,14 @@ def __init__(self, vector_size, min_n, max_n, bucket, compatible_hash): self.num_ngram_vectors = 0 self.compatible_hash = compatible_hash + @classmethod + def load(cls, fname_or_handle, **kwargs): + model = super(WordEmbeddingsKeyedVectors, cls).load(fname_or_handle, **kwargs) + if not hasattr(model, 'compatible_hash'): + model.compatible_hash = False + + return model + @property @deprecated("Attribute will be removed in 4.0.0, use self.vectors_vocab instead") def syn0_vocab(self): @@ -2012,9 +2034,8 @@ def __contains__(self, word): if word in self.vocab: return True else: - hash_fn = _ft_hash if self.compatible_hash else _ft_hash_broken - char_ngrams = _compute_ngrams(word, self.min_n, self.max_n) - return any(hash_fn(ng) % self.bucket in self.hash2index for ng in char_ngrams) + hashes = ft_ngram_hashes(word, self.min_n, self.max_n, self.bucket, self.compatible_hash) + return any(h in self.hash2index for h in hashes) def save(self, *args, **kwargs): """Save object. @@ -2056,23 +2077,18 @@ def word_vec(self, word, use_norm=False): If word and all ngrams not in vocabulary. """ - hash_fn = _ft_hash if self.compatible_hash else _ft_hash_broken - if word in self.vocab: return super(FastTextKeyedVectors, self).word_vec(word, use_norm) elif self.bucket == 0: raise KeyError('cannot calculate vector for OOV word without ngrams') else: - # from gensim.models.fasttext import compute_ngrams word_vec = np.zeros(self.vectors_ngrams.shape[1], dtype=np.float32) - ngrams = _compute_ngrams(word, self.min_n, self.max_n) if use_norm: ngram_weights = self.vectors_ngrams_norm else: ngram_weights = self.vectors_ngrams ngrams_found = 0 - for ngram in ngrams: - ngram_hash = hash_fn(ngram) % self.bucket + for ngram_hash in ft_ngram_hashes(word, self.min_n, self.max_n, self.bucket, self.compatible_hash): if ngram_hash in self.hash2index: word_vec += ngram_weights[self.hash2index[ngram_hash]] ngrams_found += 1 @@ -2130,7 +2146,7 @@ def init_ngrams_weights(self, seed): self.min_n, self.max_n, self.bucket, - _ft_hash if self.compatible_hash else _ft_hash_broken, + self.compatible_hash, self.hash2index ) self.num_ngram_vectors = len(ngram_indices) @@ -2153,7 +2169,7 @@ def update_ngrams_weights(self, seed, old_vocab_len): self.min_n, self.max_n, self.bucket, - _ft_hash if self.compatible_hash else _ft_hash_broken, + self.compatible_hash, self.hash2index ) num_new_ngrams = len(new_ngram_hashes) @@ -2215,7 +2231,7 @@ def init_post_load(self, vectors, match_gensim=False): self.min_n, self.max_n, self.bucket, - _ft_hash if self.compatible_hash else _ft_hash_broken, + self.compatible_hash, dict(), # we don't care what goes here in this case ) ngram_hashes = sorted(set(ngram_hashes)) @@ -2237,19 +2253,16 @@ def adjust_vectors(self): if self.bucket == 0: return - hash_fn = _ft_hash if self.compatible_hash else _ft_hash_broken - for w, v in self.vocab.items(): word_vec = np.copy(self.vectors_vocab[v.index]) - ngrams = _compute_ngrams(w, self.min_n, self.max_n) - for ngram in ngrams: - ngram_index = self.hash2index[hash_fn(ngram) % self.bucket] - word_vec += self.vectors_ngrams[ngram_index] - word_vec /= len(ngrams) + 1 + ngram_hashes = ft_ngram_hashes(w, self.min_n, self.max_n, self.bucket, self.compatible_hash) + for nh in ngram_hashes: + word_vec += self.vectors_ngrams[self.hash2index[nh]] + word_vec /= len(ngram_hashes) + 1 self.vectors[v.index] = word_vec -def _process_fasttext_vocab(iterable, min_n, max_n, num_buckets, hash_fn, hash2index): +def _process_fasttext_vocab(iterable, min_n, max_n, num_buckets, compatible_hash, hash2index): """ Performs a common operation for FastText weight initialization and updates: scan the vocabulary, calculate ngrams and their hashes, keep @@ -2266,8 +2279,9 @@ def _process_fasttext_vocab(iterable, min_n, max_n, num_buckets, hash_fn, hash2i The maximum length of ngrams. num_buckets : int The number of buckets used by the model. - hash_fn : callable - Used to hash ngrams to buckets. + compatible_hash : boolean + True for compatibility with the Facebook implementation. + False for compatibility with the old Gensim implementation. hash2index : dict Updated in-place. @@ -2293,8 +2307,7 @@ def _process_fasttext_vocab(iterable, min_n, max_n, num_buckets, hash_fn, hash2i for word, vocab in iterable: wi = [] - for ngram in _compute_ngrams(word, min_n, max_n): - ngram_hash = hash_fn(ngram) % num_buckets + for ngram_hash in ft_ngram_hashes(word, min_n, max_n, num_buckets, compatible_hash): if ngram_hash not in hash2index: # # This is a new ngram. Reserve a new index in hash2index. diff --git a/gensim/models/ldamodel.py b/gensim/models/ldamodel.py index 503c2b48e3..786ec41c0b 100755 --- a/gensim/models/ldamodel.py +++ b/gensim/models/ldamodel.py @@ -594,9 +594,19 @@ def __str__(self): self.num_terms, self.num_topics, self.decay, self.chunksize ) - def sync_state(self): - """Propagate the states topic probabilities to the inner object's attribute.""" - self.expElogbeta = np.exp(self.state.get_Elogbeta()) + def sync_state(self, current_Elogbeta=None): + """Propagate the states topic probabilities to the inner object's attribute. + + Parameters + ---------- + current_Elogbeta: numpy.ndarray + Posterior probabilities for each topic, optional. + If omitted, it will get Elogbeta from state. + """ + + if current_Elogbeta is None: + current_Elogbeta = self.state.get_Elogbeta() + self.expElogbeta = np.exp(current_Elogbeta) assert self.expElogbeta.dtype == self.dtype def clear(self): @@ -1027,14 +1037,16 @@ def do_mstep(self, rho, other, extra_pass=False): logger.debug("updating topics") # update self with the new blend; also keep track of how much did # the topics change through this update, to assess convergence - diff = np.log(self.expElogbeta) + previous_Elogbeta = self.state.get_Elogbeta() self.state.blend(rho, other) - diff -= self.state.get_Elogbeta() - self.sync_state() + + current_Elogbeta = self.state.get_Elogbeta() + self.sync_state(current_Elogbeta) # print out some debug info at the end of each EM iteration self.print_topics(5) - logger.info("topic diff=%f, rho=%f", np.mean(np.abs(diff)), rho) + diff = mean_absolute_difference(previous_Elogbeta.ravel(), current_Elogbeta.ravel()) + logger.info("topic diff=%f, rho=%f", diff, rho) if self.optimize_eta: self.update_eta(self.state.get_lambda(), rho) diff --git a/gensim/models/ldamulticore.py b/gensim/models/ldamulticore.py index e3ed274128..f3341fee0b 100644 --- a/gensim/models/ldamulticore.py +++ b/gensim/models/ldamulticore.py @@ -225,13 +225,14 @@ def update(self, corpus, chunks_as_numpy=False): self.state.numdocs += lencorpus - if not self.batch: - updatetype = "online" - updateafter = self.chunksize * self.workers - else: + if self.batch: updatetype = "batch" updateafter = lencorpus - evalafter = min(lencorpus, (self.eval_every or 0) * updateafter) + else: + updatetype = "online" + updateafter = self.chunksize * self.workers + eval_every = self.eval_every or 0 + evalafter = min(lencorpus, eval_every * updateafter) updates_per_pass = max(1, lencorpus / updateafter) logger.info( @@ -257,47 +258,45 @@ def update(self, corpus, chunks_as_numpy=False): def rho(): return pow(self.offset + pass_ + (self.num_updates / self.chunksize), -self.decay) + def process_result_queue(force=False): + """ + Clear the result queue, merging all intermediate results, and update the + LDA model if necessary. + + """ + merged_new = False + while not result_queue.empty(): + other.merge(result_queue.get()) + queue_size[0] -= 1 + merged_new = True + + if (force and merged_new and queue_size[0] == 0) or (other.numdocs >= updateafter): + self.do_mstep(rho(), other, pass_ > 0) + other.reset() + if eval_every > 0 and (force or (self.num_updates / updateafter) % eval_every == 0): + self.log_perplexity(chunk, total_docs=lencorpus) + logger.info("training LDA model using %i processes", self.workers) pool = Pool(self.workers, worker_e_step, (job_queue, result_queue,)) for pass_ in range(self.passes): queue_size, reallen = [0], 0 other = LdaState(self.eta, self.state.sstats.shape) - def process_result_queue(force=False): - """ - Clear the result queue, merging all intermediate results, and update the - LDA model if necessary. - - """ - merged_new = False - while not result_queue.empty(): - other.merge(result_queue.get()) - queue_size[0] -= 1 - merged_new = True - if (force and merged_new and queue_size[0] == 0) or (not self.batch and (other.numdocs >= updateafter)): - self.do_mstep(rho(), other, pass_ > 0) - other.reset() - if self.eval_every is not None \ - and ((force and queue_size[0] == 0) - or (self.eval_every != 0 and (self.num_updates / updateafter) % self.eval_every == 0)): - self.log_perplexity(chunk, total_docs=lencorpus) - chunk_stream = utils.grouper(corpus, self.chunksize, as_numpy=chunks_as_numpy) for chunk_no, chunk in enumerate(chunk_stream): reallen += len(chunk) # keep track of how many documents we've processed so far # put the chunk into the workers' input job queue - chunk_put = False - while not chunk_put: + while True: try: - job_queue.put((chunk_no, chunk, self), block=False, timeout=0.1) - chunk_put = True + job_queue.put((chunk_no, chunk, self), block=False) queue_size[0] += 1 logger.info( "PROGRESS: pass %i, dispatched chunk #%i = documents up to #%i/%i, " "outstanding queue size %i", pass_, chunk_no, chunk_no * self.chunksize + len(chunk), lencorpus, queue_size[0] ) + break except queue.Full: # in case the input job queue is full, keep clearing the # result queue, to make sure we don't deadlock diff --git a/gensim/models/ldaseqmodel.py b/gensim/models/ldaseqmodel.py index 1c9e8a55d9..642f12e28d 100644 --- a/gensim/models/ldaseqmodel.py +++ b/gensim/models/ldaseqmodel.py @@ -58,6 +58,7 @@ from scipy.special import digamma, gammaln from scipy import optimize import logging +from six.moves import range, zip logger = logging.getLogger(__name__) @@ -126,7 +127,7 @@ def __init__(self, corpus=None, time_slice=None, id2word=None, alphas=0.01, num_ logger.warning("no word id mapping provided; initializing from corpus, assuming identity") self.id2word = utils.dict_from_corpus(corpus) self.vocab_len = len(self.id2word) - elif len(self.id2word) > 0: + elif self.id2word: self.vocab_len = len(self.id2word) else: self.vocab_len = 0 @@ -142,12 +143,6 @@ def __init__(self, corpus=None, time_slice=None, id2word=None, alphas=0.01, num_ if self.time_slice is not None: self.num_time_slices = len(time_slice) - max_doc_len = 0 - for line_no, line in enumerate(corpus): - if len(line) > max_doc_len: - max_doc_len = len(line) - self.max_doc_len = max_doc_len - self.num_topics = num_topics self.num_time_slices = len(time_slice) self.alphas = np.full(num_topics, alphas) @@ -157,7 +152,7 @@ def __init__(self, corpus=None, time_slice=None, id2word=None, alphas=0.01, num_ # the sslm class is described below and contains information # on topic-word probabilities and doc-topic probabilities. self.topic_chains = [] - for topic in range(0, num_topics): + for topic in range(num_topics): sslm_ = sslm( num_time_slices=self.num_time_slices, vocab_len=self.vocab_len, num_topics=self.num_topics, chain_variance=chain_variance, obs_variance=obs_variance @@ -172,6 +167,8 @@ def __init__(self, corpus=None, time_slice=None, id2word=None, alphas=0.01, num_ # if a corpus and time_slice is provided, depending on the user choice of initializing LDA, we start DTM. if corpus is not None and time_slice is not None: + self.max_doc_len = max(len(line) for line in corpus) + if initialize == 'gensim': lda_model = ldamodel.LdaModel( corpus, id2word=self.id2word, num_topics=self.num_topics, @@ -268,12 +265,12 @@ def fit_lda_seq(self, corpus, lda_inference_max_iter, em_min_iter, em_max_iter, # initiate sufficient statistics topic_suffstats = [] - for topic in range(0, num_topics): - topic_suffstats.append(np.resize(np.zeros(vocab_len * data_len), (vocab_len, data_len))) + for topic in range(num_topics): + topic_suffstats.append(np.zeros((vocab_len, data_len))) # set up variables - gammas = np.resize(np.zeros(corpus_len * num_topics), (corpus_len, num_topics)) - lhoods = np.resize(np.zeros(corpus_len * num_topics + 1), (corpus_len, num_topics + 1)) + gammas = np.zeros((corpus_len, num_topics)) + lhoods = np.zeros((corpus_len, num_topics + 1)) # compute the likelihood of a sequential corpus under an LDA # seq model and find the evidence lower bound. This is the E - Step bound, gammas = \ @@ -346,7 +343,7 @@ def lda_seq_infer(self, corpus, topic_suffstats, gammas, lhoods, bound = 0.0 lda = ldamodel.LdaModel(num_topics=num_topics, alpha=self.alphas, id2word=self.id2word, dtype=np.float64) - lda.topics = np.array(np.split(np.zeros(vocab_len * num_topics), vocab_len)) + lda.topics = np.zeros((vocab_len, num_topics)) ldapost = LdaPost(max_doc_len=self.max_doc_len, num_topics=num_topics, lda=lda) model = "DTM" @@ -460,8 +457,8 @@ def make_lda_seq_slice(self, lda, time): The stationary model updated to reflect the passed time slice. """ - for k in range(0, self.num_topics): - lda.topics[:, k] = np.copy(self.topic_chains[k].e_log_prob[:, time]) + for k in range(self.num_topics): + lda.topics[:, k] = self.topic_chains[k].e_log_prob[:, time] lda.alpha = np.copy(self.alphas) return lda @@ -507,7 +504,7 @@ def print_topic_times(self, topic, top_terms=20): """ topics = [] - for time in range(0, self.num_time_slices): + for time in range(self.num_time_slices): topics.append(self.print_topic(topic, time, top_terms)) return topics @@ -530,7 +527,7 @@ def print_topics(self, time=0, top_terms=20): probability. """ - return [self.print_topic(topic, time, top_terms) for topic in range(0, self.num_topics)] + return [self.print_topic(topic, time, top_terms) for topic in range(self.num_topics)] def print_topic(self, topic, time=0, top_terms=20): """Get the list of words most relevant to the given topic. @@ -578,8 +575,7 @@ def doc_topics(self, doc_number): Probability for each topic in the mixture (essentially a point in the `self.num_topics - 1` simplex. """ - doc_topic = np.copy(self.gammas) - doc_topic /= doc_topic.sum(axis=1)[:, np.newaxis] + doc_topic = self.gammas / self.gammas.sum(axis=1)[:, np.newaxis] return doc_topic[doc_number] def dtm_vis(self, time, corpus): @@ -608,22 +604,25 @@ def dtm_vis(self, time, corpus): The set of unique terms existing in the cropuse's vocabulary. """ - doc_topic = np.copy(self.gammas) - doc_topic /= doc_topic.sum(axis=1)[:, np.newaxis] + doc_topic = self.gammas / self.gammas.sum(axis=1)[:, np.newaxis] + + def normalize(x): + return x / x.sum() topic_term = [ - np.exp(np.transpose(chain.e_log_prob)[time]) / np.exp(np.transpose(chain.e_log_prob)[time]).sum() + normalize(np.exp(chain.e_log_prob.T[time])) for k, chain in enumerate(self.topic_chains) ] - doc_lengths = [len(doc) for doc_no, doc in enumerate(corpus)] - + doc_lengths = [] term_frequency = np.zeros(self.vocab_len) for doc_no, doc in enumerate(corpus): - for pair in doc: - term_frequency[pair[0]] += pair[1] + doc_lengths.append(len(doc)) + + for term, freq in doc: + term_frequency[term] += freq - vocab = [self.id2word[i] for i in range(0, len(self.id2word))] + vocab = [self.id2word[i] for i in range(len(self.id2word))] return doc_topic, np.array(topic_term), doc_lengths, term_frequency, vocab @@ -668,13 +667,13 @@ def __getitem__(self, doc): Probabilities for each topic in the mixture. This is essentially a point in the `num_topics - 1` simplex. """ - lda_model = \ - ldamodel.LdaModel(num_topics=self.num_topics, alpha=self.alphas, id2word=self.id2word, dtype=np.float64) - lda_model.topics = np.array(np.split(np.zeros(self.vocab_len * self.num_topics), self.vocab_len)) + lda_model = ldamodel.LdaModel( + num_topics=self.num_topics, alpha=self.alphas, id2word=self.id2word, dtype=np.float64) + lda_model.topics = np.zeros((self.vocab_len, self.num_topics)) ldapost = LdaPost(num_topics=self.num_topics, max_doc_len=len(doc), lda=lda_model, doc=doc) time_lhoods = [] - for time in range(0, self.num_time_slices): + for time in range(self.num_time_slices): lda_model = self.make_lda_seq_slice(lda_model, time) # create lda_seq slice lhood = LdaPost.fit_lda_post(ldapost, 0, time, self) time_lhoods.append(lhood) @@ -706,12 +705,12 @@ def __init__(self, vocab_len=None, num_time_slices=None, num_topics=None, obs_va self.num_topics = num_topics # setting up matrices - self.obs = np.array(np.split(np.zeros(num_time_slices * vocab_len), vocab_len)) - self.e_log_prob = np.array(np.split(np.zeros(num_time_slices * vocab_len), vocab_len)) - self.mean = np.array(np.split(np.zeros((num_time_slices + 1) * vocab_len), vocab_len)) - self.fwd_mean = np.array(np.split(np.zeros((num_time_slices + 1) * vocab_len), vocab_len)) - self.fwd_variance = np.array(np.split(np.zeros((num_time_slices + 1) * vocab_len), vocab_len)) - self.variance = np.array(np.split(np.zeros((num_time_slices + 1) * vocab_len), vocab_len)) + self.obs = np.zeros((vocab_len, num_time_slices)) + self.e_log_prob = np.zeros((vocab_len, num_time_slices)) + self.mean = np.zeros((vocab_len, num_time_slices + 1)) + self.fwd_mean = np.zeros((vocab_len, num_time_slices + 1)) + self.fwd_variance = np.zeros((vocab_len, num_time_slices + 1)) + self.variance = np.zeros((vocab_len, num_time_slices + 1)) self.zeta = np.zeros(num_time_slices) # the following are class variables which are to be integrated during Document Influence Model @@ -896,9 +895,9 @@ def sslm_counts_init(self, obs_variance, chain_variance, sstats): T = self.num_time_slices log_norm_counts = np.copy(sstats) - log_norm_counts = log_norm_counts / sum(log_norm_counts) - log_norm_counts = log_norm_counts + 1.0 / W - log_norm_counts = log_norm_counts / sum(log_norm_counts) + log_norm_counts /= sum(log_norm_counts) + log_norm_counts += 1.0 / W + log_norm_counts /= sum(log_norm_counts) log_norm_counts = np.log(log_norm_counts) # setting variational observations to transformed counts @@ -908,7 +907,7 @@ def sslm_counts_init(self, obs_variance, chain_variance, sstats): self.chain_variance = chain_variance # compute post variance, mean - for w in range(0, W): + for w in range(W): self.variance[w], self.fwd_variance[w] = self.compute_post_variance(w, self.chain_variance) self.mean[w], self.fwd_mean[w] = self.compute_post_mean(w, self.chain_variance) @@ -944,7 +943,7 @@ def fit_sslm(self, sstats): # computing variance, fwd_variance self.variance, self.fwd_variance = \ - (np.array(x) for x in list(zip(*[self.compute_post_variance(w, self.chain_variance) for w in range(0, W)]))) + (np.array(x) for x in zip(*(self.compute_post_variance(w, self.chain_variance) for w in range(W)))) # column sum of sstats totals = sstats.sum(axis=0) @@ -1006,11 +1005,10 @@ def compute_bound(self, sstats, totals): chain_variance = self.chain_variance # computing mean, fwd_mean self.mean, self.fwd_mean = \ - (np.array(x) for x in zip(*[self.compute_post_mean(w, self.chain_variance) for w in range(0, w)])) + (np.array(x) for x in zip(*(self.compute_post_mean(w, self.chain_variance) for w in range(w)))) self.zeta = self.update_zeta() - for w in range(0, w): - val += (self.variance[w][0] - self.variance[w][t]) / 2 * chain_variance + val = sum(self.variance[w][0] - self.variance[w][t] for w in range(w)) / 2 * chain_variance logger.info("Computing bound, all times") @@ -1018,7 +1016,7 @@ def compute_bound(self, sstats, totals): term_1 = 0.0 term_2 = 0.0 ent = 0.0 - for w in range(0, w): + for w in range(w): m = self.mean[w][t] prev_m = self.mean[w][t - 1] @@ -1071,14 +1069,14 @@ def update_obs(self, sstats, totals): T = self.num_time_slices runs = 0 - mean_deriv_mtx = np.resize(np.zeros(T * (T + 1)), (T, T + 1)) + mean_deriv_mtx = np.zeros((T, T + 1)) norm_cutoff_obs = None - for w in range(0, W): + for w in range(W): w_counts = sstats[w] counts_norm = 0 # now we find L2 norm of w_counts - for i in range(0, len(w_counts)): + for i in range(len(w_counts)): counts_norm += w_counts[i] * w_counts[i] counts_norm = np.sqrt(counts_norm) @@ -1091,10 +1089,8 @@ def update_obs(self, sstats, totals): w_counts = np.zeros(len(w_counts)) # TODO: apply lambda function - for t in range(0, T): - mean_deriv = mean_deriv_mtx[t] - mean_deriv = self.compute_mean_deriv(w, t, mean_deriv) - mean_deriv_mtx[t] = mean_deriv + for t in range(T): + mean_deriv_mtx[t] = self.compute_mean_deriv(w, t, mean_deriv_mtx[t]) deriv = np.zeros(T) args = self, w_counts, totals, mean_deriv_mtx, w, deriv @@ -1207,10 +1203,10 @@ def compute_obs_deriv(self, word, word_counts, totals, mean_deriv_mtx, deriv): # temp_vector holds temporary zeta values self.temp_vect = np.zeros(T) - for u in range(0, T): + for u in range(T): self.temp_vect[u] = np.exp(mean[u + 1] + variance[u + 1] / 2) - for t in range(0, T): + for t in range(T): mean_deriv = mean_deriv_mtx[t] term1 = 0 term2 = 0 @@ -1280,8 +1276,8 @@ def __init__(self, doc=None, lda=None, max_doc_len=None, num_topics=None, gamma= self.lhood = np.zeros(num_topics + 1) if max_doc_len is not None and num_topics is not None: - self.phi = np.resize(np.zeros(max_doc_len * num_topics), (max_doc_len, num_topics)) - self.log_phi = np.resize(np.zeros(max_doc_len * num_topics), (max_doc_len, num_topics)) + self.phi = np.zeros((max_doc_len, num_topics)) + self.log_phi = np.zeros((max_doc_len, num_topics)) # the following are class variables which are to be integrated during Document Influence Model @@ -1314,12 +1310,12 @@ def update_phi(self, doc_number, time): # digamma values dig = np.zeros(num_topics) - for k in range(0, num_topics): + for k in range(num_topics): dig[k] = digamma(self.gamma[k]) n = 0 # keep track of iterations for phi, log_phi for word_id, count in self.doc: - for k in range(0, num_topics): + for k in range(num_topics): self.log_phi[n][k] = dig[k] + self.lda.topics[word_id][k] log_phi_row = self.log_phi[n] @@ -1355,7 +1351,7 @@ def update_gamma(self): n = 0 # keep track of number of iterations for phi, log_phi for word_id, count in self.doc: phi_row = self.phi[n] - for k in range(0, self.lda.num_topics): + for k in range(self.lda.num_topics): self.gamma[k] += phi_row[k] * count n += 1 @@ -1392,7 +1388,7 @@ def compute_lda_lhood(self): digsum = digamma(gamma_sum) model = "DTM" # noqa:F841 - for k in range(0, num_topics): + for k in range(num_topics): # below code only to be used in DIM mode # if ldapost.doc_weight is not None and (model == "DIM" or model == "fixed"): # influence_topic = ldapost.doc_weight[k] @@ -1518,7 +1514,7 @@ def update_lda_seq_ss(self, time, doc, topic_suffstats): """ num_topics = self.lda.num_topics - for k in range(0, num_topics): + for k in range(num_topics): topic_ss = topic_suffstats[k] n = 0 for word_id, count in self.doc: @@ -1639,6 +1635,7 @@ def df_obs(x, *args): if model == "DTM": deriv = sslm.compute_obs_deriv(word, word_counts, totals, mean_deriv_mtx, deriv) elif model == "DIM": - deriv = sslm.compute_obs_deriv_fixed(p.word, p.word_counts, p.totals, p.sslm, p.mean_deriv_mtx, deriv) # noqa:F821 + deriv = sslm.compute_obs_deriv_fixed( + p.word, p.word_counts, p.totals, p.sslm, p.mean_deriv_mtx, deriv) # noqa:F821 return np.negative(deriv) diff --git a/gensim/models/nmf.py b/gensim/models/nmf.py index 0a33660d00..d7993db5e7 100644 --- a/gensim/models/nmf.py +++ b/gensim/models/nmf.py @@ -1,10 +1,102 @@ -"""Online Non-Negative Matrix Factorization.""" +"""`Online Non-Negative Matrix Factorization. ` +Implements online non-negative matrix factorization algorithm, which allows for fast latent topic inference. +This NMF implementation updates in a streaming fashion and works best with sparse corpora. + +- W is a word-topic matrix +- h is a topic-document matrix +- v is an input word-document matrix +- A, B - matrices that accumulate information from every consecutive chunk. A = h.dot(ht), B = v.dot(ht). + +The idea of the algorithm is as follows: + +.. code-block:: text + + Initialize W, A and B matrices + + Input corpus + Split corpus to batches + + for v in batches: + infer h: + do coordinate gradient descent step to find h that minimizes (v - Wh) l2 norm + + bound h so that it is non-negative + + update A and B: + A = h.dot(ht) + B = v.dot(ht) + + update W: + do gradient descent step to find W that minimizes 0.5*trace(WtWA) - trace(WtB) l2 norm + +Examples +-------- + +Train an NMF model using a Gensim corpus + +.. sourcecode:: pycon + + >>> from gensim.test.utils import common_texts + >>> from gensim.corpora.dictionary import Dictionary + >>> + >>> # Create a corpus from a list of texts + >>> common_dictionary = Dictionary(common_texts) + >>> common_corpus = [common_dictionary.doc2bow(text) for text in common_texts] + >>> + >>> # Train the model on the corpus. + >>> nmf = Nmf(common_corpus, num_topics=10) + +Save a model to disk, or reload a pre-trained model + +.. sourcecode:: pycon + + >>> from gensim.test.utils import datapath + >>> + >>> # Save model to disk. + >>> temp_file = datapath("model") + >>> nmf.save(temp_file) + >>> + >>> # Load a potentially pretrained model from disk. + >>> nmf = Nmf.load(temp_file) + +Infer vectors for new documents + +.. sourcecode:: pycon + + >>> # Create a new corpus, made of previously unseen documents. + >>> other_texts = [ + ... ['computer', 'time', 'graph'], + ... ['survey', 'response', 'eps'], + ... ['human', 'system', 'computer'] + ... ] + >>> other_corpus = [common_dictionary.doc2bow(text) for text in other_texts] + >>> + >>> unseen_doc = other_corpus[0] + >>> vector = Nmf[unseen_doc] # get topic probability distribution for a document + +Update the model by incrementally training on the new corpus + +.. sourcecode:: pycon + + >>> nmf.update(other_corpus) + >>> vector = nmf[unseen_doc] + +A lot of parameters can be tuned to optimize training for your specific case + +.. sourcecode:: pycon + + >>> nmf = Nmf(common_corpus, num_topics=50, kappa=0.1, eval_every=5) # decrease training step size + +The NMF should be used whenever one needs extremely fast and memory optimized topic model. + +""" import itertools import logging import numpy as np import scipy.sparse +from gensim.models.nmf_pgd import solve_h from scipy.stats import halfnorm from gensim import interfaces @@ -12,10 +104,11 @@ from gensim import utils from gensim.interfaces import TransformedCorpus from gensim.models import basemodel, CoherenceModel -from gensim.models.nmf_pgd import solve_h, solve_r logger = logging.getLogger(__name__) +OLD_SCIPY = int(scipy.__version__.split('.')[1]) <= 18 + class Nmf(interfaces.TransformationABC, basemodel.BaseTopicModel): """Online Non-Negative Matrix Factorization. @@ -31,79 +124,74 @@ def __init__( id2word=None, chunksize=2000, passes=1, - lambda_=1.0, kappa=1.0, minimum_probability=0.01, - use_r=False, w_max_iter=200, w_stop_condition=1e-4, - h_r_max_iter=50, - h_r_stop_condition=1e-3, + h_max_iter=50, + h_stop_condition=1e-3, eval_every=10, - v_max=None, normalize=True, - sparse_coef=3, random_state=None, ): - """ + r""" Parameters ---------- corpus : iterable of list of (int, float), optional - Training corpus. If not given, model is left untrained. + Training corpus. + Can be either iterable of documents, which are lists of `(word_id, word_count)`, + or a sparse csc matrix of BOWs for each document. + If not specified, the model is left uninitialized (presumably, to be trained later with `self.train()`). num_topics : int, optional Number of topics to extract. - id2word: gensim.corpora.Dictionary, optional - Mapping from token id to token. If not set words get replaced with word ids. + id2word: {dict of (int, str), :class:`gensim.corpora.dictionary.Dictionary`} + Mapping from word IDs to words. It is used to determine the vocabulary size, as well as for + debugging and topic printing. chunksize: int, optional Number of documents to be used in each training chunk. - passes: int, optioanl + passes: int, optional Number of full passes over the training corpus. - lambda_ : float, optional - Residuals regularizer coefficient. Increasing it helps prevent ovefitting. Has no effect if `use_r` is set - to False. + Leave at default `passes=1` if your input is a non-repeatable generator. kappa : float, optional - Optimizer step coefficient. Increaing it makes model train faster, but adds a risk that it won't converge. + Gradient descent step size. + Larger value makes the model train faster, but could lead to non-convergence if set too large. + minimum_probability: + If `normalize` is True, topics with smaller probabilities are filtered out. + If `normalize` is False, topics with smaller factors are filtered out. + If set to None, a value of 1e-8 is used to prevent 0s. w_max_iter: int, optional - Maximum number of iterations to train W matrix per each batch. + Maximum number of iterations to train W per each batch. w_stop_condition: float, optional - If error difference gets less than that, training of matrix ``W`` stops for current batch. - h_r_max_iter: int, optional - Maximum number of iterations to train h and r matrices per each batch. - h_r_stop_condition: float - If error difference gets less than that, training of matrices ``h`` and ``r`` stops for current batch. + If error difference gets less than that, training of ``W`` stops for the current batch. + h_max_iter: int, optional + Maximum number of iterations to train h per each batch. + h_stop_condition: float + If error difference gets less than that, training of ``h`` stops for the current batch. eval_every: int, optional - Number of batches after which model will be evaluated. - v_max: int, optional - Maximum number of word occurrences in the corpora. Inferred if not set. Rarely needs to be set explicitly. - normalize: bool, optional - Whether to normalize results. Offers "kind-of-probabilistic" result. - sparse_coef: float, optional - The more it is, the more sparse are matrices. Significantly increases performance. + Number of batches after which l2 norm of (v - Wh) is computed. Decreases performance if set too low. + normalize: bool or None, optional + Whether to normalize the result. Allows for estimation of perplexity, coherence, e.t.c. random_state: {np.random.RandomState, int}, optional - Seed for random generator. Useful for reproducibility. + Seed for random generator. Needed for reproducibility. """ - self._w_error = None - self.num_tokens = None self.num_topics = num_topics self.id2word = id2word self.chunksize = chunksize self.passes = passes - self._lambda_ = lambda_ self._kappa = kappa self.minimum_probability = minimum_probability - self.use_r = use_r self._w_max_iter = w_max_iter self._w_stop_condition = w_stop_condition - self._h_r_max_iter = h_r_max_iter - self._h_r_stop_condition = h_r_stop_condition - self.v_max = v_max + self._h_max_iter = h_max_iter + self.h_stop_condition = h_stop_condition self.eval_every = eval_every self.normalize = normalize - self.sparse_coef = sparse_coef self.random_state = utils.get_random_state(random_state) + self.v_max = None + if self.id2word is None: self.id2word = utils.dict_from_corpus(corpus) @@ -114,9 +202,9 @@ def __init__( self._W = None self.w_std = None + self._w_error = np.inf self._h = None - self._r = None if corpus is not None: self.update(corpus) @@ -126,8 +214,8 @@ def get_topics(self, normalize=None): Parameters ---------- - normalize : bool, optional - Whether to normalize an output vector. + normalize: bool or None, optional + Whether to normalize the result. Allows for estimation of perplexity, coherence, e.t.c. Returns ------- @@ -135,7 +223,7 @@ def get_topics(self, normalize=None): The probability for each word in each topic, shape (`num_topics`, `vocabulary_size`). """ - dense_topics = self._W.T.toarray() + dense_topics = self._W.T if normalize is None: normalize = self.normalize if normalize: @@ -146,9 +234,8 @@ def get_topics(self, normalize=None): def __getitem__(self, bow, eps=None): return self.get_document_topics(bow, eps) - def show_topics(self, num_topics=10, num_words=10, log=False, - formatted=True, normalize=None): - """Get a representation for selected topics. + def show_topics(self, num_topics=10, num_words=10, log=False, formatted=True, normalize=None): + """Get the topics sorted by sparsity. Parameters ---------- @@ -160,12 +247,12 @@ def show_topics(self, num_topics=10, num_words=10, log=False, Number of words to be presented for each topic. These will be the most relevant words (assigned the highest probability for each topic). log : bool, optional - Whether the output is also logged, besides being returned. + Whether the result is also logged, besides being returned. formatted : bool, optional Whether the topic representations should be formatted as strings. If False, they are returned as 2 tuples of (word, probability). - normalize : bool, optional - Whether to normalize an output vector. + normalize: bool or None, optional + Whether to normalize the result. Allows for estimation of perplexity, coherence, e.t.c. Returns ------- @@ -177,7 +264,7 @@ def show_topics(self, num_topics=10, num_words=10, log=False, if normalize is None: normalize = self.normalize - sparsity = self._W.getnnz(axis=0) + sparsity = (self._W == 0).mean(axis=0) if num_topics < 0 or num_topics >= self.num_topics: num_topics = self.num_topics @@ -217,8 +304,8 @@ def show_topic(self, topicid, topn=10, normalize=None): The ID of the topic to be returned topn : int, optional Number of the most significant words that are associated with the topic. - normalize : bool, optional - Whether to normalize an output vector. + normalize: bool or None, optional + Whether to normalize the result. Allows for estimation of perplexity, coherence, e.t.c. Returns ------- @@ -245,8 +332,8 @@ def get_topic_terms(self, topicid, topn=10, normalize=None): The ID of the topic to be returned topn : int, optional Number of the most significant words that are associated with the topic. - normalize : bool, optional - Whether to normalize an output vector. + normalize: bool or None, optional + Whether to normalize the result. Allows for estimation of perplexity, coherence, e.t.c. Returns ------- @@ -254,7 +341,7 @@ def get_topic_terms(self, topicid, topn=10, normalize=None): Word ID - probability pairs for the most relevant words generated by the topic. """ - topic = self._W.getcol(topicid).toarray()[0] + topic = self._W[:, topicid] if normalize is None: normalize = self.normalize @@ -266,17 +353,20 @@ def get_topic_terms(self, topicid, topn=10, normalize=None): def top_topics(self, corpus=None, texts=None, dictionary=None, window_size=None, coherence='u_mass', topn=20, processes=-1): - """Get the topics with the highest coherence score the coherence for each topic. + """Get the topics sorted by coherence. Parameters ---------- corpus : iterable of list of (int, float), optional - Corpus in BoW format. + Training corpus. + Can be either iterable of documents, which are lists of `(word_id, word_count)`, + or a sparse csc matrix of BOWs for each document. + If not specified, the model is left uninitialized (presumably, to be trained later with `self.train()`). texts : list of list of str, optional Tokenized texts, needed for coherence models that use sliding window based (i.e. coherence=`c_something`) probability estimator . - dictionary : :class:`~gensim.corpora.dictionary.Dictionary`, optional - Gensim dictionary mapping of id word to create corpus. + dictionary : {dict of (int, str), :class:`gensim.corpora.dictionary.Dictionary`}, optional + Dictionary mapping of id word to create corpus. If `model.id2word` is present, this is not needed. If both are provided, passed `dictionary` will be used. window_size : int, optional Is the size of the window to be used for coherence measures using boolean sliding window as their @@ -323,8 +413,11 @@ def log_perplexity(self, corpus): Parameters ---------- - corpus : list of list of (int, float) - The corpus on which the perplexity is computed. + corpus : iterable of list of (int, float), optional + Training corpus. + Can be either iterable of documents, which are lists of `(word_id, word_count)`, + or a sparse csc matrix of BOWs for each document. + If not specified, the model is left uninitialized (presumably, to be trained later with `self.train()`). Returns ------- @@ -346,8 +439,7 @@ def log_perplexity(self, corpus): return (np.log(pred_factors, where=pred_factors > 0) * dense_corpus).sum() / dense_corpus.sum() - def get_term_topics(self, word_id, minimum_probability=None, - normalize=None): + def get_term_topics(self, word_id, minimum_probability=None, normalize=None): """Get the most relevant topics to the given word. Parameters @@ -355,9 +447,11 @@ def get_term_topics(self, word_id, minimum_probability=None, word_id : int The word for which the topic distribution will be computed. minimum_probability : float, optional - Topics with an assigned probability below this threshold will be discarded. - normalize : bool, optional - Whether to normalize an output vector. + If `normalize` is True, topics with smaller probabilities are filtered out. + If `normalize` is False, topics with smaller factors are filtered out. + If set to None, a value of 1e-8 is used to prevent 0s. + normalize: bool or None, optional + Whether to normalize the result. Allows for estimation of perplexity, coherence, e.t.c. Returns ------- @@ -376,7 +470,7 @@ def get_term_topics(self, word_id, minimum_probability=None, values = [] - word_topics = self._W.getrow(word_id) + word_topics = self._W[word_id] if normalize is None: normalize = self.normalize @@ -384,7 +478,7 @@ def get_term_topics(self, word_id, minimum_probability=None, word_topics /= word_topics.sum() for topic_id in range(0, self.num_topics): - word_coef = word_topics[0, topic_id] + word_coef = word_topics[topic_id] if word_coef >= minimum_probability: values.append((topic_id, word_coef)) @@ -400,9 +494,11 @@ def get_document_topics(self, bow, minimum_probability=None, bow : list of (int, float) The document in BOW format. minimum_probability : float - Topics with an assigned probability lower than this threshold will be discarded. - normalize : bool, optional - Whether to normalize an output vector. + If `normalize` is True, topics with smaller probabilities are filtered out. + If `normalize` is False, topics with smaller factors are filtered out. + If set to None, a value of 1e-8 is used to prevent 0s. + normalize: bool or None, optional + Whether to normalize the result. Allows for estimation of perplexity, coherence, e.t.c. Returns ------- @@ -422,18 +518,18 @@ def get_document_topics(self, bow, minimum_probability=None, kwargs = dict(minimum_probability=minimum_probability) return self._apply(corpus, **kwargs) - v = matutils.corpus2csc([bow], len(self.id2word)).tocsr() - h, _ = self._solveproj(v, self._W, v_max=np.inf) + v = matutils.corpus2csc([bow], self.num_tokens) + h = self._solveproj(v, self._W, v_max=np.inf) if normalize is None: normalize = self.normalize if normalize: - h.data /= h.sum() + h /= h.sum() return [ - (idx, proba.toarray()[0, 0]) + (idx, proba) for idx, proba in enumerate(h[:, 0]) - if not minimum_probability or proba.toarray()[0, 0] > minimum_probability + if not minimum_probability or proba > minimum_probability ] def _setup(self, corpus): @@ -441,14 +537,21 @@ def _setup(self, corpus): Parameters ---------- - corpus : iterable of list(int, float) + corpus : iterable of list of (int, float), optional Training corpus. + Can be either iterable of documents, which are lists of `(word_id, word_count)`, + or a sparse csc matrix of BOWs for each document. + If not specified, the model is left uninitialized (presumably, to be trained later with `self.train()`). """ - self._h, self._r = None, None - first_doc_it = itertools.tee(corpus, 1) - first_doc = next(first_doc_it[0]) - first_doc = matutils.corpus2csc([first_doc], len(self.id2word)) + self._h = None + + if isinstance(corpus, scipy.sparse.csc.csc_matrix): + first_doc = corpus.getcol(0) + else: + first_doc_it = itertools.tee(corpus, 1) + first_doc = next(first_doc_it[0]) + first_doc = matutils.corpus2csc([first_doc], len(self.id2word)) self.w_std = np.sqrt(first_doc.mean() / (self.num_tokens * self.num_topics)) self._W = np.abs( @@ -458,90 +561,88 @@ def _setup(self, corpus): ) ) - is_great_enough = self._W > self.w_std * self.sparse_coef + self.A = np.zeros((self.num_topics, self.num_topics)) + self.B = np.zeros((self.num_tokens, self.num_topics)) - self._W *= is_great_enough | ~is_great_enough.all(axis=0) - - self._W = scipy.sparse.csc_matrix(self._W) - - self.A = scipy.sparse.csr_matrix((self.num_topics, self.num_topics)) - self.B = scipy.sparse.csc_matrix((self.num_tokens, self.num_topics)) - - def update(self, corpus, chunks_as_numpy=False): + def update(self, corpus): """Train the model with new documents. Parameters ---------- - corpus : iterable of list(int, float) + corpus : iterable of list of (int, float), optional Training corpus. - chunks_as_numpy : bool, optional - Whether each chunk passed to the inference step should be a numpy.ndarray or not. Numpy can in some settings - turn the term IDs into floats, these will be converted back into integers in inference, which incurs a - performance hit. For distributed computing it may be desirable to keep the chunks as `numpy.ndarray`. + Can be either iterable of documents, which are lists of `(word_id, word_count)`, + or a sparse csc matrix of BOWs for each document. + If not specified, the model is left uninitialized (presumably, to be trained later with `self.train()`). """ - if self._W is None: self._setup(corpus) chunk_idx = 1 for _ in range(self.passes): - for chunk in utils.grouper( - corpus, self.chunksize, as_numpy=chunks_as_numpy - ): - self.random_state.shuffle(chunk) - v = matutils.corpus2csc(chunk, len(self.id2word)).tocsr() - self._h, self._r = self._solveproj( - v, self._W, r=self._r, h=self._h, v_max=self.v_max + if isinstance(corpus, scipy.sparse.csc.csc_matrix): + grouper = ( + corpus[:, col_idx:col_idx + self.chunksize] + for col_idx + in range(0, corpus.shape[1], self.chunksize) ) - h, r = self._h, self._r + else: + grouper = utils.grouper(corpus, self.chunksize) + + for chunk in grouper: + if isinstance(corpus, scipy.sparse.csc.csc_matrix): + v = chunk[:, self.random_state.permutation(chunk.shape[1])] + else: + self.random_state.shuffle(chunk) + + v = matutils.corpus2csc( + chunk, + num_terms=self.num_tokens, + ) + + self._h = self._solveproj(v, self._W, h=self._h, v_max=self.v_max) + h = self._h self.A *= chunk_idx - 1 self.A += h.dot(h.T) self.A /= chunk_idx self.B *= chunk_idx - 1 - self.B += (v - r).dot(h.T) + self.B += v.dot(h.T) self.B /= chunk_idx + prev_w_error = self._w_error + self._solve_w() if chunk_idx % self.eval_every == 0: - logger.info( - "Loss (no outliers): {}\tLoss (with outliers): {}".format( - scipy.sparse.linalg.norm(v - self._W.dot(h)), - scipy.sparse.linalg.norm(v - self._W.dot(h) - r), - ) - ) + logger.info("Loss: {}".format(self._w_error / prev_w_error)) chunk_idx += 1 - logger.info( - "Loss (no outliers): {}\tLoss (with outliers): {}".format( - scipy.sparse.linalg.norm(v - self._W.dot(h)), - scipy.sparse.linalg.norm(v - self._W.dot(h) - r), - ) - ) + logger.info("Loss: {}".format(self._w_error / prev_w_error)) def _solve_w(self): - """Update W matrix.""" + """Update W.""" def error(): + Wt = self._W.T return ( - 0.5 * self._W.T.dot(self._W).dot(self.A).diagonal().sum() - - self._W.T.dot(self.B).diagonal().sum() + 0.5 * Wt.dot(self._W).dot(self.A).trace() + - Wt.dot(self.B).trace() ) - eta = self._kappa / scipy.sparse.linalg.norm(self.A) + eta = self._kappa / np.linalg.norm(self.A) for iter_number in range(self._w_max_iter): - logger.debug("w_error: %s" % self._w_error) + logger.debug("w_error: {}".format(self._w_error)) error_ = error() if ( - self._w_error + self._w_error < np.inf and np.abs((error_ - self._w_error) / self._w_error) < self._w_stop_condition ): break @@ -556,8 +657,11 @@ def _apply(self, corpus, chunksize=None, **kwargs): Parameters ---------- - corpus : iterable of list of (int, number) - Corpus in sparse Gensim bag-of-words format. + corpus : iterable of list of (int, float), optional + Training corpus. + Can be either iterable of documents, which are lists of `(word_id, word_count)`, + or a sparse csc matrix of BOWs for each document. + If not specified, the model is left uninitialized (presumably, to be trained later with `self.train()`). chunksize : int, optional If provided, a more effective processing will performed. @@ -571,36 +675,29 @@ def _apply(self, corpus, chunksize=None, **kwargs): def _transform(self): """Apply boundaries on W.""" - np.clip(self._W.data, 0, self.v_max, out=self._W.data) - self._W.eliminate_zeros() - sumsq = scipy.sparse.linalg.norm(self._W, axis=0) + np.clip(self._W, 0, self.v_max, out=self._W) + sumsq = np.linalg.norm(self._W, axis=0) np.maximum(sumsq, 1, out=sumsq) - sumsq = np.repeat(sumsq, self._W.getnnz(axis=0)) - self._W.data /= sumsq + self._W /= sumsq - is_great_enough_data = self._W.data > self.w_std * self.sparse_coef - is_great_enough = self._W.toarray() > self.w_std * self.sparse_coef - is_all_too_small = is_great_enough.sum(axis=0) == 0 - is_all_too_small = np.repeat(is_all_too_small, self._W.getnnz(axis=0)) - - is_great_enough_data |= is_all_too_small - - self._W.data *= is_great_enough_data - self._W.eliminate_zeros() + @staticmethod + def _dense_dot_csc(dense, csc): + if OLD_SCIPY: + return (csc.T.dot(dense.T)).T + else: + return scipy.sparse.csc_matrix.dot(dense, csc) - def _solveproj(self, v, W, h=None, r=None, v_max=None): + def _solveproj(self, v, W, h=None, v_max=None): """Update residuals and representation(h) matrices. Parameters ---------- - v : iterable of list(int, float) + v : scipy.sparse.csc_matrix Subset of training corpus. - W : scipy.sparse.csc_matrix + W : ndarray Dictionary matrix. - h : scipy.sparse.csr_matrix + h : ndarray Representation matrix. - r : scipy.sparse.csr_matrix - Residuals matrix. v_max : float Maximum possible value in matrices. @@ -612,45 +709,30 @@ def _solveproj(self, v, W, h=None, r=None, v_max=None): self.v_max = v.max() batch_size = v.shape[1] - rshape = (m, batch_size) hshape = (n, batch_size) if h is None or h.shape != hshape: - h = scipy.sparse.csr_matrix(hshape) - - if r is None or r.shape != rshape: - r = scipy.sparse.csr_matrix(rshape) + h = np.zeros(hshape) - WtW = W.T.dot(W) + Wt = W.T + WtW = Wt.dot(W) - _h_r_error = None + h_error = None - for iter_number in range(self._h_r_max_iter): - logger.debug("h_r_error: %s" % _h_r_error) + for iter_number in range(self._h_max_iter): + logger.debug("h_error: {}".format(h_error)) - error_ = 0. + Wtv = self._dense_dot_csc(Wt, v) - Wt_v_minus_r = W.T.dot(v - r) + permutation = self.random_state.permutation(self.num_topics).astype(np.int32) - h_ = h.toarray() - error_ = max( - error_, solve_h(h_, Wt_v_minus_r.toarray(), WtW.toarray(), self._kappa) - ) - h = scipy.sparse.csr_matrix(h_) - - if self.use_r: - r_actual = v - W.dot(h) - error_ = max( - error_, - solve_r(r, r_actual, self._lambda_, self.v_max) - ) - r = r_actual + error_ = solve_h(h, Wtv, WtW, permutation, self._kappa) error_ /= m - if _h_r_error and np.abs(_h_r_error - error_) < self._h_r_stop_condition: + if h_error and np.abs(h_error - error_) < self.h_stop_condition: break - _h_r_error = error_ + h_error = error_ - return h, r + return h diff --git a/gensim/models/nmf_pgd.c b/gensim/models/nmf_pgd.c index 83857ce7fa..2a1aa2ac3e 100644 --- a/gensim/models/nmf_pgd.c +++ b/gensim/models/nmf_pgd.c @@ -1,4 +1,4 @@ -/* Generated by Cython 0.29.2 */ +/* Generated by Cython 0.29.3 */ #define PY_SSIZE_T_CLEAN #include "Python.h" @@ -7,8 +7,8 @@ #elif PY_VERSION_HEX < 0x02060000 || (0x03000000 <= PY_VERSION_HEX && PY_VERSION_HEX < 0x03030000) #error Cython requires Python 2.6+ or Python 3.3+. #else -#define CYTHON_ABI "0_29_2" -#define CYTHON_HEX_VERSION 0x001D02F0 +#define CYTHON_ABI "0_29_3" +#define CYTHON_HEX_VERSION 0x001D03F0 #define CYTHON_FUTURE_DIVISION 0 #include #ifndef offsetof @@ -398,7 +398,7 @@ typedef int Py_tss_t; static CYTHON_INLINE int PyThread_tss_create(Py_tss_t *key) { *key = PyThread_create_key(); - return 0; // PyThread_create_key reports success always + return 0; } static CYTHON_INLINE Py_tss_t * PyThread_tss_alloc(void) { Py_tss_t *key = (Py_tss_t *)PyObject_Malloc(sizeof(Py_tss_t)); @@ -421,7 +421,7 @@ static CYTHON_INLINE int PyThread_tss_set(Py_tss_t *key, void *value) { static CYTHON_INLINE void * PyThread_tss_get(Py_tss_t *key) { return PyThread_get_key_value(*key); } -#endif // TSS (Thread Specific Storage) API +#endif #if CYTHON_COMPILING_IN_CPYTHON || defined(_PyDict_NewPresized) #define __Pyx_PyDict_NewPresized(n) ((n <= 8) ? PyDict_New() : _PyDict_NewPresized(n)) #else @@ -1614,6 +1614,9 @@ static CYTHON_INLINE __Pyx_memviewslice __Pyx_PyObject_to_MemoryviewSlice_d_dc_d /* ObjectToMemviewSlice.proto */ static CYTHON_INLINE __Pyx_memviewslice __Pyx_PyObject_to_MemoryviewSlice_dsds_double(PyObject *, int writable_flag); +/* ObjectToMemviewSlice.proto */ +static CYTHON_INLINE __Pyx_memviewslice __Pyx_PyObject_to_MemoryviewSlice_dc_int(PyObject *, int writable_flag); + /* MemviewSliceCopyTemplate.proto */ static __Pyx_memviewslice __pyx_memoryview_copy_new_contig(const __Pyx_memviewslice *from_mvs, @@ -1636,12 +1639,6 @@ static CYTHON_INLINE PyObject* __Pyx_PyInt_From_long(long value); /* CIntFromPy.proto */ static CYTHON_INLINE char __Pyx_PyInt_As_char(PyObject *); -/* ObjectToMemviewSlice.proto */ -static CYTHON_INLINE __Pyx_memviewslice __Pyx_PyObject_to_MemoryviewSlice_dc_int(PyObject *, int writable_flag); - -/* ObjectToMemviewSlice.proto */ -static CYTHON_INLINE __Pyx_memviewslice __Pyx_PyObject_to_MemoryviewSlice_dc_double(PyObject *, int writable_flag); - /* CheckBinaryVersion.proto */ static int __Pyx_check_binary_version(void); @@ -1675,7 +1672,6 @@ static int __pyx_memoryview_thread_locks_used; static PyThread_type_lock __pyx_memoryview_thread_locks[8]; static double __pyx_f_6gensim_6models_7nmf_pgd_fmin(double, double); /*proto*/ static double __pyx_f_6gensim_6models_7nmf_pgd_fmax(double, double); /*proto*/ -static double __pyx_f_6gensim_6models_7nmf_pgd_clip(double, double, double); /*proto*/ static struct __pyx_array_obj *__pyx_array_new(PyObject *, Py_ssize_t, char *, char *, char *); /*proto*/ static void *__pyx_align_pointer(void *, size_t); /*proto*/ static PyObject *__pyx_memoryview_new(PyObject *, int, int, __Pyx_TypeInfo *); /*proto*/ @@ -1727,13 +1723,12 @@ static PyObject *__pyx_builtin_IndexError; static const char __pyx_k_O[] = "O"; static const char __pyx_k_c[] = "c"; static const char __pyx_k_h[] = "h"; -static const char __pyx_k_r[] = "r"; static const char __pyx_k_id[] = "id"; static const char __pyx_k_WtW[] = "WtW"; +static const char __pyx_k_Wtv[] = "Wtv"; static const char __pyx_k_new[] = "__new__"; static const char __pyx_k_obj[] = "obj"; static const char __pyx_k_base[] = "base"; -static const char __pyx_k_data[] = "data"; static const char __pyx_k_dict[] = "__dict__"; static const char __pyx_k_grad[] = "grad"; static const char __pyx_k_main[] = "__main__"; @@ -1753,57 +1748,42 @@ static const char __pyx_k_kappa[] = "kappa"; static const char __pyx_k_range[] = "range"; static const char __pyx_k_shape[] = "shape"; static const char __pyx_k_start[] = "start"; -static const char __pyx_k_v_max[] = "v_max"; static const char __pyx_k_encode[] = "encode"; static const char __pyx_k_format[] = "format"; static const char __pyx_k_import[] = "__import__"; -static const char __pyx_k_indptr[] = "indptr"; -static const char __pyx_k_lambda[] = "lambda_"; static const char __pyx_k_name_2[] = "__name__"; static const char __pyx_k_pickle[] = "pickle"; -static const char __pyx_k_r_data[] = "r_data"; static const char __pyx_k_reduce[] = "__reduce__"; static const char __pyx_k_struct[] = "struct"; static const char __pyx_k_unpack[] = "unpack"; static const char __pyx_k_update[] = "update"; static const char __pyx_k_fortran[] = "fortran"; static const char __pyx_k_hessian[] = "hessian"; -static const char __pyx_k_indices[] = "indices"; static const char __pyx_k_memview[] = "memview"; static const char __pyx_k_solve_h[] = "solve_h"; -static const char __pyx_k_solve_r[] = "solve_r"; static const char __pyx_k_Ellipsis[] = "Ellipsis"; static const char __pyx_k_getstate[] = "__getstate__"; static const char __pyx_k_itemsize[] = "itemsize"; static const char __pyx_k_pyx_type[] = "__pyx_type"; -static const char __pyx_k_r_actual[] = "r_actual"; -static const char __pyx_k_r_indptr[] = "r_indptr"; static const char __pyx_k_setstate[] = "__setstate__"; static const char __pyx_k_TypeError[] = "TypeError"; static const char __pyx_k_enumerate[] = "enumerate"; static const char __pyx_k_n_samples[] = "n_samples"; static const char __pyx_k_pyx_state[] = "__pyx_state"; -static const char __pyx_k_r_col_idx[] = "r_col_idx"; -static const char __pyx_k_r_element[] = "r_element"; -static const char __pyx_k_r_indices[] = "r_indices"; static const char __pyx_k_reduce_ex[] = "__reduce_ex__"; static const char __pyx_k_violation[] = "violation"; static const char __pyx_k_IndexError[] = "IndexError"; static const char __pyx_k_ValueError[] = "ValueError"; static const char __pyx_k_pyx_result[] = "__pyx_result"; static const char __pyx_k_pyx_vtable[] = "__pyx_vtable__"; -static const char __pyx_k_r_col_size[] = "r_col_size"; static const char __pyx_k_sample_idx[] = "sample_idx"; static const char __pyx_k_MemoryError[] = "MemoryError"; static const char __pyx_k_PickleError[] = "PickleError"; -static const char __pyx_k_Wt_v_minus_r[] = "Wt_v_minus_r"; +static const char __pyx_k_permutation[] = "permutation"; static const char __pyx_k_n_components[] = "n_components"; static const char __pyx_k_pyx_checksum[] = "__pyx_checksum"; -static const char __pyx_k_r_col_indptr[] = "r_col_indptr"; static const char __pyx_k_stringsource[] = "stringsource"; static const char __pyx_k_pyx_getbuffer[] = "__pyx_getbuffer"; -static const char __pyx_k_r_actual_data[] = "r_actual_data"; -static const char __pyx_k_r_actual_sign[] = "r_actual_sign"; static const char __pyx_k_reduce_cython[] = "__reduce_cython__"; static const char __pyx_k_projected_grad[] = "projected_grad"; static const char __pyx_k_View_MemoryView[] = "View.MemoryView"; @@ -1812,16 +1792,10 @@ static const char __pyx_k_component_idx_1[] = "component_idx_1"; static const char __pyx_k_component_idx_2[] = "component_idx_2"; static const char __pyx_k_dtype_is_object[] = "dtype_is_object"; static const char __pyx_k_pyx_PickleError[] = "__pyx_PickleError"; -static const char __pyx_k_r_actual_indptr[] = "r_actual_indptr"; static const char __pyx_k_setstate_cython[] = "__setstate_cython__"; -static const char __pyx_k_r_actual_col_idx[] = "r_actual_col_idx"; -static const char __pyx_k_r_actual_element[] = "r_actual_element"; -static const char __pyx_k_r_actual_indices[] = "r_actual_indices"; static const char __pyx_k_pyx_unpickle_Enum[] = "__pyx_unpickle_Enum"; -static const char __pyx_k_r_actual_col_size[] = "r_actual_col_size"; static const char __pyx_k_cline_in_traceback[] = "cline_in_traceback"; static const char __pyx_k_strided_and_direct[] = ""; -static const char __pyx_k_r_actual_col_indptr[] = "r_actual_col_indptr"; static const char __pyx_k_strided_and_indirect[] = ""; static const char __pyx_k_contiguous_and_direct[] = ""; static const char __pyx_k_gensim_models_nmf_pgd[] = "gensim.models.nmf_pgd"; @@ -1871,7 +1845,7 @@ static PyObject *__pyx_kp_s_Unable_to_convert_item_to_object; static PyObject *__pyx_n_s_ValueError; static PyObject *__pyx_n_s_View_MemoryView; static PyObject *__pyx_n_s_WtW; -static PyObject *__pyx_n_s_Wt_v_minus_r; +static PyObject *__pyx_n_s_Wtv; static PyObject *__pyx_n_s_allocate_buffer; static PyObject *__pyx_n_s_base; static PyObject *__pyx_n_s_c; @@ -1882,7 +1856,6 @@ static PyObject *__pyx_n_s_component_idx_1; static PyObject *__pyx_n_s_component_idx_2; static PyObject *__pyx_kp_s_contiguous_and_direct; static PyObject *__pyx_kp_s_contiguous_and_indirect; -static PyObject *__pyx_n_s_data; static PyObject *__pyx_n_s_dict; static PyObject *__pyx_n_s_dtype_is_object; static PyObject *__pyx_n_s_encode; @@ -1901,12 +1874,9 @@ static PyObject *__pyx_n_s_h; static PyObject *__pyx_n_s_hessian; static PyObject *__pyx_n_s_id; static PyObject *__pyx_n_s_import; -static PyObject *__pyx_n_s_indices; -static PyObject *__pyx_n_s_indptr; static PyObject *__pyx_n_s_itemsize; static PyObject *__pyx_kp_s_itemsize_0_for_cython_array; static PyObject *__pyx_n_s_kappa; -static PyObject *__pyx_n_s_lambda; static PyObject *__pyx_n_s_main; static PyObject *__pyx_n_s_memview; static PyObject *__pyx_n_s_mode; @@ -1919,6 +1889,7 @@ static PyObject *__pyx_n_s_new; static PyObject *__pyx_kp_s_no_default___reduce___due_to_non; static PyObject *__pyx_n_s_obj; static PyObject *__pyx_n_s_pack; +static PyObject *__pyx_n_s_permutation; static PyObject *__pyx_n_s_pickle; static PyObject *__pyx_n_s_projected_grad; static PyObject *__pyx_n_s_pyx_PickleError; @@ -1929,23 +1900,6 @@ static PyObject *__pyx_n_s_pyx_state; static PyObject *__pyx_n_s_pyx_type; static PyObject *__pyx_n_s_pyx_unpickle_Enum; static PyObject *__pyx_n_s_pyx_vtable; -static PyObject *__pyx_n_s_r; -static PyObject *__pyx_n_s_r_actual; -static PyObject *__pyx_n_s_r_actual_col_idx; -static PyObject *__pyx_n_s_r_actual_col_indptr; -static PyObject *__pyx_n_s_r_actual_col_size; -static PyObject *__pyx_n_s_r_actual_data; -static PyObject *__pyx_n_s_r_actual_element; -static PyObject *__pyx_n_s_r_actual_indices; -static PyObject *__pyx_n_s_r_actual_indptr; -static PyObject *__pyx_n_s_r_actual_sign; -static PyObject *__pyx_n_s_r_col_idx; -static PyObject *__pyx_n_s_r_col_indptr; -static PyObject *__pyx_n_s_r_col_size; -static PyObject *__pyx_n_s_r_data; -static PyObject *__pyx_n_s_r_element; -static PyObject *__pyx_n_s_r_indices; -static PyObject *__pyx_n_s_r_indptr; static PyObject *__pyx_n_s_range; static PyObject *__pyx_n_s_reduce; static PyObject *__pyx_n_s_reduce_cython; @@ -1956,7 +1910,6 @@ static PyObject *__pyx_n_s_setstate_cython; static PyObject *__pyx_n_s_shape; static PyObject *__pyx_n_s_size; static PyObject *__pyx_n_s_solve_h; -static PyObject *__pyx_n_s_solve_r; static PyObject *__pyx_n_s_start; static PyObject *__pyx_n_s_step; static PyObject *__pyx_n_s_stop; @@ -1970,10 +1923,8 @@ static PyObject *__pyx_kp_s_unable_to_allocate_array_data; static PyObject *__pyx_kp_s_unable_to_allocate_shape_and_str; static PyObject *__pyx_n_s_unpack; static PyObject *__pyx_n_s_update; -static PyObject *__pyx_n_s_v_max; static PyObject *__pyx_n_s_violation; -static PyObject *__pyx_pf_6gensim_6models_7nmf_pgd_solve_h(CYTHON_UNUSED PyObject *__pyx_self, __Pyx_memviewslice __pyx_v_h, __Pyx_memviewslice __pyx_v_Wt_v_minus_r, __Pyx_memviewslice __pyx_v_WtW, double __pyx_v_kappa); /* proto */ -static PyObject *__pyx_pf_6gensim_6models_7nmf_pgd_2solve_r(CYTHON_UNUSED PyObject *__pyx_self, PyObject *__pyx_v_r, PyObject *__pyx_v_r_actual, double __pyx_v_lambda_, double __pyx_v_v_max); /* proto */ +static PyObject *__pyx_pf_6gensim_6models_7nmf_pgd_solve_h(CYTHON_UNUSED PyObject *__pyx_self, __Pyx_memviewslice __pyx_v_h, __Pyx_memviewslice __pyx_v_Wtv, __Pyx_memviewslice __pyx_v_WtW, __Pyx_memviewslice __pyx_v_permutation, double __pyx_v_kappa); /* proto */ static int __pyx_array___pyx_pf_15View_dot_MemoryView_5array___cinit__(struct __pyx_array_obj *__pyx_v_self, PyObject *__pyx_v_shape, Py_ssize_t __pyx_v_itemsize, PyObject *__pyx_v_format, PyObject *__pyx_v_mode, int __pyx_v_allocate_buffer); /* proto */ static int __pyx_array___pyx_pf_15View_dot_MemoryView_5array_2__getbuffer__(struct __pyx_array_obj *__pyx_v_self, Py_buffer *__pyx_v_info, int __pyx_v_flags); /* proto */ static void __pyx_array___pyx_pf_15View_dot_MemoryView_5array_4__dealloc__(struct __pyx_array_obj *__pyx_v_self); /* proto */ @@ -2044,15 +1995,13 @@ static PyObject *__pyx_tuple__17; static PyObject *__pyx_tuple__18; static PyObject *__pyx_tuple__19; static PyObject *__pyx_tuple__21; +static PyObject *__pyx_tuple__22; static PyObject *__pyx_tuple__23; static PyObject *__pyx_tuple__24; static PyObject *__pyx_tuple__25; static PyObject *__pyx_tuple__26; -static PyObject *__pyx_tuple__27; -static PyObject *__pyx_tuple__28; static PyObject *__pyx_codeobj__20; -static PyObject *__pyx_codeobj__22; -static PyObject *__pyx_codeobj__29; +static PyObject *__pyx_codeobj__27; /* Late includes */ /* "gensim/models/nmf_pgd.pyx":12 @@ -2112,7 +2061,7 @@ static double __pyx_f_6gensim_6models_7nmf_pgd_fmax(double __pyx_v_x, double __p * cdef double fmax(double x, double y) nogil: * return x if x > y else y # <<<<<<<<<<<<<< * - * cdef double clip(double a, double a_min, double a_max) nogil: + * def solve_h(double[:, ::1] h, double[:, :] Wtv, double[:, ::1] WtW, int[::1] permutation, double kappa): */ if (((__pyx_v_x > __pyx_v_y) != 0)) { __pyx_t_1 = __pyx_v_x; @@ -2138,82 +2087,33 @@ static double __pyx_f_6gensim_6models_7nmf_pgd_fmax(double __pyx_v_x, double __p /* "gensim/models/nmf_pgd.pyx":18 * return x if x > y else y * - * cdef double clip(double a, double a_min, double a_max) nogil: # <<<<<<<<<<<<<< - * a = fmin(a, a_max) - * a = fmax(a, a_min) - */ - -static double __pyx_f_6gensim_6models_7nmf_pgd_clip(double __pyx_v_a, double __pyx_v_a_min, double __pyx_v_a_max) { - double __pyx_r; - - /* "gensim/models/nmf_pgd.pyx":19 - * - * cdef double clip(double a, double a_min, double a_max) nogil: - * a = fmin(a, a_max) # <<<<<<<<<<<<<< - * a = fmax(a, a_min) - * return a - */ - __pyx_v_a = __pyx_f_6gensim_6models_7nmf_pgd_fmin(__pyx_v_a, __pyx_v_a_max); - - /* "gensim/models/nmf_pgd.pyx":20 - * cdef double clip(double a, double a_min, double a_max) nogil: - * a = fmin(a, a_max) - * a = fmax(a, a_min) # <<<<<<<<<<<<<< - * return a - * - */ - __pyx_v_a = __pyx_f_6gensim_6models_7nmf_pgd_fmax(__pyx_v_a, __pyx_v_a_min); - - /* "gensim/models/nmf_pgd.pyx":21 - * a = fmin(a, a_max) - * a = fmax(a, a_min) - * return a # <<<<<<<<<<<<<< - * - * def solve_h(double[:, ::1] h, double[:, :] Wt_v_minus_r, double[:, ::1] WtW, double kappa): - */ - __pyx_r = __pyx_v_a; - goto __pyx_L0; - - /* "gensim/models/nmf_pgd.pyx":18 - * return x if x > y else y - * - * cdef double clip(double a, double a_min, double a_max) nogil: # <<<<<<<<<<<<<< - * a = fmin(a, a_max) - * a = fmax(a, a_min) - */ - - /* function exit code */ - __pyx_L0:; - return __pyx_r; -} - -/* "gensim/models/nmf_pgd.pyx":23 - * return a - * - * def solve_h(double[:, ::1] h, double[:, :] Wt_v_minus_r, double[:, ::1] WtW, double kappa): # <<<<<<<<<<<<<< + * def solve_h(double[:, ::1] h, double[:, :] Wtv, double[:, ::1] WtW, int[::1] permutation, double kappa): # <<<<<<<<<<<<<< * """Find optimal dense vector representation for current W and r matrices. * */ /* Python wrapper */ static PyObject *__pyx_pw_6gensim_6models_7nmf_pgd_1solve_h(PyObject *__pyx_self, PyObject *__pyx_args, PyObject *__pyx_kwds); /*proto*/ -static char __pyx_doc_6gensim_6models_7nmf_pgd_solve_h[] = "solve_h(double[:, ::1] h, double[:, :] Wt_v_minus_r, double[:, ::1] WtW, double kappa)\nFind optimal dense vector representation for current W and r matrices.\n\n Parameters\n ----------\n h : matrix\n Dense representation of documents in current batch.\n Wt_v_minus_r : matrix\n WtW : matrix\n\n Returns\n -------\n float\n Cumulative difference between previous and current h vectors.\n\n "; +static char __pyx_doc_6gensim_6models_7nmf_pgd_solve_h[] = "solve_h(double[:, ::1] h, double[:, :] Wtv, double[:, ::1] WtW, int[::1] permutation, double kappa)\nFind optimal dense vector representation for current W and r matrices.\n\n Parameters\n ----------\n h : matrix\n Dense representation of documents in current batch.\n Wtv : matrix\n WtW : matrix\n\n Returns\n -------\n float\n Cumulative difference between previous and current h vectors.\n\n "; static PyMethodDef __pyx_mdef_6gensim_6models_7nmf_pgd_1solve_h = {"solve_h", (PyCFunction)(void*)(PyCFunctionWithKeywords)__pyx_pw_6gensim_6models_7nmf_pgd_1solve_h, METH_VARARGS|METH_KEYWORDS, __pyx_doc_6gensim_6models_7nmf_pgd_solve_h}; static PyObject *__pyx_pw_6gensim_6models_7nmf_pgd_1solve_h(PyObject *__pyx_self, PyObject *__pyx_args, PyObject *__pyx_kwds) { __Pyx_memviewslice __pyx_v_h = { 0, 0, { 0 }, { 0 }, { 0 } }; - __Pyx_memviewslice __pyx_v_Wt_v_minus_r = { 0, 0, { 0 }, { 0 }, { 0 } }; + __Pyx_memviewslice __pyx_v_Wtv = { 0, 0, { 0 }, { 0 }, { 0 } }; __Pyx_memviewslice __pyx_v_WtW = { 0, 0, { 0 }, { 0 }, { 0 } }; + __Pyx_memviewslice __pyx_v_permutation = { 0, 0, { 0 }, { 0 }, { 0 } }; double __pyx_v_kappa; PyObject *__pyx_r = 0; __Pyx_RefNannyDeclarations __Pyx_RefNannySetupContext("solve_h (wrapper)", 0); { - static PyObject **__pyx_pyargnames[] = {&__pyx_n_s_h,&__pyx_n_s_Wt_v_minus_r,&__pyx_n_s_WtW,&__pyx_n_s_kappa,0}; - PyObject* values[4] = {0,0,0,0}; + static PyObject **__pyx_pyargnames[] = {&__pyx_n_s_h,&__pyx_n_s_Wtv,&__pyx_n_s_WtW,&__pyx_n_s_permutation,&__pyx_n_s_kappa,0}; + PyObject* values[5] = {0,0,0,0,0}; if (unlikely(__pyx_kwds)) { Py_ssize_t kw_args; const Py_ssize_t pos_args = PyTuple_GET_SIZE(__pyx_args); switch (pos_args) { + case 5: values[4] = PyTuple_GET_ITEM(__pyx_args, 4); + CYTHON_FALLTHROUGH; case 4: values[3] = PyTuple_GET_ITEM(__pyx_args, 3); CYTHON_FALLTHROUGH; case 3: values[2] = PyTuple_GET_ITEM(__pyx_args, 2); @@ -2232,55 +2132,63 @@ static PyObject *__pyx_pw_6gensim_6models_7nmf_pgd_1solve_h(PyObject *__pyx_self else goto __pyx_L5_argtuple_error; CYTHON_FALLTHROUGH; case 1: - if (likely((values[1] = __Pyx_PyDict_GetItemStr(__pyx_kwds, __pyx_n_s_Wt_v_minus_r)) != 0)) kw_args--; + if (likely((values[1] = __Pyx_PyDict_GetItemStr(__pyx_kwds, __pyx_n_s_Wtv)) != 0)) kw_args--; else { - __Pyx_RaiseArgtupleInvalid("solve_h", 1, 4, 4, 1); __PYX_ERR(0, 23, __pyx_L3_error) + __Pyx_RaiseArgtupleInvalid("solve_h", 1, 5, 5, 1); __PYX_ERR(0, 18, __pyx_L3_error) } CYTHON_FALLTHROUGH; case 2: if (likely((values[2] = __Pyx_PyDict_GetItemStr(__pyx_kwds, __pyx_n_s_WtW)) != 0)) kw_args--; else { - __Pyx_RaiseArgtupleInvalid("solve_h", 1, 4, 4, 2); __PYX_ERR(0, 23, __pyx_L3_error) + __Pyx_RaiseArgtupleInvalid("solve_h", 1, 5, 5, 2); __PYX_ERR(0, 18, __pyx_L3_error) } CYTHON_FALLTHROUGH; case 3: - if (likely((values[3] = __Pyx_PyDict_GetItemStr(__pyx_kwds, __pyx_n_s_kappa)) != 0)) kw_args--; + if (likely((values[3] = __Pyx_PyDict_GetItemStr(__pyx_kwds, __pyx_n_s_permutation)) != 0)) kw_args--; + else { + __Pyx_RaiseArgtupleInvalid("solve_h", 1, 5, 5, 3); __PYX_ERR(0, 18, __pyx_L3_error) + } + CYTHON_FALLTHROUGH; + case 4: + if (likely((values[4] = __Pyx_PyDict_GetItemStr(__pyx_kwds, __pyx_n_s_kappa)) != 0)) kw_args--; else { - __Pyx_RaiseArgtupleInvalid("solve_h", 1, 4, 4, 3); __PYX_ERR(0, 23, __pyx_L3_error) + __Pyx_RaiseArgtupleInvalid("solve_h", 1, 5, 5, 4); __PYX_ERR(0, 18, __pyx_L3_error) } } if (unlikely(kw_args > 0)) { - if (unlikely(__Pyx_ParseOptionalKeywords(__pyx_kwds, __pyx_pyargnames, 0, values, pos_args, "solve_h") < 0)) __PYX_ERR(0, 23, __pyx_L3_error) + if (unlikely(__Pyx_ParseOptionalKeywords(__pyx_kwds, __pyx_pyargnames, 0, values, pos_args, "solve_h") < 0)) __PYX_ERR(0, 18, __pyx_L3_error) } - } else if (PyTuple_GET_SIZE(__pyx_args) != 4) { + } else if (PyTuple_GET_SIZE(__pyx_args) != 5) { goto __pyx_L5_argtuple_error; } else { values[0] = PyTuple_GET_ITEM(__pyx_args, 0); values[1] = PyTuple_GET_ITEM(__pyx_args, 1); values[2] = PyTuple_GET_ITEM(__pyx_args, 2); values[3] = PyTuple_GET_ITEM(__pyx_args, 3); + values[4] = PyTuple_GET_ITEM(__pyx_args, 4); } - __pyx_v_h = __Pyx_PyObject_to_MemoryviewSlice_d_dc_double(values[0], PyBUF_WRITABLE); if (unlikely(!__pyx_v_h.memview)) __PYX_ERR(0, 23, __pyx_L3_error) - __pyx_v_Wt_v_minus_r = __Pyx_PyObject_to_MemoryviewSlice_dsds_double(values[1], PyBUF_WRITABLE); if (unlikely(!__pyx_v_Wt_v_minus_r.memview)) __PYX_ERR(0, 23, __pyx_L3_error) - __pyx_v_WtW = __Pyx_PyObject_to_MemoryviewSlice_d_dc_double(values[2], PyBUF_WRITABLE); if (unlikely(!__pyx_v_WtW.memview)) __PYX_ERR(0, 23, __pyx_L3_error) - __pyx_v_kappa = __pyx_PyFloat_AsDouble(values[3]); if (unlikely((__pyx_v_kappa == (double)-1) && PyErr_Occurred())) __PYX_ERR(0, 23, __pyx_L3_error) + __pyx_v_h = __Pyx_PyObject_to_MemoryviewSlice_d_dc_double(values[0], PyBUF_WRITABLE); if (unlikely(!__pyx_v_h.memview)) __PYX_ERR(0, 18, __pyx_L3_error) + __pyx_v_Wtv = __Pyx_PyObject_to_MemoryviewSlice_dsds_double(values[1], PyBUF_WRITABLE); if (unlikely(!__pyx_v_Wtv.memview)) __PYX_ERR(0, 18, __pyx_L3_error) + __pyx_v_WtW = __Pyx_PyObject_to_MemoryviewSlice_d_dc_double(values[2], PyBUF_WRITABLE); if (unlikely(!__pyx_v_WtW.memview)) __PYX_ERR(0, 18, __pyx_L3_error) + __pyx_v_permutation = __Pyx_PyObject_to_MemoryviewSlice_dc_int(values[3], PyBUF_WRITABLE); if (unlikely(!__pyx_v_permutation.memview)) __PYX_ERR(0, 18, __pyx_L3_error) + __pyx_v_kappa = __pyx_PyFloat_AsDouble(values[4]); if (unlikely((__pyx_v_kappa == (double)-1) && PyErr_Occurred())) __PYX_ERR(0, 18, __pyx_L3_error) } goto __pyx_L4_argument_unpacking_done; __pyx_L5_argtuple_error:; - __Pyx_RaiseArgtupleInvalid("solve_h", 1, 4, 4, PyTuple_GET_SIZE(__pyx_args)); __PYX_ERR(0, 23, __pyx_L3_error) + __Pyx_RaiseArgtupleInvalid("solve_h", 1, 5, 5, PyTuple_GET_SIZE(__pyx_args)); __PYX_ERR(0, 18, __pyx_L3_error) __pyx_L3_error:; __Pyx_AddTraceback("gensim.models.nmf_pgd.solve_h", __pyx_clineno, __pyx_lineno, __pyx_filename); __Pyx_RefNannyFinishContext(); return NULL; __pyx_L4_argument_unpacking_done:; - __pyx_r = __pyx_pf_6gensim_6models_7nmf_pgd_solve_h(__pyx_self, __pyx_v_h, __pyx_v_Wt_v_minus_r, __pyx_v_WtW, __pyx_v_kappa); + __pyx_r = __pyx_pf_6gensim_6models_7nmf_pgd_solve_h(__pyx_self, __pyx_v_h, __pyx_v_Wtv, __pyx_v_WtW, __pyx_v_permutation, __pyx_v_kappa); /* function exit code */ __Pyx_RefNannyFinishContext(); return __pyx_r; } -static PyObject *__pyx_pf_6gensim_6models_7nmf_pgd_solve_h(CYTHON_UNUSED PyObject *__pyx_self, __Pyx_memviewslice __pyx_v_h, __Pyx_memviewslice __pyx_v_Wt_v_minus_r, __Pyx_memviewslice __pyx_v_WtW, double __pyx_v_kappa) { +static PyObject *__pyx_pf_6gensim_6models_7nmf_pgd_solve_h(CYTHON_UNUSED PyObject *__pyx_self, __Pyx_memviewslice __pyx_v_h, __Pyx_memviewslice __pyx_v_Wtv, __Pyx_memviewslice __pyx_v_WtW, __Pyx_memviewslice __pyx_v_permutation, double __pyx_v_kappa) { Py_ssize_t __pyx_v_n_components; CYTHON_UNUSED Py_ssize_t __pyx_v_n_samples; double __pyx_v_violation; @@ -2309,17 +2217,18 @@ static PyObject *__pyx_pf_6gensim_6models_7nmf_pgd_solve_h(CYTHON_UNUSED PyObjec Py_ssize_t __pyx_t_15; Py_ssize_t __pyx_t_16; Py_ssize_t __pyx_t_17; - double __pyx_t_18; - Py_ssize_t __pyx_t_19; + Py_ssize_t __pyx_t_18; + double __pyx_t_19; Py_ssize_t __pyx_t_20; Py_ssize_t __pyx_t_21; Py_ssize_t __pyx_t_22; Py_ssize_t __pyx_t_23; Py_ssize_t __pyx_t_24; - PyObject *__pyx_t_25 = NULL; + Py_ssize_t __pyx_t_25; + PyObject *__pyx_t_26 = NULL; __Pyx_RefNannySetupContext("solve_h", 0); - /* "gensim/models/nmf_pgd.pyx":40 + /* "gensim/models/nmf_pgd.pyx":35 * """ * * cdef Py_ssize_t n_components = h.shape[0] # <<<<<<<<<<<<<< @@ -2328,7 +2237,7 @@ static PyObject *__pyx_pf_6gensim_6models_7nmf_pgd_solve_h(CYTHON_UNUSED PyObjec */ __pyx_v_n_components = (__pyx_v_h.shape[0]); - /* "gensim/models/nmf_pgd.pyx":41 + /* "gensim/models/nmf_pgd.pyx":36 * * cdef Py_ssize_t n_components = h.shape[0] * cdef Py_ssize_t n_samples = h.shape[1] # <<<<<<<<<<<<<< @@ -2337,7 +2246,7 @@ static PyObject *__pyx_pf_6gensim_6models_7nmf_pgd_solve_h(CYTHON_UNUSED PyObjec */ __pyx_v_n_samples = (__pyx_v_h.shape[1]); - /* "gensim/models/nmf_pgd.pyx":42 + /* "gensim/models/nmf_pgd.pyx":37 * cdef Py_ssize_t n_components = h.shape[0] * cdef Py_ssize_t n_samples = h.shape[1] * cdef double violation = 0 # <<<<<<<<<<<<<< @@ -2346,7 +2255,7 @@ static PyObject *__pyx_pf_6gensim_6models_7nmf_pgd_solve_h(CYTHON_UNUSED PyObjec */ __pyx_v_violation = 0.0; - /* "gensim/models/nmf_pgd.pyx":44 + /* "gensim/models/nmf_pgd.pyx":39 * cdef double violation = 0 * cdef double grad, projected_grad, hessian * cdef Py_ssize_t sample_idx = 0 # <<<<<<<<<<<<<< @@ -2355,7 +2264,7 @@ static PyObject *__pyx_pf_6gensim_6models_7nmf_pgd_solve_h(CYTHON_UNUSED PyObjec */ __pyx_v_sample_idx = 0; - /* "gensim/models/nmf_pgd.pyx":45 + /* "gensim/models/nmf_pgd.pyx":40 * cdef double grad, projected_grad, hessian * cdef Py_ssize_t sample_idx = 0 * cdef Py_ssize_t component_idx_1 = 0 # <<<<<<<<<<<<<< @@ -2364,7 +2273,7 @@ static PyObject *__pyx_pf_6gensim_6models_7nmf_pgd_solve_h(CYTHON_UNUSED PyObjec */ __pyx_v_component_idx_1 = 0; - /* "gensim/models/nmf_pgd.pyx":46 + /* "gensim/models/nmf_pgd.pyx":41 * cdef Py_ssize_t sample_idx = 0 * cdef Py_ssize_t component_idx_1 = 0 * cdef Py_ssize_t component_idx_2 = 0 # <<<<<<<<<<<<<< @@ -2373,12 +2282,12 @@ static PyObject *__pyx_pf_6gensim_6models_7nmf_pgd_solve_h(CYTHON_UNUSED PyObjec */ __pyx_v_component_idx_2 = 0; - /* "gensim/models/nmf_pgd.pyx":48 + /* "gensim/models/nmf_pgd.pyx":43 * cdef Py_ssize_t component_idx_2 = 0 * * for sample_idx in prange(n_samples, nogil=True): # <<<<<<<<<<<<<< * for component_idx_1 in range(n_components): - * + * component_idx_1 = permutation[component_idx_1] */ { #ifdef WITH_THREAD @@ -2400,7 +2309,7 @@ static PyObject *__pyx_pf_6gensim_6models_7nmf_pgd_solve_h(CYTHON_UNUSED PyObjec if (__pyx_t_3 > 0) { #ifdef _OPENMP - #pragma omp parallel reduction(+:__pyx_v_violation) private(__pyx_t_10, __pyx_t_11, __pyx_t_12, __pyx_t_13, __pyx_t_14, __pyx_t_15, __pyx_t_16, __pyx_t_17, __pyx_t_18, __pyx_t_19, __pyx_t_20, __pyx_t_21, __pyx_t_22, __pyx_t_23, __pyx_t_24, __pyx_t_4, __pyx_t_5, __pyx_t_6, __pyx_t_7, __pyx_t_8, __pyx_t_9) + #pragma omp parallel reduction(+:__pyx_v_violation) private(__pyx_t_10, __pyx_t_11, __pyx_t_12, __pyx_t_13, __pyx_t_14, __pyx_t_15, __pyx_t_16, __pyx_t_17, __pyx_t_18, __pyx_t_19, __pyx_t_20, __pyx_t_21, __pyx_t_22, __pyx_t_23, __pyx_t_24, __pyx_t_25, __pyx_t_4, __pyx_t_5, __pyx_t_6, __pyx_t_7, __pyx_t_8, __pyx_t_9) #endif /* _OPENMP */ { #ifdef _OPENMP @@ -2416,67 +2325,77 @@ static PyObject *__pyx_pf_6gensim_6models_7nmf_pgd_solve_h(CYTHON_UNUSED PyObjec __pyx_v_hessian = ((double)__PYX_NAN()); __pyx_v_projected_grad = ((double)__PYX_NAN()); - /* "gensim/models/nmf_pgd.pyx":49 + /* "gensim/models/nmf_pgd.pyx":44 * * for sample_idx in prange(n_samples, nogil=True): * for component_idx_1 in range(n_components): # <<<<<<<<<<<<<< + * component_idx_1 = permutation[component_idx_1] * - * grad = -Wt_v_minus_r[component_idx_1, sample_idx] */ __pyx_t_4 = __pyx_v_n_components; __pyx_t_5 = __pyx_t_4; for (__pyx_t_6 = 0; __pyx_t_6 < __pyx_t_5; __pyx_t_6+=1) { __pyx_v_component_idx_1 = __pyx_t_6; - /* "gensim/models/nmf_pgd.pyx":51 + /* "gensim/models/nmf_pgd.pyx":45 + * for sample_idx in prange(n_samples, nogil=True): * for component_idx_1 in range(n_components): + * component_idx_1 = permutation[component_idx_1] # <<<<<<<<<<<<<< + * + * grad = -Wtv[component_idx_1, sample_idx] + */ + __pyx_t_7 = __pyx_v_component_idx_1; + __pyx_v_component_idx_1 = (*((int *) ( /* dim=0 */ ((char *) (((int *) __pyx_v_permutation.data) + __pyx_t_7)) ))); + + /* "gensim/models/nmf_pgd.pyx":47 + * component_idx_1 = permutation[component_idx_1] * - * grad = -Wt_v_minus_r[component_idx_1, sample_idx] # <<<<<<<<<<<<<< + * grad = -Wtv[component_idx_1, sample_idx] # <<<<<<<<<<<<<< * * for component_idx_2 in range(n_components): */ - __pyx_t_7 = __pyx_v_component_idx_1; - __pyx_t_8 = __pyx_v_sample_idx; - __pyx_v_grad = (-(*((double *) ( /* dim=1 */ (( /* dim=0 */ (__pyx_v_Wt_v_minus_r.data + __pyx_t_7 * __pyx_v_Wt_v_minus_r.strides[0]) ) + __pyx_t_8 * __pyx_v_Wt_v_minus_r.strides[1]) )))); + __pyx_t_8 = __pyx_v_component_idx_1; + __pyx_t_9 = __pyx_v_sample_idx; + __pyx_v_grad = (-(*((double *) ( /* dim=1 */ (( /* dim=0 */ (__pyx_v_Wtv.data + __pyx_t_8 * __pyx_v_Wtv.strides[0]) ) + __pyx_t_9 * __pyx_v_Wtv.strides[1]) )))); - /* "gensim/models/nmf_pgd.pyx":53 - * grad = -Wt_v_minus_r[component_idx_1, sample_idx] + /* "gensim/models/nmf_pgd.pyx":49 + * grad = -Wtv[component_idx_1, sample_idx] * * for component_idx_2 in range(n_components): # <<<<<<<<<<<<<< * grad += WtW[component_idx_1, component_idx_2] * h[component_idx_2, sample_idx] * */ - __pyx_t_9 = __pyx_v_n_components; - __pyx_t_10 = __pyx_t_9; - for (__pyx_t_11 = 0; __pyx_t_11 < __pyx_t_10; __pyx_t_11+=1) { - __pyx_v_component_idx_2 = __pyx_t_11; + __pyx_t_10 = __pyx_v_n_components; + __pyx_t_11 = __pyx_t_10; + for (__pyx_t_12 = 0; __pyx_t_12 < __pyx_t_11; __pyx_t_12+=1) { + __pyx_v_component_idx_2 = __pyx_t_12; - /* "gensim/models/nmf_pgd.pyx":54 + /* "gensim/models/nmf_pgd.pyx":50 * * for component_idx_2 in range(n_components): * grad += WtW[component_idx_1, component_idx_2] * h[component_idx_2, sample_idx] # <<<<<<<<<<<<<< * * hessian = WtW[component_idx_1, component_idx_1] */ - __pyx_t_12 = __pyx_v_component_idx_1; - __pyx_t_13 = __pyx_v_component_idx_2; + __pyx_t_13 = __pyx_v_component_idx_1; __pyx_t_14 = __pyx_v_component_idx_2; - __pyx_t_15 = __pyx_v_sample_idx; - __pyx_v_grad = (__pyx_v_grad + ((*((double *) ( /* dim=1 */ ((char *) (((double *) ( /* dim=0 */ (__pyx_v_WtW.data + __pyx_t_12 * __pyx_v_WtW.strides[0]) )) + __pyx_t_13)) ))) * (*((double *) ( /* dim=1 */ ((char *) (((double *) ( /* dim=0 */ (__pyx_v_h.data + __pyx_t_14 * __pyx_v_h.strides[0]) )) + __pyx_t_15)) ))))); + __pyx_t_15 = __pyx_v_component_idx_2; + __pyx_t_16 = __pyx_v_sample_idx; + __pyx_v_grad = (__pyx_v_grad + ((*((double *) ( /* dim=1 */ ((char *) (((double *) ( /* dim=0 */ (__pyx_v_WtW.data + __pyx_t_13 * __pyx_v_WtW.strides[0]) )) + __pyx_t_14)) ))) * (*((double *) ( /* dim=1 */ ((char *) (((double *) ( /* dim=0 */ (__pyx_v_h.data + __pyx_t_15 * __pyx_v_h.strides[0]) )) + __pyx_t_16)) ))))); } - /* "gensim/models/nmf_pgd.pyx":56 + /* "gensim/models/nmf_pgd.pyx":52 * grad += WtW[component_idx_1, component_idx_2] * h[component_idx_2, sample_idx] * * hessian = WtW[component_idx_1, component_idx_1] # <<<<<<<<<<<<<< * * grad = grad * kappa / hessian */ - __pyx_t_16 = __pyx_v_component_idx_1; __pyx_t_17 = __pyx_v_component_idx_1; - __pyx_v_hessian = (*((double *) ( /* dim=1 */ ((char *) (((double *) ( /* dim=0 */ (__pyx_v_WtW.data + __pyx_t_16 * __pyx_v_WtW.strides[0]) )) + __pyx_t_17)) ))); + __pyx_t_18 = __pyx_v_component_idx_1; + __pyx_v_hessian = (*((double *) ( /* dim=1 */ ((char *) (((double *) ( /* dim=0 */ (__pyx_v_WtW.data + __pyx_t_17 * __pyx_v_WtW.strides[0]) )) + __pyx_t_18)) ))); - /* "gensim/models/nmf_pgd.pyx":58 + /* "gensim/models/nmf_pgd.pyx":54 * hessian = WtW[component_idx_1, component_idx_1] * * grad = grad * kappa / hessian # <<<<<<<<<<<<<< @@ -2485,23 +2404,23 @@ static PyObject *__pyx_pf_6gensim_6models_7nmf_pgd_solve_h(CYTHON_UNUSED PyObjec */ __pyx_v_grad = ((__pyx_v_grad * __pyx_v_kappa) / __pyx_v_hessian); - /* "gensim/models/nmf_pgd.pyx":60 + /* "gensim/models/nmf_pgd.pyx":56 * grad = grad * kappa / hessian * * projected_grad = fmin(0, grad) if h[component_idx_1, sample_idx] == 0 else grad # <<<<<<<<<<<<<< * * violation += projected_grad * projected_grad */ - __pyx_t_19 = __pyx_v_component_idx_1; - __pyx_t_20 = __pyx_v_sample_idx; - if ((((*((double *) ( /* dim=1 */ ((char *) (((double *) ( /* dim=0 */ (__pyx_v_h.data + __pyx_t_19 * __pyx_v_h.strides[0]) )) + __pyx_t_20)) ))) == 0.0) != 0)) { - __pyx_t_18 = __pyx_f_6gensim_6models_7nmf_pgd_fmin(0.0, __pyx_v_grad); + __pyx_t_20 = __pyx_v_component_idx_1; + __pyx_t_21 = __pyx_v_sample_idx; + if ((((*((double *) ( /* dim=1 */ ((char *) (((double *) ( /* dim=0 */ (__pyx_v_h.data + __pyx_t_20 * __pyx_v_h.strides[0]) )) + __pyx_t_21)) ))) == 0.0) != 0)) { + __pyx_t_19 = __pyx_f_6gensim_6models_7nmf_pgd_fmin(0.0, __pyx_v_grad); } else { - __pyx_t_18 = __pyx_v_grad; + __pyx_t_19 = __pyx_v_grad; } - __pyx_v_projected_grad = __pyx_t_18; + __pyx_v_projected_grad = __pyx_t_19; - /* "gensim/models/nmf_pgd.pyx":62 + /* "gensim/models/nmf_pgd.pyx":58 * projected_grad = fmin(0, grad) if h[component_idx_1, sample_idx] == 0 else grad * * violation += projected_grad * projected_grad # <<<<<<<<<<<<<< @@ -2510,18 +2429,18 @@ static PyObject *__pyx_pf_6gensim_6models_7nmf_pgd_solve_h(CYTHON_UNUSED PyObjec */ __pyx_v_violation = (__pyx_v_violation + (__pyx_v_projected_grad * __pyx_v_projected_grad)); - /* "gensim/models/nmf_pgd.pyx":64 + /* "gensim/models/nmf_pgd.pyx":60 * violation += projected_grad * projected_grad * * h[component_idx_1, sample_idx] = fmax(h[component_idx_1, sample_idx] - grad, 0.) # <<<<<<<<<<<<<< * * return sqrt(violation) */ - __pyx_t_21 = __pyx_v_component_idx_1; - __pyx_t_22 = __pyx_v_sample_idx; - __pyx_t_23 = __pyx_v_component_idx_1; - __pyx_t_24 = __pyx_v_sample_idx; - *((double *) ( /* dim=1 */ ((char *) (((double *) ( /* dim=0 */ (__pyx_v_h.data + __pyx_t_23 * __pyx_v_h.strides[0]) )) + __pyx_t_24)) )) = __pyx_f_6gensim_6models_7nmf_pgd_fmax(((*((double *) ( /* dim=1 */ ((char *) (((double *) ( /* dim=0 */ (__pyx_v_h.data + __pyx_t_21 * __pyx_v_h.strides[0]) )) + __pyx_t_22)) ))) - __pyx_v_grad), 0.); + __pyx_t_22 = __pyx_v_component_idx_1; + __pyx_t_23 = __pyx_v_sample_idx; + __pyx_t_24 = __pyx_v_component_idx_1; + __pyx_t_25 = __pyx_v_sample_idx; + *((double *) ( /* dim=1 */ ((char *) (((double *) ( /* dim=0 */ (__pyx_v_h.data + __pyx_t_24 * __pyx_v_h.strides[0]) )) + __pyx_t_25)) )) = __pyx_f_6gensim_6models_7nmf_pgd_fmax(((*((double *) ( /* dim=1 */ ((char *) (((double *) ( /* dim=0 */ (__pyx_v_h.data + __pyx_t_22 * __pyx_v_h.strides[0]) )) + __pyx_t_23)) ))) - __pyx_v_grad), 0.); } } } @@ -2536,12 +2455,12 @@ static PyObject *__pyx_pf_6gensim_6models_7nmf_pgd_solve_h(CYTHON_UNUSED PyObjec #endif } - /* "gensim/models/nmf_pgd.pyx":48 + /* "gensim/models/nmf_pgd.pyx":43 * cdef Py_ssize_t component_idx_2 = 0 * * for sample_idx in prange(n_samples, nogil=True): # <<<<<<<<<<<<<< * for component_idx_1 in range(n_components): - * + * component_idx_1 = permutation[component_idx_1] */ /*finally:*/ { /*normal exit:*/{ @@ -2555,780 +2474,36 @@ static PyObject *__pyx_pf_6gensim_6models_7nmf_pgd_solve_h(CYTHON_UNUSED PyObjec } } - /* "gensim/models/nmf_pgd.pyx":66 + /* "gensim/models/nmf_pgd.pyx":62 * h[component_idx_1, sample_idx] = fmax(h[component_idx_1, sample_idx] - grad, 0.) * * return sqrt(violation) # <<<<<<<<<<<<<< - * - * def solve_r( */ __Pyx_XDECREF(__pyx_r); - __pyx_t_25 = PyFloat_FromDouble(sqrt(__pyx_v_violation)); if (unlikely(!__pyx_t_25)) __PYX_ERR(0, 66, __pyx_L1_error) - __Pyx_GOTREF(__pyx_t_25); - __pyx_r = __pyx_t_25; - __pyx_t_25 = 0; + __pyx_t_26 = PyFloat_FromDouble(sqrt(__pyx_v_violation)); if (unlikely(!__pyx_t_26)) __PYX_ERR(0, 62, __pyx_L1_error) + __Pyx_GOTREF(__pyx_t_26); + __pyx_r = __pyx_t_26; + __pyx_t_26 = 0; goto __pyx_L0; - /* "gensim/models/nmf_pgd.pyx":23 - * return a + /* "gensim/models/nmf_pgd.pyx":18 + * return x if x > y else y * - * def solve_h(double[:, ::1] h, double[:, :] Wt_v_minus_r, double[:, ::1] WtW, double kappa): # <<<<<<<<<<<<<< + * def solve_h(double[:, ::1] h, double[:, :] Wtv, double[:, ::1] WtW, int[::1] permutation, double kappa): # <<<<<<<<<<<<<< * """Find optimal dense vector representation for current W and r matrices. * */ /* function exit code */ __pyx_L1_error:; - __Pyx_XDECREF(__pyx_t_25); + __Pyx_XDECREF(__pyx_t_26); __Pyx_AddTraceback("gensim.models.nmf_pgd.solve_h", __pyx_clineno, __pyx_lineno, __pyx_filename); __pyx_r = NULL; __pyx_L0:; __PYX_XDEC_MEMVIEW(&__pyx_v_h, 1); - __PYX_XDEC_MEMVIEW(&__pyx_v_Wt_v_minus_r, 1); + __PYX_XDEC_MEMVIEW(&__pyx_v_Wtv, 1); __PYX_XDEC_MEMVIEW(&__pyx_v_WtW, 1); - __Pyx_XGIVEREF(__pyx_r); - __Pyx_RefNannyFinishContext(); - return __pyx_r; -} - -/* "gensim/models/nmf_pgd.pyx":68 - * return sqrt(violation) - * - * def solve_r( # <<<<<<<<<<<<<< - * r, - * r_actual, - */ - -/* Python wrapper */ -static PyObject *__pyx_pw_6gensim_6models_7nmf_pgd_3solve_r(PyObject *__pyx_self, PyObject *__pyx_args, PyObject *__pyx_kwds); /*proto*/ -static char __pyx_doc_6gensim_6models_7nmf_pgd_2solve_r[] = "solve_r(r, r_actual, double lambda_, double v_max)\nBound new residuals.\n\n Parameters\n ----------\n r: sparse matrix\n r_actual: sparse matrix\n lambda_ : double\n v_max : double\n\n Returns\n -------\n float\n Cumulative difference between previous and current residuals vectors.\n\n "; -static PyMethodDef __pyx_mdef_6gensim_6models_7nmf_pgd_3solve_r = {"solve_r", (PyCFunction)(void*)(PyCFunctionWithKeywords)__pyx_pw_6gensim_6models_7nmf_pgd_3solve_r, METH_VARARGS|METH_KEYWORDS, __pyx_doc_6gensim_6models_7nmf_pgd_2solve_r}; -static PyObject *__pyx_pw_6gensim_6models_7nmf_pgd_3solve_r(PyObject *__pyx_self, PyObject *__pyx_args, PyObject *__pyx_kwds) { - PyObject *__pyx_v_r = 0; - PyObject *__pyx_v_r_actual = 0; - double __pyx_v_lambda_; - double __pyx_v_v_max; - PyObject *__pyx_r = 0; - __Pyx_RefNannyDeclarations - __Pyx_RefNannySetupContext("solve_r (wrapper)", 0); - { - static PyObject **__pyx_pyargnames[] = {&__pyx_n_s_r,&__pyx_n_s_r_actual,&__pyx_n_s_lambda,&__pyx_n_s_v_max,0}; - PyObject* values[4] = {0,0,0,0}; - if (unlikely(__pyx_kwds)) { - Py_ssize_t kw_args; - const Py_ssize_t pos_args = PyTuple_GET_SIZE(__pyx_args); - switch (pos_args) { - case 4: values[3] = PyTuple_GET_ITEM(__pyx_args, 3); - CYTHON_FALLTHROUGH; - case 3: values[2] = PyTuple_GET_ITEM(__pyx_args, 2); - CYTHON_FALLTHROUGH; - case 2: values[1] = PyTuple_GET_ITEM(__pyx_args, 1); - CYTHON_FALLTHROUGH; - case 1: values[0] = PyTuple_GET_ITEM(__pyx_args, 0); - CYTHON_FALLTHROUGH; - case 0: break; - default: goto __pyx_L5_argtuple_error; - } - kw_args = PyDict_Size(__pyx_kwds); - switch (pos_args) { - case 0: - if (likely((values[0] = __Pyx_PyDict_GetItemStr(__pyx_kwds, __pyx_n_s_r)) != 0)) kw_args--; - else goto __pyx_L5_argtuple_error; - CYTHON_FALLTHROUGH; - case 1: - if (likely((values[1] = __Pyx_PyDict_GetItemStr(__pyx_kwds, __pyx_n_s_r_actual)) != 0)) kw_args--; - else { - __Pyx_RaiseArgtupleInvalid("solve_r", 1, 4, 4, 1); __PYX_ERR(0, 68, __pyx_L3_error) - } - CYTHON_FALLTHROUGH; - case 2: - if (likely((values[2] = __Pyx_PyDict_GetItemStr(__pyx_kwds, __pyx_n_s_lambda)) != 0)) kw_args--; - else { - __Pyx_RaiseArgtupleInvalid("solve_r", 1, 4, 4, 2); __PYX_ERR(0, 68, __pyx_L3_error) - } - CYTHON_FALLTHROUGH; - case 3: - if (likely((values[3] = __Pyx_PyDict_GetItemStr(__pyx_kwds, __pyx_n_s_v_max)) != 0)) kw_args--; - else { - __Pyx_RaiseArgtupleInvalid("solve_r", 1, 4, 4, 3); __PYX_ERR(0, 68, __pyx_L3_error) - } - } - if (unlikely(kw_args > 0)) { - if (unlikely(__Pyx_ParseOptionalKeywords(__pyx_kwds, __pyx_pyargnames, 0, values, pos_args, "solve_r") < 0)) __PYX_ERR(0, 68, __pyx_L3_error) - } - } else if (PyTuple_GET_SIZE(__pyx_args) != 4) { - goto __pyx_L5_argtuple_error; - } else { - values[0] = PyTuple_GET_ITEM(__pyx_args, 0); - values[1] = PyTuple_GET_ITEM(__pyx_args, 1); - values[2] = PyTuple_GET_ITEM(__pyx_args, 2); - values[3] = PyTuple_GET_ITEM(__pyx_args, 3); - } - __pyx_v_r = values[0]; - __pyx_v_r_actual = values[1]; - __pyx_v_lambda_ = __pyx_PyFloat_AsDouble(values[2]); if (unlikely((__pyx_v_lambda_ == (double)-1) && PyErr_Occurred())) __PYX_ERR(0, 71, __pyx_L3_error) - __pyx_v_v_max = __pyx_PyFloat_AsDouble(values[3]); if (unlikely((__pyx_v_v_max == (double)-1) && PyErr_Occurred())) __PYX_ERR(0, 72, __pyx_L3_error) - } - goto __pyx_L4_argument_unpacking_done; - __pyx_L5_argtuple_error:; - __Pyx_RaiseArgtupleInvalid("solve_r", 1, 4, 4, PyTuple_GET_SIZE(__pyx_args)); __PYX_ERR(0, 68, __pyx_L3_error) - __pyx_L3_error:; - __Pyx_AddTraceback("gensim.models.nmf_pgd.solve_r", __pyx_clineno, __pyx_lineno, __pyx_filename); - __Pyx_RefNannyFinishContext(); - return NULL; - __pyx_L4_argument_unpacking_done:; - __pyx_r = __pyx_pf_6gensim_6models_7nmf_pgd_2solve_r(__pyx_self, __pyx_v_r, __pyx_v_r_actual, __pyx_v_lambda_, __pyx_v_v_max); - - /* function exit code */ - __Pyx_RefNannyFinishContext(); - return __pyx_r; -} - -static PyObject *__pyx_pf_6gensim_6models_7nmf_pgd_2solve_r(CYTHON_UNUSED PyObject *__pyx_self, PyObject *__pyx_v_r, PyObject *__pyx_v_r_actual, double __pyx_v_lambda_, double __pyx_v_v_max) { - __Pyx_memviewslice __pyx_v_r_indptr = { 0, 0, { 0 }, { 0 }, { 0 } }; - __Pyx_memviewslice __pyx_v_r_indices = { 0, 0, { 0 }, { 0 }, { 0 } }; - __Pyx_memviewslice __pyx_v_r_data = { 0, 0, { 0 }, { 0 }, { 0 } }; - __Pyx_memviewslice __pyx_v_r_actual_indptr = { 0, 0, { 0 }, { 0 }, { 0 } }; - __Pyx_memviewslice __pyx_v_r_actual_indices = { 0, 0, { 0 }, { 0 }, { 0 } }; - __Pyx_memviewslice __pyx_v_r_actual_data = { 0, 0, { 0 }, { 0 }, { 0 } }; - Py_ssize_t __pyx_v_r_col_size; - Py_ssize_t __pyx_v_r_actual_col_size; - Py_ssize_t __pyx_v_r_col_indptr; - Py_ssize_t __pyx_v_r_actual_col_indptr; - Py_ssize_t __pyx_v_r_col_idx; - Py_ssize_t __pyx_v_r_actual_col_idx; - double *__pyx_v_r_element; - double *__pyx_v_r_actual_element; - double __pyx_v_r_actual_sign; - CYTHON_UNUSED Py_ssize_t __pyx_v_n_samples; - Py_ssize_t __pyx_v_sample_idx; - double __pyx_v_violation; - PyObject *__pyx_r = NULL; - __Pyx_RefNannyDeclarations - PyObject *__pyx_t_1 = NULL; - __Pyx_memviewslice __pyx_t_2 = { 0, 0, { 0 }, { 0 }, { 0 } }; - __Pyx_memviewslice __pyx_t_3 = { 0, 0, { 0 }, { 0 }, { 0 } }; - Py_ssize_t __pyx_t_4; - Py_ssize_t __pyx_t_5; - Py_ssize_t __pyx_t_6; - Py_ssize_t __pyx_t_7; - Py_ssize_t __pyx_t_8; - Py_ssize_t __pyx_t_9; - Py_ssize_t __pyx_t_10; - int __pyx_t_11; - int __pyx_t_12; - Py_ssize_t __pyx_t_13; - Py_ssize_t __pyx_t_14; - Py_ssize_t __pyx_t_15; - Py_ssize_t __pyx_t_16; - Py_ssize_t __pyx_t_17; - Py_ssize_t __pyx_t_18; - Py_ssize_t __pyx_t_19; - Py_ssize_t __pyx_t_20; - __Pyx_RefNannySetupContext("solve_r", 0); - - /* "gensim/models/nmf_pgd.pyx":90 - * """ - * - * cdef int[::1] r_indptr = r.indptr # <<<<<<<<<<<<<< - * cdef int[::1] r_indices = r.indices - * cdef double[::1] r_data = r.data - */ - __pyx_t_1 = __Pyx_PyObject_GetAttrStr(__pyx_v_r, __pyx_n_s_indptr); if (unlikely(!__pyx_t_1)) __PYX_ERR(0, 90, __pyx_L1_error) - __Pyx_GOTREF(__pyx_t_1); - __pyx_t_2 = __Pyx_PyObject_to_MemoryviewSlice_dc_int(__pyx_t_1, PyBUF_WRITABLE); if (unlikely(!__pyx_t_2.memview)) __PYX_ERR(0, 90, __pyx_L1_error) - __Pyx_DECREF(__pyx_t_1); __pyx_t_1 = 0; - __pyx_v_r_indptr = __pyx_t_2; - __pyx_t_2.memview = NULL; - __pyx_t_2.data = NULL; - - /* "gensim/models/nmf_pgd.pyx":91 - * - * cdef int[::1] r_indptr = r.indptr - * cdef int[::1] r_indices = r.indices # <<<<<<<<<<<<<< - * cdef double[::1] r_data = r.data - * cdef int[::1] r_actual_indptr = r_actual.indptr - */ - __pyx_t_1 = __Pyx_PyObject_GetAttrStr(__pyx_v_r, __pyx_n_s_indices); if (unlikely(!__pyx_t_1)) __PYX_ERR(0, 91, __pyx_L1_error) - __Pyx_GOTREF(__pyx_t_1); - __pyx_t_2 = __Pyx_PyObject_to_MemoryviewSlice_dc_int(__pyx_t_1, PyBUF_WRITABLE); if (unlikely(!__pyx_t_2.memview)) __PYX_ERR(0, 91, __pyx_L1_error) - __Pyx_DECREF(__pyx_t_1); __pyx_t_1 = 0; - __pyx_v_r_indices = __pyx_t_2; - __pyx_t_2.memview = NULL; - __pyx_t_2.data = NULL; - - /* "gensim/models/nmf_pgd.pyx":92 - * cdef int[::1] r_indptr = r.indptr - * cdef int[::1] r_indices = r.indices - * cdef double[::1] r_data = r.data # <<<<<<<<<<<<<< - * cdef int[::1] r_actual_indptr = r_actual.indptr - * cdef int[::1] r_actual_indices = r_actual.indices - */ - __pyx_t_1 = __Pyx_PyObject_GetAttrStr(__pyx_v_r, __pyx_n_s_data); if (unlikely(!__pyx_t_1)) __PYX_ERR(0, 92, __pyx_L1_error) - __Pyx_GOTREF(__pyx_t_1); - __pyx_t_3 = __Pyx_PyObject_to_MemoryviewSlice_dc_double(__pyx_t_1, PyBUF_WRITABLE); if (unlikely(!__pyx_t_3.memview)) __PYX_ERR(0, 92, __pyx_L1_error) - __Pyx_DECREF(__pyx_t_1); __pyx_t_1 = 0; - __pyx_v_r_data = __pyx_t_3; - __pyx_t_3.memview = NULL; - __pyx_t_3.data = NULL; - - /* "gensim/models/nmf_pgd.pyx":93 - * cdef int[::1] r_indices = r.indices - * cdef double[::1] r_data = r.data - * cdef int[::1] r_actual_indptr = r_actual.indptr # <<<<<<<<<<<<<< - * cdef int[::1] r_actual_indices = r_actual.indices - * cdef double[::1] r_actual_data = r_actual.data - */ - __pyx_t_1 = __Pyx_PyObject_GetAttrStr(__pyx_v_r_actual, __pyx_n_s_indptr); if (unlikely(!__pyx_t_1)) __PYX_ERR(0, 93, __pyx_L1_error) - __Pyx_GOTREF(__pyx_t_1); - __pyx_t_2 = __Pyx_PyObject_to_MemoryviewSlice_dc_int(__pyx_t_1, PyBUF_WRITABLE); if (unlikely(!__pyx_t_2.memview)) __PYX_ERR(0, 93, __pyx_L1_error) - __Pyx_DECREF(__pyx_t_1); __pyx_t_1 = 0; - __pyx_v_r_actual_indptr = __pyx_t_2; - __pyx_t_2.memview = NULL; - __pyx_t_2.data = NULL; - - /* "gensim/models/nmf_pgd.pyx":94 - * cdef double[::1] r_data = r.data - * cdef int[::1] r_actual_indptr = r_actual.indptr - * cdef int[::1] r_actual_indices = r_actual.indices # <<<<<<<<<<<<<< - * cdef double[::1] r_actual_data = r_actual.data - * - */ - __pyx_t_1 = __Pyx_PyObject_GetAttrStr(__pyx_v_r_actual, __pyx_n_s_indices); if (unlikely(!__pyx_t_1)) __PYX_ERR(0, 94, __pyx_L1_error) - __Pyx_GOTREF(__pyx_t_1); - __pyx_t_2 = __Pyx_PyObject_to_MemoryviewSlice_dc_int(__pyx_t_1, PyBUF_WRITABLE); if (unlikely(!__pyx_t_2.memview)) __PYX_ERR(0, 94, __pyx_L1_error) - __Pyx_DECREF(__pyx_t_1); __pyx_t_1 = 0; - __pyx_v_r_actual_indices = __pyx_t_2; - __pyx_t_2.memview = NULL; - __pyx_t_2.data = NULL; - - /* "gensim/models/nmf_pgd.pyx":95 - * cdef int[::1] r_actual_indptr = r_actual.indptr - * cdef int[::1] r_actual_indices = r_actual.indices - * cdef double[::1] r_actual_data = r_actual.data # <<<<<<<<<<<<<< - * - * cdef Py_ssize_t r_col_size = 0 - */ - __pyx_t_1 = __Pyx_PyObject_GetAttrStr(__pyx_v_r_actual, __pyx_n_s_data); if (unlikely(!__pyx_t_1)) __PYX_ERR(0, 95, __pyx_L1_error) - __Pyx_GOTREF(__pyx_t_1); - __pyx_t_3 = __Pyx_PyObject_to_MemoryviewSlice_dc_double(__pyx_t_1, PyBUF_WRITABLE); if (unlikely(!__pyx_t_3.memview)) __PYX_ERR(0, 95, __pyx_L1_error) - __Pyx_DECREF(__pyx_t_1); __pyx_t_1 = 0; - __pyx_v_r_actual_data = __pyx_t_3; - __pyx_t_3.memview = NULL; - __pyx_t_3.data = NULL; - - /* "gensim/models/nmf_pgd.pyx":97 - * cdef double[::1] r_actual_data = r_actual.data - * - * cdef Py_ssize_t r_col_size = 0 # <<<<<<<<<<<<<< - * cdef Py_ssize_t r_actual_col_size = 0 - * cdef Py_ssize_t r_col_indptr - */ - __pyx_v_r_col_size = 0; - - /* "gensim/models/nmf_pgd.pyx":98 - * - * cdef Py_ssize_t r_col_size = 0 - * cdef Py_ssize_t r_actual_col_size = 0 # <<<<<<<<<<<<<< - * cdef Py_ssize_t r_col_indptr - * cdef Py_ssize_t r_actual_col_indptr - */ - __pyx_v_r_actual_col_size = 0; - - /* "gensim/models/nmf_pgd.pyx":106 - * cdef double* r_actual_element - * - * cdef double r_actual_sign = 1.0 # <<<<<<<<<<<<<< - * - * cdef Py_ssize_t n_samples = r_actual_indptr.shape[0] - 1 - */ - __pyx_v_r_actual_sign = 1.0; - - /* "gensim/models/nmf_pgd.pyx":108 - * cdef double r_actual_sign = 1.0 - * - * cdef Py_ssize_t n_samples = r_actual_indptr.shape[0] - 1 # <<<<<<<<<<<<<< - * cdef Py_ssize_t sample_idx - * - */ - __pyx_v_n_samples = ((__pyx_v_r_actual_indptr.shape[0]) - 1); - - /* "gensim/models/nmf_pgd.pyx":111 - * cdef Py_ssize_t sample_idx - * - * cdef double violation = 0 # <<<<<<<<<<<<<< - * - * for sample_idx in prange(n_samples, nogil=True): - */ - __pyx_v_violation = 0.0; - - /* "gensim/models/nmf_pgd.pyx":113 - * cdef double violation = 0 - * - * for sample_idx in prange(n_samples, nogil=True): # <<<<<<<<<<<<<< - * r_col_size = r_indptr[sample_idx + 1] - r_indptr[sample_idx] - * r_actual_col_size = r_actual_indptr[sample_idx + 1] - r_actual_indptr[sample_idx] - */ - { - #ifdef WITH_THREAD - PyThreadState *_save; - Py_UNBLOCK_THREADS - __Pyx_FastGIL_Remember(); - #endif - /*try:*/ { - __pyx_t_4 = __pyx_v_n_samples; - if (1 == 0) abort(); - { - #if ((defined(__APPLE__) || defined(__OSX__)) && (defined(__GNUC__) && (__GNUC__ > 2 || (__GNUC__ == 2 && (__GNUC_MINOR__ > 95))))) - #undef likely - #undef unlikely - #define likely(x) (x) - #define unlikely(x) (x) - #endif - __pyx_t_6 = (__pyx_t_4 - 0 + 1 - 1/abs(1)) / 1; - if (__pyx_t_6 > 0) - { - #ifdef _OPENMP - #pragma omp parallel reduction(+:__pyx_v_violation) private(__pyx_t_10, __pyx_t_11, __pyx_t_12, __pyx_t_13, __pyx_t_14, __pyx_t_15, __pyx_t_16, __pyx_t_17, __pyx_t_18, __pyx_t_19, __pyx_t_20, __pyx_t_7, __pyx_t_8, __pyx_t_9) - #endif /* _OPENMP */ - { - #ifdef _OPENMP - #pragma omp for lastprivate(__pyx_v_r_actual_col_idx) lastprivate(__pyx_v_r_actual_col_indptr) lastprivate(__pyx_v_r_actual_col_size) lastprivate(__pyx_v_r_actual_element) lastprivate(__pyx_v_r_actual_sign) lastprivate(__pyx_v_r_col_idx) lastprivate(__pyx_v_r_col_indptr) lastprivate(__pyx_v_r_col_size) lastprivate(__pyx_v_r_element) firstprivate(__pyx_v_sample_idx) lastprivate(__pyx_v_sample_idx) - #endif /* _OPENMP */ - for (__pyx_t_5 = 0; __pyx_t_5 < __pyx_t_6; __pyx_t_5++){ - { - __pyx_v_sample_idx = (Py_ssize_t)(0 + 1 * __pyx_t_5); - /* Initialize private variables to invalid values */ - __pyx_v_r_actual_col_idx = ((Py_ssize_t)0xbad0bad0); - __pyx_v_r_actual_col_indptr = ((Py_ssize_t)0xbad0bad0); - __pyx_v_r_actual_col_size = ((Py_ssize_t)0xbad0bad0); - __pyx_v_r_actual_element = ((double *)1); - __pyx_v_r_actual_sign = ((double)__PYX_NAN()); - __pyx_v_r_col_idx = ((Py_ssize_t)0xbad0bad0); - __pyx_v_r_col_indptr = ((Py_ssize_t)0xbad0bad0); - __pyx_v_r_col_size = ((Py_ssize_t)0xbad0bad0); - __pyx_v_r_element = ((double *)1); - - /* "gensim/models/nmf_pgd.pyx":114 - * - * for sample_idx in prange(n_samples, nogil=True): - * r_col_size = r_indptr[sample_idx + 1] - r_indptr[sample_idx] # <<<<<<<<<<<<<< - * r_actual_col_size = r_actual_indptr[sample_idx + 1] - r_actual_indptr[sample_idx] - * - */ - __pyx_t_7 = (__pyx_v_sample_idx + 1); - __pyx_t_8 = __pyx_v_sample_idx; - __pyx_v_r_col_size = ((*((int *) ( /* dim=0 */ ((char *) (((int *) __pyx_v_r_indptr.data) + __pyx_t_7)) ))) - (*((int *) ( /* dim=0 */ ((char *) (((int *) __pyx_v_r_indptr.data) + __pyx_t_8)) )))); - - /* "gensim/models/nmf_pgd.pyx":115 - * for sample_idx in prange(n_samples, nogil=True): - * r_col_size = r_indptr[sample_idx + 1] - r_indptr[sample_idx] - * r_actual_col_size = r_actual_indptr[sample_idx + 1] - r_actual_indptr[sample_idx] # <<<<<<<<<<<<<< - * - * r_col_idx = 0 - */ - __pyx_t_9 = (__pyx_v_sample_idx + 1); - __pyx_t_10 = __pyx_v_sample_idx; - __pyx_v_r_actual_col_size = ((*((int *) ( /* dim=0 */ ((char *) (((int *) __pyx_v_r_actual_indptr.data) + __pyx_t_9)) ))) - (*((int *) ( /* dim=0 */ ((char *) (((int *) __pyx_v_r_actual_indptr.data) + __pyx_t_10)) )))); - - /* "gensim/models/nmf_pgd.pyx":117 - * r_actual_col_size = r_actual_indptr[sample_idx + 1] - r_actual_indptr[sample_idx] - * - * r_col_idx = 0 # <<<<<<<<<<<<<< - * r_actual_col_idx = 0 - * - */ - __pyx_v_r_col_idx = 0; - - /* "gensim/models/nmf_pgd.pyx":118 - * - * r_col_idx = 0 - * r_actual_col_idx = 0 # <<<<<<<<<<<<<< - * - * while r_col_idx < r_col_size or r_actual_col_idx < r_actual_col_size: - */ - __pyx_v_r_actual_col_idx = 0; - - /* "gensim/models/nmf_pgd.pyx":120 - * r_actual_col_idx = 0 - * - * while r_col_idx < r_col_size or r_actual_col_idx < r_actual_col_size: # <<<<<<<<<<<<<< - * r_col_indptr = r_indices[ - * r_indptr[sample_idx] - */ - while (1) { - __pyx_t_12 = ((__pyx_v_r_col_idx < __pyx_v_r_col_size) != 0); - if (!__pyx_t_12) { - } else { - __pyx_t_11 = __pyx_t_12; - goto __pyx_L12_bool_binop_done; - } - __pyx_t_12 = ((__pyx_v_r_actual_col_idx < __pyx_v_r_actual_col_size) != 0); - __pyx_t_11 = __pyx_t_12; - __pyx_L12_bool_binop_done:; - if (!__pyx_t_11) break; - - /* "gensim/models/nmf_pgd.pyx":122 - * while r_col_idx < r_col_size or r_actual_col_idx < r_actual_col_size: - * r_col_indptr = r_indices[ - * r_indptr[sample_idx] # <<<<<<<<<<<<<< - * + r_col_idx - * ] - */ - __pyx_t_13 = __pyx_v_sample_idx; - - /* "gensim/models/nmf_pgd.pyx":121 - * - * while r_col_idx < r_col_size or r_actual_col_idx < r_actual_col_size: - * r_col_indptr = r_indices[ # <<<<<<<<<<<<<< - * r_indptr[sample_idx] - * + r_col_idx - */ - __pyx_t_14 = ((*((int *) ( /* dim=0 */ ((char *) (((int *) __pyx_v_r_indptr.data) + __pyx_t_13)) ))) + __pyx_v_r_col_idx); - __pyx_v_r_col_indptr = (*((int *) ( /* dim=0 */ ((char *) (((int *) __pyx_v_r_indices.data) + __pyx_t_14)) ))); - - /* "gensim/models/nmf_pgd.pyx":126 - * ] - * r_actual_col_indptr = r_actual_indices[ - * r_actual_indptr[sample_idx] # <<<<<<<<<<<<<< - * + r_actual_col_idx - * ] - */ - __pyx_t_15 = __pyx_v_sample_idx; - - /* "gensim/models/nmf_pgd.pyx":125 - * + r_col_idx - * ] - * r_actual_col_indptr = r_actual_indices[ # <<<<<<<<<<<<<< - * r_actual_indptr[sample_idx] - * + r_actual_col_idx - */ - __pyx_t_16 = ((*((int *) ( /* dim=0 */ ((char *) (((int *) __pyx_v_r_actual_indptr.data) + __pyx_t_15)) ))) + __pyx_v_r_actual_col_idx); - __pyx_v_r_actual_col_indptr = (*((int *) ( /* dim=0 */ ((char *) (((int *) __pyx_v_r_actual_indices.data) + __pyx_t_16)) ))); - - /* "gensim/models/nmf_pgd.pyx":131 - * - * r_element = &r_data[ - * r_indptr[sample_idx] # <<<<<<<<<<<<<< - * + r_col_idx - * ] - */ - __pyx_t_17 = __pyx_v_sample_idx; - - /* "gensim/models/nmf_pgd.pyx":130 - * ] - * - * r_element = &r_data[ # <<<<<<<<<<<<<< - * r_indptr[sample_idx] - * + r_col_idx - */ - __pyx_t_18 = ((*((int *) ( /* dim=0 */ ((char *) (((int *) __pyx_v_r_indptr.data) + __pyx_t_17)) ))) + __pyx_v_r_col_idx); - __pyx_v_r_element = (&(*((double *) ( /* dim=0 */ ((char *) (((double *) __pyx_v_r_data.data) + __pyx_t_18)) )))); - - /* "gensim/models/nmf_pgd.pyx":135 - * ] - * r_actual_element = &r_actual_data[ - * r_actual_indptr[sample_idx] # <<<<<<<<<<<<<< - * + r_actual_col_idx - * ] - */ - __pyx_t_19 = __pyx_v_sample_idx; - - /* "gensim/models/nmf_pgd.pyx":134 - * + r_col_idx - * ] - * r_actual_element = &r_actual_data[ # <<<<<<<<<<<<<< - * r_actual_indptr[sample_idx] - * + r_actual_col_idx - */ - __pyx_t_20 = ((*((int *) ( /* dim=0 */ ((char *) (((int *) __pyx_v_r_actual_indptr.data) + __pyx_t_19)) ))) + __pyx_v_r_actual_col_idx); - __pyx_v_r_actual_element = (&(*((double *) ( /* dim=0 */ ((char *) (((double *) __pyx_v_r_actual_data.data) + __pyx_t_20)) )))); - - /* "gensim/models/nmf_pgd.pyx":139 - * ] - * - * if r_col_indptr >= r_actual_col_indptr: # <<<<<<<<<<<<<< - * r_actual_sign = copysign(r_actual_sign, r_actual_element[0]) - * - */ - __pyx_t_11 = ((__pyx_v_r_col_indptr >= __pyx_v_r_actual_col_indptr) != 0); - if (__pyx_t_11) { - - /* "gensim/models/nmf_pgd.pyx":140 - * - * if r_col_indptr >= r_actual_col_indptr: - * r_actual_sign = copysign(r_actual_sign, r_actual_element[0]) # <<<<<<<<<<<<<< - * - * r_actual_element[0] = fabs(r_actual_element[0]) - lambda_ - */ - __pyx_v_r_actual_sign = copysign(__pyx_v_r_actual_sign, (__pyx_v_r_actual_element[0])); - - /* "gensim/models/nmf_pgd.pyx":142 - * r_actual_sign = copysign(r_actual_sign, r_actual_element[0]) - * - * r_actual_element[0] = fabs(r_actual_element[0]) - lambda_ # <<<<<<<<<<<<<< - * r_actual_element[0] = fmax(r_actual_element[0], 0) - * - */ - (__pyx_v_r_actual_element[0]) = (fabs((__pyx_v_r_actual_element[0])) - __pyx_v_lambda_); - - /* "gensim/models/nmf_pgd.pyx":143 - * - * r_actual_element[0] = fabs(r_actual_element[0]) - lambda_ - * r_actual_element[0] = fmax(r_actual_element[0], 0) # <<<<<<<<<<<<<< - * - * if r_actual_element[0] != 0: - */ - (__pyx_v_r_actual_element[0]) = __pyx_f_6gensim_6models_7nmf_pgd_fmax((__pyx_v_r_actual_element[0]), 0.0); - - /* "gensim/models/nmf_pgd.pyx":145 - * r_actual_element[0] = fmax(r_actual_element[0], 0) - * - * if r_actual_element[0] != 0: # <<<<<<<<<<<<<< - * r_actual_element[0] = copysign(r_actual_element[0], r_actual_sign) - * r_actual_element[0] = clip(r_actual_element[0], -v_max, v_max) - */ - __pyx_t_11 = (((__pyx_v_r_actual_element[0]) != 0.0) != 0); - if (__pyx_t_11) { - - /* "gensim/models/nmf_pgd.pyx":146 - * - * if r_actual_element[0] != 0: - * r_actual_element[0] = copysign(r_actual_element[0], r_actual_sign) # <<<<<<<<<<<<<< - * r_actual_element[0] = clip(r_actual_element[0], -v_max, v_max) - * - */ - (__pyx_v_r_actual_element[0]) = copysign((__pyx_v_r_actual_element[0]), __pyx_v_r_actual_sign); - - /* "gensim/models/nmf_pgd.pyx":147 - * if r_actual_element[0] != 0: - * r_actual_element[0] = copysign(r_actual_element[0], r_actual_sign) - * r_actual_element[0] = clip(r_actual_element[0], -v_max, v_max) # <<<<<<<<<<<<<< - * - * if r_col_indptr == r_actual_col_indptr: - */ - (__pyx_v_r_actual_element[0]) = __pyx_f_6gensim_6models_7nmf_pgd_clip((__pyx_v_r_actual_element[0]), (-__pyx_v_v_max), __pyx_v_v_max); - - /* "gensim/models/nmf_pgd.pyx":145 - * r_actual_element[0] = fmax(r_actual_element[0], 0) - * - * if r_actual_element[0] != 0: # <<<<<<<<<<<<<< - * r_actual_element[0] = copysign(r_actual_element[0], r_actual_sign) - * r_actual_element[0] = clip(r_actual_element[0], -v_max, v_max) - */ - } - - /* "gensim/models/nmf_pgd.pyx":149 - * r_actual_element[0] = clip(r_actual_element[0], -v_max, v_max) - * - * if r_col_indptr == r_actual_col_indptr: # <<<<<<<<<<<<<< - * violation += (r_element[0] - r_actual_element[0]) ** 2 - * else: - */ - __pyx_t_11 = ((__pyx_v_r_col_indptr == __pyx_v_r_actual_col_indptr) != 0); - if (__pyx_t_11) { - - /* "gensim/models/nmf_pgd.pyx":150 - * - * if r_col_indptr == r_actual_col_indptr: - * violation += (r_element[0] - r_actual_element[0]) ** 2 # <<<<<<<<<<<<<< - * else: - * violation += r_actual_element[0] ** 2 - */ - __pyx_v_violation = (__pyx_v_violation + pow(((__pyx_v_r_element[0]) - (__pyx_v_r_actual_element[0])), 2.0)); - - /* "gensim/models/nmf_pgd.pyx":149 - * r_actual_element[0] = clip(r_actual_element[0], -v_max, v_max) - * - * if r_col_indptr == r_actual_col_indptr: # <<<<<<<<<<<<<< - * violation += (r_element[0] - r_actual_element[0]) ** 2 - * else: - */ - goto __pyx_L16; - } - - /* "gensim/models/nmf_pgd.pyx":152 - * violation += (r_element[0] - r_actual_element[0]) ** 2 - * else: - * violation += r_actual_element[0] ** 2 # <<<<<<<<<<<<<< - * - * if r_actual_col_idx < r_actual_col_size: - */ - /*else*/ { - __pyx_v_violation = (__pyx_v_violation + pow((__pyx_v_r_actual_element[0]), 2.0)); - } - __pyx_L16:; - - /* "gensim/models/nmf_pgd.pyx":154 - * violation += r_actual_element[0] ** 2 - * - * if r_actual_col_idx < r_actual_col_size: # <<<<<<<<<<<<<< - * r_actual_col_idx = r_actual_col_idx + 1 - * else: - */ - __pyx_t_11 = ((__pyx_v_r_actual_col_idx < __pyx_v_r_actual_col_size) != 0); - if (__pyx_t_11) { - - /* "gensim/models/nmf_pgd.pyx":155 - * - * if r_actual_col_idx < r_actual_col_size: - * r_actual_col_idx = r_actual_col_idx + 1 # <<<<<<<<<<<<<< - * else: - * r_col_idx = r_col_idx + 1 - */ - __pyx_v_r_actual_col_idx = (__pyx_v_r_actual_col_idx + 1); - - /* "gensim/models/nmf_pgd.pyx":154 - * violation += r_actual_element[0] ** 2 - * - * if r_actual_col_idx < r_actual_col_size: # <<<<<<<<<<<<<< - * r_actual_col_idx = r_actual_col_idx + 1 - * else: - */ - goto __pyx_L17; - } - - /* "gensim/models/nmf_pgd.pyx":157 - * r_actual_col_idx = r_actual_col_idx + 1 - * else: - * r_col_idx = r_col_idx + 1 # <<<<<<<<<<<<<< - * else: - * violation += r_element[0] ** 2 - */ - /*else*/ { - __pyx_v_r_col_idx = (__pyx_v_r_col_idx + 1); - } - __pyx_L17:; - - /* "gensim/models/nmf_pgd.pyx":139 - * ] - * - * if r_col_indptr >= r_actual_col_indptr: # <<<<<<<<<<<<<< - * r_actual_sign = copysign(r_actual_sign, r_actual_element[0]) - * - */ - goto __pyx_L14; - } - - /* "gensim/models/nmf_pgd.pyx":159 - * r_col_idx = r_col_idx + 1 - * else: - * violation += r_element[0] ** 2 # <<<<<<<<<<<<<< - * - * if r_col_idx < r_col_size: - */ - /*else*/ { - __pyx_v_violation = (__pyx_v_violation + pow((__pyx_v_r_element[0]), 2.0)); - - /* "gensim/models/nmf_pgd.pyx":161 - * violation += r_element[0] ** 2 - * - * if r_col_idx < r_col_size: # <<<<<<<<<<<<<< - * r_col_idx = r_col_idx + 1 - * else: - */ - __pyx_t_11 = ((__pyx_v_r_col_idx < __pyx_v_r_col_size) != 0); - if (__pyx_t_11) { - - /* "gensim/models/nmf_pgd.pyx":162 - * - * if r_col_idx < r_col_size: - * r_col_idx = r_col_idx + 1 # <<<<<<<<<<<<<< - * else: - * r_actual_col_idx = r_actual_col_idx + 1 - */ - __pyx_v_r_col_idx = (__pyx_v_r_col_idx + 1); - - /* "gensim/models/nmf_pgd.pyx":161 - * violation += r_element[0] ** 2 - * - * if r_col_idx < r_col_size: # <<<<<<<<<<<<<< - * r_col_idx = r_col_idx + 1 - * else: - */ - goto __pyx_L18; - } - - /* "gensim/models/nmf_pgd.pyx":164 - * r_col_idx = r_col_idx + 1 - * else: - * r_actual_col_idx = r_actual_col_idx + 1 # <<<<<<<<<<<<<< - * - * return sqrt(violation) - */ - /*else*/ { - __pyx_v_r_actual_col_idx = (__pyx_v_r_actual_col_idx + 1); - } - __pyx_L18:; - } - __pyx_L14:; - } - } - } - } - } - } - #if ((defined(__APPLE__) || defined(__OSX__)) && (defined(__GNUC__) && (__GNUC__ > 2 || (__GNUC__ == 2 && (__GNUC_MINOR__ > 95))))) - #undef likely - #undef unlikely - #define likely(x) __builtin_expect(!!(x), 1) - #define unlikely(x) __builtin_expect(!!(x), 0) - #endif - } - - /* "gensim/models/nmf_pgd.pyx":113 - * cdef double violation = 0 - * - * for sample_idx in prange(n_samples, nogil=True): # <<<<<<<<<<<<<< - * r_col_size = r_indptr[sample_idx + 1] - r_indptr[sample_idx] - * r_actual_col_size = r_actual_indptr[sample_idx + 1] - r_actual_indptr[sample_idx] - */ - /*finally:*/ { - /*normal exit:*/{ - #ifdef WITH_THREAD - __Pyx_FastGIL_Forget(); - Py_BLOCK_THREADS - #endif - goto __pyx_L5; - } - __pyx_L5:; - } - } - - /* "gensim/models/nmf_pgd.pyx":166 - * r_actual_col_idx = r_actual_col_idx + 1 - * - * return sqrt(violation) # <<<<<<<<<<<<<< - */ - __Pyx_XDECREF(__pyx_r); - __pyx_t_1 = PyFloat_FromDouble(sqrt(__pyx_v_violation)); if (unlikely(!__pyx_t_1)) __PYX_ERR(0, 166, __pyx_L1_error) - __Pyx_GOTREF(__pyx_t_1); - __pyx_r = __pyx_t_1; - __pyx_t_1 = 0; - goto __pyx_L0; - - /* "gensim/models/nmf_pgd.pyx":68 - * return sqrt(violation) - * - * def solve_r( # <<<<<<<<<<<<<< - * r, - * r_actual, - */ - - /* function exit code */ - __pyx_L1_error:; - __Pyx_XDECREF(__pyx_t_1); - __PYX_XDEC_MEMVIEW(&__pyx_t_2, 1); - __PYX_XDEC_MEMVIEW(&__pyx_t_3, 1); - __Pyx_AddTraceback("gensim.models.nmf_pgd.solve_r", __pyx_clineno, __pyx_lineno, __pyx_filename); - __pyx_r = NULL; - __pyx_L0:; - __PYX_XDEC_MEMVIEW(&__pyx_v_r_indptr, 1); - __PYX_XDEC_MEMVIEW(&__pyx_v_r_indices, 1); - __PYX_XDEC_MEMVIEW(&__pyx_v_r_data, 1); - __PYX_XDEC_MEMVIEW(&__pyx_v_r_actual_indptr, 1); - __PYX_XDEC_MEMVIEW(&__pyx_v_r_actual_indices, 1); - __PYX_XDEC_MEMVIEW(&__pyx_v_r_actual_data, 1); + __PYX_XDEC_MEMVIEW(&__pyx_v_permutation, 1); __Pyx_XGIVEREF(__pyx_r); __Pyx_RefNannyFinishContext(); return __pyx_r; @@ -6901,8 +6076,8 @@ static PyObject *__pyx_memoryview_is_slice(struct __pyx_memoryview_obj *__pyx_v_ goto __pyx_L9_try_end; __pyx_L4_error:; __Pyx_XDECREF(__pyx_t_6); __pyx_t_6 = 0; - __Pyx_XDECREF(__pyx_t_8); __pyx_t_8 = 0; __Pyx_XDECREF(__pyx_t_7); __pyx_t_7 = 0; + __Pyx_XDECREF(__pyx_t_8); __pyx_t_8 = 0; /* "View.MemoryView":432 * obj = memoryview(obj, self.flags & ~PyBUF_WRITABLE | PyBUF_ANY_CONTIGUOUS, @@ -7611,11 +6786,11 @@ static PyObject *__pyx_memoryview_convert_item_to_object(struct __pyx_memoryview goto __pyx_L6_except_return; } __pyx_L3_error:; - __Pyx_XDECREF(__pyx_t_7); __pyx_t_7 = 0; + __Pyx_XDECREF(__pyx_t_1); __pyx_t_1 = 0; + __Pyx_XDECREF(__pyx_t_5); __pyx_t_5 = 0; __Pyx_XDECREF(__pyx_t_6); __pyx_t_6 = 0; + __Pyx_XDECREF(__pyx_t_7); __pyx_t_7 = 0; __Pyx_XDECREF(__pyx_t_9); __pyx_t_9 = 0; - __Pyx_XDECREF(__pyx_t_5); __pyx_t_5 = 0; - __Pyx_XDECREF(__pyx_t_1); __pyx_t_1 = 0; /* "View.MemoryView":490 * try: @@ -16849,7 +16024,7 @@ static __Pyx_StringTabEntry __pyx_string_tab[] = { {&__pyx_n_s_ValueError, __pyx_k_ValueError, sizeof(__pyx_k_ValueError), 0, 0, 1, 1}, {&__pyx_n_s_View_MemoryView, __pyx_k_View_MemoryView, sizeof(__pyx_k_View_MemoryView), 0, 0, 1, 1}, {&__pyx_n_s_WtW, __pyx_k_WtW, sizeof(__pyx_k_WtW), 0, 0, 1, 1}, - {&__pyx_n_s_Wt_v_minus_r, __pyx_k_Wt_v_minus_r, sizeof(__pyx_k_Wt_v_minus_r), 0, 0, 1, 1}, + {&__pyx_n_s_Wtv, __pyx_k_Wtv, sizeof(__pyx_k_Wtv), 0, 0, 1, 1}, {&__pyx_n_s_allocate_buffer, __pyx_k_allocate_buffer, sizeof(__pyx_k_allocate_buffer), 0, 0, 1, 1}, {&__pyx_n_s_base, __pyx_k_base, sizeof(__pyx_k_base), 0, 0, 1, 1}, {&__pyx_n_s_c, __pyx_k_c, sizeof(__pyx_k_c), 0, 0, 1, 1}, @@ -16860,7 +16035,6 @@ static __Pyx_StringTabEntry __pyx_string_tab[] = { {&__pyx_n_s_component_idx_2, __pyx_k_component_idx_2, sizeof(__pyx_k_component_idx_2), 0, 0, 1, 1}, {&__pyx_kp_s_contiguous_and_direct, __pyx_k_contiguous_and_direct, sizeof(__pyx_k_contiguous_and_direct), 0, 0, 1, 0}, {&__pyx_kp_s_contiguous_and_indirect, __pyx_k_contiguous_and_indirect, sizeof(__pyx_k_contiguous_and_indirect), 0, 0, 1, 0}, - {&__pyx_n_s_data, __pyx_k_data, sizeof(__pyx_k_data), 0, 0, 1, 1}, {&__pyx_n_s_dict, __pyx_k_dict, sizeof(__pyx_k_dict), 0, 0, 1, 1}, {&__pyx_n_s_dtype_is_object, __pyx_k_dtype_is_object, sizeof(__pyx_k_dtype_is_object), 0, 0, 1, 1}, {&__pyx_n_s_encode, __pyx_k_encode, sizeof(__pyx_k_encode), 0, 0, 1, 1}, @@ -16879,12 +16053,9 @@ static __Pyx_StringTabEntry __pyx_string_tab[] = { {&__pyx_n_s_hessian, __pyx_k_hessian, sizeof(__pyx_k_hessian), 0, 0, 1, 1}, {&__pyx_n_s_id, __pyx_k_id, sizeof(__pyx_k_id), 0, 0, 1, 1}, {&__pyx_n_s_import, __pyx_k_import, sizeof(__pyx_k_import), 0, 0, 1, 1}, - {&__pyx_n_s_indices, __pyx_k_indices, sizeof(__pyx_k_indices), 0, 0, 1, 1}, - {&__pyx_n_s_indptr, __pyx_k_indptr, sizeof(__pyx_k_indptr), 0, 0, 1, 1}, {&__pyx_n_s_itemsize, __pyx_k_itemsize, sizeof(__pyx_k_itemsize), 0, 0, 1, 1}, {&__pyx_kp_s_itemsize_0_for_cython_array, __pyx_k_itemsize_0_for_cython_array, sizeof(__pyx_k_itemsize_0_for_cython_array), 0, 0, 1, 0}, {&__pyx_n_s_kappa, __pyx_k_kappa, sizeof(__pyx_k_kappa), 0, 0, 1, 1}, - {&__pyx_n_s_lambda, __pyx_k_lambda, sizeof(__pyx_k_lambda), 0, 0, 1, 1}, {&__pyx_n_s_main, __pyx_k_main, sizeof(__pyx_k_main), 0, 0, 1, 1}, {&__pyx_n_s_memview, __pyx_k_memview, sizeof(__pyx_k_memview), 0, 0, 1, 1}, {&__pyx_n_s_mode, __pyx_k_mode, sizeof(__pyx_k_mode), 0, 0, 1, 1}, @@ -16897,6 +16068,7 @@ static __Pyx_StringTabEntry __pyx_string_tab[] = { {&__pyx_kp_s_no_default___reduce___due_to_non, __pyx_k_no_default___reduce___due_to_non, sizeof(__pyx_k_no_default___reduce___due_to_non), 0, 0, 1, 0}, {&__pyx_n_s_obj, __pyx_k_obj, sizeof(__pyx_k_obj), 0, 0, 1, 1}, {&__pyx_n_s_pack, __pyx_k_pack, sizeof(__pyx_k_pack), 0, 0, 1, 1}, + {&__pyx_n_s_permutation, __pyx_k_permutation, sizeof(__pyx_k_permutation), 0, 0, 1, 1}, {&__pyx_n_s_pickle, __pyx_k_pickle, sizeof(__pyx_k_pickle), 0, 0, 1, 1}, {&__pyx_n_s_projected_grad, __pyx_k_projected_grad, sizeof(__pyx_k_projected_grad), 0, 0, 1, 1}, {&__pyx_n_s_pyx_PickleError, __pyx_k_pyx_PickleError, sizeof(__pyx_k_pyx_PickleError), 0, 0, 1, 1}, @@ -16907,23 +16079,6 @@ static __Pyx_StringTabEntry __pyx_string_tab[] = { {&__pyx_n_s_pyx_type, __pyx_k_pyx_type, sizeof(__pyx_k_pyx_type), 0, 0, 1, 1}, {&__pyx_n_s_pyx_unpickle_Enum, __pyx_k_pyx_unpickle_Enum, sizeof(__pyx_k_pyx_unpickle_Enum), 0, 0, 1, 1}, {&__pyx_n_s_pyx_vtable, __pyx_k_pyx_vtable, sizeof(__pyx_k_pyx_vtable), 0, 0, 1, 1}, - {&__pyx_n_s_r, __pyx_k_r, sizeof(__pyx_k_r), 0, 0, 1, 1}, - {&__pyx_n_s_r_actual, __pyx_k_r_actual, sizeof(__pyx_k_r_actual), 0, 0, 1, 1}, - {&__pyx_n_s_r_actual_col_idx, __pyx_k_r_actual_col_idx, sizeof(__pyx_k_r_actual_col_idx), 0, 0, 1, 1}, - {&__pyx_n_s_r_actual_col_indptr, __pyx_k_r_actual_col_indptr, sizeof(__pyx_k_r_actual_col_indptr), 0, 0, 1, 1}, - {&__pyx_n_s_r_actual_col_size, __pyx_k_r_actual_col_size, sizeof(__pyx_k_r_actual_col_size), 0, 0, 1, 1}, - {&__pyx_n_s_r_actual_data, __pyx_k_r_actual_data, sizeof(__pyx_k_r_actual_data), 0, 0, 1, 1}, - {&__pyx_n_s_r_actual_element, __pyx_k_r_actual_element, sizeof(__pyx_k_r_actual_element), 0, 0, 1, 1}, - {&__pyx_n_s_r_actual_indices, __pyx_k_r_actual_indices, sizeof(__pyx_k_r_actual_indices), 0, 0, 1, 1}, - {&__pyx_n_s_r_actual_indptr, __pyx_k_r_actual_indptr, sizeof(__pyx_k_r_actual_indptr), 0, 0, 1, 1}, - {&__pyx_n_s_r_actual_sign, __pyx_k_r_actual_sign, sizeof(__pyx_k_r_actual_sign), 0, 0, 1, 1}, - {&__pyx_n_s_r_col_idx, __pyx_k_r_col_idx, sizeof(__pyx_k_r_col_idx), 0, 0, 1, 1}, - {&__pyx_n_s_r_col_indptr, __pyx_k_r_col_indptr, sizeof(__pyx_k_r_col_indptr), 0, 0, 1, 1}, - {&__pyx_n_s_r_col_size, __pyx_k_r_col_size, sizeof(__pyx_k_r_col_size), 0, 0, 1, 1}, - {&__pyx_n_s_r_data, __pyx_k_r_data, sizeof(__pyx_k_r_data), 0, 0, 1, 1}, - {&__pyx_n_s_r_element, __pyx_k_r_element, sizeof(__pyx_k_r_element), 0, 0, 1, 1}, - {&__pyx_n_s_r_indices, __pyx_k_r_indices, sizeof(__pyx_k_r_indices), 0, 0, 1, 1}, - {&__pyx_n_s_r_indptr, __pyx_k_r_indptr, sizeof(__pyx_k_r_indptr), 0, 0, 1, 1}, {&__pyx_n_s_range, __pyx_k_range, sizeof(__pyx_k_range), 0, 0, 1, 1}, {&__pyx_n_s_reduce, __pyx_k_reduce, sizeof(__pyx_k_reduce), 0, 0, 1, 1}, {&__pyx_n_s_reduce_cython, __pyx_k_reduce_cython, sizeof(__pyx_k_reduce_cython), 0, 0, 1, 1}, @@ -16934,7 +16089,6 @@ static __Pyx_StringTabEntry __pyx_string_tab[] = { {&__pyx_n_s_shape, __pyx_k_shape, sizeof(__pyx_k_shape), 0, 0, 1, 1}, {&__pyx_n_s_size, __pyx_k_size, sizeof(__pyx_k_size), 0, 0, 1, 1}, {&__pyx_n_s_solve_h, __pyx_k_solve_h, sizeof(__pyx_k_solve_h), 0, 0, 1, 1}, - {&__pyx_n_s_solve_r, __pyx_k_solve_r, sizeof(__pyx_k_solve_r), 0, 0, 1, 1}, {&__pyx_n_s_start, __pyx_k_start, sizeof(__pyx_k_start), 0, 0, 1, 1}, {&__pyx_n_s_step, __pyx_k_step, sizeof(__pyx_k_step), 0, 0, 1, 1}, {&__pyx_n_s_stop, __pyx_k_stop, sizeof(__pyx_k_stop), 0, 0, 1, 1}, @@ -16948,12 +16102,11 @@ static __Pyx_StringTabEntry __pyx_string_tab[] = { {&__pyx_kp_s_unable_to_allocate_shape_and_str, __pyx_k_unable_to_allocate_shape_and_str, sizeof(__pyx_k_unable_to_allocate_shape_and_str), 0, 0, 1, 0}, {&__pyx_n_s_unpack, __pyx_k_unpack, sizeof(__pyx_k_unpack), 0, 0, 1, 1}, {&__pyx_n_s_update, __pyx_k_update, sizeof(__pyx_k_update), 0, 0, 1, 1}, - {&__pyx_n_s_v_max, __pyx_k_v_max, sizeof(__pyx_k_v_max), 0, 0, 1, 1}, {&__pyx_n_s_violation, __pyx_k_violation, sizeof(__pyx_k_violation), 0, 0, 1, 1}, {0, 0, 0, 0, 0, 0, 0} }; static CYTHON_SMALL_CODE int __Pyx_InitCachedBuiltins(void) { - __pyx_builtin_range = __Pyx_GetBuiltinName(__pyx_n_s_range); if (!__pyx_builtin_range) __PYX_ERR(0, 49, __pyx_L1_error) + __pyx_builtin_range = __Pyx_GetBuiltinName(__pyx_n_s_range); if (!__pyx_builtin_range) __PYX_ERR(0, 44, __pyx_L1_error) __pyx_builtin_ValueError = __Pyx_GetBuiltinName(__pyx_n_s_ValueError); if (!__pyx_builtin_ValueError) __PYX_ERR(1, 133, __pyx_L1_error) __pyx_builtin_MemoryError = __Pyx_GetBuiltinName(__pyx_n_s_MemoryError); if (!__pyx_builtin_MemoryError) __PYX_ERR(1, 148, __pyx_L1_error) __pyx_builtin_enumerate = __Pyx_GetBuiltinName(__pyx_n_s_enumerate); if (!__pyx_builtin_enumerate) __PYX_ERR(1, 151, __pyx_L1_error) @@ -17162,29 +16315,17 @@ static CYTHON_SMALL_CODE int __Pyx_InitCachedConstants(void) { __Pyx_GOTREF(__pyx_tuple__18); __Pyx_GIVEREF(__pyx_tuple__18); - /* "gensim/models/nmf_pgd.pyx":23 - * return a + /* "gensim/models/nmf_pgd.pyx":18 + * return x if x > y else y * - * def solve_h(double[:, ::1] h, double[:, :] Wt_v_minus_r, double[:, ::1] WtW, double kappa): # <<<<<<<<<<<<<< + * def solve_h(double[:, ::1] h, double[:, :] Wtv, double[:, ::1] WtW, int[::1] permutation, double kappa): # <<<<<<<<<<<<<< * """Find optimal dense vector representation for current W and r matrices. * */ - __pyx_tuple__19 = PyTuple_Pack(13, __pyx_n_s_h, __pyx_n_s_Wt_v_minus_r, __pyx_n_s_WtW, __pyx_n_s_kappa, __pyx_n_s_n_components, __pyx_n_s_n_samples, __pyx_n_s_violation, __pyx_n_s_grad, __pyx_n_s_projected_grad, __pyx_n_s_hessian, __pyx_n_s_sample_idx, __pyx_n_s_component_idx_1, __pyx_n_s_component_idx_2); if (unlikely(!__pyx_tuple__19)) __PYX_ERR(0, 23, __pyx_L1_error) + __pyx_tuple__19 = PyTuple_Pack(14, __pyx_n_s_h, __pyx_n_s_Wtv, __pyx_n_s_WtW, __pyx_n_s_permutation, __pyx_n_s_kappa, __pyx_n_s_n_components, __pyx_n_s_n_samples, __pyx_n_s_violation, __pyx_n_s_grad, __pyx_n_s_projected_grad, __pyx_n_s_hessian, __pyx_n_s_sample_idx, __pyx_n_s_component_idx_1, __pyx_n_s_component_idx_2); if (unlikely(!__pyx_tuple__19)) __PYX_ERR(0, 18, __pyx_L1_error) __Pyx_GOTREF(__pyx_tuple__19); __Pyx_GIVEREF(__pyx_tuple__19); - __pyx_codeobj__20 = (PyObject*)__Pyx_PyCode_New(4, 0, 13, 0, CO_OPTIMIZED|CO_NEWLOCALS, __pyx_empty_bytes, __pyx_empty_tuple, __pyx_empty_tuple, __pyx_tuple__19, __pyx_empty_tuple, __pyx_empty_tuple, __pyx_kp_s_gensim_models_nmf_pgd_pyx, __pyx_n_s_solve_h, 23, __pyx_empty_bytes); if (unlikely(!__pyx_codeobj__20)) __PYX_ERR(0, 23, __pyx_L1_error) - - /* "gensim/models/nmf_pgd.pyx":68 - * return sqrt(violation) - * - * def solve_r( # <<<<<<<<<<<<<< - * r, - * r_actual, - */ - __pyx_tuple__21 = PyTuple_Pack(22, __pyx_n_s_r, __pyx_n_s_r_actual, __pyx_n_s_lambda, __pyx_n_s_v_max, __pyx_n_s_r_indptr, __pyx_n_s_r_indices, __pyx_n_s_r_data, __pyx_n_s_r_actual_indptr, __pyx_n_s_r_actual_indices, __pyx_n_s_r_actual_data, __pyx_n_s_r_col_size, __pyx_n_s_r_actual_col_size, __pyx_n_s_r_col_indptr, __pyx_n_s_r_actual_col_indptr, __pyx_n_s_r_col_idx, __pyx_n_s_r_actual_col_idx, __pyx_n_s_r_element, __pyx_n_s_r_actual_element, __pyx_n_s_r_actual_sign, __pyx_n_s_n_samples, __pyx_n_s_sample_idx, __pyx_n_s_violation); if (unlikely(!__pyx_tuple__21)) __PYX_ERR(0, 68, __pyx_L1_error) - __Pyx_GOTREF(__pyx_tuple__21); - __Pyx_GIVEREF(__pyx_tuple__21); - __pyx_codeobj__22 = (PyObject*)__Pyx_PyCode_New(4, 0, 22, 0, CO_OPTIMIZED|CO_NEWLOCALS, __pyx_empty_bytes, __pyx_empty_tuple, __pyx_empty_tuple, __pyx_tuple__21, __pyx_empty_tuple, __pyx_empty_tuple, __pyx_kp_s_gensim_models_nmf_pgd_pyx, __pyx_n_s_solve_r, 68, __pyx_empty_bytes); if (unlikely(!__pyx_codeobj__22)) __PYX_ERR(0, 68, __pyx_L1_error) + __pyx_codeobj__20 = (PyObject*)__Pyx_PyCode_New(5, 0, 14, 0, CO_OPTIMIZED|CO_NEWLOCALS, __pyx_empty_bytes, __pyx_empty_tuple, __pyx_empty_tuple, __pyx_tuple__19, __pyx_empty_tuple, __pyx_empty_tuple, __pyx_kp_s_gensim_models_nmf_pgd_pyx, __pyx_n_s_solve_h, 18, __pyx_empty_bytes); if (unlikely(!__pyx_codeobj__20)) __PYX_ERR(0, 18, __pyx_L1_error) /* "View.MemoryView":286 * return self.name @@ -17193,9 +16334,9 @@ static CYTHON_SMALL_CODE int __Pyx_InitCachedConstants(void) { * cdef strided = Enum("") # default * cdef indirect = Enum("") */ - __pyx_tuple__23 = PyTuple_Pack(1, __pyx_kp_s_strided_and_direct_or_indirect); if (unlikely(!__pyx_tuple__23)) __PYX_ERR(1, 286, __pyx_L1_error) - __Pyx_GOTREF(__pyx_tuple__23); - __Pyx_GIVEREF(__pyx_tuple__23); + __pyx_tuple__21 = PyTuple_Pack(1, __pyx_kp_s_strided_and_direct_or_indirect); if (unlikely(!__pyx_tuple__21)) __PYX_ERR(1, 286, __pyx_L1_error) + __Pyx_GOTREF(__pyx_tuple__21); + __Pyx_GIVEREF(__pyx_tuple__21); /* "View.MemoryView":287 * @@ -17204,9 +16345,9 @@ static CYTHON_SMALL_CODE int __Pyx_InitCachedConstants(void) { * cdef indirect = Enum("") * */ - __pyx_tuple__24 = PyTuple_Pack(1, __pyx_kp_s_strided_and_direct); if (unlikely(!__pyx_tuple__24)) __PYX_ERR(1, 287, __pyx_L1_error) - __Pyx_GOTREF(__pyx_tuple__24); - __Pyx_GIVEREF(__pyx_tuple__24); + __pyx_tuple__22 = PyTuple_Pack(1, __pyx_kp_s_strided_and_direct); if (unlikely(!__pyx_tuple__22)) __PYX_ERR(1, 287, __pyx_L1_error) + __Pyx_GOTREF(__pyx_tuple__22); + __Pyx_GIVEREF(__pyx_tuple__22); /* "View.MemoryView":288 * cdef generic = Enum("") @@ -17215,9 +16356,9 @@ static CYTHON_SMALL_CODE int __Pyx_InitCachedConstants(void) { * * */ - __pyx_tuple__25 = PyTuple_Pack(1, __pyx_kp_s_strided_and_indirect); if (unlikely(!__pyx_tuple__25)) __PYX_ERR(1, 288, __pyx_L1_error) - __Pyx_GOTREF(__pyx_tuple__25); - __Pyx_GIVEREF(__pyx_tuple__25); + __pyx_tuple__23 = PyTuple_Pack(1, __pyx_kp_s_strided_and_indirect); if (unlikely(!__pyx_tuple__23)) __PYX_ERR(1, 288, __pyx_L1_error) + __Pyx_GOTREF(__pyx_tuple__23); + __Pyx_GIVEREF(__pyx_tuple__23); /* "View.MemoryView":291 * @@ -17226,9 +16367,9 @@ static CYTHON_SMALL_CODE int __Pyx_InitCachedConstants(void) { * cdef indirect_contiguous = Enum("") * */ - __pyx_tuple__26 = PyTuple_Pack(1, __pyx_kp_s_contiguous_and_direct); if (unlikely(!__pyx_tuple__26)) __PYX_ERR(1, 291, __pyx_L1_error) - __Pyx_GOTREF(__pyx_tuple__26); - __Pyx_GIVEREF(__pyx_tuple__26); + __pyx_tuple__24 = PyTuple_Pack(1, __pyx_kp_s_contiguous_and_direct); if (unlikely(!__pyx_tuple__24)) __PYX_ERR(1, 291, __pyx_L1_error) + __Pyx_GOTREF(__pyx_tuple__24); + __Pyx_GIVEREF(__pyx_tuple__24); /* "View.MemoryView":292 * @@ -17237,19 +16378,19 @@ static CYTHON_SMALL_CODE int __Pyx_InitCachedConstants(void) { * * */ - __pyx_tuple__27 = PyTuple_Pack(1, __pyx_kp_s_contiguous_and_indirect); if (unlikely(!__pyx_tuple__27)) __PYX_ERR(1, 292, __pyx_L1_error) - __Pyx_GOTREF(__pyx_tuple__27); - __Pyx_GIVEREF(__pyx_tuple__27); + __pyx_tuple__25 = PyTuple_Pack(1, __pyx_kp_s_contiguous_and_indirect); if (unlikely(!__pyx_tuple__25)) __PYX_ERR(1, 292, __pyx_L1_error) + __Pyx_GOTREF(__pyx_tuple__25); + __Pyx_GIVEREF(__pyx_tuple__25); /* "(tree fragment)":1 * def __pyx_unpickle_Enum(__pyx_type, long __pyx_checksum, __pyx_state): # <<<<<<<<<<<<<< * cdef object __pyx_PickleError * cdef object __pyx_result */ - __pyx_tuple__28 = PyTuple_Pack(5, __pyx_n_s_pyx_type, __pyx_n_s_pyx_checksum, __pyx_n_s_pyx_state, __pyx_n_s_pyx_PickleError, __pyx_n_s_pyx_result); if (unlikely(!__pyx_tuple__28)) __PYX_ERR(1, 1, __pyx_L1_error) - __Pyx_GOTREF(__pyx_tuple__28); - __Pyx_GIVEREF(__pyx_tuple__28); - __pyx_codeobj__29 = (PyObject*)__Pyx_PyCode_New(3, 0, 5, 0, CO_OPTIMIZED|CO_NEWLOCALS, __pyx_empty_bytes, __pyx_empty_tuple, __pyx_empty_tuple, __pyx_tuple__28, __pyx_empty_tuple, __pyx_empty_tuple, __pyx_kp_s_stringsource, __pyx_n_s_pyx_unpickle_Enum, 1, __pyx_empty_bytes); if (unlikely(!__pyx_codeobj__29)) __PYX_ERR(1, 1, __pyx_L1_error) + __pyx_tuple__26 = PyTuple_Pack(5, __pyx_n_s_pyx_type, __pyx_n_s_pyx_checksum, __pyx_n_s_pyx_state, __pyx_n_s_pyx_PickleError, __pyx_n_s_pyx_result); if (unlikely(!__pyx_tuple__26)) __PYX_ERR(1, 1, __pyx_L1_error) + __Pyx_GOTREF(__pyx_tuple__26); + __Pyx_GIVEREF(__pyx_tuple__26); + __pyx_codeobj__27 = (PyObject*)__Pyx_PyCode_New(3, 0, 5, 0, CO_OPTIMIZED|CO_NEWLOCALS, __pyx_empty_bytes, __pyx_empty_tuple, __pyx_empty_tuple, __pyx_tuple__26, __pyx_empty_tuple, __pyx_empty_tuple, __pyx_kp_s_stringsource, __pyx_n_s_pyx_unpickle_Enum, 1, __pyx_empty_bytes); if (unlikely(!__pyx_codeobj__27)) __PYX_ERR(1, 1, __pyx_L1_error) __Pyx_RefNannyFinishContext(); return 0; __pyx_L1_error:; @@ -17589,28 +16730,16 @@ if (!__Pyx_RefNanny) { if (__Pyx_patch_abc() < 0) __PYX_ERR(0, 1, __pyx_L1_error) #endif - /* "gensim/models/nmf_pgd.pyx":23 - * return a + /* "gensim/models/nmf_pgd.pyx":18 + * return x if x > y else y * - * def solve_h(double[:, ::1] h, double[:, :] Wt_v_minus_r, double[:, ::1] WtW, double kappa): # <<<<<<<<<<<<<< + * def solve_h(double[:, ::1] h, double[:, :] Wtv, double[:, ::1] WtW, int[::1] permutation, double kappa): # <<<<<<<<<<<<<< * """Find optimal dense vector representation for current W and r matrices. * */ - __pyx_t_1 = PyCFunction_NewEx(&__pyx_mdef_6gensim_6models_7nmf_pgd_1solve_h, NULL, __pyx_n_s_gensim_models_nmf_pgd); if (unlikely(!__pyx_t_1)) __PYX_ERR(0, 23, __pyx_L1_error) - __Pyx_GOTREF(__pyx_t_1); - if (PyDict_SetItem(__pyx_d, __pyx_n_s_solve_h, __pyx_t_1) < 0) __PYX_ERR(0, 23, __pyx_L1_error) - __Pyx_DECREF(__pyx_t_1); __pyx_t_1 = 0; - - /* "gensim/models/nmf_pgd.pyx":68 - * return sqrt(violation) - * - * def solve_r( # <<<<<<<<<<<<<< - * r, - * r_actual, - */ - __pyx_t_1 = PyCFunction_NewEx(&__pyx_mdef_6gensim_6models_7nmf_pgd_3solve_r, NULL, __pyx_n_s_gensim_models_nmf_pgd); if (unlikely(!__pyx_t_1)) __PYX_ERR(0, 68, __pyx_L1_error) + __pyx_t_1 = PyCFunction_NewEx(&__pyx_mdef_6gensim_6models_7nmf_pgd_1solve_h, NULL, __pyx_n_s_gensim_models_nmf_pgd); if (unlikely(!__pyx_t_1)) __PYX_ERR(0, 18, __pyx_L1_error) __Pyx_GOTREF(__pyx_t_1); - if (PyDict_SetItem(__pyx_d, __pyx_n_s_solve_r, __pyx_t_1) < 0) __PYX_ERR(0, 68, __pyx_L1_error) + if (PyDict_SetItem(__pyx_d, __pyx_n_s_solve_h, __pyx_t_1) < 0) __PYX_ERR(0, 18, __pyx_L1_error) __Pyx_DECREF(__pyx_t_1); __pyx_t_1 = 0; /* "gensim/models/nmf_pgd.pyx":1 @@ -17643,7 +16772,7 @@ if (!__Pyx_RefNanny) { * cdef strided = Enum("") # default * cdef indirect = Enum("") */ - __pyx_t_1 = __Pyx_PyObject_Call(((PyObject *)__pyx_MemviewEnum_type), __pyx_tuple__23, NULL); if (unlikely(!__pyx_t_1)) __PYX_ERR(1, 286, __pyx_L1_error) + __pyx_t_1 = __Pyx_PyObject_Call(((PyObject *)__pyx_MemviewEnum_type), __pyx_tuple__21, NULL); if (unlikely(!__pyx_t_1)) __PYX_ERR(1, 286, __pyx_L1_error) __Pyx_GOTREF(__pyx_t_1); __Pyx_XGOTREF(generic); __Pyx_DECREF_SET(generic, __pyx_t_1); @@ -17657,7 +16786,7 @@ if (!__Pyx_RefNanny) { * cdef indirect = Enum("") * */ - __pyx_t_1 = __Pyx_PyObject_Call(((PyObject *)__pyx_MemviewEnum_type), __pyx_tuple__24, NULL); if (unlikely(!__pyx_t_1)) __PYX_ERR(1, 287, __pyx_L1_error) + __pyx_t_1 = __Pyx_PyObject_Call(((PyObject *)__pyx_MemviewEnum_type), __pyx_tuple__22, NULL); if (unlikely(!__pyx_t_1)) __PYX_ERR(1, 287, __pyx_L1_error) __Pyx_GOTREF(__pyx_t_1); __Pyx_XGOTREF(strided); __Pyx_DECREF_SET(strided, __pyx_t_1); @@ -17671,7 +16800,7 @@ if (!__Pyx_RefNanny) { * * */ - __pyx_t_1 = __Pyx_PyObject_Call(((PyObject *)__pyx_MemviewEnum_type), __pyx_tuple__25, NULL); if (unlikely(!__pyx_t_1)) __PYX_ERR(1, 288, __pyx_L1_error) + __pyx_t_1 = __Pyx_PyObject_Call(((PyObject *)__pyx_MemviewEnum_type), __pyx_tuple__23, NULL); if (unlikely(!__pyx_t_1)) __PYX_ERR(1, 288, __pyx_L1_error) __Pyx_GOTREF(__pyx_t_1); __Pyx_XGOTREF(indirect); __Pyx_DECREF_SET(indirect, __pyx_t_1); @@ -17685,7 +16814,7 @@ if (!__Pyx_RefNanny) { * cdef indirect_contiguous = Enum("") * */ - __pyx_t_1 = __Pyx_PyObject_Call(((PyObject *)__pyx_MemviewEnum_type), __pyx_tuple__26, NULL); if (unlikely(!__pyx_t_1)) __PYX_ERR(1, 291, __pyx_L1_error) + __pyx_t_1 = __Pyx_PyObject_Call(((PyObject *)__pyx_MemviewEnum_type), __pyx_tuple__24, NULL); if (unlikely(!__pyx_t_1)) __PYX_ERR(1, 291, __pyx_L1_error) __Pyx_GOTREF(__pyx_t_1); __Pyx_XGOTREF(contiguous); __Pyx_DECREF_SET(contiguous, __pyx_t_1); @@ -17699,7 +16828,7 @@ if (!__Pyx_RefNanny) { * * */ - __pyx_t_1 = __Pyx_PyObject_Call(((PyObject *)__pyx_MemviewEnum_type), __pyx_tuple__27, NULL); if (unlikely(!__pyx_t_1)) __PYX_ERR(1, 292, __pyx_L1_error) + __pyx_t_1 = __Pyx_PyObject_Call(((PyObject *)__pyx_MemviewEnum_type), __pyx_tuple__25, NULL); if (unlikely(!__pyx_t_1)) __PYX_ERR(1, 292, __pyx_L1_error) __Pyx_GOTREF(__pyx_t_1); __Pyx_XGOTREF(indirect_contiguous); __Pyx_DECREF_SET(indirect_contiguous, __pyx_t_1); @@ -20755,6 +19884,29 @@ static int __Pyx_ValidateAndInit_memviewslice( return result; } +/* ObjectToMemviewSlice */ + static CYTHON_INLINE __Pyx_memviewslice __Pyx_PyObject_to_MemoryviewSlice_dc_int(PyObject *obj, int writable_flag) { + __Pyx_memviewslice result = { 0, 0, { 0 }, { 0 }, { 0 } }; + __Pyx_BufFmt_StackElem stack[1]; + int axes_specs[] = { (__Pyx_MEMVIEW_DIRECT | __Pyx_MEMVIEW_CONTIG) }; + int retcode; + if (obj == Py_None) { + result.memview = (struct __pyx_memoryview_obj *) Py_None; + return result; + } + retcode = __Pyx_ValidateAndInit_memviewslice(axes_specs, __Pyx_IS_C_CONTIG, + (PyBUF_C_CONTIGUOUS | PyBUF_FORMAT) | writable_flag, 1, + &__Pyx_TypeInfo_int, stack, + &result, obj); + if (unlikely(retcode == -1)) + goto __pyx_fail; + return result; +__pyx_fail: + result.memview = NULL; + result.data = NULL; + return result; +} + /* MemviewSliceCopyTemplate */ static __Pyx_memviewslice __pyx_memoryview_copy_new_contig(const __Pyx_memviewslice *from_mvs, @@ -21473,52 +20625,6 @@ __pyx_memoryview_copy_new_contig(const __Pyx_memviewslice *from_mvs, return (char) -1; } -/* ObjectToMemviewSlice */ - static CYTHON_INLINE __Pyx_memviewslice __Pyx_PyObject_to_MemoryviewSlice_dc_int(PyObject *obj, int writable_flag) { - __Pyx_memviewslice result = { 0, 0, { 0 }, { 0 }, { 0 } }; - __Pyx_BufFmt_StackElem stack[1]; - int axes_specs[] = { (__Pyx_MEMVIEW_DIRECT | __Pyx_MEMVIEW_CONTIG) }; - int retcode; - if (obj == Py_None) { - result.memview = (struct __pyx_memoryview_obj *) Py_None; - return result; - } - retcode = __Pyx_ValidateAndInit_memviewslice(axes_specs, __Pyx_IS_C_CONTIG, - (PyBUF_C_CONTIGUOUS | PyBUF_FORMAT) | writable_flag, 1, - &__Pyx_TypeInfo_int, stack, - &result, obj); - if (unlikely(retcode == -1)) - goto __pyx_fail; - return result; -__pyx_fail: - result.memview = NULL; - result.data = NULL; - return result; -} - -/* ObjectToMemviewSlice */ - static CYTHON_INLINE __Pyx_memviewslice __Pyx_PyObject_to_MemoryviewSlice_dc_double(PyObject *obj, int writable_flag) { - __Pyx_memviewslice result = { 0, 0, { 0 }, { 0 }, { 0 } }; - __Pyx_BufFmt_StackElem stack[1]; - int axes_specs[] = { (__Pyx_MEMVIEW_DIRECT | __Pyx_MEMVIEW_CONTIG) }; - int retcode; - if (obj == Py_None) { - result.memview = (struct __pyx_memoryview_obj *) Py_None; - return result; - } - retcode = __Pyx_ValidateAndInit_memviewslice(axes_specs, __Pyx_IS_C_CONTIG, - (PyBUF_C_CONTIGUOUS | PyBUF_FORMAT) | writable_flag, 1, - &__Pyx_TypeInfo_double, stack, - &result, obj); - if (unlikely(retcode == -1)) - goto __pyx_fail; - return result; -__pyx_fail: - result.memview = NULL; - result.data = NULL; - return result; -} - /* CheckBinaryVersion */ static int __Pyx_check_binary_version(void) { char ctversion[4], rtversion[4]; diff --git a/gensim/models/nmf_pgd.pyx b/gensim/models/nmf_pgd.pyx index 01e9075cbc..dff480cdb4 100644 --- a/gensim/models/nmf_pgd.pyx +++ b/gensim/models/nmf_pgd.pyx @@ -6,7 +6,7 @@ # cython: nonecheck=False # cython: embedsignature=True -from libc.math cimport sqrt, fabs, copysign +from libc.math cimport sqrt from cython.parallel import prange cdef double fmin(double x, double y) nogil: @@ -15,19 +15,14 @@ cdef double fmin(double x, double y) nogil: cdef double fmax(double x, double y) nogil: return x if x > y else y -cdef double clip(double a, double a_min, double a_max) nogil: - a = fmin(a, a_max) - a = fmax(a, a_min) - return a - -def solve_h(double[:, ::1] h, double[:, :] Wt_v_minus_r, double[:, ::1] WtW, double kappa): +def solve_h(double[:, ::1] h, double[:, :] Wtv, double[:, ::1] WtW, int[::1] permutation, double kappa): """Find optimal dense vector representation for current W and r matrices. Parameters ---------- h : matrix Dense representation of documents in current batch. - Wt_v_minus_r : matrix + Wtv : matrix WtW : matrix Returns @@ -47,8 +42,9 @@ def solve_h(double[:, ::1] h, double[:, :] Wt_v_minus_r, double[:, ::1] WtW, dou for sample_idx in prange(n_samples, nogil=True): for component_idx_1 in range(n_components): + component_idx_1 = permutation[component_idx_1] - grad = -Wt_v_minus_r[component_idx_1, sample_idx] + grad = -Wtv[component_idx_1, sample_idx] for component_idx_2 in range(n_components): grad += WtW[component_idx_1, component_idx_2] * h[component_idx_2, sample_idx] @@ -64,103 +60,3 @@ def solve_h(double[:, ::1] h, double[:, :] Wt_v_minus_r, double[:, ::1] WtW, dou h[component_idx_1, sample_idx] = fmax(h[component_idx_1, sample_idx] - grad, 0.) return sqrt(violation) - -def solve_r( - r, - r_actual, - double lambda_, - double v_max - ): - """Bound new residuals. - - Parameters - ---------- - r: sparse matrix - r_actual: sparse matrix - lambda_ : double - v_max : double - - Returns - ------- - float - Cumulative difference between previous and current residuals vectors. - - """ - - cdef int[::1] r_indptr = r.indptr - cdef int[::1] r_indices = r.indices - cdef double[::1] r_data = r.data - cdef int[::1] r_actual_indptr = r_actual.indptr - cdef int[::1] r_actual_indices = r_actual.indices - cdef double[::1] r_actual_data = r_actual.data - - cdef Py_ssize_t r_col_size = 0 - cdef Py_ssize_t r_actual_col_size = 0 - cdef Py_ssize_t r_col_indptr - cdef Py_ssize_t r_actual_col_indptr - cdef Py_ssize_t r_col_idx - cdef Py_ssize_t r_actual_col_idx - cdef double* r_element - cdef double* r_actual_element - - cdef double r_actual_sign = 1.0 - - cdef Py_ssize_t n_samples = r_actual_indptr.shape[0] - 1 - cdef Py_ssize_t sample_idx - - cdef double violation = 0 - - for sample_idx in prange(n_samples, nogil=True): - r_col_size = r_indptr[sample_idx + 1] - r_indptr[sample_idx] - r_actual_col_size = r_actual_indptr[sample_idx + 1] - r_actual_indptr[sample_idx] - - r_col_idx = 0 - r_actual_col_idx = 0 - - while r_col_idx < r_col_size or r_actual_col_idx < r_actual_col_size: - r_col_indptr = r_indices[ - r_indptr[sample_idx] - + r_col_idx - ] - r_actual_col_indptr = r_actual_indices[ - r_actual_indptr[sample_idx] - + r_actual_col_idx - ] - - r_element = &r_data[ - r_indptr[sample_idx] - + r_col_idx - ] - r_actual_element = &r_actual_data[ - r_actual_indptr[sample_idx] - + r_actual_col_idx - ] - - if r_col_indptr >= r_actual_col_indptr: - r_actual_sign = copysign(r_actual_sign, r_actual_element[0]) - - r_actual_element[0] = fabs(r_actual_element[0]) - lambda_ - r_actual_element[0] = fmax(r_actual_element[0], 0) - - if r_actual_element[0] != 0: - r_actual_element[0] = copysign(r_actual_element[0], r_actual_sign) - r_actual_element[0] = clip(r_actual_element[0], -v_max, v_max) - - if r_col_indptr == r_actual_col_indptr: - violation += (r_element[0] - r_actual_element[0]) ** 2 - else: - violation += r_actual_element[0] ** 2 - - if r_actual_col_idx < r_actual_col_size: - r_actual_col_idx = r_actual_col_idx + 1 - else: - r_col_idx = r_col_idx + 1 - else: - violation += r_element[0] ** 2 - - if r_col_idx < r_col_size: - r_col_idx = r_col_idx + 1 - else: - r_actual_col_idx = r_actual_col_idx + 1 - - return sqrt(violation) diff --git a/gensim/models/poincare.py b/gensim/models/poincare.py index 267878302c..0c49c761f2 100644 --- a/gensim/models/poincare.py +++ b/gensim/models/poincare.py @@ -1383,6 +1383,12 @@ def __init__(self, file_path, encoding='utf8', delimiter='\t'): ---------- file_path : str Path to file containing a pair of nodes (a relation) per line, separated by `delimiter`. + Since the relations are asymmetric, the order of `u` and `v` nodes in each pair matters. + To express a "u is v" relation, the lines should take the form `u delimeter v`. + e.g: `kangaroo mammal` is a tab-delimited line expressing a "`kangaroo is a mammal`" relation. + + For a full input file example, see `gensim/test/test_data/poincare_hypernyms.tsv + `_. encoding : str, optional Character encoding of the input file. delimiter : str, optional diff --git a/gensim/models/stdint_wrapper.h b/gensim/models/stdint_wrapper.h new file mode 100644 index 0000000000..0b9832dedf --- /dev/null +++ b/gensim/models/stdint_wrapper.h @@ -0,0 +1,19 @@ +/* + * This file is here to support older versions of the MSVC compiler that don't + * have stdint.h. + */ +#ifdef _MSC_VER + #ifndef _MSC_STDINT_H_ + #if _MSC_VER < 1300 + typedef unsigned char uint8_t; + typedef unsigned int uint32_t; + typedef char int8_t; + #else + typedef unsigned __int8 uint8_t; + typedef unsigned __int32 uint32_t; + typedef char int8_t; + #endif + #endif +#else + #include +#endif diff --git a/gensim/models/utils_any2vec.py b/gensim/models/utils_any2vec.py index 74d0effcff..1d9e03647c 100644 --- a/gensim/models/utils_any2vec.py +++ b/gensim/models/utils_any2vec.py @@ -4,7 +4,26 @@ # Author: Shiva Manne # Copyright (C) 2018 RaRe Technologies s.r.o. -"""General functions used for any2vec models.""" +"""General functions used for any2vec models. + +One of the goals of this module is to provide an abstraction over the Cython +extensions for FastText. If they are not available, then the module substitutes +slower Python versions in their place. + +Another related set of FastText functionality is computing ngrams for a word. +The :py:func:`compute_ngrams` and :py:func:`compute_ngrams_bytes` hashes achieve that. + +Closely related is the functionality for hashing ngrams, implemented by the +:py:func:`ft_hash` and :py:func:`ft_hash_broken` functions. +The module exposes "working" and "broken" hash functions in order to maintain +backwards compatibility with older versions of Gensim. + +For compatibility with older Gensim, use :py:func:`compute_ngrams` and +:py:func:`ft_hash_broken` to has each ngram. For compatibility with the +current Facebook implementation, use :py:func:`compute_ngrams_bytes` and +:py:func:`ft_hash_bytes`. + +""" import logging import numpy as np @@ -18,6 +37,14 @@ logger = logging.getLogger(__name__) +# +# UTF-8 bytes that begin with 10 are subsequent bytes of a multi-byte sequence, +# as opposed to a new character. +# +_MB_MASK = 0xC0 +_MB_START = 0x80 + + def _byte_to_int_py3(b): return b @@ -29,19 +56,23 @@ def _byte_to_int_py2(b): _byte_to_int = _byte_to_int_py2 if PY2 else _byte_to_int_py3 +def _is_utf8_continue(b): + return _byte_to_int(b) & _MB_MASK == _MB_START + + # -# Define this here so we can unittest here. Only use this function if the -# faster C version fails to import. +# Define this here so we can unittest this function directly. +# Only use this function if the faster C version fails to import. # -def _ft_hash_py(string): - """Calculate hash based on `string`. +def _ft_hash_bytes_py(bytez): + """Calculate hash based on `bytez`. Reproduce `hash method from Facebook fastText implementation `_. Parameters ---------- - string : str - The string whose hash needs to be calculated. + bytez : bytes + The string whose hash needs to be calculated, encoded as UTF-8. Returns ------- @@ -51,14 +82,14 @@ def _ft_hash_py(string): """ old_settings = np.seterr(all='ignore') h = np.uint32(2166136261) - for c in string.encode('utf-8'): - h = h ^ np.uint32(np.int8(_byte_to_int(c))) + for b in bytez: + h = h ^ np.uint32(np.int8(_byte_to_int(b))) h = h * np.uint32(16777619) np.seterr(**old_settings) return h -def _ft_hash_py_broken(string): +def _ft_hash_broken_py(string): """Calculate hash based on `string`. Reproduce `hash method from Facebook fastText implementation `_. @@ -86,91 +117,178 @@ def _ft_hash_py_broken(string): return h +def _compute_ngrams_py(word, min_n, max_n): + """Get the list of all possible ngrams for a given word. + Parameters + ---------- + word : str + The word whose ngrams need to be computed. + min_n : int + Minimum character length of the ngrams. + max_n : int + Maximum character length of the ngrams. + Returns + ------- + list of str + Sequence of character ngrams. + """ + BOW, EOW = ('<', '>') # Used by FastText to attach to all words as prefix and suffix + extended_word = BOW + word + EOW + ngrams = [] + for ngram_length in range(min_n, min(len(extended_word), max_n) + 1): + for i in range(0, len(extended_word) - ngram_length + 1): + ngrams.append(extended_word[i:i + ngram_length]) + return ngrams + + +def _compute_ngrams_bytes_py(word, min_n, max_n): + """Computes ngrams for a word. + + Ported from the original FB implementation. + + Parameters + ---------- + word : str + A unicode string. + min_n : unsigned int + The minimum ngram length. + max_n : unsigned int + The maximum ngram length. + + Returns: + -------- + list of str + A list of ngrams, where each ngram is a list of **bytes**. + + See Also + -------- + `Original implementation `__ # noqa: E501 + + """ + utf8_word = ('<%s>' % word).encode("utf-8") + num_bytes = len(utf8_word) + n = 0 + + ngrams = [] + for i in range(num_bytes): + if _is_utf8_continue(utf8_word[i]): + continue + + j, n = i, 1 + while j < num_bytes and n <= max_n: + j += 1 + while j < num_bytes and _is_utf8_continue(utf8_word[j]): + j += 1 + if n >= min_n and not (n == 1 and (i == 0 or j == num_bytes)): + ngram = bytes(utf8_word[i:j]) + ngrams.append(ngram) + n += 1 + return ngrams + + +# +# Internally, we use the following convention to abstract away the presence +# or absence of the Cython extensions: +# +# - _function_cy: Imported from Cython extension +# - _function_py: Implemented in Python +# - function: Exported by this module. +# try: from gensim.models._utils_any2vec import ( - ft_hash as _ft_hash_cy, - ft_hash_broken as _ft_hash_cy_broken, - compute_ngrams as _compute_ngrams + compute_ngrams as _compute_ngrams_cy, + compute_ngrams_bytes as _compute_ngrams_bytes_cy, + ft_hash_broken as _ft_hash_broken_cy, + ft_hash_bytes as _ft_hash_bytes_cy, ) - _ft_hash = _ft_hash_cy - _ft_hash_broken = _ft_hash_cy_broken + ft_hash_bytes = _ft_hash_bytes_cy + ft_hash_broken = _ft_hash_broken_cy + compute_ngrams = _compute_ngrams_cy + compute_ngrams_bytes = _compute_ngrams_bytes_cy + FAST_VERSION = 0 except ImportError: + # failed... fall back to plain python FAST_VERSION = -1 + ft_hash_bytes = _ft_hash_bytes_py + ft_hash_broken = _ft_hash_broken_py + compute_ngrams = _compute_ngrams_py + compute_ngrams_bytes = _compute_ngrams_bytes_py - _ft_hash = _ft_hash_py - _ft_hash_broken = _ft_hash_py_broken - # failed... fall back to plain python - def _compute_ngrams(word, min_n, max_n): - """Get the list of all possible ngrams for a given word. - - Parameters - ---------- - word : str - The word whose ngrams need to be computed. - min_n : int - Minimum character length of the ngrams. - max_n : int - Maximum character length of the ngrams. - - Returns - ------- - list of str - Sequence of character ngrams. - - """ - BOW, EOW = ('<', '>') # Used by FastText to attach to all words as prefix and suffix - extended_word = BOW + word + EOW - ngrams = [] - for ngram_length in range(min_n, min(len(extended_word), max_n) + 1): - for i in range(0, len(extended_word) - ngram_length + 1): - ngrams.append(extended_word[i:i + ngram_length]) - return ngrams +def ft_ngram_hashes(word, minn, maxn, num_buckets, fb_compatible=True): + """Calculate the ngrams of the word and hash them. + + Parameters + ---------- + word : str + The word to calculate ngram hashes for. + minn : int + Minimum ngram length + maxn : int + Maximum ngram length + num_buckets : int + The number of buckets + fb_compatible : boolean, optional + True for compatibility with the Facebook implementation. + False for compatibility with the old Gensim implementation. + + Returns + ------- + A list of hashes (integers), one per each detected ngram. + + """ + if fb_compatible: + encoded_ngrams = compute_ngrams_bytes(word, minn, maxn) + hashes = [ft_hash_bytes(n) % num_buckets for n in encoded_ngrams] + else: + text_ngrams = compute_ngrams(word, minn, maxn) + hashes = [ft_hash_broken(n) % num_buckets for n in text_ngrams] + return hashes def _save_word2vec_format(fname, vocab, vectors, fvocab=None, binary=False, total_vec=None): - """Store the input-hidden weight matrix in the same format used by the original - C word2vec-tool, for compatibility. - - Parameters - ---------- - fname : str - The file path used to save the vectors in. - vocab : dict - The vocabulary of words. - vectors : numpy.array - The vectors to be stored. - fvocab : str, optional - File path used to save the vocabulary. - binary : bool, optional - If True, the data wil be saved in binary word2vec format, else it will be saved in plain text. - total_vec : int, optional - Explicitly specify total number of vectors - (in case word vectors are appended with document vectors afterwards). - - """ - if not (vocab or vectors): - raise RuntimeError("no input") - if total_vec is None: - total_vec = len(vocab) - vector_size = vectors.shape[1] - if fvocab is not None: - logger.info("storing vocabulary in %s", fvocab) - with utils.smart_open(fvocab, 'wb') as vout: - for word, vocab_ in sorted(iteritems(vocab), key=lambda item: -item[1].count): - vout.write(utils.to_utf8("%s %s\n" % (word, vocab_.count))) - logger.info("storing %sx%s projection weights into %s", total_vec, vector_size, fname) - assert (len(vocab), vector_size) == vectors.shape - with utils.smart_open(fname, 'wb') as fout: - fout.write(utils.to_utf8("%s %s\n" % (total_vec, vector_size))) - # store in sorted order: most frequent words at the top + """Store the input-hidden weight matrix in the same format used by the original + C word2vec-tool, for compatibility. + + Parameters + ---------- + fname : str + The file path used to save the vectors in. + vocab : dict + The vocabulary of words. + vectors : numpy.array + The vectors to be stored. + fvocab : str, optional + File path used to save the vocabulary. + binary : bool, optional + If True, the data wil be saved in binary word2vec format, else it will be saved in plain text. + total_vec : int, optional + Explicitly specify total number of vectors + (in case word vectors are appended with document vectors afterwards). + + """ + if not (vocab or vectors): + raise RuntimeError("no input") + if total_vec is None: + total_vec = len(vocab) + vector_size = vectors.shape[1] + if fvocab is not None: + logger.info("storing vocabulary in %s", fvocab) + with utils.smart_open(fvocab, 'wb') as vout: for word, vocab_ in sorted(iteritems(vocab), key=lambda item: -item[1].count): - row = vectors[vocab_.index] - if binary: - row = row.astype(REAL) - fout.write(utils.to_utf8(word) + b" " + row.tostring()) - else: - fout.write(utils.to_utf8("%s %s\n" % (word, ' '.join(repr(val) for val in row)))) + vout.write(utils.to_utf8("%s %s\n" % (word, vocab_.count))) + logger.info("storing %sx%s projection weights into %s", total_vec, vector_size, fname) + assert (len(vocab), vector_size) == vectors.shape + with utils.smart_open(fname, 'wb') as fout: + fout.write(utils.to_utf8("%s %s\n" % (total_vec, vector_size))) + # store in sorted order: most frequent words at the top + for word, vocab_ in sorted(iteritems(vocab), key=lambda item: -item[1].count): + row = vectors[vocab_.index] + if binary: + row = row.astype(REAL) + fout.write(utils.to_utf8(word) + b" " + row.tostring()) + else: + fout.write(utils.to_utf8("%s %s\n" % (word, ' '.join(repr(val) for val in row)))) def _load_word2vec_format(cls, fname, fvocab=None, binary=False, encoding='utf8', unicode_errors='strict', diff --git a/gensim/models/word2vec_corpusfile.cpp b/gensim/models/word2vec_corpusfile.cpp index 7835d19963..aa12258744 100644 --- a/gensim/models/word2vec_corpusfile.cpp +++ b/gensim/models/word2vec_corpusfile.cpp @@ -1,25 +1,4 @@ -/* Generated by Cython 0.28.4 */ - -/* BEGIN: Cython Metadata -{ - "distutils": { - "depends": [ - "gensim/models/fast_line_sentence.h", - "gensim/models/voidptr.h" - ], - "include_dirs": [ - "gensim/models", - "./gensim/models" - ], - "language": "c++", - "name": "gensim.models.word2vec_corpusfile", - "sources": [ - "/home/akhlif/dzr_core/gensim/gensim/models/word2vec_corpusfile.pyx" - ] - }, - "module_name": "gensim.models.word2vec_corpusfile" -} -END: Cython Metadata */ +/* Generated by Cython 0.29.2 */ #define PY_SSIZE_T_CLEAN #include "Python.h" @@ -28,7 +7,8 @@ END: Cython Metadata */ #elif PY_VERSION_HEX < 0x02060000 || (0x03000000 <= PY_VERSION_HEX && PY_VERSION_HEX < 0x03030000) #error Cython requires Python 2.6+ or Python 3.3+. #else -#define CYTHON_ABI "0_28_4" +#define CYTHON_ABI "0_29_2" +#define CYTHON_HEX_VERSION 0x001D02F0 #define CYTHON_FUTURE_DIVISION 0 #include #ifndef offsetof @@ -99,6 +79,10 @@ END: Cython Metadata */ #define CYTHON_PEP489_MULTI_PHASE_INIT 0 #undef CYTHON_USE_TP_FINALIZE #define CYTHON_USE_TP_FINALIZE 0 + #undef CYTHON_USE_DICT_VERSIONS + #define CYTHON_USE_DICT_VERSIONS 0 + #undef CYTHON_USE_EXC_INFO_STACK + #define CYTHON_USE_EXC_INFO_STACK 0 #elif defined(PYSTON_VERSION) #define CYTHON_COMPILING_IN_PYPY 0 #define CYTHON_COMPILING_IN_PYSTON 1 @@ -136,6 +120,10 @@ END: Cython Metadata */ #define CYTHON_PEP489_MULTI_PHASE_INIT 0 #undef CYTHON_USE_TP_FINALIZE #define CYTHON_USE_TP_FINALIZE 0 + #undef CYTHON_USE_DICT_VERSIONS + #define CYTHON_USE_DICT_VERSIONS 0 + #undef CYTHON_USE_EXC_INFO_STACK + #define CYTHON_USE_EXC_INFO_STACK 0 #else #define CYTHON_COMPILING_IN_PYPY 0 #define CYTHON_COMPILING_IN_PYSTON 0 @@ -189,11 +177,17 @@ END: Cython Metadata */ #define CYTHON_FAST_PYCALL 1 #endif #ifndef CYTHON_PEP489_MULTI_PHASE_INIT - #define CYTHON_PEP489_MULTI_PHASE_INIT (0 && PY_VERSION_HEX >= 0x03050000) + #define CYTHON_PEP489_MULTI_PHASE_INIT (PY_VERSION_HEX >= 0x03050000) #endif #ifndef CYTHON_USE_TP_FINALIZE #define CYTHON_USE_TP_FINALIZE (PY_VERSION_HEX >= 0x030400a1) #endif + #ifndef CYTHON_USE_DICT_VERSIONS + #define CYTHON_USE_DICT_VERSIONS (PY_VERSION_HEX >= 0x030600B1) + #endif + #ifndef CYTHON_USE_EXC_INFO_STACK + #define CYTHON_USE_EXC_INFO_STACK (PY_VERSION_HEX >= 0x030700A3) + #endif #endif #if !defined(CYTHON_FAST_PYCCALL) #define CYTHON_FAST_PYCCALL (CYTHON_FAST_PYCALL && PY_VERSION_HEX >= 0x030600B1) @@ -203,6 +197,9 @@ END: Cython Metadata */ #undef SHIFT #undef BASE #undef MASK + #ifdef SIZEOF_VOID_P + enum { __pyx_check_sizeof_voidp = 1 / (int)(SIZEOF_VOID_P == sizeof(void*)) }; + #endif #endif #ifndef __has_attribute #define __has_attribute(x) 0 @@ -343,6 +340,9 @@ class __Pyx_FakeReference { #ifndef Py_TPFLAGS_HAVE_FINALIZE #define Py_TPFLAGS_HAVE_FINALIZE 0 #endif +#ifndef METH_STACKLESS + #define METH_STACKLESS 0 +#endif #if PY_VERSION_HEX <= 0x030700A3 || !defined(METH_FASTCALL) #ifndef METH_FASTCALL #define METH_FASTCALL 0x80 @@ -356,15 +356,40 @@ class __Pyx_FakeReference { #endif #if CYTHON_FAST_PYCCALL #define __Pyx_PyFastCFunction_Check(func)\ - ((PyCFunction_Check(func) && (METH_FASTCALL == (PyCFunction_GET_FLAGS(func) & ~(METH_CLASS | METH_STATIC | METH_COEXIST | METH_KEYWORDS))))) + ((PyCFunction_Check(func) && (METH_FASTCALL == (PyCFunction_GET_FLAGS(func) & ~(METH_CLASS | METH_STATIC | METH_COEXIST | METH_KEYWORDS | METH_STACKLESS))))) #else #define __Pyx_PyFastCFunction_Check(func) 0 #endif +#if CYTHON_USE_DICT_VERSIONS +#define __PYX_GET_DICT_VERSION(dict) (((PyDictObject*)(dict))->ma_version_tag) +#define __PYX_UPDATE_DICT_CACHE(dict, value, cache_var, version_var)\ + (version_var) = __PYX_GET_DICT_VERSION(dict);\ + (cache_var) = (value); +#define __PYX_PY_DICT_LOOKUP_IF_MODIFIED(VAR, DICT, LOOKUP) {\ + static PY_UINT64_T __pyx_dict_version = 0;\ + static PyObject *__pyx_dict_cached_value = NULL;\ + if (likely(__PYX_GET_DICT_VERSION(DICT) == __pyx_dict_version)) {\ + (VAR) = __pyx_dict_cached_value;\ + } else {\ + (VAR) = __pyx_dict_cached_value = (LOOKUP);\ + __pyx_dict_version = __PYX_GET_DICT_VERSION(DICT);\ + }\ + } +#else +#define __PYX_GET_DICT_VERSION(dict) (0) +#define __PYX_UPDATE_DICT_CACHE(dict, value, cache_var, version_var) +#define __PYX_PY_DICT_LOOKUP_IF_MODIFIED(VAR, DICT, LOOKUP) (VAR) = (LOOKUP); +#endif #if CYTHON_COMPILING_IN_PYPY && !defined(PyObject_Malloc) #define PyObject_Malloc(s) PyMem_Malloc(s) #define PyObject_Free(p) PyMem_Free(p) #define PyObject_Realloc(p) PyMem_Realloc(p) #endif +#if CYTHON_COMPILING_IN_CPYTHON && PY_VERSION_HEX < 0x030400A1 + #define PyMem_RawMalloc(n) PyMem_Malloc(n) + #define PyMem_RawRealloc(p, n) PyMem_Realloc(p, n) + #define PyMem_RawFree(p) PyMem_Free(p) +#endif #if CYTHON_COMPILING_IN_PYSTON #define __Pyx_PyCode_HasFreeVars(co) PyCode_HasFreeVars(co) #define __Pyx_PyFrame_SetLineNumber(frame, lineno) PyFrame_SetLineNumber(frame, lineno) @@ -472,8 +497,8 @@ static CYTHON_INLINE void * PyThread_tss_get(Py_tss_t *key) { #if CYTHON_COMPILING_IN_PYPY && !defined(PyObject_Format) #define PyObject_Format(obj, fmt) PyObject_CallMethod(obj, "__format__", "O", fmt) #endif -#define __Pyx_PyString_FormatSafe(a, b) ((unlikely((a) == Py_None)) ? PyNumber_Remainder(a, b) : __Pyx_PyString_Format(a, b)) -#define __Pyx_PyUnicode_FormatSafe(a, b) ((unlikely((a) == Py_None)) ? PyNumber_Remainder(a, b) : PyUnicode_Format(a, b)) +#define __Pyx_PyString_FormatSafe(a, b) ((unlikely((a) == Py_None || (PyString_Check(b) && !PyString_CheckExact(b)))) ? PyNumber_Remainder(a, b) : __Pyx_PyString_Format(a, b)) +#define __Pyx_PyUnicode_FormatSafe(a, b) ((unlikely((a) == Py_None || (PyUnicode_Check(b) && !PyUnicode_CheckExact(b)))) ? PyNumber_Remainder(a, b) : PyUnicode_Format(a, b)) #if PY_MAJOR_VERSION >= 3 #define __Pyx_PyString_Format(a, b) PyUnicode_Format(a, b) #else @@ -639,6 +664,9 @@ typedef struct {PyObject **p; const char *s; const Py_ssize_t n; const char* enc (sizeof(type) == sizeof(Py_ssize_t) &&\ (is_signed || likely(v < (type)PY_SSIZE_T_MAX ||\ v == (type)PY_SSIZE_T_MAX))) ) +static CYTHON_INLINE int __Pyx_is_valid_index(Py_ssize_t i, Py_ssize_t limit) { + return (size_t) i < (size_t) limit; +} #if defined (__cplusplus) && __cplusplus >= 201103L #include #define __Pyx_sst_abs(value) std::abs(value) @@ -697,6 +725,7 @@ static CYTHON_INLINE size_t __Pyx_Py_UNICODE_strlen(const Py_UNICODE *u) { #define __Pyx_Owned_Py_None(b) __Pyx_NewRef(Py_None) static CYTHON_INLINE PyObject * __Pyx_PyBool_FromLong(long b); static CYTHON_INLINE int __Pyx_PyObject_IsTrue(PyObject*); +static CYTHON_INLINE int __Pyx_PyObject_IsTrueAndDecref(PyObject*); static CYTHON_INLINE PyObject* __Pyx_PyNumber_IntOrLong(PyObject* x); #define __Pyx_PySequence_Tuple(obj)\ (likely(PyTuple_CheckExact(obj)) ? __Pyx_NewRef(obj) : PySequence_Tuple(obj)) @@ -777,7 +806,7 @@ static int __Pyx_init_sys_getdefaultencoding_params(void) { if (!default_encoding) goto bad; default_encoding_c = PyBytes_AsString(default_encoding); if (!default_encoding_c) goto bad; - __PYX_DEFAULT_STRING_ENCODING = (char*) malloc(strlen(default_encoding_c)); + __PYX_DEFAULT_STRING_ENCODING = (char*) malloc(strlen(default_encoding_c) + 1); if (!__PYX_DEFAULT_STRING_ENCODING) goto bad; strcpy(__PYX_DEFAULT_STRING_ENCODING, default_encoding_c); Py_DECREF(default_encoding); @@ -855,7 +884,7 @@ static const char *__pyx_f[] = { #define __Pyx_FastGilFuncInit() -/* "../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":730 +/* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":776 * # in Cython to enable them only on the right systems. * * ctypedef npy_int8 int8_t # <<<<<<<<<<<<<< @@ -864,7 +893,7 @@ static const char *__pyx_f[] = { */ typedef npy_int8 __pyx_t_5numpy_int8_t; -/* "../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":731 +/* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":777 * * ctypedef npy_int8 int8_t * ctypedef npy_int16 int16_t # <<<<<<<<<<<<<< @@ -873,7 +902,7 @@ typedef npy_int8 __pyx_t_5numpy_int8_t; */ typedef npy_int16 __pyx_t_5numpy_int16_t; -/* "../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":732 +/* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":778 * ctypedef npy_int8 int8_t * ctypedef npy_int16 int16_t * ctypedef npy_int32 int32_t # <<<<<<<<<<<<<< @@ -882,7 +911,7 @@ typedef npy_int16 __pyx_t_5numpy_int16_t; */ typedef npy_int32 __pyx_t_5numpy_int32_t; -/* "../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":733 +/* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":779 * ctypedef npy_int16 int16_t * ctypedef npy_int32 int32_t * ctypedef npy_int64 int64_t # <<<<<<<<<<<<<< @@ -891,7 +920,7 @@ typedef npy_int32 __pyx_t_5numpy_int32_t; */ typedef npy_int64 __pyx_t_5numpy_int64_t; -/* "../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":737 +/* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":783 * #ctypedef npy_int128 int128_t * * ctypedef npy_uint8 uint8_t # <<<<<<<<<<<<<< @@ -900,7 +929,7 @@ typedef npy_int64 __pyx_t_5numpy_int64_t; */ typedef npy_uint8 __pyx_t_5numpy_uint8_t; -/* "../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":738 +/* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":784 * * ctypedef npy_uint8 uint8_t * ctypedef npy_uint16 uint16_t # <<<<<<<<<<<<<< @@ -909,7 +938,7 @@ typedef npy_uint8 __pyx_t_5numpy_uint8_t; */ typedef npy_uint16 __pyx_t_5numpy_uint16_t; -/* "../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":739 +/* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":785 * ctypedef npy_uint8 uint8_t * ctypedef npy_uint16 uint16_t * ctypedef npy_uint32 uint32_t # <<<<<<<<<<<<<< @@ -918,7 +947,7 @@ typedef npy_uint16 __pyx_t_5numpy_uint16_t; */ typedef npy_uint32 __pyx_t_5numpy_uint32_t; -/* "../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":740 +/* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":786 * ctypedef npy_uint16 uint16_t * ctypedef npy_uint32 uint32_t * ctypedef npy_uint64 uint64_t # <<<<<<<<<<<<<< @@ -927,7 +956,7 @@ typedef npy_uint32 __pyx_t_5numpy_uint32_t; */ typedef npy_uint64 __pyx_t_5numpy_uint64_t; -/* "../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":744 +/* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":790 * #ctypedef npy_uint128 uint128_t * * ctypedef npy_float32 float32_t # <<<<<<<<<<<<<< @@ -936,7 +965,7 @@ typedef npy_uint64 __pyx_t_5numpy_uint64_t; */ typedef npy_float32 __pyx_t_5numpy_float32_t; -/* "../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":745 +/* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":791 * * ctypedef npy_float32 float32_t * ctypedef npy_float64 float64_t # <<<<<<<<<<<<<< @@ -945,7 +974,7 @@ typedef npy_float32 __pyx_t_5numpy_float32_t; */ typedef npy_float64 __pyx_t_5numpy_float64_t; -/* "../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":754 +/* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":800 * # The int types are mapped a bit surprising -- * # numpy.int corresponds to 'l' and numpy.long to 'q' * ctypedef npy_long int_t # <<<<<<<<<<<<<< @@ -954,7 +983,7 @@ typedef npy_float64 __pyx_t_5numpy_float64_t; */ typedef npy_long __pyx_t_5numpy_int_t; -/* "../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":755 +/* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":801 * # numpy.int corresponds to 'l' and numpy.long to 'q' * ctypedef npy_long int_t * ctypedef npy_longlong long_t # <<<<<<<<<<<<<< @@ -963,7 +992,7 @@ typedef npy_long __pyx_t_5numpy_int_t; */ typedef npy_longlong __pyx_t_5numpy_long_t; -/* "../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":756 +/* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":802 * ctypedef npy_long int_t * ctypedef npy_longlong long_t * ctypedef npy_longlong longlong_t # <<<<<<<<<<<<<< @@ -972,7 +1001,7 @@ typedef npy_longlong __pyx_t_5numpy_long_t; */ typedef npy_longlong __pyx_t_5numpy_longlong_t; -/* "../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":758 +/* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":804 * ctypedef npy_longlong longlong_t * * ctypedef npy_ulong uint_t # <<<<<<<<<<<<<< @@ -981,7 +1010,7 @@ typedef npy_longlong __pyx_t_5numpy_longlong_t; */ typedef npy_ulong __pyx_t_5numpy_uint_t; -/* "../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":759 +/* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":805 * * ctypedef npy_ulong uint_t * ctypedef npy_ulonglong ulong_t # <<<<<<<<<<<<<< @@ -990,7 +1019,7 @@ typedef npy_ulong __pyx_t_5numpy_uint_t; */ typedef npy_ulonglong __pyx_t_5numpy_ulong_t; -/* "../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":760 +/* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":806 * ctypedef npy_ulong uint_t * ctypedef npy_ulonglong ulong_t * ctypedef npy_ulonglong ulonglong_t # <<<<<<<<<<<<<< @@ -999,7 +1028,7 @@ typedef npy_ulonglong __pyx_t_5numpy_ulong_t; */ typedef npy_ulonglong __pyx_t_5numpy_ulonglong_t; -/* "../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":762 +/* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":808 * ctypedef npy_ulonglong ulonglong_t * * ctypedef npy_intp intp_t # <<<<<<<<<<<<<< @@ -1008,7 +1037,7 @@ typedef npy_ulonglong __pyx_t_5numpy_ulonglong_t; */ typedef npy_intp __pyx_t_5numpy_intp_t; -/* "../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":763 +/* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":809 * * ctypedef npy_intp intp_t * ctypedef npy_uintp uintp_t # <<<<<<<<<<<<<< @@ -1017,7 +1046,7 @@ typedef npy_intp __pyx_t_5numpy_intp_t; */ typedef npy_uintp __pyx_t_5numpy_uintp_t; -/* "../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":765 +/* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":811 * ctypedef npy_uintp uintp_t * * ctypedef npy_double float_t # <<<<<<<<<<<<<< @@ -1026,7 +1055,7 @@ typedef npy_uintp __pyx_t_5numpy_uintp_t; */ typedef npy_double __pyx_t_5numpy_float_t; -/* "../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":766 +/* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":812 * * ctypedef npy_double float_t * ctypedef npy_double double_t # <<<<<<<<<<<<<< @@ -1035,7 +1064,7 @@ typedef npy_double __pyx_t_5numpy_float_t; */ typedef npy_double __pyx_t_5numpy_double_t; -/* "../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":767 +/* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":813 * ctypedef npy_double float_t * ctypedef npy_double double_t * ctypedef npy_longdouble longdouble_t # <<<<<<<<<<<<<< @@ -1091,7 +1120,7 @@ struct __pyx_obj_6gensim_6models_19word2vec_corpusfile_CythonLineSentence; struct __pyx_obj_6gensim_6models_19word2vec_corpusfile_CythonVocab; struct __pyx_obj_6gensim_6models_19word2vec_corpusfile___pyx_scope_struct____iter__; -/* "../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":769 +/* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":815 * ctypedef npy_longdouble longdouble_t * * ctypedef npy_cfloat cfloat_t # <<<<<<<<<<<<<< @@ -1100,7 +1129,7 @@ struct __pyx_obj_6gensim_6models_19word2vec_corpusfile___pyx_scope_struct____ite */ typedef npy_cfloat __pyx_t_5numpy_cfloat_t; -/* "../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":770 +/* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":816 * * ctypedef npy_cfloat cfloat_t * ctypedef npy_cdouble cdouble_t # <<<<<<<<<<<<<< @@ -1109,7 +1138,7 @@ typedef npy_cfloat __pyx_t_5numpy_cfloat_t; */ typedef npy_cdouble __pyx_t_5numpy_cdouble_t; -/* "../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":771 +/* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":817 * ctypedef npy_cfloat cfloat_t * ctypedef npy_cdouble cdouble_t * ctypedef npy_clongdouble clongdouble_t # <<<<<<<<<<<<<< @@ -1118,7 +1147,7 @@ typedef npy_cdouble __pyx_t_5numpy_cdouble_t; */ typedef npy_clongdouble __pyx_t_5numpy_clongdouble_t; -/* "../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":773 +/* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":819 * ctypedef npy_clongdouble clongdouble_t * * ctypedef npy_cdouble complex_t # <<<<<<<<<<<<<< @@ -1450,7 +1479,25 @@ static void __Pyx_RaiseArgtupleInvalid(const char* func_name, int exact, Py_ssize_t num_min, Py_ssize_t num_max, Py_ssize_t num_found); /* GetModuleGlobalName.proto */ -static CYTHON_INLINE PyObject *__Pyx_GetModuleGlobalName(PyObject *name); +#if CYTHON_USE_DICT_VERSIONS +#define __Pyx_GetModuleGlobalName(var, name) {\ + static PY_UINT64_T __pyx_dict_version = 0;\ + static PyObject *__pyx_dict_cached_value = NULL;\ + (var) = (likely(__pyx_dict_version == __PYX_GET_DICT_VERSION(__pyx_d))) ?\ + (likely(__pyx_dict_cached_value) ? __Pyx_NewRef(__pyx_dict_cached_value) : __Pyx_GetBuiltinName(name)) :\ + __Pyx__GetModuleGlobalName(name, &__pyx_dict_version, &__pyx_dict_cached_value);\ +} +#define __Pyx_GetModuleGlobalNameUncached(var, name) {\ + PY_UINT64_T __pyx_dict_version;\ + PyObject *__pyx_dict_cached_value;\ + (var) = __Pyx__GetModuleGlobalName(name, &__pyx_dict_version, &__pyx_dict_cached_value);\ +} +static PyObject *__Pyx__GetModuleGlobalName(PyObject *name, PY_UINT64_T *dict_version, PyObject **dict_cached_value); +#else +#define __Pyx_GetModuleGlobalName(var, name) (var) = __Pyx__GetModuleGlobalName(name) +#define __Pyx_GetModuleGlobalNameUncached(var, name) (var) = __Pyx__GetModuleGlobalName(name) +static CYTHON_INLINE PyObject *__Pyx__GetModuleGlobalName(PyObject *name); +#endif /* PyCFunctionFastCall.proto */ #if CYTHON_FAST_PYCCALL @@ -1468,6 +1515,18 @@ static PyObject *__Pyx_PyFunction_FastCallDict(PyObject *func, PyObject **args, #else #define __Pyx_PyFunction_FastCallDict(func, args, nargs, kwargs) _PyFunction_FastCallDict(func, args, nargs, kwargs) #endif +#define __Pyx_BUILD_ASSERT_EXPR(cond)\ + (sizeof(char [1 - 2*!(cond)]) - 1) +#ifndef Py_MEMBER_SIZE +#define Py_MEMBER_SIZE(type, member) sizeof(((type *)0)->member) +#endif + static size_t __pyx_pyframe_localsplus_offset = 0; + #include "frameobject.h" + #define __Pxy_PyFrame_Initialize_Offsets()\ + ((void)__Pyx_BUILD_ASSERT_EXPR(sizeof(PyFrameObject) == offsetof(PyFrameObject, f_localsplus) + Py_MEMBER_SIZE(PyFrameObject, f_localsplus)),\ + (void)(__pyx_pyframe_localsplus_offset = ((size_t)PyFrame_Type.tp_basicsize) - Py_MEMBER_SIZE(PyFrameObject, f_localsplus))) + #define __Pyx_PyFrame_GetLocalsplus(frame)\ + (assert(__pyx_pyframe_localsplus_offset), (PyObject **)(((char *)(frame)) + __pyx_pyframe_localsplus_offset)) #endif /* PyObjectCall.proto */ @@ -1477,6 +1536,9 @@ static CYTHON_INLINE PyObject* __Pyx_PyObject_Call(PyObject *func, PyObject *arg #define __Pyx_PyObject_Call(func, arg, kw) PyObject_Call(func, arg, kw) #endif +/* PyObjectCall2Args.proto */ +static CYTHON_UNUSED PyObject* __Pyx_PyObject_Call2Args(PyObject* function, PyObject* arg1, PyObject* arg2); + /* PyObjectCallMethO.proto */ #if CYTHON_COMPILING_IN_CPYTHON static CYTHON_INLINE PyObject* __Pyx_PyObject_CallMethO(PyObject *func, PyObject *arg); @@ -1589,6 +1651,11 @@ static PyObject *__Pyx_PyDict_GetItem(PyObject *d, PyObject* key); /* RaiseNoneIterError.proto */ static CYTHON_INLINE void __Pyx_RaiseNoneNotIterableError(void); +/* GetTopmostException.proto */ +#if CYTHON_USE_EXC_INFO_STACK +static _PyErr_StackItem * __Pyx_PyErr_GetTopmostException(PyThreadState *tstate); +#endif + /* SaveResetException.proto */ #if CYTHON_FAST_THREAD_STATE #define __Pyx_ExceptionSave(type, value, tb) __Pyx__ExceptionSave(__pyx_tstate, type, value, tb) @@ -1649,6 +1716,17 @@ static int __Pyx_SetVtable(PyObject *dict, void *vtable); /* SetupReduce.proto */ static int __Pyx_setup_reduce(PyObject* type_obj); +/* TypeImport.proto */ +#ifndef __PYX_HAVE_RT_ImportType_proto +#define __PYX_HAVE_RT_ImportType_proto +enum __Pyx_ImportType_CheckSize { + __Pyx_ImportType_CheckSize_Error = 0, + __Pyx_ImportType_CheckSize_Warn = 1, + __Pyx_ImportType_CheckSize_Ignore = 2 +}; +static PyTypeObject *__Pyx_ImportType(PyObject* module, const char *module_name, const char *class_name, size_t size, enum __Pyx_ImportType_CheckSize check_size); +#endif + /* Import.proto */ static PyObject *__Pyx_Import(PyObject *name, PyObject *from_list, int level); @@ -1881,19 +1959,28 @@ static CYTHON_INLINE void __Pyx__ExceptionSwap(PyThreadState *tstate, PyObject * static CYTHON_INLINE void __Pyx_ExceptionSwap(PyObject **type, PyObject **value, PyObject **tb); #endif +/* PyObjectGetMethod.proto */ +static int __Pyx_PyObject_GetMethod(PyObject *obj, PyObject *name, PyObject **method); + /* PyObjectCallMethod1.proto */ static PyObject* __Pyx_PyObject_CallMethod1(PyObject* obj, PyObject* method_name, PyObject* arg); -static PyObject* __Pyx__PyObject_CallMethod1(PyObject* method, PyObject* arg); /* CoroutineBase.proto */ typedef PyObject *(*__pyx_coroutine_body_t)(PyObject *, PyThreadState *, PyObject *); +#if CYTHON_USE_EXC_INFO_STACK +#define __Pyx_ExcInfoStruct _PyErr_StackItem +#else typedef struct { - PyObject_HEAD - __pyx_coroutine_body_t body; - PyObject *closure; PyObject *exc_type; PyObject *exc_value; PyObject *exc_traceback; +} __Pyx_ExcInfoStruct; +#endif +typedef struct { + PyObject_HEAD + __pyx_coroutine_body_t body; + PyObject *closure; + __Pyx_ExcInfoStruct gi_exc_state; PyObject *gi_weakreflist; PyObject *classobj; PyObject *yieldfrom; @@ -1910,18 +1997,24 @@ static __pyx_CoroutineObject *__Pyx__Coroutine_New( static __pyx_CoroutineObject *__Pyx__Coroutine_NewInit( __pyx_CoroutineObject *gen, __pyx_coroutine_body_t body, PyObject *code, PyObject *closure, PyObject *name, PyObject *qualname, PyObject *module_name); +static CYTHON_INLINE void __Pyx_Coroutine_ExceptionClear(__Pyx_ExcInfoStruct *self); static int __Pyx_Coroutine_clear(PyObject *self); static PyObject *__Pyx_Coroutine_Send(PyObject *self, PyObject *value); static PyObject *__Pyx_Coroutine_Close(PyObject *self); static PyObject *__Pyx_Coroutine_Throw(PyObject *gen, PyObject *args); +#if CYTHON_USE_EXC_INFO_STACK +#define __Pyx_Coroutine_SwapException(self) +#define __Pyx_Coroutine_ResetAndClearException(self) __Pyx_Coroutine_ExceptionClear(&(self)->gi_exc_state) +#else #define __Pyx_Coroutine_SwapException(self) {\ - __Pyx_ExceptionSwap(&(self)->exc_type, &(self)->exc_value, &(self)->exc_traceback);\ - __Pyx_Coroutine_ResetFrameBackpointer(self);\ + __Pyx_ExceptionSwap(&(self)->gi_exc_state.exc_type, &(self)->gi_exc_state.exc_value, &(self)->gi_exc_state.exc_traceback);\ + __Pyx_Coroutine_ResetFrameBackpointer(&(self)->gi_exc_state);\ } #define __Pyx_Coroutine_ResetAndClearException(self) {\ - __Pyx_ExceptionReset((self)->exc_type, (self)->exc_value, (self)->exc_traceback);\ - (self)->exc_type = (self)->exc_value = (self)->exc_traceback = NULL;\ + __Pyx_ExceptionReset((self)->gi_exc_state.exc_type, (self)->gi_exc_state.exc_value, (self)->gi_exc_state.exc_traceback);\ + (self)->gi_exc_state.exc_type = (self)->gi_exc_state.exc_value = (self)->gi_exc_state.exc_traceback = NULL;\ } +#endif #if CYTHON_FAST_THREAD_STATE #define __Pyx_PyGen_FetchStopIterationValue(pvalue)\ __Pyx_PyGen__FetchStopIterationValue(__pyx_tstate, pvalue) @@ -1930,7 +2023,7 @@ static PyObject *__Pyx_Coroutine_Throw(PyObject *gen, PyObject *args); __Pyx_PyGen__FetchStopIterationValue(__Pyx_PyThreadState_Current, pvalue) #endif static int __Pyx_PyGen__FetchStopIterationValue(PyThreadState *tstate, PyObject **pvalue); -static CYTHON_INLINE void __Pyx_Coroutine_ResetFrameBackpointer(__pyx_CoroutineObject *self); +static CYTHON_INLINE void __Pyx_Coroutine_ResetFrameBackpointer(__Pyx_ExcInfoStruct *exc_state); /* PatchModuleWithCoroutine.proto */ static PyObject* __Pyx_Coroutine_patch_module(PyObject* module, const char* py_code); @@ -1953,21 +2046,6 @@ static int __Pyx_check_binary_version(void); /* FunctionExport.proto */ static int __Pyx_ExportFunction(const char *name, void (*f)(void), const char *sig); -/* PyIdentifierFromString.proto */ -#if !defined(__Pyx_PyIdentifier_FromString) -#if PY_MAJOR_VERSION < 3 - #define __Pyx_PyIdentifier_FromString(s) PyString_FromString(s) -#else - #define __Pyx_PyIdentifier_FromString(s) PyUnicode_FromString(s) -#endif -#endif - -/* ModuleImport.proto */ -static PyObject *__Pyx_ImportModule(const char *name); - -/* TypeImport.proto */ -static PyTypeObject *__Pyx_ImportType(const char *module_name, const char *class_name, size_t size, int strict); - /* VoidPtrImport.proto */ static int __Pyx_ImportVoidPtr(PyObject *module, const char *name, void **p, const char *sig); @@ -2131,6 +2209,7 @@ static const char __pyx_k_ValueError[] = "ValueError"; static const char __pyx_k_num_epochs[] = "num_epochs"; static const char __pyx_k_pyx_vtable[] = "__pyx_vtable__"; static const char __pyx_k_sample_int[] = "sample_int"; +static const char __pyx_k_CythonVocab[] = "CythonVocab"; static const char __pyx_k_ImportError[] = "ImportError"; static const char __pyx_k_corpus_file[] = "corpus_file"; static const char __pyx_k_cur_epoch_2[] = "cur_epoch"; @@ -2153,6 +2232,7 @@ static const char __pyx_k_train_epoch_cbow[] = "train_epoch_cbow"; static const char __pyx_k_effective_samples[] = "effective_samples"; static const char __pyx_k_expected_examples[] = "_expected_examples"; static const char __pyx_k_CORPUSFILE_VERSION[] = "CORPUSFILE_VERSION"; +static const char __pyx_k_CythonLineSentence[] = "CythonLineSentence"; static const char __pyx_k_cline_in_traceback[] = "cline_in_traceback"; static const char __pyx_k_effective_sentences[] = "effective_sentences"; static const char __pyx_k_expected_examples_2[] = "expected_examples"; @@ -2174,7 +2254,9 @@ static const char __pyx_k_self_vocab_cannot_be_converted_t[] = "self.vocab canno static const char __pyx_k_Format_string_allocated_too_shor_2[] = "Format string allocated too short."; static const char __pyx_k_gensim_models_word2vec_corpusfil_2[] = "gensim/models/word2vec_corpusfile.pyx"; static PyObject *__pyx_n_s_CORPUSFILE_VERSION; +static PyObject *__pyx_n_s_CythonLineSentence; static PyObject *__pyx_n_s_CythonLineSentence___iter; +static PyObject *__pyx_n_s_CythonVocab; static PyObject *__pyx_kp_u_Format_string_allocated_too_shor; static PyObject *__pyx_kp_u_Format_string_allocated_too_shor_2; static PyObject *__pyx_n_s_ImportError; @@ -2310,14 +2392,11 @@ static PyObject *__pyx_tuple__7; static PyObject *__pyx_tuple__8; static PyObject *__pyx_tuple__9; static PyObject *__pyx_tuple__10; -static PyObject *__pyx_tuple__11; static PyObject *__pyx_tuple__12; -static PyObject *__pyx_tuple__13; -static PyObject *__pyx_tuple__15; -static PyObject *__pyx_tuple__17; -static PyObject *__pyx_codeobj__14; -static PyObject *__pyx_codeobj__16; -static PyObject *__pyx_codeobj__18; +static PyObject *__pyx_tuple__14; +static PyObject *__pyx_codeobj__11; +static PyObject *__pyx_codeobj__13; +static PyObject *__pyx_codeobj__15; /* Late includes */ /* "gensim/models/word2vec_corpusfile.pyx":41 @@ -2417,9 +2496,9 @@ static int __pyx_pf_6gensim_6models_19word2vec_corpusfile_11CythonVocab___init__ PyObject *__pyx_t_2 = NULL; PyObject *__pyx_t_3 = NULL; PyObject *__pyx_t_4 = NULL; - PyObject *__pyx_t_5 = NULL; - Py_ssize_t __pyx_t_6; - PyObject *(*__pyx_t_7)(PyObject *); + Py_ssize_t __pyx_t_5; + PyObject *(*__pyx_t_6)(PyObject *); + PyObject *__pyx_t_7 = NULL; PyObject *(*__pyx_t_8)(PyObject *); __pyx_t_5numpy_uint32_t __pyx_t_9; PY_LONG_LONG __pyx_t_10; @@ -2435,7 +2514,7 @@ static int __pyx_pf_6gensim_6models_19word2vec_corpusfile_11CythonVocab___init__ * token = any2utf8(py_token) * word.index = vocab_item.index */ - __pyx_t_2 = __Pyx_GetModuleGlobalName(__pyx_n_s_iteritems); if (unlikely(!__pyx_t_2)) __PYX_ERR(1, 44, __pyx_L1_error) + __Pyx_GetModuleGlobalName(__pyx_t_2, __pyx_n_s_iteritems); if (unlikely(!__pyx_t_2)) __PYX_ERR(1, 44, __pyx_L1_error) __Pyx_GOTREF(__pyx_t_2); __pyx_t_3 = __Pyx_PyObject_GetAttrStr(__pyx_v_wv, __pyx_n_s_vocab); if (unlikely(!__pyx_t_3)) __PYX_ERR(1, 44, __pyx_L1_error) __Pyx_GOTREF(__pyx_t_3); @@ -2449,72 +2528,42 @@ static int __pyx_pf_6gensim_6models_19word2vec_corpusfile_11CythonVocab___init__ __Pyx_DECREF_SET(__pyx_t_2, function); } } - if (!__pyx_t_4) { - __pyx_t_1 = __Pyx_PyObject_CallOneArg(__pyx_t_2, __pyx_t_3); if (unlikely(!__pyx_t_1)) __PYX_ERR(1, 44, __pyx_L1_error) - __Pyx_DECREF(__pyx_t_3); __pyx_t_3 = 0; - __Pyx_GOTREF(__pyx_t_1); - } else { - #if CYTHON_FAST_PYCALL - if (PyFunction_Check(__pyx_t_2)) { - PyObject *__pyx_temp[2] = {__pyx_t_4, __pyx_t_3}; - __pyx_t_1 = __Pyx_PyFunction_FastCall(__pyx_t_2, __pyx_temp+1-1, 1+1); if (unlikely(!__pyx_t_1)) __PYX_ERR(1, 44, __pyx_L1_error) - __Pyx_XDECREF(__pyx_t_4); __pyx_t_4 = 0; - __Pyx_GOTREF(__pyx_t_1); - __Pyx_DECREF(__pyx_t_3); __pyx_t_3 = 0; - } else - #endif - #if CYTHON_FAST_PYCCALL - if (__Pyx_PyFastCFunction_Check(__pyx_t_2)) { - PyObject *__pyx_temp[2] = {__pyx_t_4, __pyx_t_3}; - __pyx_t_1 = __Pyx_PyCFunction_FastCall(__pyx_t_2, __pyx_temp+1-1, 1+1); if (unlikely(!__pyx_t_1)) __PYX_ERR(1, 44, __pyx_L1_error) - __Pyx_XDECREF(__pyx_t_4); __pyx_t_4 = 0; - __Pyx_GOTREF(__pyx_t_1); - __Pyx_DECREF(__pyx_t_3); __pyx_t_3 = 0; - } else - #endif - { - __pyx_t_5 = PyTuple_New(1+1); if (unlikely(!__pyx_t_5)) __PYX_ERR(1, 44, __pyx_L1_error) - __Pyx_GOTREF(__pyx_t_5); - __Pyx_GIVEREF(__pyx_t_4); PyTuple_SET_ITEM(__pyx_t_5, 0, __pyx_t_4); __pyx_t_4 = NULL; - __Pyx_GIVEREF(__pyx_t_3); - PyTuple_SET_ITEM(__pyx_t_5, 0+1, __pyx_t_3); - __pyx_t_3 = 0; - __pyx_t_1 = __Pyx_PyObject_Call(__pyx_t_2, __pyx_t_5, NULL); if (unlikely(!__pyx_t_1)) __PYX_ERR(1, 44, __pyx_L1_error) - __Pyx_GOTREF(__pyx_t_1); - __Pyx_DECREF(__pyx_t_5); __pyx_t_5 = 0; - } - } + __pyx_t_1 = (__pyx_t_4) ? __Pyx_PyObject_Call2Args(__pyx_t_2, __pyx_t_4, __pyx_t_3) : __Pyx_PyObject_CallOneArg(__pyx_t_2, __pyx_t_3); + __Pyx_XDECREF(__pyx_t_4); __pyx_t_4 = 0; + __Pyx_DECREF(__pyx_t_3); __pyx_t_3 = 0; + if (unlikely(!__pyx_t_1)) __PYX_ERR(1, 44, __pyx_L1_error) + __Pyx_GOTREF(__pyx_t_1); __Pyx_DECREF(__pyx_t_2); __pyx_t_2 = 0; if (likely(PyList_CheckExact(__pyx_t_1)) || PyTuple_CheckExact(__pyx_t_1)) { - __pyx_t_2 = __pyx_t_1; __Pyx_INCREF(__pyx_t_2); __pyx_t_6 = 0; - __pyx_t_7 = NULL; + __pyx_t_2 = __pyx_t_1; __Pyx_INCREF(__pyx_t_2); __pyx_t_5 = 0; + __pyx_t_6 = NULL; } else { - __pyx_t_6 = -1; __pyx_t_2 = PyObject_GetIter(__pyx_t_1); if (unlikely(!__pyx_t_2)) __PYX_ERR(1, 44, __pyx_L1_error) + __pyx_t_5 = -1; __pyx_t_2 = PyObject_GetIter(__pyx_t_1); if (unlikely(!__pyx_t_2)) __PYX_ERR(1, 44, __pyx_L1_error) __Pyx_GOTREF(__pyx_t_2); - __pyx_t_7 = Py_TYPE(__pyx_t_2)->tp_iternext; if (unlikely(!__pyx_t_7)) __PYX_ERR(1, 44, __pyx_L1_error) + __pyx_t_6 = Py_TYPE(__pyx_t_2)->tp_iternext; if (unlikely(!__pyx_t_6)) __PYX_ERR(1, 44, __pyx_L1_error) } __Pyx_DECREF(__pyx_t_1); __pyx_t_1 = 0; for (;;) { - if (likely(!__pyx_t_7)) { + if (likely(!__pyx_t_6)) { if (likely(PyList_CheckExact(__pyx_t_2))) { - if (__pyx_t_6 >= PyList_GET_SIZE(__pyx_t_2)) break; + if (__pyx_t_5 >= PyList_GET_SIZE(__pyx_t_2)) break; #if CYTHON_ASSUME_SAFE_MACROS && !CYTHON_AVOID_BORROWED_REFS - __pyx_t_1 = PyList_GET_ITEM(__pyx_t_2, __pyx_t_6); __Pyx_INCREF(__pyx_t_1); __pyx_t_6++; if (unlikely(0 < 0)) __PYX_ERR(1, 44, __pyx_L1_error) + __pyx_t_1 = PyList_GET_ITEM(__pyx_t_2, __pyx_t_5); __Pyx_INCREF(__pyx_t_1); __pyx_t_5++; if (unlikely(0 < 0)) __PYX_ERR(1, 44, __pyx_L1_error) #else - __pyx_t_1 = PySequence_ITEM(__pyx_t_2, __pyx_t_6); __pyx_t_6++; if (unlikely(!__pyx_t_1)) __PYX_ERR(1, 44, __pyx_L1_error) + __pyx_t_1 = PySequence_ITEM(__pyx_t_2, __pyx_t_5); __pyx_t_5++; if (unlikely(!__pyx_t_1)) __PYX_ERR(1, 44, __pyx_L1_error) __Pyx_GOTREF(__pyx_t_1); #endif } else { - if (__pyx_t_6 >= PyTuple_GET_SIZE(__pyx_t_2)) break; + if (__pyx_t_5 >= PyTuple_GET_SIZE(__pyx_t_2)) break; #if CYTHON_ASSUME_SAFE_MACROS && !CYTHON_AVOID_BORROWED_REFS - __pyx_t_1 = PyTuple_GET_ITEM(__pyx_t_2, __pyx_t_6); __Pyx_INCREF(__pyx_t_1); __pyx_t_6++; if (unlikely(0 < 0)) __PYX_ERR(1, 44, __pyx_L1_error) + __pyx_t_1 = PyTuple_GET_ITEM(__pyx_t_2, __pyx_t_5); __Pyx_INCREF(__pyx_t_1); __pyx_t_5++; if (unlikely(0 < 0)) __PYX_ERR(1, 44, __pyx_L1_error) #else - __pyx_t_1 = PySequence_ITEM(__pyx_t_2, __pyx_t_6); __pyx_t_6++; if (unlikely(!__pyx_t_1)) __PYX_ERR(1, 44, __pyx_L1_error) + __pyx_t_1 = PySequence_ITEM(__pyx_t_2, __pyx_t_5); __pyx_t_5++; if (unlikely(!__pyx_t_1)) __PYX_ERR(1, 44, __pyx_L1_error) __Pyx_GOTREF(__pyx_t_1); #endif } } else { - __pyx_t_1 = __pyx_t_7(__pyx_t_2); + __pyx_t_1 = __pyx_t_6(__pyx_t_2); if (unlikely(!__pyx_t_1)) { PyObject* exc_type = PyErr_Occurred(); if (exc_type) { @@ -2535,46 +2584,46 @@ static int __pyx_pf_6gensim_6models_19word2vec_corpusfile_11CythonVocab___init__ } #if CYTHON_ASSUME_SAFE_MACROS && !CYTHON_AVOID_BORROWED_REFS if (likely(PyTuple_CheckExact(sequence))) { - __pyx_t_5 = PyTuple_GET_ITEM(sequence, 0); - __pyx_t_3 = PyTuple_GET_ITEM(sequence, 1); + __pyx_t_3 = PyTuple_GET_ITEM(sequence, 0); + __pyx_t_4 = PyTuple_GET_ITEM(sequence, 1); } else { - __pyx_t_5 = PyList_GET_ITEM(sequence, 0); - __pyx_t_3 = PyList_GET_ITEM(sequence, 1); + __pyx_t_3 = PyList_GET_ITEM(sequence, 0); + __pyx_t_4 = PyList_GET_ITEM(sequence, 1); } - __Pyx_INCREF(__pyx_t_5); __Pyx_INCREF(__pyx_t_3); + __Pyx_INCREF(__pyx_t_4); #else - __pyx_t_5 = PySequence_ITEM(sequence, 0); if (unlikely(!__pyx_t_5)) __PYX_ERR(1, 44, __pyx_L1_error) - __Pyx_GOTREF(__pyx_t_5); - __pyx_t_3 = PySequence_ITEM(sequence, 1); if (unlikely(!__pyx_t_3)) __PYX_ERR(1, 44, __pyx_L1_error) + __pyx_t_3 = PySequence_ITEM(sequence, 0); if (unlikely(!__pyx_t_3)) __PYX_ERR(1, 44, __pyx_L1_error) __Pyx_GOTREF(__pyx_t_3); + __pyx_t_4 = PySequence_ITEM(sequence, 1); if (unlikely(!__pyx_t_4)) __PYX_ERR(1, 44, __pyx_L1_error) + __Pyx_GOTREF(__pyx_t_4); #endif __Pyx_DECREF(__pyx_t_1); __pyx_t_1 = 0; } else { Py_ssize_t index = -1; - __pyx_t_4 = PyObject_GetIter(__pyx_t_1); if (unlikely(!__pyx_t_4)) __PYX_ERR(1, 44, __pyx_L1_error) - __Pyx_GOTREF(__pyx_t_4); + __pyx_t_7 = PyObject_GetIter(__pyx_t_1); if (unlikely(!__pyx_t_7)) __PYX_ERR(1, 44, __pyx_L1_error) + __Pyx_GOTREF(__pyx_t_7); __Pyx_DECREF(__pyx_t_1); __pyx_t_1 = 0; - __pyx_t_8 = Py_TYPE(__pyx_t_4)->tp_iternext; - index = 0; __pyx_t_5 = __pyx_t_8(__pyx_t_4); if (unlikely(!__pyx_t_5)) goto __pyx_L5_unpacking_failed; - __Pyx_GOTREF(__pyx_t_5); - index = 1; __pyx_t_3 = __pyx_t_8(__pyx_t_4); if (unlikely(!__pyx_t_3)) goto __pyx_L5_unpacking_failed; + __pyx_t_8 = Py_TYPE(__pyx_t_7)->tp_iternext; + index = 0; __pyx_t_3 = __pyx_t_8(__pyx_t_7); if (unlikely(!__pyx_t_3)) goto __pyx_L5_unpacking_failed; __Pyx_GOTREF(__pyx_t_3); - if (__Pyx_IternextUnpackEndCheck(__pyx_t_8(__pyx_t_4), 2) < 0) __PYX_ERR(1, 44, __pyx_L1_error) + index = 1; __pyx_t_4 = __pyx_t_8(__pyx_t_7); if (unlikely(!__pyx_t_4)) goto __pyx_L5_unpacking_failed; + __Pyx_GOTREF(__pyx_t_4); + if (__Pyx_IternextUnpackEndCheck(__pyx_t_8(__pyx_t_7), 2) < 0) __PYX_ERR(1, 44, __pyx_L1_error) __pyx_t_8 = NULL; - __Pyx_DECREF(__pyx_t_4); __pyx_t_4 = 0; + __Pyx_DECREF(__pyx_t_7); __pyx_t_7 = 0; goto __pyx_L6_unpacking_done; __pyx_L5_unpacking_failed:; - __Pyx_DECREF(__pyx_t_4); __pyx_t_4 = 0; + __Pyx_DECREF(__pyx_t_7); __pyx_t_7 = 0; __pyx_t_8 = NULL; if (__Pyx_IterFinish() == 0) __Pyx_RaiseNeedMoreValuesError(index); __PYX_ERR(1, 44, __pyx_L1_error) __pyx_L6_unpacking_done:; } - __Pyx_XDECREF_SET(__pyx_v_py_token, __pyx_t_5); - __pyx_t_5 = 0; - __Pyx_XDECREF_SET(__pyx_v_vocab_item, __pyx_t_3); + __Pyx_XDECREF_SET(__pyx_v_py_token, __pyx_t_3); __pyx_t_3 = 0; + __Pyx_XDECREF_SET(__pyx_v_vocab_item, __pyx_t_4); + __pyx_t_4 = 0; /* "gensim/models/word2vec_corpusfile.pyx":45 * @@ -2583,51 +2632,23 @@ static int __pyx_pf_6gensim_6models_19word2vec_corpusfile_11CythonVocab___init__ * word.index = vocab_item.index * word.sample_int = vocab_item.sample_int */ - __pyx_t_3 = __Pyx_GetModuleGlobalName(__pyx_n_s_any2utf8); if (unlikely(!__pyx_t_3)) __PYX_ERR(1, 45, __pyx_L1_error) - __Pyx_GOTREF(__pyx_t_3); - __pyx_t_5 = NULL; - if (CYTHON_UNPACK_METHODS && unlikely(PyMethod_Check(__pyx_t_3))) { - __pyx_t_5 = PyMethod_GET_SELF(__pyx_t_3); - if (likely(__pyx_t_5)) { - PyObject* function = PyMethod_GET_FUNCTION(__pyx_t_3); - __Pyx_INCREF(__pyx_t_5); + __Pyx_GetModuleGlobalName(__pyx_t_4, __pyx_n_s_any2utf8); if (unlikely(!__pyx_t_4)) __PYX_ERR(1, 45, __pyx_L1_error) + __Pyx_GOTREF(__pyx_t_4); + __pyx_t_3 = NULL; + if (CYTHON_UNPACK_METHODS && unlikely(PyMethod_Check(__pyx_t_4))) { + __pyx_t_3 = PyMethod_GET_SELF(__pyx_t_4); + if (likely(__pyx_t_3)) { + PyObject* function = PyMethod_GET_FUNCTION(__pyx_t_4); + __Pyx_INCREF(__pyx_t_3); __Pyx_INCREF(function); - __Pyx_DECREF_SET(__pyx_t_3, function); - } - } - if (!__pyx_t_5) { - __pyx_t_1 = __Pyx_PyObject_CallOneArg(__pyx_t_3, __pyx_v_py_token); if (unlikely(!__pyx_t_1)) __PYX_ERR(1, 45, __pyx_L1_error) - __Pyx_GOTREF(__pyx_t_1); - } else { - #if CYTHON_FAST_PYCALL - if (PyFunction_Check(__pyx_t_3)) { - PyObject *__pyx_temp[2] = {__pyx_t_5, __pyx_v_py_token}; - __pyx_t_1 = __Pyx_PyFunction_FastCall(__pyx_t_3, __pyx_temp+1-1, 1+1); if (unlikely(!__pyx_t_1)) __PYX_ERR(1, 45, __pyx_L1_error) - __Pyx_XDECREF(__pyx_t_5); __pyx_t_5 = 0; - __Pyx_GOTREF(__pyx_t_1); - } else - #endif - #if CYTHON_FAST_PYCCALL - if (__Pyx_PyFastCFunction_Check(__pyx_t_3)) { - PyObject *__pyx_temp[2] = {__pyx_t_5, __pyx_v_py_token}; - __pyx_t_1 = __Pyx_PyCFunction_FastCall(__pyx_t_3, __pyx_temp+1-1, 1+1); if (unlikely(!__pyx_t_1)) __PYX_ERR(1, 45, __pyx_L1_error) - __Pyx_XDECREF(__pyx_t_5); __pyx_t_5 = 0; - __Pyx_GOTREF(__pyx_t_1); - } else - #endif - { - __pyx_t_4 = PyTuple_New(1+1); if (unlikely(!__pyx_t_4)) __PYX_ERR(1, 45, __pyx_L1_error) - __Pyx_GOTREF(__pyx_t_4); - __Pyx_GIVEREF(__pyx_t_5); PyTuple_SET_ITEM(__pyx_t_4, 0, __pyx_t_5); __pyx_t_5 = NULL; - __Pyx_INCREF(__pyx_v_py_token); - __Pyx_GIVEREF(__pyx_v_py_token); - PyTuple_SET_ITEM(__pyx_t_4, 0+1, __pyx_v_py_token); - __pyx_t_1 = __Pyx_PyObject_Call(__pyx_t_3, __pyx_t_4, NULL); if (unlikely(!__pyx_t_1)) __PYX_ERR(1, 45, __pyx_L1_error) - __Pyx_GOTREF(__pyx_t_1); - __Pyx_DECREF(__pyx_t_4); __pyx_t_4 = 0; + __Pyx_DECREF_SET(__pyx_t_4, function); } } - __Pyx_DECREF(__pyx_t_3); __pyx_t_3 = 0; + __pyx_t_1 = (__pyx_t_3) ? __Pyx_PyObject_Call2Args(__pyx_t_4, __pyx_t_3, __pyx_v_py_token) : __Pyx_PyObject_CallOneArg(__pyx_t_4, __pyx_v_py_token); + __Pyx_XDECREF(__pyx_t_3); __pyx_t_3 = 0; + if (unlikely(!__pyx_t_1)) __PYX_ERR(1, 45, __pyx_L1_error) + __Pyx_GOTREF(__pyx_t_1); + __Pyx_DECREF(__pyx_t_4); __pyx_t_4 = 0; __Pyx_XDECREF_SET(__pyx_v_token, __pyx_t_1); __pyx_t_1 = 0; @@ -2734,11 +2755,11 @@ static int __pyx_pf_6gensim_6models_19word2vec_corpusfile_11CythonVocab___init__ */ __pyx_t_1 = __Pyx_PyObject_GetAttrStr(__pyx_v_wv, __pyx_n_s_buckets_word); if (unlikely(!__pyx_t_1)) __PYX_ERR(1, 56, __pyx_L1_error) __Pyx_GOTREF(__pyx_t_1); - __pyx_t_3 = __Pyx_GetItemInt(__pyx_t_1, __pyx_v_word.index, __pyx_t_5numpy_uint32_t, 0, __Pyx_PyInt_From_npy_uint32, 0, 0, 0); if (unlikely(!__pyx_t_3)) __PYX_ERR(1, 56, __pyx_L1_error) - __Pyx_GOTREF(__pyx_t_3); + __pyx_t_4 = __Pyx_GetItemInt(__pyx_t_1, __pyx_v_word.index, __pyx_t_5numpy_uint32_t, 0, __Pyx_PyInt_From_npy_uint32, 0, 0, 0); if (unlikely(!__pyx_t_4)) __PYX_ERR(1, 56, __pyx_L1_error) + __Pyx_GOTREF(__pyx_t_4); __Pyx_DECREF(__pyx_t_1); __pyx_t_1 = 0; - __pyx_t_12 = PyObject_Length(__pyx_t_3); if (unlikely(__pyx_t_12 == ((Py_ssize_t)-1))) __PYX_ERR(1, 56, __pyx_L1_error) - __Pyx_DECREF(__pyx_t_3); __pyx_t_3 = 0; + __pyx_t_12 = PyObject_Length(__pyx_t_4); if (unlikely(__pyx_t_12 == ((Py_ssize_t)-1))) __PYX_ERR(1, 56, __pyx_L1_error) + __Pyx_DECREF(__pyx_t_4); __pyx_t_4 = 0; __pyx_v_word.subword_idx_len = ((int)__pyx_t_12); /* "gensim/models/word2vec_corpusfile.pyx":57 @@ -2748,11 +2769,11 @@ static int __pyx_pf_6gensim_6models_19word2vec_corpusfile_11CythonVocab___init__ * * self.vocab[token] = word */ - __pyx_t_3 = __Pyx_PyObject_GetAttrStr(__pyx_v_wv, __pyx_n_s_buckets_word); if (unlikely(!__pyx_t_3)) __PYX_ERR(1, 57, __pyx_L1_error) - __Pyx_GOTREF(__pyx_t_3); - __pyx_t_1 = __Pyx_GetItemInt(__pyx_t_3, __pyx_v_word.index, __pyx_t_5numpy_uint32_t, 0, __Pyx_PyInt_From_npy_uint32, 0, 0, 0); if (unlikely(!__pyx_t_1)) __PYX_ERR(1, 57, __pyx_L1_error) + __pyx_t_4 = __Pyx_PyObject_GetAttrStr(__pyx_v_wv, __pyx_n_s_buckets_word); if (unlikely(!__pyx_t_4)) __PYX_ERR(1, 57, __pyx_L1_error) + __Pyx_GOTREF(__pyx_t_4); + __pyx_t_1 = __Pyx_GetItemInt(__pyx_t_4, __pyx_v_word.index, __pyx_t_5numpy_uint32_t, 0, __Pyx_PyInt_From_npy_uint32, 0, 0, 0); if (unlikely(!__pyx_t_1)) __PYX_ERR(1, 57, __pyx_L1_error) __Pyx_GOTREF(__pyx_t_1); - __Pyx_DECREF(__pyx_t_3); __pyx_t_3 = 0; + __Pyx_DECREF(__pyx_t_4); __pyx_t_4 = 0; if (!(likely(((__pyx_t_1) == Py_None) || likely(__Pyx_TypeTest(__pyx_t_1, __pyx_ptype_5numpy_ndarray))))) __PYX_ERR(1, 57, __pyx_L1_error) __pyx_v_word.subword_idx = ((__pyx_t_5numpy_uint32_t *)PyArray_DATA(((PyArrayObject *)__pyx_t_1))); __Pyx_DECREF(__pyx_t_1); __pyx_t_1 = 0; @@ -2802,7 +2823,7 @@ static int __pyx_pf_6gensim_6models_19word2vec_corpusfile_11CythonVocab___init__ __Pyx_XDECREF(__pyx_t_2); __Pyx_XDECREF(__pyx_t_3); __Pyx_XDECREF(__pyx_t_4); - __Pyx_XDECREF(__pyx_t_5); + __Pyx_XDECREF(__pyx_t_7); __Pyx_AddTraceback("gensim.models.word2vec_corpusfile.CythonVocab.__init__", __pyx_clineno, __pyx_lineno, __pyx_filename); __pyx_r = -1; __pyx_L0:; @@ -2967,7 +2988,7 @@ static PyObject *__pyx_pf_6gensim_6models_19word2vec_corpusfile_11CythonVocab_4_ /* Python wrapper */ static PyObject *__pyx_pw_6gensim_6models_19word2vec_corpusfile_1rebuild_cython_line_sentence(PyObject *__pyx_self, PyObject *__pyx_args, PyObject *__pyx_kwds); /*proto*/ static char __pyx_doc_6gensim_6models_19word2vec_corpusfile_rebuild_cython_line_sentence[] = "rebuild_cython_line_sentence(source, max_sentence_length)"; -static PyMethodDef __pyx_mdef_6gensim_6models_19word2vec_corpusfile_1rebuild_cython_line_sentence = {"rebuild_cython_line_sentence", (PyCFunction)__pyx_pw_6gensim_6models_19word2vec_corpusfile_1rebuild_cython_line_sentence, METH_VARARGS|METH_KEYWORDS, __pyx_doc_6gensim_6models_19word2vec_corpusfile_rebuild_cython_line_sentence}; +static PyMethodDef __pyx_mdef_6gensim_6models_19word2vec_corpusfile_1rebuild_cython_line_sentence = {"rebuild_cython_line_sentence", (PyCFunction)(void*)(PyCFunctionWithKeywords)__pyx_pw_6gensim_6models_19word2vec_corpusfile_1rebuild_cython_line_sentence, METH_VARARGS|METH_KEYWORDS, __pyx_doc_6gensim_6models_19word2vec_corpusfile_rebuild_cython_line_sentence}; static PyObject *__pyx_pw_6gensim_6models_19word2vec_corpusfile_1rebuild_cython_line_sentence(PyObject *__pyx_self, PyObject *__pyx_args, PyObject *__pyx_kwds) { PyObject *__pyx_v_source = 0; PyObject *__pyx_v_max_sentence_length = 0; @@ -3095,6 +3116,7 @@ static PyObject *__pyx_f_6gensim_6models_19word2vec_corpusfile_to_bytes(PyObject int __pyx_t_2; PyObject *__pyx_t_3 = NULL; PyObject *__pyx_t_4 = NULL; + PyObject *__pyx_t_5 = NULL; __Pyx_RefNannySetupContext("to_bytes", 0); /* "gensim/models/word2vec_corpusfile.pyx":70 @@ -3138,14 +3160,26 @@ static PyObject *__pyx_f_6gensim_6models_19word2vec_corpusfile_to_bytes(PyObject */ /*else*/ { __Pyx_XDECREF(__pyx_r); - __pyx_t_3 = __Pyx_PyObject_GetAttrStr(__pyx_v_key, __pyx_n_s_encode); if (unlikely(!__pyx_t_3)) __PYX_ERR(1, 73, __pyx_L1_error) - __Pyx_GOTREF(__pyx_t_3); - __pyx_t_4 = __Pyx_PyObject_Call(__pyx_t_3, __pyx_tuple__3, NULL); if (unlikely(!__pyx_t_4)) __PYX_ERR(1, 73, __pyx_L1_error) + __pyx_t_4 = __Pyx_PyObject_GetAttrStr(__pyx_v_key, __pyx_n_s_encode); if (unlikely(!__pyx_t_4)) __PYX_ERR(1, 73, __pyx_L1_error) __Pyx_GOTREF(__pyx_t_4); - __Pyx_DECREF(__pyx_t_3); __pyx_t_3 = 0; - if (!(likely(PyBytes_CheckExact(__pyx_t_4))||((__pyx_t_4) == Py_None)||(PyErr_Format(PyExc_TypeError, "Expected %.16s, got %.200s", "bytes", Py_TYPE(__pyx_t_4)->tp_name), 0))) __PYX_ERR(1, 73, __pyx_L1_error) - __pyx_r = ((PyObject*)__pyx_t_4); - __pyx_t_4 = 0; + __pyx_t_5 = NULL; + if (CYTHON_UNPACK_METHODS && likely(PyMethod_Check(__pyx_t_4))) { + __pyx_t_5 = PyMethod_GET_SELF(__pyx_t_4); + if (likely(__pyx_t_5)) { + PyObject* function = PyMethod_GET_FUNCTION(__pyx_t_4); + __Pyx_INCREF(__pyx_t_5); + __Pyx_INCREF(function); + __Pyx_DECREF_SET(__pyx_t_4, function); + } + } + __pyx_t_3 = (__pyx_t_5) ? __Pyx_PyObject_Call2Args(__pyx_t_4, __pyx_t_5, __pyx_n_s_utf8) : __Pyx_PyObject_CallOneArg(__pyx_t_4, __pyx_n_s_utf8); + __Pyx_XDECREF(__pyx_t_5); __pyx_t_5 = 0; + if (unlikely(!__pyx_t_3)) __PYX_ERR(1, 73, __pyx_L1_error) + __Pyx_GOTREF(__pyx_t_3); + __Pyx_DECREF(__pyx_t_4); __pyx_t_4 = 0; + if (!(likely(PyBytes_CheckExact(__pyx_t_3))||((__pyx_t_3) == Py_None)||(PyErr_Format(PyExc_TypeError, "Expected %.16s, got %.200s", "bytes", Py_TYPE(__pyx_t_3)->tp_name), 0))) __PYX_ERR(1, 73, __pyx_L1_error) + __pyx_r = ((PyObject*)__pyx_t_3); + __pyx_t_3 = 0; goto __pyx_L0; } @@ -3161,6 +3195,7 @@ static PyObject *__pyx_f_6gensim_6models_19word2vec_corpusfile_to_bytes(PyObject __pyx_L1_error:; __Pyx_XDECREF(__pyx_t_3); __Pyx_XDECREF(__pyx_t_4); + __Pyx_XDECREF(__pyx_t_5); __Pyx_AddTraceback("gensim.models.word2vec_corpusfile.to_bytes", __pyx_clineno, __pyx_lineno, __pyx_filename); __pyx_r = 0; __pyx_L0:; @@ -4285,7 +4320,9 @@ static PyObject *__pyx_gb_6gensim_6models_19word2vec_corpusfile_18CythonLineSent __Pyx_AddTraceback("__iter__", __pyx_clineno, __pyx_lineno, __pyx_filename); __pyx_L0:; __Pyx_XDECREF(__pyx_r); __pyx_r = 0; + #if !CYTHON_USE_EXC_INFO_STACK __Pyx_Coroutine_ResetAndClearException(__pyx_generator); + #endif __pyx_generator->resume_label = -1; __Pyx_Coroutine_clear((PyObject*)__pyx_generator); __Pyx_RefNannyFinishContext(); @@ -4330,7 +4367,7 @@ static PyObject *__pyx_pf_6gensim_6models_19word2vec_corpusfile_18CythonLineSent * cpdef vector[vector[string]] next_batch(self) nogil except *: */ __Pyx_XDECREF(__pyx_r); - __pyx_t_1 = __Pyx_GetModuleGlobalName(__pyx_n_s_rebuild_cython_line_sentence); if (unlikely(!__pyx_t_1)) __PYX_ERR(1, 132, __pyx_L1_error) + __Pyx_GetModuleGlobalName(__pyx_t_1, __pyx_n_s_rebuild_cython_line_sentence); if (unlikely(!__pyx_t_1)) __PYX_ERR(1, 132, __pyx_L1_error) __Pyx_GOTREF(__pyx_t_1); __pyx_t_2 = __Pyx_PyInt_FromSize_t(__pyx_v_self->max_sentence_length); if (unlikely(!__pyx_t_2)) __PYX_ERR(1, 132, __pyx_L1_error) __Pyx_GOTREF(__pyx_t_2); @@ -5678,7 +5715,7 @@ static __pyx_t_6gensim_6models_19word2vec_corpusfile_REAL_t __pyx_f_6gensim_6mod /* Python wrapper */ static PyObject *__pyx_pw_6gensim_6models_19word2vec_corpusfile_3train_epoch_sg(PyObject *__pyx_self, PyObject *__pyx_args, PyObject *__pyx_kwds); /*proto*/ static char __pyx_doc_6gensim_6models_19word2vec_corpusfile_2train_epoch_sg[] = "train_epoch_sg(model, corpus_file, offset, _cython_vocab, _cur_epoch, _expected_examples, _expected_words, _work, _neu1, compute_loss)\nTrain Skipgram model for one epoch by training on an input stream. This function is used only in multistream mode.\n\n Called internally from :meth:`~gensim.models.word2vec.Word2Vec.train`.\n\n Parameters\n ----------\n model : :class:`~gensim.models.word2vec.Word2Vec`\n The Word2Vec model instance to train.\n input_stream : iterable of list of str\n The corpus used to train the model.\n _cur_epoch : int\n Current epoch number. Used for calculating and decaying learning rate.\n _work : np.ndarray\n Private working memory for each worker.\n _neu1 : np.ndarray\n Private working memory for each worker.\n compute_loss : bool\n Whether or not the training loss should be computed in this batch.\n\n Returns\n -------\n int\n Number of words in the vocabulary actually used for training (They already existed in the vocabulary\n and were not discarded by negative sampling).\n "; -static PyMethodDef __pyx_mdef_6gensim_6models_19word2vec_corpusfile_3train_epoch_sg = {"train_epoch_sg", (PyCFunction)__pyx_pw_6gensim_6models_19word2vec_corpusfile_3train_epoch_sg, METH_VARARGS|METH_KEYWORDS, __pyx_doc_6gensim_6models_19word2vec_corpusfile_2train_epoch_sg}; +static PyMethodDef __pyx_mdef_6gensim_6models_19word2vec_corpusfile_3train_epoch_sg = {"train_epoch_sg", (PyCFunction)(void*)(PyCFunctionWithKeywords)__pyx_pw_6gensim_6models_19word2vec_corpusfile_3train_epoch_sg, METH_VARARGS|METH_KEYWORDS, __pyx_doc_6gensim_6models_19word2vec_corpusfile_2train_epoch_sg}; static PyObject *__pyx_pw_6gensim_6models_19word2vec_corpusfile_3train_epoch_sg(PyObject *__pyx_self, PyObject *__pyx_args, PyObject *__pyx_kwds) { PyObject *__pyx_v_model = 0; PyObject *__pyx_v_corpus_file = 0; @@ -6499,7 +6536,7 @@ static PyObject *__pyx_pf_6gensim_6models_19word2vec_corpusfile_2train_epoch_sg( /* Python wrapper */ static PyObject *__pyx_pw_6gensim_6models_19word2vec_corpusfile_5train_epoch_cbow(PyObject *__pyx_self, PyObject *__pyx_args, PyObject *__pyx_kwds); /*proto*/ static char __pyx_doc_6gensim_6models_19word2vec_corpusfile_4train_epoch_cbow[] = "train_epoch_cbow(model, corpus_file, offset, _cython_vocab, _cur_epoch, _expected_examples, _expected_words, _work, _neu1, compute_loss)\nTrain CBOW model for one epoch by training on an input stream. This function is used only in multistream mode.\n\n Called internally from :meth:`~gensim.models.word2vec.Word2Vec.train`.\n\n Parameters\n ----------\n model : :class:`~gensim.models.word2vec.Word2Vec`\n The Word2Vec model instance to train.\n input_stream : iterable of list of str\n The corpus used to train the model.\n _cur_epoch : int\n Current epoch number. Used for calculating and decaying learning rate.\n _work : np.ndarray\n Private working memory for each worker.\n _neu1 : np.ndarray\n Private working memory for each worker.\n compute_loss : bool\n Whether or not the training loss should be computed in this batch.\n\n Returns\n -------\n int\n Number of words in the vocabulary actually used for training (They already existed in the vocabulary\n and were not discarded by negative sampling).\n "; -static PyMethodDef __pyx_mdef_6gensim_6models_19word2vec_corpusfile_5train_epoch_cbow = {"train_epoch_cbow", (PyCFunction)__pyx_pw_6gensim_6models_19word2vec_corpusfile_5train_epoch_cbow, METH_VARARGS|METH_KEYWORDS, __pyx_doc_6gensim_6models_19word2vec_corpusfile_4train_epoch_cbow}; +static PyMethodDef __pyx_mdef_6gensim_6models_19word2vec_corpusfile_5train_epoch_cbow = {"train_epoch_cbow", (PyCFunction)(void*)(PyCFunctionWithKeywords)__pyx_pw_6gensim_6models_19word2vec_corpusfile_5train_epoch_cbow, METH_VARARGS|METH_KEYWORDS, __pyx_doc_6gensim_6models_19word2vec_corpusfile_4train_epoch_cbow}; static PyObject *__pyx_pw_6gensim_6models_19word2vec_corpusfile_5train_epoch_cbow(PyObject *__pyx_self, PyObject *__pyx_args, PyObject *__pyx_kwds) { PyObject *__pyx_v_model = 0; PyObject *__pyx_v_corpus_file = 0; @@ -7256,7 +7293,7 @@ static PyObject *__pyx_pf_6gensim_6models_19word2vec_corpusfile_4train_epoch_cbo return __pyx_r; } -/* "../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":215 +/* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":258 * # experimental exception made for __getbuffer__ and __releasebuffer__ * # -- the details of this may change. * def __getbuffer__(ndarray self, Py_buffer* info, int flags): # <<<<<<<<<<<<<< @@ -7294,8 +7331,9 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P int __pyx_t_4; int __pyx_t_5; int __pyx_t_6; - PyObject *__pyx_t_7 = NULL; - char *__pyx_t_8; + PyArray_Descr *__pyx_t_7; + PyObject *__pyx_t_8 = NULL; + char *__pyx_t_9; if (__pyx_v_info == NULL) { PyErr_SetString(PyExc_BufferError, "PyObject_GetBuffer: view==NULL argument is obsolete"); return -1; @@ -7304,7 +7342,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P __pyx_v_info->obj = Py_None; __Pyx_INCREF(Py_None); __Pyx_GIVEREF(__pyx_v_info->obj); - /* "../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":222 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":265 * * cdef int i, ndim * cdef int endian_detector = 1 # <<<<<<<<<<<<<< @@ -7313,7 +7351,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P */ __pyx_v_endian_detector = 1; - /* "../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":223 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":266 * cdef int i, ndim * cdef int endian_detector = 1 * cdef bint little_endian = ((&endian_detector)[0] != 0) # <<<<<<<<<<<<<< @@ -7322,7 +7360,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P */ __pyx_v_little_endian = ((((char *)(&__pyx_v_endian_detector))[0]) != 0); - /* "../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":225 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":268 * cdef bint little_endian = ((&endian_detector)[0] != 0) * * ndim = PyArray_NDIM(self) # <<<<<<<<<<<<<< @@ -7331,11 +7369,11 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P */ __pyx_v_ndim = PyArray_NDIM(__pyx_v_self); - /* "../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":227 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":270 * ndim = PyArray_NDIM(self) * * if ((flags & pybuf.PyBUF_C_CONTIGUOUS == pybuf.PyBUF_C_CONTIGUOUS) # <<<<<<<<<<<<<< - * and not PyArray_CHKFLAGS(self, NPY_C_CONTIGUOUS)): + * and not PyArray_CHKFLAGS(self, NPY_ARRAY_C_CONTIGUOUS)): * raise ValueError(u"ndarray is not C contiguous") */ __pyx_t_2 = (((__pyx_v_flags & PyBUF_C_CONTIGUOUS) == PyBUF_C_CONTIGUOUS) != 0); @@ -7345,53 +7383,53 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P goto __pyx_L4_bool_binop_done; } - /* "../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":228 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":271 * * if ((flags & pybuf.PyBUF_C_CONTIGUOUS == pybuf.PyBUF_C_CONTIGUOUS) - * and not PyArray_CHKFLAGS(self, NPY_C_CONTIGUOUS)): # <<<<<<<<<<<<<< + * and not PyArray_CHKFLAGS(self, NPY_ARRAY_C_CONTIGUOUS)): # <<<<<<<<<<<<<< * raise ValueError(u"ndarray is not C contiguous") * */ - __pyx_t_2 = ((!(PyArray_CHKFLAGS(__pyx_v_self, NPY_C_CONTIGUOUS) != 0)) != 0); + __pyx_t_2 = ((!(PyArray_CHKFLAGS(__pyx_v_self, NPY_ARRAY_C_CONTIGUOUS) != 0)) != 0); __pyx_t_1 = __pyx_t_2; __pyx_L4_bool_binop_done:; - /* "../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":227 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":270 * ndim = PyArray_NDIM(self) * * if ((flags & pybuf.PyBUF_C_CONTIGUOUS == pybuf.PyBUF_C_CONTIGUOUS) # <<<<<<<<<<<<<< - * and not PyArray_CHKFLAGS(self, NPY_C_CONTIGUOUS)): + * and not PyArray_CHKFLAGS(self, NPY_ARRAY_C_CONTIGUOUS)): * raise ValueError(u"ndarray is not C contiguous") */ if (unlikely(__pyx_t_1)) { - /* "../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":229 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":272 * if ((flags & pybuf.PyBUF_C_CONTIGUOUS == pybuf.PyBUF_C_CONTIGUOUS) - * and not PyArray_CHKFLAGS(self, NPY_C_CONTIGUOUS)): + * and not PyArray_CHKFLAGS(self, NPY_ARRAY_C_CONTIGUOUS)): * raise ValueError(u"ndarray is not C contiguous") # <<<<<<<<<<<<<< * * if ((flags & pybuf.PyBUF_F_CONTIGUOUS == pybuf.PyBUF_F_CONTIGUOUS) */ - __pyx_t_3 = __Pyx_PyObject_Call(__pyx_builtin_ValueError, __pyx_tuple__4, NULL); if (unlikely(!__pyx_t_3)) __PYX_ERR(3, 229, __pyx_L1_error) + __pyx_t_3 = __Pyx_PyObject_Call(__pyx_builtin_ValueError, __pyx_tuple__3, NULL); if (unlikely(!__pyx_t_3)) __PYX_ERR(3, 272, __pyx_L1_error) __Pyx_GOTREF(__pyx_t_3); __Pyx_Raise(__pyx_t_3, 0, 0, 0); __Pyx_DECREF(__pyx_t_3); __pyx_t_3 = 0; - __PYX_ERR(3, 229, __pyx_L1_error) + __PYX_ERR(3, 272, __pyx_L1_error) - /* "../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":227 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":270 * ndim = PyArray_NDIM(self) * * if ((flags & pybuf.PyBUF_C_CONTIGUOUS == pybuf.PyBUF_C_CONTIGUOUS) # <<<<<<<<<<<<<< - * and not PyArray_CHKFLAGS(self, NPY_C_CONTIGUOUS)): + * and not PyArray_CHKFLAGS(self, NPY_ARRAY_C_CONTIGUOUS)): * raise ValueError(u"ndarray is not C contiguous") */ } - /* "../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":231 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":274 * raise ValueError(u"ndarray is not C contiguous") * * if ((flags & pybuf.PyBUF_F_CONTIGUOUS == pybuf.PyBUF_F_CONTIGUOUS) # <<<<<<<<<<<<<< - * and not PyArray_CHKFLAGS(self, NPY_F_CONTIGUOUS)): + * and not PyArray_CHKFLAGS(self, NPY_ARRAY_F_CONTIGUOUS)): * raise ValueError(u"ndarray is not Fortran contiguous") */ __pyx_t_2 = (((__pyx_v_flags & PyBUF_F_CONTIGUOUS) == PyBUF_F_CONTIGUOUS) != 0); @@ -7401,49 +7439,49 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P goto __pyx_L7_bool_binop_done; } - /* "../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":232 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":275 * * if ((flags & pybuf.PyBUF_F_CONTIGUOUS == pybuf.PyBUF_F_CONTIGUOUS) - * and not PyArray_CHKFLAGS(self, NPY_F_CONTIGUOUS)): # <<<<<<<<<<<<<< + * and not PyArray_CHKFLAGS(self, NPY_ARRAY_F_CONTIGUOUS)): # <<<<<<<<<<<<<< * raise ValueError(u"ndarray is not Fortran contiguous") * */ - __pyx_t_2 = ((!(PyArray_CHKFLAGS(__pyx_v_self, NPY_F_CONTIGUOUS) != 0)) != 0); + __pyx_t_2 = ((!(PyArray_CHKFLAGS(__pyx_v_self, NPY_ARRAY_F_CONTIGUOUS) != 0)) != 0); __pyx_t_1 = __pyx_t_2; __pyx_L7_bool_binop_done:; - /* "../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":231 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":274 * raise ValueError(u"ndarray is not C contiguous") * * if ((flags & pybuf.PyBUF_F_CONTIGUOUS == pybuf.PyBUF_F_CONTIGUOUS) # <<<<<<<<<<<<<< - * and not PyArray_CHKFLAGS(self, NPY_F_CONTIGUOUS)): + * and not PyArray_CHKFLAGS(self, NPY_ARRAY_F_CONTIGUOUS)): * raise ValueError(u"ndarray is not Fortran contiguous") */ if (unlikely(__pyx_t_1)) { - /* "../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":233 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":276 * if ((flags & pybuf.PyBUF_F_CONTIGUOUS == pybuf.PyBUF_F_CONTIGUOUS) - * and not PyArray_CHKFLAGS(self, NPY_F_CONTIGUOUS)): + * and not PyArray_CHKFLAGS(self, NPY_ARRAY_F_CONTIGUOUS)): * raise ValueError(u"ndarray is not Fortran contiguous") # <<<<<<<<<<<<<< * * info.buf = PyArray_DATA(self) */ - __pyx_t_3 = __Pyx_PyObject_Call(__pyx_builtin_ValueError, __pyx_tuple__5, NULL); if (unlikely(!__pyx_t_3)) __PYX_ERR(3, 233, __pyx_L1_error) + __pyx_t_3 = __Pyx_PyObject_Call(__pyx_builtin_ValueError, __pyx_tuple__4, NULL); if (unlikely(!__pyx_t_3)) __PYX_ERR(3, 276, __pyx_L1_error) __Pyx_GOTREF(__pyx_t_3); __Pyx_Raise(__pyx_t_3, 0, 0, 0); __Pyx_DECREF(__pyx_t_3); __pyx_t_3 = 0; - __PYX_ERR(3, 233, __pyx_L1_error) + __PYX_ERR(3, 276, __pyx_L1_error) - /* "../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":231 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":274 * raise ValueError(u"ndarray is not C contiguous") * * if ((flags & pybuf.PyBUF_F_CONTIGUOUS == pybuf.PyBUF_F_CONTIGUOUS) # <<<<<<<<<<<<<< - * and not PyArray_CHKFLAGS(self, NPY_F_CONTIGUOUS)): + * and not PyArray_CHKFLAGS(self, NPY_ARRAY_F_CONTIGUOUS)): * raise ValueError(u"ndarray is not Fortran contiguous") */ } - /* "../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":235 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":278 * raise ValueError(u"ndarray is not Fortran contiguous") * * info.buf = PyArray_DATA(self) # <<<<<<<<<<<<<< @@ -7452,7 +7490,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P */ __pyx_v_info->buf = PyArray_DATA(__pyx_v_self); - /* "../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":236 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":279 * * info.buf = PyArray_DATA(self) * info.ndim = ndim # <<<<<<<<<<<<<< @@ -7461,7 +7499,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P */ __pyx_v_info->ndim = __pyx_v_ndim; - /* "../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":237 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":280 * info.buf = PyArray_DATA(self) * info.ndim = ndim * if sizeof(npy_intp) != sizeof(Py_ssize_t): # <<<<<<<<<<<<<< @@ -7471,7 +7509,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P __pyx_t_1 = (((sizeof(npy_intp)) != (sizeof(Py_ssize_t))) != 0); if (__pyx_t_1) { - /* "../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":240 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":283 * # Allocate new buffer for strides and shape info. * # This is allocated as one block, strides first. * info.strides = PyObject_Malloc(sizeof(Py_ssize_t) * 2 * ndim) # <<<<<<<<<<<<<< @@ -7480,7 +7518,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P */ __pyx_v_info->strides = ((Py_ssize_t *)PyObject_Malloc((((sizeof(Py_ssize_t)) * 2) * ((size_t)__pyx_v_ndim)))); - /* "../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":241 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":284 * # This is allocated as one block, strides first. * info.strides = PyObject_Malloc(sizeof(Py_ssize_t) * 2 * ndim) * info.shape = info.strides + ndim # <<<<<<<<<<<<<< @@ -7489,7 +7527,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P */ __pyx_v_info->shape = (__pyx_v_info->strides + __pyx_v_ndim); - /* "../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":242 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":285 * info.strides = PyObject_Malloc(sizeof(Py_ssize_t) * 2 * ndim) * info.shape = info.strides + ndim * for i in range(ndim): # <<<<<<<<<<<<<< @@ -7501,7 +7539,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P for (__pyx_t_6 = 0; __pyx_t_6 < __pyx_t_5; __pyx_t_6+=1) { __pyx_v_i = __pyx_t_6; - /* "../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":243 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":286 * info.shape = info.strides + ndim * for i in range(ndim): * info.strides[i] = PyArray_STRIDES(self)[i] # <<<<<<<<<<<<<< @@ -7510,7 +7548,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P */ (__pyx_v_info->strides[__pyx_v_i]) = (PyArray_STRIDES(__pyx_v_self)[__pyx_v_i]); - /* "../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":244 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":287 * for i in range(ndim): * info.strides[i] = PyArray_STRIDES(self)[i] * info.shape[i] = PyArray_DIMS(self)[i] # <<<<<<<<<<<<<< @@ -7520,7 +7558,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P (__pyx_v_info->shape[__pyx_v_i]) = (PyArray_DIMS(__pyx_v_self)[__pyx_v_i]); } - /* "../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":237 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":280 * info.buf = PyArray_DATA(self) * info.ndim = ndim * if sizeof(npy_intp) != sizeof(Py_ssize_t): # <<<<<<<<<<<<<< @@ -7530,7 +7568,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P goto __pyx_L9; } - /* "../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":246 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":289 * info.shape[i] = PyArray_DIMS(self)[i] * else: * info.strides = PyArray_STRIDES(self) # <<<<<<<<<<<<<< @@ -7540,7 +7578,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P /*else*/ { __pyx_v_info->strides = ((Py_ssize_t *)PyArray_STRIDES(__pyx_v_self)); - /* "../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":247 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":290 * else: * info.strides = PyArray_STRIDES(self) * info.shape = PyArray_DIMS(self) # <<<<<<<<<<<<<< @@ -7551,7 +7589,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P } __pyx_L9:; - /* "../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":248 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":291 * info.strides = PyArray_STRIDES(self) * info.shape = PyArray_DIMS(self) * info.suboffsets = NULL # <<<<<<<<<<<<<< @@ -7560,7 +7598,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P */ __pyx_v_info->suboffsets = NULL; - /* "../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":249 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":292 * info.shape = PyArray_DIMS(self) * info.suboffsets = NULL * info.itemsize = PyArray_ITEMSIZE(self) # <<<<<<<<<<<<<< @@ -7569,7 +7607,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P */ __pyx_v_info->itemsize = PyArray_ITEMSIZE(__pyx_v_self); - /* "../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":250 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":293 * info.suboffsets = NULL * info.itemsize = PyArray_ITEMSIZE(self) * info.readonly = not PyArray_ISWRITEABLE(self) # <<<<<<<<<<<<<< @@ -7578,28 +7616,29 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P */ __pyx_v_info->readonly = (!(PyArray_ISWRITEABLE(__pyx_v_self) != 0)); - /* "../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":253 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":296 * * cdef int t * cdef char* f = NULL # <<<<<<<<<<<<<< - * cdef dtype descr = self.descr + * cdef dtype descr = PyArray_DESCR(self) * cdef int offset */ __pyx_v_f = NULL; - /* "../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":254 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":297 * cdef int t * cdef char* f = NULL - * cdef dtype descr = self.descr # <<<<<<<<<<<<<< + * cdef dtype descr = PyArray_DESCR(self) # <<<<<<<<<<<<<< * cdef int offset * */ - __pyx_t_3 = ((PyObject *)__pyx_v_self->descr); + __pyx_t_7 = PyArray_DESCR(__pyx_v_self); + __pyx_t_3 = ((PyObject *)__pyx_t_7); __Pyx_INCREF(__pyx_t_3); __pyx_v_descr = ((PyArray_Descr *)__pyx_t_3); __pyx_t_3 = 0; - /* "../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":257 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":300 * cdef int offset * * info.obj = self # <<<<<<<<<<<<<< @@ -7612,7 +7651,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P __Pyx_DECREF(__pyx_v_info->obj); __pyx_v_info->obj = ((PyObject *)__pyx_v_self); - /* "../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":259 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":302 * info.obj = self * * if not PyDataType_HASFIELDS(descr): # <<<<<<<<<<<<<< @@ -7622,7 +7661,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P __pyx_t_1 = ((!(PyDataType_HASFIELDS(__pyx_v_descr) != 0)) != 0); if (__pyx_t_1) { - /* "../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":260 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":303 * * if not PyDataType_HASFIELDS(descr): * t = descr.type_num # <<<<<<<<<<<<<< @@ -7632,7 +7671,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P __pyx_t_4 = __pyx_v_descr->type_num; __pyx_v_t = __pyx_t_4; - /* "../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":261 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":304 * if not PyDataType_HASFIELDS(descr): * t = descr.type_num * if ((descr.byteorder == c'>' and little_endian) or # <<<<<<<<<<<<<< @@ -7652,7 +7691,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P } __pyx_L15_next_or:; - /* "../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":262 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":305 * t = descr.type_num * if ((descr.byteorder == c'>' and little_endian) or * (descr.byteorder == c'<' and not little_endian)): # <<<<<<<<<<<<<< @@ -7669,7 +7708,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P __pyx_t_1 = __pyx_t_2; __pyx_L14_bool_binop_done:; - /* "../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":261 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":304 * if not PyDataType_HASFIELDS(descr): * t = descr.type_num * if ((descr.byteorder == c'>' and little_endian) or # <<<<<<<<<<<<<< @@ -7678,20 +7717,20 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P */ if (unlikely(__pyx_t_1)) { - /* "../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":263 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":306 * if ((descr.byteorder == c'>' and little_endian) or * (descr.byteorder == c'<' and not little_endian)): * raise ValueError(u"Non-native byte order not supported") # <<<<<<<<<<<<<< * if t == NPY_BYTE: f = "b" * elif t == NPY_UBYTE: f = "B" */ - __pyx_t_3 = __Pyx_PyObject_Call(__pyx_builtin_ValueError, __pyx_tuple__6, NULL); if (unlikely(!__pyx_t_3)) __PYX_ERR(3, 263, __pyx_L1_error) + __pyx_t_3 = __Pyx_PyObject_Call(__pyx_builtin_ValueError, __pyx_tuple__5, NULL); if (unlikely(!__pyx_t_3)) __PYX_ERR(3, 306, __pyx_L1_error) __Pyx_GOTREF(__pyx_t_3); __Pyx_Raise(__pyx_t_3, 0, 0, 0); __Pyx_DECREF(__pyx_t_3); __pyx_t_3 = 0; - __PYX_ERR(3, 263, __pyx_L1_error) + __PYX_ERR(3, 306, __pyx_L1_error) - /* "../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":261 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":304 * if not PyDataType_HASFIELDS(descr): * t = descr.type_num * if ((descr.byteorder == c'>' and little_endian) or # <<<<<<<<<<<<<< @@ -7700,7 +7739,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P */ } - /* "../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":264 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":307 * (descr.byteorder == c'<' and not little_endian)): * raise ValueError(u"Non-native byte order not supported") * if t == NPY_BYTE: f = "b" # <<<<<<<<<<<<<< @@ -7711,206 +7750,206 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P case NPY_BYTE: __pyx_v_f = ((char *)"b"); break; + case NPY_UBYTE: - /* "../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":265 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":308 * raise ValueError(u"Non-native byte order not supported") * if t == NPY_BYTE: f = "b" * elif t == NPY_UBYTE: f = "B" # <<<<<<<<<<<<<< * elif t == NPY_SHORT: f = "h" * elif t == NPY_USHORT: f = "H" */ - case NPY_UBYTE: __pyx_v_f = ((char *)"B"); break; + case NPY_SHORT: - /* "../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":266 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":309 * if t == NPY_BYTE: f = "b" * elif t == NPY_UBYTE: f = "B" * elif t == NPY_SHORT: f = "h" # <<<<<<<<<<<<<< * elif t == NPY_USHORT: f = "H" * elif t == NPY_INT: f = "i" */ - case NPY_SHORT: __pyx_v_f = ((char *)"h"); break; + case NPY_USHORT: - /* "../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":267 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":310 * elif t == NPY_UBYTE: f = "B" * elif t == NPY_SHORT: f = "h" * elif t == NPY_USHORT: f = "H" # <<<<<<<<<<<<<< * elif t == NPY_INT: f = "i" * elif t == NPY_UINT: f = "I" */ - case NPY_USHORT: __pyx_v_f = ((char *)"H"); break; + case NPY_INT: - /* "../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":268 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":311 * elif t == NPY_SHORT: f = "h" * elif t == NPY_USHORT: f = "H" * elif t == NPY_INT: f = "i" # <<<<<<<<<<<<<< * elif t == NPY_UINT: f = "I" * elif t == NPY_LONG: f = "l" */ - case NPY_INT: __pyx_v_f = ((char *)"i"); break; + case NPY_UINT: - /* "../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":269 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":312 * elif t == NPY_USHORT: f = "H" * elif t == NPY_INT: f = "i" * elif t == NPY_UINT: f = "I" # <<<<<<<<<<<<<< * elif t == NPY_LONG: f = "l" * elif t == NPY_ULONG: f = "L" */ - case NPY_UINT: __pyx_v_f = ((char *)"I"); break; + case NPY_LONG: - /* "../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":270 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":313 * elif t == NPY_INT: f = "i" * elif t == NPY_UINT: f = "I" * elif t == NPY_LONG: f = "l" # <<<<<<<<<<<<<< * elif t == NPY_ULONG: f = "L" * elif t == NPY_LONGLONG: f = "q" */ - case NPY_LONG: __pyx_v_f = ((char *)"l"); break; + case NPY_ULONG: - /* "../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":271 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":314 * elif t == NPY_UINT: f = "I" * elif t == NPY_LONG: f = "l" * elif t == NPY_ULONG: f = "L" # <<<<<<<<<<<<<< * elif t == NPY_LONGLONG: f = "q" * elif t == NPY_ULONGLONG: f = "Q" */ - case NPY_ULONG: __pyx_v_f = ((char *)"L"); break; + case NPY_LONGLONG: - /* "../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":272 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":315 * elif t == NPY_LONG: f = "l" * elif t == NPY_ULONG: f = "L" * elif t == NPY_LONGLONG: f = "q" # <<<<<<<<<<<<<< * elif t == NPY_ULONGLONG: f = "Q" * elif t == NPY_FLOAT: f = "f" */ - case NPY_LONGLONG: __pyx_v_f = ((char *)"q"); break; + case NPY_ULONGLONG: - /* "../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":273 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":316 * elif t == NPY_ULONG: f = "L" * elif t == NPY_LONGLONG: f = "q" * elif t == NPY_ULONGLONG: f = "Q" # <<<<<<<<<<<<<< * elif t == NPY_FLOAT: f = "f" * elif t == NPY_DOUBLE: f = "d" */ - case NPY_ULONGLONG: __pyx_v_f = ((char *)"Q"); break; + case NPY_FLOAT: - /* "../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":274 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":317 * elif t == NPY_LONGLONG: f = "q" * elif t == NPY_ULONGLONG: f = "Q" * elif t == NPY_FLOAT: f = "f" # <<<<<<<<<<<<<< * elif t == NPY_DOUBLE: f = "d" * elif t == NPY_LONGDOUBLE: f = "g" */ - case NPY_FLOAT: __pyx_v_f = ((char *)"f"); break; + case NPY_DOUBLE: - /* "../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":275 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":318 * elif t == NPY_ULONGLONG: f = "Q" * elif t == NPY_FLOAT: f = "f" * elif t == NPY_DOUBLE: f = "d" # <<<<<<<<<<<<<< * elif t == NPY_LONGDOUBLE: f = "g" * elif t == NPY_CFLOAT: f = "Zf" */ - case NPY_DOUBLE: __pyx_v_f = ((char *)"d"); break; + case NPY_LONGDOUBLE: - /* "../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":276 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":319 * elif t == NPY_FLOAT: f = "f" * elif t == NPY_DOUBLE: f = "d" * elif t == NPY_LONGDOUBLE: f = "g" # <<<<<<<<<<<<<< * elif t == NPY_CFLOAT: f = "Zf" * elif t == NPY_CDOUBLE: f = "Zd" */ - case NPY_LONGDOUBLE: __pyx_v_f = ((char *)"g"); break; + case NPY_CFLOAT: - /* "../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":277 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":320 * elif t == NPY_DOUBLE: f = "d" * elif t == NPY_LONGDOUBLE: f = "g" * elif t == NPY_CFLOAT: f = "Zf" # <<<<<<<<<<<<<< * elif t == NPY_CDOUBLE: f = "Zd" * elif t == NPY_CLONGDOUBLE: f = "Zg" */ - case NPY_CFLOAT: __pyx_v_f = ((char *)"Zf"); break; + case NPY_CDOUBLE: - /* "../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":278 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":321 * elif t == NPY_LONGDOUBLE: f = "g" * elif t == NPY_CFLOAT: f = "Zf" * elif t == NPY_CDOUBLE: f = "Zd" # <<<<<<<<<<<<<< * elif t == NPY_CLONGDOUBLE: f = "Zg" * elif t == NPY_OBJECT: f = "O" */ - case NPY_CDOUBLE: __pyx_v_f = ((char *)"Zd"); break; + case NPY_CLONGDOUBLE: - /* "../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":279 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":322 * elif t == NPY_CFLOAT: f = "Zf" * elif t == NPY_CDOUBLE: f = "Zd" * elif t == NPY_CLONGDOUBLE: f = "Zg" # <<<<<<<<<<<<<< * elif t == NPY_OBJECT: f = "O" * else: */ - case NPY_CLONGDOUBLE: __pyx_v_f = ((char *)"Zg"); break; + case NPY_OBJECT: - /* "../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":280 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":323 * elif t == NPY_CDOUBLE: f = "Zd" * elif t == NPY_CLONGDOUBLE: f = "Zg" * elif t == NPY_OBJECT: f = "O" # <<<<<<<<<<<<<< * else: * raise ValueError(u"unknown dtype code in numpy.pxd (%d)" % t) */ - case NPY_OBJECT: __pyx_v_f = ((char *)"O"); break; default: - /* "../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":282 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":325 * elif t == NPY_OBJECT: f = "O" * else: * raise ValueError(u"unknown dtype code in numpy.pxd (%d)" % t) # <<<<<<<<<<<<<< * info.format = f * return */ - __pyx_t_3 = __Pyx_PyInt_From_int(__pyx_v_t); if (unlikely(!__pyx_t_3)) __PYX_ERR(3, 282, __pyx_L1_error) + __pyx_t_3 = __Pyx_PyInt_From_int(__pyx_v_t); if (unlikely(!__pyx_t_3)) __PYX_ERR(3, 325, __pyx_L1_error) __Pyx_GOTREF(__pyx_t_3); - __pyx_t_7 = PyUnicode_Format(__pyx_kp_u_unknown_dtype_code_in_numpy_pxd, __pyx_t_3); if (unlikely(!__pyx_t_7)) __PYX_ERR(3, 282, __pyx_L1_error) - __Pyx_GOTREF(__pyx_t_7); + __pyx_t_8 = PyUnicode_Format(__pyx_kp_u_unknown_dtype_code_in_numpy_pxd, __pyx_t_3); if (unlikely(!__pyx_t_8)) __PYX_ERR(3, 325, __pyx_L1_error) + __Pyx_GOTREF(__pyx_t_8); __Pyx_DECREF(__pyx_t_3); __pyx_t_3 = 0; - __pyx_t_3 = __Pyx_PyObject_CallOneArg(__pyx_builtin_ValueError, __pyx_t_7); if (unlikely(!__pyx_t_3)) __PYX_ERR(3, 282, __pyx_L1_error) + __pyx_t_3 = __Pyx_PyObject_CallOneArg(__pyx_builtin_ValueError, __pyx_t_8); if (unlikely(!__pyx_t_3)) __PYX_ERR(3, 325, __pyx_L1_error) __Pyx_GOTREF(__pyx_t_3); - __Pyx_DECREF(__pyx_t_7); __pyx_t_7 = 0; + __Pyx_DECREF(__pyx_t_8); __pyx_t_8 = 0; __Pyx_Raise(__pyx_t_3, 0, 0, 0); __Pyx_DECREF(__pyx_t_3); __pyx_t_3 = 0; - __PYX_ERR(3, 282, __pyx_L1_error) + __PYX_ERR(3, 325, __pyx_L1_error) break; } - /* "../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":283 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":326 * else: * raise ValueError(u"unknown dtype code in numpy.pxd (%d)" % t) * info.format = f # <<<<<<<<<<<<<< @@ -7919,7 +7958,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P */ __pyx_v_info->format = __pyx_v_f; - /* "../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":284 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":327 * raise ValueError(u"unknown dtype code in numpy.pxd (%d)" % t) * info.format = f * return # <<<<<<<<<<<<<< @@ -7929,7 +7968,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P __pyx_r = 0; goto __pyx_L0; - /* "../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":259 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":302 * info.obj = self * * if not PyDataType_HASFIELDS(descr): # <<<<<<<<<<<<<< @@ -7938,7 +7977,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P */ } - /* "../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":286 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":329 * return * else: * info.format = PyObject_Malloc(_buffer_format_string_len) # <<<<<<<<<<<<<< @@ -7948,7 +7987,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P /*else*/ { __pyx_v_info->format = ((char *)PyObject_Malloc(0xFF)); - /* "../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":287 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":330 * else: * info.format = PyObject_Malloc(_buffer_format_string_len) * info.format[0] = c'^' # Native data types, manual alignment # <<<<<<<<<<<<<< @@ -7957,7 +7996,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P */ (__pyx_v_info->format[0]) = '^'; - /* "../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":288 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":331 * info.format = PyObject_Malloc(_buffer_format_string_len) * info.format[0] = c'^' # Native data types, manual alignment * offset = 0 # <<<<<<<<<<<<<< @@ -7966,17 +8005,17 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P */ __pyx_v_offset = 0; - /* "../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":289 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":332 * info.format[0] = c'^' # Native data types, manual alignment * offset = 0 * f = _util_dtypestring(descr, info.format + 1, # <<<<<<<<<<<<<< * info.format + _buffer_format_string_len, * &offset) */ - __pyx_t_8 = __pyx_f_5numpy__util_dtypestring(__pyx_v_descr, (__pyx_v_info->format + 1), (__pyx_v_info->format + 0xFF), (&__pyx_v_offset)); if (unlikely(__pyx_t_8 == ((char *)NULL))) __PYX_ERR(3, 289, __pyx_L1_error) - __pyx_v_f = __pyx_t_8; + __pyx_t_9 = __pyx_f_5numpy__util_dtypestring(__pyx_v_descr, (__pyx_v_info->format + 1), (__pyx_v_info->format + 0xFF), (&__pyx_v_offset)); if (unlikely(__pyx_t_9 == ((char *)NULL))) __PYX_ERR(3, 332, __pyx_L1_error) + __pyx_v_f = __pyx_t_9; - /* "../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":292 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":335 * info.format + _buffer_format_string_len, * &offset) * f[0] = c'\0' # Terminate format string # <<<<<<<<<<<<<< @@ -7986,7 +8025,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P (__pyx_v_f[0]) = '\x00'; } - /* "../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":215 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":258 * # experimental exception made for __getbuffer__ and __releasebuffer__ * # -- the details of this may change. * def __getbuffer__(ndarray self, Py_buffer* info, int flags): # <<<<<<<<<<<<<< @@ -7999,7 +8038,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P goto __pyx_L0; __pyx_L1_error:; __Pyx_XDECREF(__pyx_t_3); - __Pyx_XDECREF(__pyx_t_7); + __Pyx_XDECREF(__pyx_t_8); __Pyx_AddTraceback("numpy.ndarray.__getbuffer__", __pyx_clineno, __pyx_lineno, __pyx_filename); __pyx_r = -1; if (__pyx_v_info->obj != NULL) { @@ -8018,7 +8057,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P return __pyx_r; } -/* "../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":294 +/* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":337 * f[0] = c'\0' # Terminate format string * * def __releasebuffer__(ndarray self, Py_buffer* info): # <<<<<<<<<<<<<< @@ -8042,7 +8081,7 @@ static void __pyx_pf_5numpy_7ndarray_2__releasebuffer__(PyArrayObject *__pyx_v_s int __pyx_t_1; __Pyx_RefNannySetupContext("__releasebuffer__", 0); - /* "../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":295 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":338 * * def __releasebuffer__(ndarray self, Py_buffer* info): * if PyArray_HASFIELDS(self): # <<<<<<<<<<<<<< @@ -8052,7 +8091,7 @@ static void __pyx_pf_5numpy_7ndarray_2__releasebuffer__(PyArrayObject *__pyx_v_s __pyx_t_1 = (PyArray_HASFIELDS(__pyx_v_self) != 0); if (__pyx_t_1) { - /* "../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":296 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":339 * def __releasebuffer__(ndarray self, Py_buffer* info): * if PyArray_HASFIELDS(self): * PyObject_Free(info.format) # <<<<<<<<<<<<<< @@ -8061,7 +8100,7 @@ static void __pyx_pf_5numpy_7ndarray_2__releasebuffer__(PyArrayObject *__pyx_v_s */ PyObject_Free(__pyx_v_info->format); - /* "../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":295 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":338 * * def __releasebuffer__(ndarray self, Py_buffer* info): * if PyArray_HASFIELDS(self): # <<<<<<<<<<<<<< @@ -8070,7 +8109,7 @@ static void __pyx_pf_5numpy_7ndarray_2__releasebuffer__(PyArrayObject *__pyx_v_s */ } - /* "../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":297 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":340 * if PyArray_HASFIELDS(self): * PyObject_Free(info.format) * if sizeof(npy_intp) != sizeof(Py_ssize_t): # <<<<<<<<<<<<<< @@ -8080,7 +8119,7 @@ static void __pyx_pf_5numpy_7ndarray_2__releasebuffer__(PyArrayObject *__pyx_v_s __pyx_t_1 = (((sizeof(npy_intp)) != (sizeof(Py_ssize_t))) != 0); if (__pyx_t_1) { - /* "../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":298 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":341 * PyObject_Free(info.format) * if sizeof(npy_intp) != sizeof(Py_ssize_t): * PyObject_Free(info.strides) # <<<<<<<<<<<<<< @@ -8089,7 +8128,7 @@ static void __pyx_pf_5numpy_7ndarray_2__releasebuffer__(PyArrayObject *__pyx_v_s */ PyObject_Free(__pyx_v_info->strides); - /* "../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":297 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":340 * if PyArray_HASFIELDS(self): * PyObject_Free(info.format) * if sizeof(npy_intp) != sizeof(Py_ssize_t): # <<<<<<<<<<<<<< @@ -8098,7 +8137,7 @@ static void __pyx_pf_5numpy_7ndarray_2__releasebuffer__(PyArrayObject *__pyx_v_s */ } - /* "../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":294 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":337 * f[0] = c'\0' # Terminate format string * * def __releasebuffer__(ndarray self, Py_buffer* info): # <<<<<<<<<<<<<< @@ -8110,7 +8149,7 @@ static void __pyx_pf_5numpy_7ndarray_2__releasebuffer__(PyArrayObject *__pyx_v_s __Pyx_RefNannyFinishContext(); } -/* "../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":775 +/* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":821 * ctypedef npy_cdouble complex_t * * cdef inline object PyArray_MultiIterNew1(a): # <<<<<<<<<<<<<< @@ -8124,7 +8163,7 @@ static CYTHON_INLINE PyObject *__pyx_f_5numpy_PyArray_MultiIterNew1(PyObject *__ PyObject *__pyx_t_1 = NULL; __Pyx_RefNannySetupContext("PyArray_MultiIterNew1", 0); - /* "../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":776 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":822 * * cdef inline object PyArray_MultiIterNew1(a): * return PyArray_MultiIterNew(1, a) # <<<<<<<<<<<<<< @@ -8132,13 +8171,13 @@ static CYTHON_INLINE PyObject *__pyx_f_5numpy_PyArray_MultiIterNew1(PyObject *__ * cdef inline object PyArray_MultiIterNew2(a, b): */ __Pyx_XDECREF(__pyx_r); - __pyx_t_1 = PyArray_MultiIterNew(1, ((void *)__pyx_v_a)); if (unlikely(!__pyx_t_1)) __PYX_ERR(3, 776, __pyx_L1_error) + __pyx_t_1 = PyArray_MultiIterNew(1, ((void *)__pyx_v_a)); if (unlikely(!__pyx_t_1)) __PYX_ERR(3, 822, __pyx_L1_error) __Pyx_GOTREF(__pyx_t_1); __pyx_r = __pyx_t_1; __pyx_t_1 = 0; goto __pyx_L0; - /* "../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":775 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":821 * ctypedef npy_cdouble complex_t * * cdef inline object PyArray_MultiIterNew1(a): # <<<<<<<<<<<<<< @@ -8157,7 +8196,7 @@ static CYTHON_INLINE PyObject *__pyx_f_5numpy_PyArray_MultiIterNew1(PyObject *__ return __pyx_r; } -/* "../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":778 +/* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":824 * return PyArray_MultiIterNew(1, a) * * cdef inline object PyArray_MultiIterNew2(a, b): # <<<<<<<<<<<<<< @@ -8171,7 +8210,7 @@ static CYTHON_INLINE PyObject *__pyx_f_5numpy_PyArray_MultiIterNew2(PyObject *__ PyObject *__pyx_t_1 = NULL; __Pyx_RefNannySetupContext("PyArray_MultiIterNew2", 0); - /* "../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":779 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":825 * * cdef inline object PyArray_MultiIterNew2(a, b): * return PyArray_MultiIterNew(2, a, b) # <<<<<<<<<<<<<< @@ -8179,13 +8218,13 @@ static CYTHON_INLINE PyObject *__pyx_f_5numpy_PyArray_MultiIterNew2(PyObject *__ * cdef inline object PyArray_MultiIterNew3(a, b, c): */ __Pyx_XDECREF(__pyx_r); - __pyx_t_1 = PyArray_MultiIterNew(2, ((void *)__pyx_v_a), ((void *)__pyx_v_b)); if (unlikely(!__pyx_t_1)) __PYX_ERR(3, 779, __pyx_L1_error) + __pyx_t_1 = PyArray_MultiIterNew(2, ((void *)__pyx_v_a), ((void *)__pyx_v_b)); if (unlikely(!__pyx_t_1)) __PYX_ERR(3, 825, __pyx_L1_error) __Pyx_GOTREF(__pyx_t_1); __pyx_r = __pyx_t_1; __pyx_t_1 = 0; goto __pyx_L0; - /* "../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":778 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":824 * return PyArray_MultiIterNew(1, a) * * cdef inline object PyArray_MultiIterNew2(a, b): # <<<<<<<<<<<<<< @@ -8204,7 +8243,7 @@ static CYTHON_INLINE PyObject *__pyx_f_5numpy_PyArray_MultiIterNew2(PyObject *__ return __pyx_r; } -/* "../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":781 +/* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":827 * return PyArray_MultiIterNew(2, a, b) * * cdef inline object PyArray_MultiIterNew3(a, b, c): # <<<<<<<<<<<<<< @@ -8218,7 +8257,7 @@ static CYTHON_INLINE PyObject *__pyx_f_5numpy_PyArray_MultiIterNew3(PyObject *__ PyObject *__pyx_t_1 = NULL; __Pyx_RefNannySetupContext("PyArray_MultiIterNew3", 0); - /* "../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":782 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":828 * * cdef inline object PyArray_MultiIterNew3(a, b, c): * return PyArray_MultiIterNew(3, a, b, c) # <<<<<<<<<<<<<< @@ -8226,13 +8265,13 @@ static CYTHON_INLINE PyObject *__pyx_f_5numpy_PyArray_MultiIterNew3(PyObject *__ * cdef inline object PyArray_MultiIterNew4(a, b, c, d): */ __Pyx_XDECREF(__pyx_r); - __pyx_t_1 = PyArray_MultiIterNew(3, ((void *)__pyx_v_a), ((void *)__pyx_v_b), ((void *)__pyx_v_c)); if (unlikely(!__pyx_t_1)) __PYX_ERR(3, 782, __pyx_L1_error) + __pyx_t_1 = PyArray_MultiIterNew(3, ((void *)__pyx_v_a), ((void *)__pyx_v_b), ((void *)__pyx_v_c)); if (unlikely(!__pyx_t_1)) __PYX_ERR(3, 828, __pyx_L1_error) __Pyx_GOTREF(__pyx_t_1); __pyx_r = __pyx_t_1; __pyx_t_1 = 0; goto __pyx_L0; - /* "../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":781 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":827 * return PyArray_MultiIterNew(2, a, b) * * cdef inline object PyArray_MultiIterNew3(a, b, c): # <<<<<<<<<<<<<< @@ -8251,7 +8290,7 @@ static CYTHON_INLINE PyObject *__pyx_f_5numpy_PyArray_MultiIterNew3(PyObject *__ return __pyx_r; } -/* "../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":784 +/* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":830 * return PyArray_MultiIterNew(3, a, b, c) * * cdef inline object PyArray_MultiIterNew4(a, b, c, d): # <<<<<<<<<<<<<< @@ -8265,7 +8304,7 @@ static CYTHON_INLINE PyObject *__pyx_f_5numpy_PyArray_MultiIterNew4(PyObject *__ PyObject *__pyx_t_1 = NULL; __Pyx_RefNannySetupContext("PyArray_MultiIterNew4", 0); - /* "../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":785 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":831 * * cdef inline object PyArray_MultiIterNew4(a, b, c, d): * return PyArray_MultiIterNew(4, a, b, c, d) # <<<<<<<<<<<<<< @@ -8273,13 +8312,13 @@ static CYTHON_INLINE PyObject *__pyx_f_5numpy_PyArray_MultiIterNew4(PyObject *__ * cdef inline object PyArray_MultiIterNew5(a, b, c, d, e): */ __Pyx_XDECREF(__pyx_r); - __pyx_t_1 = PyArray_MultiIterNew(4, ((void *)__pyx_v_a), ((void *)__pyx_v_b), ((void *)__pyx_v_c), ((void *)__pyx_v_d)); if (unlikely(!__pyx_t_1)) __PYX_ERR(3, 785, __pyx_L1_error) + __pyx_t_1 = PyArray_MultiIterNew(4, ((void *)__pyx_v_a), ((void *)__pyx_v_b), ((void *)__pyx_v_c), ((void *)__pyx_v_d)); if (unlikely(!__pyx_t_1)) __PYX_ERR(3, 831, __pyx_L1_error) __Pyx_GOTREF(__pyx_t_1); __pyx_r = __pyx_t_1; __pyx_t_1 = 0; goto __pyx_L0; - /* "../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":784 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":830 * return PyArray_MultiIterNew(3, a, b, c) * * cdef inline object PyArray_MultiIterNew4(a, b, c, d): # <<<<<<<<<<<<<< @@ -8298,7 +8337,7 @@ static CYTHON_INLINE PyObject *__pyx_f_5numpy_PyArray_MultiIterNew4(PyObject *__ return __pyx_r; } -/* "../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":787 +/* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":833 * return PyArray_MultiIterNew(4, a, b, c, d) * * cdef inline object PyArray_MultiIterNew5(a, b, c, d, e): # <<<<<<<<<<<<<< @@ -8312,7 +8351,7 @@ static CYTHON_INLINE PyObject *__pyx_f_5numpy_PyArray_MultiIterNew5(PyObject *__ PyObject *__pyx_t_1 = NULL; __Pyx_RefNannySetupContext("PyArray_MultiIterNew5", 0); - /* "../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":788 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":834 * * cdef inline object PyArray_MultiIterNew5(a, b, c, d, e): * return PyArray_MultiIterNew(5, a, b, c, d, e) # <<<<<<<<<<<<<< @@ -8320,13 +8359,13 @@ static CYTHON_INLINE PyObject *__pyx_f_5numpy_PyArray_MultiIterNew5(PyObject *__ * cdef inline tuple PyDataType_SHAPE(dtype d): */ __Pyx_XDECREF(__pyx_r); - __pyx_t_1 = PyArray_MultiIterNew(5, ((void *)__pyx_v_a), ((void *)__pyx_v_b), ((void *)__pyx_v_c), ((void *)__pyx_v_d), ((void *)__pyx_v_e)); if (unlikely(!__pyx_t_1)) __PYX_ERR(3, 788, __pyx_L1_error) + __pyx_t_1 = PyArray_MultiIterNew(5, ((void *)__pyx_v_a), ((void *)__pyx_v_b), ((void *)__pyx_v_c), ((void *)__pyx_v_d), ((void *)__pyx_v_e)); if (unlikely(!__pyx_t_1)) __PYX_ERR(3, 834, __pyx_L1_error) __Pyx_GOTREF(__pyx_t_1); __pyx_r = __pyx_t_1; __pyx_t_1 = 0; goto __pyx_L0; - /* "../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":787 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":833 * return PyArray_MultiIterNew(4, a, b, c, d) * * cdef inline object PyArray_MultiIterNew5(a, b, c, d, e): # <<<<<<<<<<<<<< @@ -8345,7 +8384,7 @@ static CYTHON_INLINE PyObject *__pyx_f_5numpy_PyArray_MultiIterNew5(PyObject *__ return __pyx_r; } -/* "../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":790 +/* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":836 * return PyArray_MultiIterNew(5, a, b, c, d, e) * * cdef inline tuple PyDataType_SHAPE(dtype d): # <<<<<<<<<<<<<< @@ -8359,7 +8398,7 @@ static CYTHON_INLINE PyObject *__pyx_f_5numpy_PyDataType_SHAPE(PyArray_Descr *__ int __pyx_t_1; __Pyx_RefNannySetupContext("PyDataType_SHAPE", 0); - /* "../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":791 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":837 * * cdef inline tuple PyDataType_SHAPE(dtype d): * if PyDataType_HASSUBARRAY(d): # <<<<<<<<<<<<<< @@ -8369,7 +8408,7 @@ static CYTHON_INLINE PyObject *__pyx_f_5numpy_PyDataType_SHAPE(PyArray_Descr *__ __pyx_t_1 = (PyDataType_HASSUBARRAY(__pyx_v_d) != 0); if (__pyx_t_1) { - /* "../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":792 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":838 * cdef inline tuple PyDataType_SHAPE(dtype d): * if PyDataType_HASSUBARRAY(d): * return d.subarray.shape # <<<<<<<<<<<<<< @@ -8381,7 +8420,7 @@ static CYTHON_INLINE PyObject *__pyx_f_5numpy_PyDataType_SHAPE(PyArray_Descr *__ __pyx_r = ((PyObject*)__pyx_v_d->subarray->shape); goto __pyx_L0; - /* "../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":791 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":837 * * cdef inline tuple PyDataType_SHAPE(dtype d): * if PyDataType_HASSUBARRAY(d): # <<<<<<<<<<<<<< @@ -8390,7 +8429,7 @@ static CYTHON_INLINE PyObject *__pyx_f_5numpy_PyDataType_SHAPE(PyArray_Descr *__ */ } - /* "../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":794 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":840 * return d.subarray.shape * else: * return () # <<<<<<<<<<<<<< @@ -8404,7 +8443,7 @@ static CYTHON_INLINE PyObject *__pyx_f_5numpy_PyDataType_SHAPE(PyArray_Descr *__ goto __pyx_L0; } - /* "../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":790 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":836 * return PyArray_MultiIterNew(5, a, b, c, d, e) * * cdef inline tuple PyDataType_SHAPE(dtype d): # <<<<<<<<<<<<<< @@ -8419,7 +8458,7 @@ static CYTHON_INLINE PyObject *__pyx_f_5numpy_PyDataType_SHAPE(PyArray_Descr *__ return __pyx_r; } -/* "../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":796 +/* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":842 * return () * * cdef inline char* _util_dtypestring(dtype descr, char* f, char* end, int* offset) except NULL: # <<<<<<<<<<<<<< @@ -8448,7 +8487,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx char *__pyx_t_9; __Pyx_RefNannySetupContext("_util_dtypestring", 0); - /* "../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":801 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":847 * * cdef dtype child * cdef int endian_detector = 1 # <<<<<<<<<<<<<< @@ -8457,7 +8496,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx */ __pyx_v_endian_detector = 1; - /* "../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":802 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":848 * cdef dtype child * cdef int endian_detector = 1 * cdef bint little_endian = ((&endian_detector)[0] != 0) # <<<<<<<<<<<<<< @@ -8466,7 +8505,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx */ __pyx_v_little_endian = ((((char *)(&__pyx_v_endian_detector))[0]) != 0); - /* "../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":805 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":851 * cdef tuple fields * * for childname in descr.names: # <<<<<<<<<<<<<< @@ -8475,21 +8514,21 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx */ if (unlikely(__pyx_v_descr->names == Py_None)) { PyErr_SetString(PyExc_TypeError, "'NoneType' object is not iterable"); - __PYX_ERR(3, 805, __pyx_L1_error) + __PYX_ERR(3, 851, __pyx_L1_error) } __pyx_t_1 = __pyx_v_descr->names; __Pyx_INCREF(__pyx_t_1); __pyx_t_2 = 0; for (;;) { if (__pyx_t_2 >= PyTuple_GET_SIZE(__pyx_t_1)) break; #if CYTHON_ASSUME_SAFE_MACROS && !CYTHON_AVOID_BORROWED_REFS - __pyx_t_3 = PyTuple_GET_ITEM(__pyx_t_1, __pyx_t_2); __Pyx_INCREF(__pyx_t_3); __pyx_t_2++; if (unlikely(0 < 0)) __PYX_ERR(3, 805, __pyx_L1_error) + __pyx_t_3 = PyTuple_GET_ITEM(__pyx_t_1, __pyx_t_2); __Pyx_INCREF(__pyx_t_3); __pyx_t_2++; if (unlikely(0 < 0)) __PYX_ERR(3, 851, __pyx_L1_error) #else - __pyx_t_3 = PySequence_ITEM(__pyx_t_1, __pyx_t_2); __pyx_t_2++; if (unlikely(!__pyx_t_3)) __PYX_ERR(3, 805, __pyx_L1_error) + __pyx_t_3 = PySequence_ITEM(__pyx_t_1, __pyx_t_2); __pyx_t_2++; if (unlikely(!__pyx_t_3)) __PYX_ERR(3, 851, __pyx_L1_error) __Pyx_GOTREF(__pyx_t_3); #endif __Pyx_XDECREF_SET(__pyx_v_childname, __pyx_t_3); __pyx_t_3 = 0; - /* "../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":806 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":852 * * for childname in descr.names: * fields = descr.fields[childname] # <<<<<<<<<<<<<< @@ -8498,15 +8537,15 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx */ if (unlikely(__pyx_v_descr->fields == Py_None)) { PyErr_SetString(PyExc_TypeError, "'NoneType' object is not subscriptable"); - __PYX_ERR(3, 806, __pyx_L1_error) + __PYX_ERR(3, 852, __pyx_L1_error) } - __pyx_t_3 = __Pyx_PyDict_GetItem(__pyx_v_descr->fields, __pyx_v_childname); if (unlikely(!__pyx_t_3)) __PYX_ERR(3, 806, __pyx_L1_error) + __pyx_t_3 = __Pyx_PyDict_GetItem(__pyx_v_descr->fields, __pyx_v_childname); if (unlikely(!__pyx_t_3)) __PYX_ERR(3, 852, __pyx_L1_error) __Pyx_GOTREF(__pyx_t_3); - if (!(likely(PyTuple_CheckExact(__pyx_t_3))||((__pyx_t_3) == Py_None)||(PyErr_Format(PyExc_TypeError, "Expected %.16s, got %.200s", "tuple", Py_TYPE(__pyx_t_3)->tp_name), 0))) __PYX_ERR(3, 806, __pyx_L1_error) + if (!(likely(PyTuple_CheckExact(__pyx_t_3))||((__pyx_t_3) == Py_None)||(PyErr_Format(PyExc_TypeError, "Expected %.16s, got %.200s", "tuple", Py_TYPE(__pyx_t_3)->tp_name), 0))) __PYX_ERR(3, 852, __pyx_L1_error) __Pyx_XDECREF_SET(__pyx_v_fields, ((PyObject*)__pyx_t_3)); __pyx_t_3 = 0; - /* "../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":807 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":853 * for childname in descr.names: * fields = descr.fields[childname] * child, new_offset = fields # <<<<<<<<<<<<<< @@ -8519,7 +8558,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx if (unlikely(size != 2)) { if (size > 2) __Pyx_RaiseTooManyValuesError(2); else if (size >= 0) __Pyx_RaiseNeedMoreValuesError(size); - __PYX_ERR(3, 807, __pyx_L1_error) + __PYX_ERR(3, 853, __pyx_L1_error) } #if CYTHON_ASSUME_SAFE_MACROS && !CYTHON_AVOID_BORROWED_REFS __pyx_t_3 = PyTuple_GET_ITEM(sequence, 0); @@ -8527,51 +8566,51 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx __Pyx_INCREF(__pyx_t_3); __Pyx_INCREF(__pyx_t_4); #else - __pyx_t_3 = PySequence_ITEM(sequence, 0); if (unlikely(!__pyx_t_3)) __PYX_ERR(3, 807, __pyx_L1_error) + __pyx_t_3 = PySequence_ITEM(sequence, 0); if (unlikely(!__pyx_t_3)) __PYX_ERR(3, 853, __pyx_L1_error) __Pyx_GOTREF(__pyx_t_3); - __pyx_t_4 = PySequence_ITEM(sequence, 1); if (unlikely(!__pyx_t_4)) __PYX_ERR(3, 807, __pyx_L1_error) + __pyx_t_4 = PySequence_ITEM(sequence, 1); if (unlikely(!__pyx_t_4)) __PYX_ERR(3, 853, __pyx_L1_error) __Pyx_GOTREF(__pyx_t_4); #endif } else { - __Pyx_RaiseNoneNotIterableError(); __PYX_ERR(3, 807, __pyx_L1_error) + __Pyx_RaiseNoneNotIterableError(); __PYX_ERR(3, 853, __pyx_L1_error) } - if (!(likely(((__pyx_t_3) == Py_None) || likely(__Pyx_TypeTest(__pyx_t_3, __pyx_ptype_5numpy_dtype))))) __PYX_ERR(3, 807, __pyx_L1_error) + if (!(likely(((__pyx_t_3) == Py_None) || likely(__Pyx_TypeTest(__pyx_t_3, __pyx_ptype_5numpy_dtype))))) __PYX_ERR(3, 853, __pyx_L1_error) __Pyx_XDECREF_SET(__pyx_v_child, ((PyArray_Descr *)__pyx_t_3)); __pyx_t_3 = 0; __Pyx_XDECREF_SET(__pyx_v_new_offset, __pyx_t_4); __pyx_t_4 = 0; - /* "../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":809 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":855 * child, new_offset = fields * * if (end - f) - (new_offset - offset[0]) < 15: # <<<<<<<<<<<<<< * raise RuntimeError(u"Format string allocated too short, see comment in numpy.pxd") * */ - __pyx_t_4 = __Pyx_PyInt_From_int((__pyx_v_offset[0])); if (unlikely(!__pyx_t_4)) __PYX_ERR(3, 809, __pyx_L1_error) + __pyx_t_4 = __Pyx_PyInt_From_int((__pyx_v_offset[0])); if (unlikely(!__pyx_t_4)) __PYX_ERR(3, 855, __pyx_L1_error) __Pyx_GOTREF(__pyx_t_4); - __pyx_t_3 = PyNumber_Subtract(__pyx_v_new_offset, __pyx_t_4); if (unlikely(!__pyx_t_3)) __PYX_ERR(3, 809, __pyx_L1_error) + __pyx_t_3 = PyNumber_Subtract(__pyx_v_new_offset, __pyx_t_4); if (unlikely(!__pyx_t_3)) __PYX_ERR(3, 855, __pyx_L1_error) __Pyx_GOTREF(__pyx_t_3); __Pyx_DECREF(__pyx_t_4); __pyx_t_4 = 0; - __pyx_t_5 = __Pyx_PyInt_As_int(__pyx_t_3); if (unlikely((__pyx_t_5 == (int)-1) && PyErr_Occurred())) __PYX_ERR(3, 809, __pyx_L1_error) + __pyx_t_5 = __Pyx_PyInt_As_int(__pyx_t_3); if (unlikely((__pyx_t_5 == (int)-1) && PyErr_Occurred())) __PYX_ERR(3, 855, __pyx_L1_error) __Pyx_DECREF(__pyx_t_3); __pyx_t_3 = 0; __pyx_t_6 = ((((__pyx_v_end - __pyx_v_f) - ((int)__pyx_t_5)) < 15) != 0); if (unlikely(__pyx_t_6)) { - /* "../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":810 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":856 * * if (end - f) - (new_offset - offset[0]) < 15: * raise RuntimeError(u"Format string allocated too short, see comment in numpy.pxd") # <<<<<<<<<<<<<< * * if ((child.byteorder == c'>' and little_endian) or */ - __pyx_t_3 = __Pyx_PyObject_Call(__pyx_builtin_RuntimeError, __pyx_tuple__7, NULL); if (unlikely(!__pyx_t_3)) __PYX_ERR(3, 810, __pyx_L1_error) + __pyx_t_3 = __Pyx_PyObject_Call(__pyx_builtin_RuntimeError, __pyx_tuple__6, NULL); if (unlikely(!__pyx_t_3)) __PYX_ERR(3, 856, __pyx_L1_error) __Pyx_GOTREF(__pyx_t_3); __Pyx_Raise(__pyx_t_3, 0, 0, 0); __Pyx_DECREF(__pyx_t_3); __pyx_t_3 = 0; - __PYX_ERR(3, 810, __pyx_L1_error) + __PYX_ERR(3, 856, __pyx_L1_error) - /* "../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":809 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":855 * child, new_offset = fields * * if (end - f) - (new_offset - offset[0]) < 15: # <<<<<<<<<<<<<< @@ -8580,7 +8619,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx */ } - /* "../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":812 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":858 * raise RuntimeError(u"Format string allocated too short, see comment in numpy.pxd") * * if ((child.byteorder == c'>' and little_endian) or # <<<<<<<<<<<<<< @@ -8600,7 +8639,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx } __pyx_L8_next_or:; - /* "../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":813 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":859 * * if ((child.byteorder == c'>' and little_endian) or * (child.byteorder == c'<' and not little_endian)): # <<<<<<<<<<<<<< @@ -8617,7 +8656,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx __pyx_t_6 = __pyx_t_7; __pyx_L7_bool_binop_done:; - /* "../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":812 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":858 * raise RuntimeError(u"Format string allocated too short, see comment in numpy.pxd") * * if ((child.byteorder == c'>' and little_endian) or # <<<<<<<<<<<<<< @@ -8626,20 +8665,20 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx */ if (unlikely(__pyx_t_6)) { - /* "../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":814 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":860 * if ((child.byteorder == c'>' and little_endian) or * (child.byteorder == c'<' and not little_endian)): * raise ValueError(u"Non-native byte order not supported") # <<<<<<<<<<<<<< * # One could encode it in the format string and have Cython * # complain instead, BUT: < and > in format strings also imply */ - __pyx_t_3 = __Pyx_PyObject_Call(__pyx_builtin_ValueError, __pyx_tuple__8, NULL); if (unlikely(!__pyx_t_3)) __PYX_ERR(3, 814, __pyx_L1_error) + __pyx_t_3 = __Pyx_PyObject_Call(__pyx_builtin_ValueError, __pyx_tuple__5, NULL); if (unlikely(!__pyx_t_3)) __PYX_ERR(3, 860, __pyx_L1_error) __Pyx_GOTREF(__pyx_t_3); __Pyx_Raise(__pyx_t_3, 0, 0, 0); __Pyx_DECREF(__pyx_t_3); __pyx_t_3 = 0; - __PYX_ERR(3, 814, __pyx_L1_error) + __PYX_ERR(3, 860, __pyx_L1_error) - /* "../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":812 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":858 * raise RuntimeError(u"Format string allocated too short, see comment in numpy.pxd") * * if ((child.byteorder == c'>' and little_endian) or # <<<<<<<<<<<<<< @@ -8648,7 +8687,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx */ } - /* "../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":824 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":870 * * # Output padding bytes * while offset[0] < new_offset: # <<<<<<<<<<<<<< @@ -8656,15 +8695,15 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx * f += 1 */ while (1) { - __pyx_t_3 = __Pyx_PyInt_From_int((__pyx_v_offset[0])); if (unlikely(!__pyx_t_3)) __PYX_ERR(3, 824, __pyx_L1_error) + __pyx_t_3 = __Pyx_PyInt_From_int((__pyx_v_offset[0])); if (unlikely(!__pyx_t_3)) __PYX_ERR(3, 870, __pyx_L1_error) __Pyx_GOTREF(__pyx_t_3); - __pyx_t_4 = PyObject_RichCompare(__pyx_t_3, __pyx_v_new_offset, Py_LT); __Pyx_XGOTREF(__pyx_t_4); if (unlikely(!__pyx_t_4)) __PYX_ERR(3, 824, __pyx_L1_error) + __pyx_t_4 = PyObject_RichCompare(__pyx_t_3, __pyx_v_new_offset, Py_LT); __Pyx_XGOTREF(__pyx_t_4); if (unlikely(!__pyx_t_4)) __PYX_ERR(3, 870, __pyx_L1_error) __Pyx_DECREF(__pyx_t_3); __pyx_t_3 = 0; - __pyx_t_6 = __Pyx_PyObject_IsTrue(__pyx_t_4); if (unlikely(__pyx_t_6 < 0)) __PYX_ERR(3, 824, __pyx_L1_error) + __pyx_t_6 = __Pyx_PyObject_IsTrue(__pyx_t_4); if (unlikely(__pyx_t_6 < 0)) __PYX_ERR(3, 870, __pyx_L1_error) __Pyx_DECREF(__pyx_t_4); __pyx_t_4 = 0; if (!__pyx_t_6) break; - /* "../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":825 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":871 * # Output padding bytes * while offset[0] < new_offset: * f[0] = 120 # "x"; pad byte # <<<<<<<<<<<<<< @@ -8673,7 +8712,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx */ (__pyx_v_f[0]) = 0x78; - /* "../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":826 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":872 * while offset[0] < new_offset: * f[0] = 120 # "x"; pad byte * f += 1 # <<<<<<<<<<<<<< @@ -8682,7 +8721,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx */ __pyx_v_f = (__pyx_v_f + 1); - /* "../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":827 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":873 * f[0] = 120 # "x"; pad byte * f += 1 * offset[0] += 1 # <<<<<<<<<<<<<< @@ -8693,7 +8732,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx (__pyx_v_offset[__pyx_t_8]) = ((__pyx_v_offset[__pyx_t_8]) + 1); } - /* "../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":829 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":875 * offset[0] += 1 * * offset[0] += child.itemsize # <<<<<<<<<<<<<< @@ -8703,7 +8742,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx __pyx_t_8 = 0; (__pyx_v_offset[__pyx_t_8]) = ((__pyx_v_offset[__pyx_t_8]) + __pyx_v_child->elsize); - /* "../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":831 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":877 * offset[0] += child.itemsize * * if not PyDataType_HASFIELDS(child): # <<<<<<<<<<<<<< @@ -8713,19 +8752,19 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx __pyx_t_6 = ((!(PyDataType_HASFIELDS(__pyx_v_child) != 0)) != 0); if (__pyx_t_6) { - /* "../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":832 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":878 * * if not PyDataType_HASFIELDS(child): * t = child.type_num # <<<<<<<<<<<<<< * if end - f < 5: * raise RuntimeError(u"Format string allocated too short.") */ - __pyx_t_4 = __Pyx_PyInt_From_int(__pyx_v_child->type_num); if (unlikely(!__pyx_t_4)) __PYX_ERR(3, 832, __pyx_L1_error) + __pyx_t_4 = __Pyx_PyInt_From_int(__pyx_v_child->type_num); if (unlikely(!__pyx_t_4)) __PYX_ERR(3, 878, __pyx_L1_error) __Pyx_GOTREF(__pyx_t_4); __Pyx_XDECREF_SET(__pyx_v_t, __pyx_t_4); __pyx_t_4 = 0; - /* "../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":833 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":879 * if not PyDataType_HASFIELDS(child): * t = child.type_num * if end - f < 5: # <<<<<<<<<<<<<< @@ -8735,20 +8774,20 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx __pyx_t_6 = (((__pyx_v_end - __pyx_v_f) < 5) != 0); if (unlikely(__pyx_t_6)) { - /* "../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":834 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":880 * t = child.type_num * if end - f < 5: * raise RuntimeError(u"Format string allocated too short.") # <<<<<<<<<<<<<< * * # Until ticket #99 is fixed, use integers to avoid warnings */ - __pyx_t_4 = __Pyx_PyObject_Call(__pyx_builtin_RuntimeError, __pyx_tuple__9, NULL); if (unlikely(!__pyx_t_4)) __PYX_ERR(3, 834, __pyx_L1_error) + __pyx_t_4 = __Pyx_PyObject_Call(__pyx_builtin_RuntimeError, __pyx_tuple__7, NULL); if (unlikely(!__pyx_t_4)) __PYX_ERR(3, 880, __pyx_L1_error) __Pyx_GOTREF(__pyx_t_4); __Pyx_Raise(__pyx_t_4, 0, 0, 0); __Pyx_DECREF(__pyx_t_4); __pyx_t_4 = 0; - __PYX_ERR(3, 834, __pyx_L1_error) + __PYX_ERR(3, 880, __pyx_L1_error) - /* "../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":833 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":879 * if not PyDataType_HASFIELDS(child): * t = child.type_num * if end - f < 5: # <<<<<<<<<<<<<< @@ -8757,252 +8796,252 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx */ } - /* "../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":837 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":883 * * # Until ticket #99 is fixed, use integers to avoid warnings * if t == NPY_BYTE: f[0] = 98 #"b" # <<<<<<<<<<<<<< * elif t == NPY_UBYTE: f[0] = 66 #"B" * elif t == NPY_SHORT: f[0] = 104 #"h" */ - __pyx_t_4 = __Pyx_PyInt_From_enum__NPY_TYPES(NPY_BYTE); if (unlikely(!__pyx_t_4)) __PYX_ERR(3, 837, __pyx_L1_error) + __pyx_t_4 = __Pyx_PyInt_From_enum__NPY_TYPES(NPY_BYTE); if (unlikely(!__pyx_t_4)) __PYX_ERR(3, 883, __pyx_L1_error) __Pyx_GOTREF(__pyx_t_4); - __pyx_t_3 = PyObject_RichCompare(__pyx_v_t, __pyx_t_4, Py_EQ); __Pyx_XGOTREF(__pyx_t_3); if (unlikely(!__pyx_t_3)) __PYX_ERR(3, 837, __pyx_L1_error) + __pyx_t_3 = PyObject_RichCompare(__pyx_v_t, __pyx_t_4, Py_EQ); __Pyx_XGOTREF(__pyx_t_3); if (unlikely(!__pyx_t_3)) __PYX_ERR(3, 883, __pyx_L1_error) __Pyx_DECREF(__pyx_t_4); __pyx_t_4 = 0; - __pyx_t_6 = __Pyx_PyObject_IsTrue(__pyx_t_3); if (unlikely(__pyx_t_6 < 0)) __PYX_ERR(3, 837, __pyx_L1_error) + __pyx_t_6 = __Pyx_PyObject_IsTrue(__pyx_t_3); if (unlikely(__pyx_t_6 < 0)) __PYX_ERR(3, 883, __pyx_L1_error) __Pyx_DECREF(__pyx_t_3); __pyx_t_3 = 0; if (__pyx_t_6) { (__pyx_v_f[0]) = 98; goto __pyx_L15; } - /* "../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":838 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":884 * # Until ticket #99 is fixed, use integers to avoid warnings * if t == NPY_BYTE: f[0] = 98 #"b" * elif t == NPY_UBYTE: f[0] = 66 #"B" # <<<<<<<<<<<<<< * elif t == NPY_SHORT: f[0] = 104 #"h" * elif t == NPY_USHORT: f[0] = 72 #"H" */ - __pyx_t_3 = __Pyx_PyInt_From_enum__NPY_TYPES(NPY_UBYTE); if (unlikely(!__pyx_t_3)) __PYX_ERR(3, 838, __pyx_L1_error) + __pyx_t_3 = __Pyx_PyInt_From_enum__NPY_TYPES(NPY_UBYTE); if (unlikely(!__pyx_t_3)) __PYX_ERR(3, 884, __pyx_L1_error) __Pyx_GOTREF(__pyx_t_3); - __pyx_t_4 = PyObject_RichCompare(__pyx_v_t, __pyx_t_3, Py_EQ); __Pyx_XGOTREF(__pyx_t_4); if (unlikely(!__pyx_t_4)) __PYX_ERR(3, 838, __pyx_L1_error) + __pyx_t_4 = PyObject_RichCompare(__pyx_v_t, __pyx_t_3, Py_EQ); __Pyx_XGOTREF(__pyx_t_4); if (unlikely(!__pyx_t_4)) __PYX_ERR(3, 884, __pyx_L1_error) __Pyx_DECREF(__pyx_t_3); __pyx_t_3 = 0; - __pyx_t_6 = __Pyx_PyObject_IsTrue(__pyx_t_4); if (unlikely(__pyx_t_6 < 0)) __PYX_ERR(3, 838, __pyx_L1_error) + __pyx_t_6 = __Pyx_PyObject_IsTrue(__pyx_t_4); if (unlikely(__pyx_t_6 < 0)) __PYX_ERR(3, 884, __pyx_L1_error) __Pyx_DECREF(__pyx_t_4); __pyx_t_4 = 0; if (__pyx_t_6) { (__pyx_v_f[0]) = 66; goto __pyx_L15; } - /* "../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":839 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":885 * if t == NPY_BYTE: f[0] = 98 #"b" * elif t == NPY_UBYTE: f[0] = 66 #"B" * elif t == NPY_SHORT: f[0] = 104 #"h" # <<<<<<<<<<<<<< * elif t == NPY_USHORT: f[0] = 72 #"H" * elif t == NPY_INT: f[0] = 105 #"i" */ - __pyx_t_4 = __Pyx_PyInt_From_enum__NPY_TYPES(NPY_SHORT); if (unlikely(!__pyx_t_4)) __PYX_ERR(3, 839, __pyx_L1_error) + __pyx_t_4 = __Pyx_PyInt_From_enum__NPY_TYPES(NPY_SHORT); if (unlikely(!__pyx_t_4)) __PYX_ERR(3, 885, __pyx_L1_error) __Pyx_GOTREF(__pyx_t_4); - __pyx_t_3 = PyObject_RichCompare(__pyx_v_t, __pyx_t_4, Py_EQ); __Pyx_XGOTREF(__pyx_t_3); if (unlikely(!__pyx_t_3)) __PYX_ERR(3, 839, __pyx_L1_error) + __pyx_t_3 = PyObject_RichCompare(__pyx_v_t, __pyx_t_4, Py_EQ); __Pyx_XGOTREF(__pyx_t_3); if (unlikely(!__pyx_t_3)) __PYX_ERR(3, 885, __pyx_L1_error) __Pyx_DECREF(__pyx_t_4); __pyx_t_4 = 0; - __pyx_t_6 = __Pyx_PyObject_IsTrue(__pyx_t_3); if (unlikely(__pyx_t_6 < 0)) __PYX_ERR(3, 839, __pyx_L1_error) + __pyx_t_6 = __Pyx_PyObject_IsTrue(__pyx_t_3); if (unlikely(__pyx_t_6 < 0)) __PYX_ERR(3, 885, __pyx_L1_error) __Pyx_DECREF(__pyx_t_3); __pyx_t_3 = 0; if (__pyx_t_6) { (__pyx_v_f[0]) = 0x68; goto __pyx_L15; } - /* "../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":840 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":886 * elif t == NPY_UBYTE: f[0] = 66 #"B" * elif t == NPY_SHORT: f[0] = 104 #"h" * elif t == NPY_USHORT: f[0] = 72 #"H" # <<<<<<<<<<<<<< * elif t == NPY_INT: f[0] = 105 #"i" * elif t == NPY_UINT: f[0] = 73 #"I" */ - __pyx_t_3 = __Pyx_PyInt_From_enum__NPY_TYPES(NPY_USHORT); if (unlikely(!__pyx_t_3)) __PYX_ERR(3, 840, __pyx_L1_error) + __pyx_t_3 = __Pyx_PyInt_From_enum__NPY_TYPES(NPY_USHORT); if (unlikely(!__pyx_t_3)) __PYX_ERR(3, 886, __pyx_L1_error) __Pyx_GOTREF(__pyx_t_3); - __pyx_t_4 = PyObject_RichCompare(__pyx_v_t, __pyx_t_3, Py_EQ); __Pyx_XGOTREF(__pyx_t_4); if (unlikely(!__pyx_t_4)) __PYX_ERR(3, 840, __pyx_L1_error) + __pyx_t_4 = PyObject_RichCompare(__pyx_v_t, __pyx_t_3, Py_EQ); __Pyx_XGOTREF(__pyx_t_4); if (unlikely(!__pyx_t_4)) __PYX_ERR(3, 886, __pyx_L1_error) __Pyx_DECREF(__pyx_t_3); __pyx_t_3 = 0; - __pyx_t_6 = __Pyx_PyObject_IsTrue(__pyx_t_4); if (unlikely(__pyx_t_6 < 0)) __PYX_ERR(3, 840, __pyx_L1_error) + __pyx_t_6 = __Pyx_PyObject_IsTrue(__pyx_t_4); if (unlikely(__pyx_t_6 < 0)) __PYX_ERR(3, 886, __pyx_L1_error) __Pyx_DECREF(__pyx_t_4); __pyx_t_4 = 0; if (__pyx_t_6) { (__pyx_v_f[0]) = 72; goto __pyx_L15; } - /* "../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":841 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":887 * elif t == NPY_SHORT: f[0] = 104 #"h" * elif t == NPY_USHORT: f[0] = 72 #"H" * elif t == NPY_INT: f[0] = 105 #"i" # <<<<<<<<<<<<<< * elif t == NPY_UINT: f[0] = 73 #"I" * elif t == NPY_LONG: f[0] = 108 #"l" */ - __pyx_t_4 = __Pyx_PyInt_From_enum__NPY_TYPES(NPY_INT); if (unlikely(!__pyx_t_4)) __PYX_ERR(3, 841, __pyx_L1_error) + __pyx_t_4 = __Pyx_PyInt_From_enum__NPY_TYPES(NPY_INT); if (unlikely(!__pyx_t_4)) __PYX_ERR(3, 887, __pyx_L1_error) __Pyx_GOTREF(__pyx_t_4); - __pyx_t_3 = PyObject_RichCompare(__pyx_v_t, __pyx_t_4, Py_EQ); __Pyx_XGOTREF(__pyx_t_3); if (unlikely(!__pyx_t_3)) __PYX_ERR(3, 841, __pyx_L1_error) + __pyx_t_3 = PyObject_RichCompare(__pyx_v_t, __pyx_t_4, Py_EQ); __Pyx_XGOTREF(__pyx_t_3); if (unlikely(!__pyx_t_3)) __PYX_ERR(3, 887, __pyx_L1_error) __Pyx_DECREF(__pyx_t_4); __pyx_t_4 = 0; - __pyx_t_6 = __Pyx_PyObject_IsTrue(__pyx_t_3); if (unlikely(__pyx_t_6 < 0)) __PYX_ERR(3, 841, __pyx_L1_error) + __pyx_t_6 = __Pyx_PyObject_IsTrue(__pyx_t_3); if (unlikely(__pyx_t_6 < 0)) __PYX_ERR(3, 887, __pyx_L1_error) __Pyx_DECREF(__pyx_t_3); __pyx_t_3 = 0; if (__pyx_t_6) { (__pyx_v_f[0]) = 0x69; goto __pyx_L15; } - /* "../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":842 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":888 * elif t == NPY_USHORT: f[0] = 72 #"H" * elif t == NPY_INT: f[0] = 105 #"i" * elif t == NPY_UINT: f[0] = 73 #"I" # <<<<<<<<<<<<<< * elif t == NPY_LONG: f[0] = 108 #"l" * elif t == NPY_ULONG: f[0] = 76 #"L" */ - __pyx_t_3 = __Pyx_PyInt_From_enum__NPY_TYPES(NPY_UINT); if (unlikely(!__pyx_t_3)) __PYX_ERR(3, 842, __pyx_L1_error) + __pyx_t_3 = __Pyx_PyInt_From_enum__NPY_TYPES(NPY_UINT); if (unlikely(!__pyx_t_3)) __PYX_ERR(3, 888, __pyx_L1_error) __Pyx_GOTREF(__pyx_t_3); - __pyx_t_4 = PyObject_RichCompare(__pyx_v_t, __pyx_t_3, Py_EQ); __Pyx_XGOTREF(__pyx_t_4); if (unlikely(!__pyx_t_4)) __PYX_ERR(3, 842, __pyx_L1_error) + __pyx_t_4 = PyObject_RichCompare(__pyx_v_t, __pyx_t_3, Py_EQ); __Pyx_XGOTREF(__pyx_t_4); if (unlikely(!__pyx_t_4)) __PYX_ERR(3, 888, __pyx_L1_error) __Pyx_DECREF(__pyx_t_3); __pyx_t_3 = 0; - __pyx_t_6 = __Pyx_PyObject_IsTrue(__pyx_t_4); if (unlikely(__pyx_t_6 < 0)) __PYX_ERR(3, 842, __pyx_L1_error) + __pyx_t_6 = __Pyx_PyObject_IsTrue(__pyx_t_4); if (unlikely(__pyx_t_6 < 0)) __PYX_ERR(3, 888, __pyx_L1_error) __Pyx_DECREF(__pyx_t_4); __pyx_t_4 = 0; if (__pyx_t_6) { (__pyx_v_f[0]) = 73; goto __pyx_L15; } - /* "../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":843 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":889 * elif t == NPY_INT: f[0] = 105 #"i" * elif t == NPY_UINT: f[0] = 73 #"I" * elif t == NPY_LONG: f[0] = 108 #"l" # <<<<<<<<<<<<<< * elif t == NPY_ULONG: f[0] = 76 #"L" * elif t == NPY_LONGLONG: f[0] = 113 #"q" */ - __pyx_t_4 = __Pyx_PyInt_From_enum__NPY_TYPES(NPY_LONG); if (unlikely(!__pyx_t_4)) __PYX_ERR(3, 843, __pyx_L1_error) + __pyx_t_4 = __Pyx_PyInt_From_enum__NPY_TYPES(NPY_LONG); if (unlikely(!__pyx_t_4)) __PYX_ERR(3, 889, __pyx_L1_error) __Pyx_GOTREF(__pyx_t_4); - __pyx_t_3 = PyObject_RichCompare(__pyx_v_t, __pyx_t_4, Py_EQ); __Pyx_XGOTREF(__pyx_t_3); if (unlikely(!__pyx_t_3)) __PYX_ERR(3, 843, __pyx_L1_error) + __pyx_t_3 = PyObject_RichCompare(__pyx_v_t, __pyx_t_4, Py_EQ); __Pyx_XGOTREF(__pyx_t_3); if (unlikely(!__pyx_t_3)) __PYX_ERR(3, 889, __pyx_L1_error) __Pyx_DECREF(__pyx_t_4); __pyx_t_4 = 0; - __pyx_t_6 = __Pyx_PyObject_IsTrue(__pyx_t_3); if (unlikely(__pyx_t_6 < 0)) __PYX_ERR(3, 843, __pyx_L1_error) + __pyx_t_6 = __Pyx_PyObject_IsTrue(__pyx_t_3); if (unlikely(__pyx_t_6 < 0)) __PYX_ERR(3, 889, __pyx_L1_error) __Pyx_DECREF(__pyx_t_3); __pyx_t_3 = 0; if (__pyx_t_6) { (__pyx_v_f[0]) = 0x6C; goto __pyx_L15; } - /* "../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":844 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":890 * elif t == NPY_UINT: f[0] = 73 #"I" * elif t == NPY_LONG: f[0] = 108 #"l" * elif t == NPY_ULONG: f[0] = 76 #"L" # <<<<<<<<<<<<<< * elif t == NPY_LONGLONG: f[0] = 113 #"q" * elif t == NPY_ULONGLONG: f[0] = 81 #"Q" */ - __pyx_t_3 = __Pyx_PyInt_From_enum__NPY_TYPES(NPY_ULONG); if (unlikely(!__pyx_t_3)) __PYX_ERR(3, 844, __pyx_L1_error) + __pyx_t_3 = __Pyx_PyInt_From_enum__NPY_TYPES(NPY_ULONG); if (unlikely(!__pyx_t_3)) __PYX_ERR(3, 890, __pyx_L1_error) __Pyx_GOTREF(__pyx_t_3); - __pyx_t_4 = PyObject_RichCompare(__pyx_v_t, __pyx_t_3, Py_EQ); __Pyx_XGOTREF(__pyx_t_4); if (unlikely(!__pyx_t_4)) __PYX_ERR(3, 844, __pyx_L1_error) + __pyx_t_4 = PyObject_RichCompare(__pyx_v_t, __pyx_t_3, Py_EQ); __Pyx_XGOTREF(__pyx_t_4); if (unlikely(!__pyx_t_4)) __PYX_ERR(3, 890, __pyx_L1_error) __Pyx_DECREF(__pyx_t_3); __pyx_t_3 = 0; - __pyx_t_6 = __Pyx_PyObject_IsTrue(__pyx_t_4); if (unlikely(__pyx_t_6 < 0)) __PYX_ERR(3, 844, __pyx_L1_error) + __pyx_t_6 = __Pyx_PyObject_IsTrue(__pyx_t_4); if (unlikely(__pyx_t_6 < 0)) __PYX_ERR(3, 890, __pyx_L1_error) __Pyx_DECREF(__pyx_t_4); __pyx_t_4 = 0; if (__pyx_t_6) { (__pyx_v_f[0]) = 76; goto __pyx_L15; } - /* "../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":845 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":891 * elif t == NPY_LONG: f[0] = 108 #"l" * elif t == NPY_ULONG: f[0] = 76 #"L" * elif t == NPY_LONGLONG: f[0] = 113 #"q" # <<<<<<<<<<<<<< * elif t == NPY_ULONGLONG: f[0] = 81 #"Q" * elif t == NPY_FLOAT: f[0] = 102 #"f" */ - __pyx_t_4 = __Pyx_PyInt_From_enum__NPY_TYPES(NPY_LONGLONG); if (unlikely(!__pyx_t_4)) __PYX_ERR(3, 845, __pyx_L1_error) + __pyx_t_4 = __Pyx_PyInt_From_enum__NPY_TYPES(NPY_LONGLONG); if (unlikely(!__pyx_t_4)) __PYX_ERR(3, 891, __pyx_L1_error) __Pyx_GOTREF(__pyx_t_4); - __pyx_t_3 = PyObject_RichCompare(__pyx_v_t, __pyx_t_4, Py_EQ); __Pyx_XGOTREF(__pyx_t_3); if (unlikely(!__pyx_t_3)) __PYX_ERR(3, 845, __pyx_L1_error) + __pyx_t_3 = PyObject_RichCompare(__pyx_v_t, __pyx_t_4, Py_EQ); __Pyx_XGOTREF(__pyx_t_3); if (unlikely(!__pyx_t_3)) __PYX_ERR(3, 891, __pyx_L1_error) __Pyx_DECREF(__pyx_t_4); __pyx_t_4 = 0; - __pyx_t_6 = __Pyx_PyObject_IsTrue(__pyx_t_3); if (unlikely(__pyx_t_6 < 0)) __PYX_ERR(3, 845, __pyx_L1_error) + __pyx_t_6 = __Pyx_PyObject_IsTrue(__pyx_t_3); if (unlikely(__pyx_t_6 < 0)) __PYX_ERR(3, 891, __pyx_L1_error) __Pyx_DECREF(__pyx_t_3); __pyx_t_3 = 0; if (__pyx_t_6) { (__pyx_v_f[0]) = 0x71; goto __pyx_L15; } - /* "../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":846 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":892 * elif t == NPY_ULONG: f[0] = 76 #"L" * elif t == NPY_LONGLONG: f[0] = 113 #"q" * elif t == NPY_ULONGLONG: f[0] = 81 #"Q" # <<<<<<<<<<<<<< * elif t == NPY_FLOAT: f[0] = 102 #"f" * elif t == NPY_DOUBLE: f[0] = 100 #"d" */ - __pyx_t_3 = __Pyx_PyInt_From_enum__NPY_TYPES(NPY_ULONGLONG); if (unlikely(!__pyx_t_3)) __PYX_ERR(3, 846, __pyx_L1_error) + __pyx_t_3 = __Pyx_PyInt_From_enum__NPY_TYPES(NPY_ULONGLONG); if (unlikely(!__pyx_t_3)) __PYX_ERR(3, 892, __pyx_L1_error) __Pyx_GOTREF(__pyx_t_3); - __pyx_t_4 = PyObject_RichCompare(__pyx_v_t, __pyx_t_3, Py_EQ); __Pyx_XGOTREF(__pyx_t_4); if (unlikely(!__pyx_t_4)) __PYX_ERR(3, 846, __pyx_L1_error) + __pyx_t_4 = PyObject_RichCompare(__pyx_v_t, __pyx_t_3, Py_EQ); __Pyx_XGOTREF(__pyx_t_4); if (unlikely(!__pyx_t_4)) __PYX_ERR(3, 892, __pyx_L1_error) __Pyx_DECREF(__pyx_t_3); __pyx_t_3 = 0; - __pyx_t_6 = __Pyx_PyObject_IsTrue(__pyx_t_4); if (unlikely(__pyx_t_6 < 0)) __PYX_ERR(3, 846, __pyx_L1_error) + __pyx_t_6 = __Pyx_PyObject_IsTrue(__pyx_t_4); if (unlikely(__pyx_t_6 < 0)) __PYX_ERR(3, 892, __pyx_L1_error) __Pyx_DECREF(__pyx_t_4); __pyx_t_4 = 0; if (__pyx_t_6) { (__pyx_v_f[0]) = 81; goto __pyx_L15; } - /* "../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":847 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":893 * elif t == NPY_LONGLONG: f[0] = 113 #"q" * elif t == NPY_ULONGLONG: f[0] = 81 #"Q" * elif t == NPY_FLOAT: f[0] = 102 #"f" # <<<<<<<<<<<<<< * elif t == NPY_DOUBLE: f[0] = 100 #"d" * elif t == NPY_LONGDOUBLE: f[0] = 103 #"g" */ - __pyx_t_4 = __Pyx_PyInt_From_enum__NPY_TYPES(NPY_FLOAT); if (unlikely(!__pyx_t_4)) __PYX_ERR(3, 847, __pyx_L1_error) + __pyx_t_4 = __Pyx_PyInt_From_enum__NPY_TYPES(NPY_FLOAT); if (unlikely(!__pyx_t_4)) __PYX_ERR(3, 893, __pyx_L1_error) __Pyx_GOTREF(__pyx_t_4); - __pyx_t_3 = PyObject_RichCompare(__pyx_v_t, __pyx_t_4, Py_EQ); __Pyx_XGOTREF(__pyx_t_3); if (unlikely(!__pyx_t_3)) __PYX_ERR(3, 847, __pyx_L1_error) + __pyx_t_3 = PyObject_RichCompare(__pyx_v_t, __pyx_t_4, Py_EQ); __Pyx_XGOTREF(__pyx_t_3); if (unlikely(!__pyx_t_3)) __PYX_ERR(3, 893, __pyx_L1_error) __Pyx_DECREF(__pyx_t_4); __pyx_t_4 = 0; - __pyx_t_6 = __Pyx_PyObject_IsTrue(__pyx_t_3); if (unlikely(__pyx_t_6 < 0)) __PYX_ERR(3, 847, __pyx_L1_error) + __pyx_t_6 = __Pyx_PyObject_IsTrue(__pyx_t_3); if (unlikely(__pyx_t_6 < 0)) __PYX_ERR(3, 893, __pyx_L1_error) __Pyx_DECREF(__pyx_t_3); __pyx_t_3 = 0; if (__pyx_t_6) { (__pyx_v_f[0]) = 0x66; goto __pyx_L15; } - /* "../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":848 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":894 * elif t == NPY_ULONGLONG: f[0] = 81 #"Q" * elif t == NPY_FLOAT: f[0] = 102 #"f" * elif t == NPY_DOUBLE: f[0] = 100 #"d" # <<<<<<<<<<<<<< * elif t == NPY_LONGDOUBLE: f[0] = 103 #"g" * elif t == NPY_CFLOAT: f[0] = 90; f[1] = 102; f += 1 # Zf */ - __pyx_t_3 = __Pyx_PyInt_From_enum__NPY_TYPES(NPY_DOUBLE); if (unlikely(!__pyx_t_3)) __PYX_ERR(3, 848, __pyx_L1_error) + __pyx_t_3 = __Pyx_PyInt_From_enum__NPY_TYPES(NPY_DOUBLE); if (unlikely(!__pyx_t_3)) __PYX_ERR(3, 894, __pyx_L1_error) __Pyx_GOTREF(__pyx_t_3); - __pyx_t_4 = PyObject_RichCompare(__pyx_v_t, __pyx_t_3, Py_EQ); __Pyx_XGOTREF(__pyx_t_4); if (unlikely(!__pyx_t_4)) __PYX_ERR(3, 848, __pyx_L1_error) + __pyx_t_4 = PyObject_RichCompare(__pyx_v_t, __pyx_t_3, Py_EQ); __Pyx_XGOTREF(__pyx_t_4); if (unlikely(!__pyx_t_4)) __PYX_ERR(3, 894, __pyx_L1_error) __Pyx_DECREF(__pyx_t_3); __pyx_t_3 = 0; - __pyx_t_6 = __Pyx_PyObject_IsTrue(__pyx_t_4); if (unlikely(__pyx_t_6 < 0)) __PYX_ERR(3, 848, __pyx_L1_error) + __pyx_t_6 = __Pyx_PyObject_IsTrue(__pyx_t_4); if (unlikely(__pyx_t_6 < 0)) __PYX_ERR(3, 894, __pyx_L1_error) __Pyx_DECREF(__pyx_t_4); __pyx_t_4 = 0; if (__pyx_t_6) { (__pyx_v_f[0]) = 0x64; goto __pyx_L15; } - /* "../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":849 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":895 * elif t == NPY_FLOAT: f[0] = 102 #"f" * elif t == NPY_DOUBLE: f[0] = 100 #"d" * elif t == NPY_LONGDOUBLE: f[0] = 103 #"g" # <<<<<<<<<<<<<< * elif t == NPY_CFLOAT: f[0] = 90; f[1] = 102; f += 1 # Zf * elif t == NPY_CDOUBLE: f[0] = 90; f[1] = 100; f += 1 # Zd */ - __pyx_t_4 = __Pyx_PyInt_From_enum__NPY_TYPES(NPY_LONGDOUBLE); if (unlikely(!__pyx_t_4)) __PYX_ERR(3, 849, __pyx_L1_error) + __pyx_t_4 = __Pyx_PyInt_From_enum__NPY_TYPES(NPY_LONGDOUBLE); if (unlikely(!__pyx_t_4)) __PYX_ERR(3, 895, __pyx_L1_error) __Pyx_GOTREF(__pyx_t_4); - __pyx_t_3 = PyObject_RichCompare(__pyx_v_t, __pyx_t_4, Py_EQ); __Pyx_XGOTREF(__pyx_t_3); if (unlikely(!__pyx_t_3)) __PYX_ERR(3, 849, __pyx_L1_error) + __pyx_t_3 = PyObject_RichCompare(__pyx_v_t, __pyx_t_4, Py_EQ); __Pyx_XGOTREF(__pyx_t_3); if (unlikely(!__pyx_t_3)) __PYX_ERR(3, 895, __pyx_L1_error) __Pyx_DECREF(__pyx_t_4); __pyx_t_4 = 0; - __pyx_t_6 = __Pyx_PyObject_IsTrue(__pyx_t_3); if (unlikely(__pyx_t_6 < 0)) __PYX_ERR(3, 849, __pyx_L1_error) + __pyx_t_6 = __Pyx_PyObject_IsTrue(__pyx_t_3); if (unlikely(__pyx_t_6 < 0)) __PYX_ERR(3, 895, __pyx_L1_error) __Pyx_DECREF(__pyx_t_3); __pyx_t_3 = 0; if (__pyx_t_6) { (__pyx_v_f[0]) = 0x67; goto __pyx_L15; } - /* "../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":850 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":896 * elif t == NPY_DOUBLE: f[0] = 100 #"d" * elif t == NPY_LONGDOUBLE: f[0] = 103 #"g" * elif t == NPY_CFLOAT: f[0] = 90; f[1] = 102; f += 1 # Zf # <<<<<<<<<<<<<< * elif t == NPY_CDOUBLE: f[0] = 90; f[1] = 100; f += 1 # Zd * elif t == NPY_CLONGDOUBLE: f[0] = 90; f[1] = 103; f += 1 # Zg */ - __pyx_t_3 = __Pyx_PyInt_From_enum__NPY_TYPES(NPY_CFLOAT); if (unlikely(!__pyx_t_3)) __PYX_ERR(3, 850, __pyx_L1_error) + __pyx_t_3 = __Pyx_PyInt_From_enum__NPY_TYPES(NPY_CFLOAT); if (unlikely(!__pyx_t_3)) __PYX_ERR(3, 896, __pyx_L1_error) __Pyx_GOTREF(__pyx_t_3); - __pyx_t_4 = PyObject_RichCompare(__pyx_v_t, __pyx_t_3, Py_EQ); __Pyx_XGOTREF(__pyx_t_4); if (unlikely(!__pyx_t_4)) __PYX_ERR(3, 850, __pyx_L1_error) + __pyx_t_4 = PyObject_RichCompare(__pyx_v_t, __pyx_t_3, Py_EQ); __Pyx_XGOTREF(__pyx_t_4); if (unlikely(!__pyx_t_4)) __PYX_ERR(3, 896, __pyx_L1_error) __Pyx_DECREF(__pyx_t_3); __pyx_t_3 = 0; - __pyx_t_6 = __Pyx_PyObject_IsTrue(__pyx_t_4); if (unlikely(__pyx_t_6 < 0)) __PYX_ERR(3, 850, __pyx_L1_error) + __pyx_t_6 = __Pyx_PyObject_IsTrue(__pyx_t_4); if (unlikely(__pyx_t_6 < 0)) __PYX_ERR(3, 896, __pyx_L1_error) __Pyx_DECREF(__pyx_t_4); __pyx_t_4 = 0; if (__pyx_t_6) { (__pyx_v_f[0]) = 90; @@ -9011,18 +9050,18 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx goto __pyx_L15; } - /* "../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":851 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":897 * elif t == NPY_LONGDOUBLE: f[0] = 103 #"g" * elif t == NPY_CFLOAT: f[0] = 90; f[1] = 102; f += 1 # Zf * elif t == NPY_CDOUBLE: f[0] = 90; f[1] = 100; f += 1 # Zd # <<<<<<<<<<<<<< * elif t == NPY_CLONGDOUBLE: f[0] = 90; f[1] = 103; f += 1 # Zg * elif t == NPY_OBJECT: f[0] = 79 #"O" */ - __pyx_t_4 = __Pyx_PyInt_From_enum__NPY_TYPES(NPY_CDOUBLE); if (unlikely(!__pyx_t_4)) __PYX_ERR(3, 851, __pyx_L1_error) + __pyx_t_4 = __Pyx_PyInt_From_enum__NPY_TYPES(NPY_CDOUBLE); if (unlikely(!__pyx_t_4)) __PYX_ERR(3, 897, __pyx_L1_error) __Pyx_GOTREF(__pyx_t_4); - __pyx_t_3 = PyObject_RichCompare(__pyx_v_t, __pyx_t_4, Py_EQ); __Pyx_XGOTREF(__pyx_t_3); if (unlikely(!__pyx_t_3)) __PYX_ERR(3, 851, __pyx_L1_error) + __pyx_t_3 = PyObject_RichCompare(__pyx_v_t, __pyx_t_4, Py_EQ); __Pyx_XGOTREF(__pyx_t_3); if (unlikely(!__pyx_t_3)) __PYX_ERR(3, 897, __pyx_L1_error) __Pyx_DECREF(__pyx_t_4); __pyx_t_4 = 0; - __pyx_t_6 = __Pyx_PyObject_IsTrue(__pyx_t_3); if (unlikely(__pyx_t_6 < 0)) __PYX_ERR(3, 851, __pyx_L1_error) + __pyx_t_6 = __Pyx_PyObject_IsTrue(__pyx_t_3); if (unlikely(__pyx_t_6 < 0)) __PYX_ERR(3, 897, __pyx_L1_error) __Pyx_DECREF(__pyx_t_3); __pyx_t_3 = 0; if (__pyx_t_6) { (__pyx_v_f[0]) = 90; @@ -9031,18 +9070,18 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx goto __pyx_L15; } - /* "../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":852 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":898 * elif t == NPY_CFLOAT: f[0] = 90; f[1] = 102; f += 1 # Zf * elif t == NPY_CDOUBLE: f[0] = 90; f[1] = 100; f += 1 # Zd * elif t == NPY_CLONGDOUBLE: f[0] = 90; f[1] = 103; f += 1 # Zg # <<<<<<<<<<<<<< * elif t == NPY_OBJECT: f[0] = 79 #"O" * else: */ - __pyx_t_3 = __Pyx_PyInt_From_enum__NPY_TYPES(NPY_CLONGDOUBLE); if (unlikely(!__pyx_t_3)) __PYX_ERR(3, 852, __pyx_L1_error) + __pyx_t_3 = __Pyx_PyInt_From_enum__NPY_TYPES(NPY_CLONGDOUBLE); if (unlikely(!__pyx_t_3)) __PYX_ERR(3, 898, __pyx_L1_error) __Pyx_GOTREF(__pyx_t_3); - __pyx_t_4 = PyObject_RichCompare(__pyx_v_t, __pyx_t_3, Py_EQ); __Pyx_XGOTREF(__pyx_t_4); if (unlikely(!__pyx_t_4)) __PYX_ERR(3, 852, __pyx_L1_error) + __pyx_t_4 = PyObject_RichCompare(__pyx_v_t, __pyx_t_3, Py_EQ); __Pyx_XGOTREF(__pyx_t_4); if (unlikely(!__pyx_t_4)) __PYX_ERR(3, 898, __pyx_L1_error) __Pyx_DECREF(__pyx_t_3); __pyx_t_3 = 0; - __pyx_t_6 = __Pyx_PyObject_IsTrue(__pyx_t_4); if (unlikely(__pyx_t_6 < 0)) __PYX_ERR(3, 852, __pyx_L1_error) + __pyx_t_6 = __Pyx_PyObject_IsTrue(__pyx_t_4); if (unlikely(__pyx_t_6 < 0)) __PYX_ERR(3, 898, __pyx_L1_error) __Pyx_DECREF(__pyx_t_4); __pyx_t_4 = 0; if (__pyx_t_6) { (__pyx_v_f[0]) = 90; @@ -9051,25 +9090,25 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx goto __pyx_L15; } - /* "../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":853 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":899 * elif t == NPY_CDOUBLE: f[0] = 90; f[1] = 100; f += 1 # Zd * elif t == NPY_CLONGDOUBLE: f[0] = 90; f[1] = 103; f += 1 # Zg * elif t == NPY_OBJECT: f[0] = 79 #"O" # <<<<<<<<<<<<<< * else: * raise ValueError(u"unknown dtype code in numpy.pxd (%d)" % t) */ - __pyx_t_4 = __Pyx_PyInt_From_enum__NPY_TYPES(NPY_OBJECT); if (unlikely(!__pyx_t_4)) __PYX_ERR(3, 853, __pyx_L1_error) + __pyx_t_4 = __Pyx_PyInt_From_enum__NPY_TYPES(NPY_OBJECT); if (unlikely(!__pyx_t_4)) __PYX_ERR(3, 899, __pyx_L1_error) __Pyx_GOTREF(__pyx_t_4); - __pyx_t_3 = PyObject_RichCompare(__pyx_v_t, __pyx_t_4, Py_EQ); __Pyx_XGOTREF(__pyx_t_3); if (unlikely(!__pyx_t_3)) __PYX_ERR(3, 853, __pyx_L1_error) + __pyx_t_3 = PyObject_RichCompare(__pyx_v_t, __pyx_t_4, Py_EQ); __Pyx_XGOTREF(__pyx_t_3); if (unlikely(!__pyx_t_3)) __PYX_ERR(3, 899, __pyx_L1_error) __Pyx_DECREF(__pyx_t_4); __pyx_t_4 = 0; - __pyx_t_6 = __Pyx_PyObject_IsTrue(__pyx_t_3); if (unlikely(__pyx_t_6 < 0)) __PYX_ERR(3, 853, __pyx_L1_error) + __pyx_t_6 = __Pyx_PyObject_IsTrue(__pyx_t_3); if (unlikely(__pyx_t_6 < 0)) __PYX_ERR(3, 899, __pyx_L1_error) __Pyx_DECREF(__pyx_t_3); __pyx_t_3 = 0; if (likely(__pyx_t_6)) { (__pyx_v_f[0]) = 79; goto __pyx_L15; } - /* "../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":855 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":901 * elif t == NPY_OBJECT: f[0] = 79 #"O" * else: * raise ValueError(u"unknown dtype code in numpy.pxd (%d)" % t) # <<<<<<<<<<<<<< @@ -9077,18 +9116,18 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx * else: */ /*else*/ { - __pyx_t_3 = PyUnicode_Format(__pyx_kp_u_unknown_dtype_code_in_numpy_pxd, __pyx_v_t); if (unlikely(!__pyx_t_3)) __PYX_ERR(3, 855, __pyx_L1_error) + __pyx_t_3 = __Pyx_PyUnicode_FormatSafe(__pyx_kp_u_unknown_dtype_code_in_numpy_pxd, __pyx_v_t); if (unlikely(!__pyx_t_3)) __PYX_ERR(3, 901, __pyx_L1_error) __Pyx_GOTREF(__pyx_t_3); - __pyx_t_4 = __Pyx_PyObject_CallOneArg(__pyx_builtin_ValueError, __pyx_t_3); if (unlikely(!__pyx_t_4)) __PYX_ERR(3, 855, __pyx_L1_error) + __pyx_t_4 = __Pyx_PyObject_CallOneArg(__pyx_builtin_ValueError, __pyx_t_3); if (unlikely(!__pyx_t_4)) __PYX_ERR(3, 901, __pyx_L1_error) __Pyx_GOTREF(__pyx_t_4); __Pyx_DECREF(__pyx_t_3); __pyx_t_3 = 0; __Pyx_Raise(__pyx_t_4, 0, 0, 0); __Pyx_DECREF(__pyx_t_4); __pyx_t_4 = 0; - __PYX_ERR(3, 855, __pyx_L1_error) + __PYX_ERR(3, 901, __pyx_L1_error) } __pyx_L15:; - /* "../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":856 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":902 * else: * raise ValueError(u"unknown dtype code in numpy.pxd (%d)" % t) * f += 1 # <<<<<<<<<<<<<< @@ -9097,7 +9136,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx */ __pyx_v_f = (__pyx_v_f + 1); - /* "../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":831 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":877 * offset[0] += child.itemsize * * if not PyDataType_HASFIELDS(child): # <<<<<<<<<<<<<< @@ -9107,7 +9146,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx goto __pyx_L13; } - /* "../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":860 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":906 * # Cython ignores struct boundary information ("T{...}"), * # so don't output it * f = _util_dtypestring(child, f, end, offset) # <<<<<<<<<<<<<< @@ -9115,12 +9154,12 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx * */ /*else*/ { - __pyx_t_9 = __pyx_f_5numpy__util_dtypestring(__pyx_v_child, __pyx_v_f, __pyx_v_end, __pyx_v_offset); if (unlikely(__pyx_t_9 == ((char *)NULL))) __PYX_ERR(3, 860, __pyx_L1_error) + __pyx_t_9 = __pyx_f_5numpy__util_dtypestring(__pyx_v_child, __pyx_v_f, __pyx_v_end, __pyx_v_offset); if (unlikely(__pyx_t_9 == ((char *)NULL))) __PYX_ERR(3, 906, __pyx_L1_error) __pyx_v_f = __pyx_t_9; } __pyx_L13:; - /* "../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":805 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":851 * cdef tuple fields * * for childname in descr.names: # <<<<<<<<<<<<<< @@ -9130,7 +9169,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx } __Pyx_DECREF(__pyx_t_1); __pyx_t_1 = 0; - /* "../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":861 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":907 * # so don't output it * f = _util_dtypestring(child, f, end, offset) * return f # <<<<<<<<<<<<<< @@ -9140,7 +9179,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx __pyx_r = __pyx_v_f; goto __pyx_L0; - /* "../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":796 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":842 * return () * * cdef inline char* _util_dtypestring(dtype descr, char* f, char* end, int* offset) except NULL: # <<<<<<<<<<<<<< @@ -9165,166 +9204,120 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx return __pyx_r; } -/* "../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":977 - * +/* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":1022 + * int _import_umath() except -1 * * cdef inline void set_array_base(ndarray arr, object base): # <<<<<<<<<<<<<< - * cdef PyObject* baseptr - * if base is None: + * Py_INCREF(base) # important to do this before stealing the reference below! + * PyArray_SetBaseObject(arr, base) */ static CYTHON_INLINE void __pyx_f_5numpy_set_array_base(PyArrayObject *__pyx_v_arr, PyObject *__pyx_v_base) { - PyObject *__pyx_v_baseptr; __Pyx_RefNannyDeclarations - int __pyx_t_1; - int __pyx_t_2; __Pyx_RefNannySetupContext("set_array_base", 0); - /* "../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":979 - * cdef inline void set_array_base(ndarray arr, object base): - * cdef PyObject* baseptr - * if base is None: # <<<<<<<<<<<<<< - * baseptr = NULL - * else: - */ - __pyx_t_1 = (__pyx_v_base == Py_None); - __pyx_t_2 = (__pyx_t_1 != 0); - if (__pyx_t_2) { - - /* "../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":980 - * cdef PyObject* baseptr - * if base is None: - * baseptr = NULL # <<<<<<<<<<<<<< - * else: - * Py_INCREF(base) # important to do this before decref below! - */ - __pyx_v_baseptr = NULL; - - /* "../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":979 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":1023 + * * cdef inline void set_array_base(ndarray arr, object base): - * cdef PyObject* baseptr - * if base is None: # <<<<<<<<<<<<<< - * baseptr = NULL - * else: - */ - goto __pyx_L3; - } - - /* "../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":982 - * baseptr = NULL - * else: - * Py_INCREF(base) # important to do this before decref below! # <<<<<<<<<<<<<< - * baseptr = base - * Py_XDECREF(arr.base) - */ - /*else*/ { - Py_INCREF(__pyx_v_base); - - /* "../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":983 - * else: - * Py_INCREF(base) # important to do this before decref below! - * baseptr = base # <<<<<<<<<<<<<< - * Py_XDECREF(arr.base) - * arr.base = baseptr - */ - __pyx_v_baseptr = ((PyObject *)__pyx_v_base); - } - __pyx_L3:; - - /* "../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":984 - * Py_INCREF(base) # important to do this before decref below! - * baseptr = base - * Py_XDECREF(arr.base) # <<<<<<<<<<<<<< - * arr.base = baseptr + * Py_INCREF(base) # important to do this before stealing the reference below! # <<<<<<<<<<<<<< + * PyArray_SetBaseObject(arr, base) * */ - Py_XDECREF(__pyx_v_arr->base); + Py_INCREF(__pyx_v_base); - /* "../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":985 - * baseptr = base - * Py_XDECREF(arr.base) - * arr.base = baseptr # <<<<<<<<<<<<<< + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":1024 + * cdef inline void set_array_base(ndarray arr, object base): + * Py_INCREF(base) # important to do this before stealing the reference below! + * PyArray_SetBaseObject(arr, base) # <<<<<<<<<<<<<< * * cdef inline object get_array_base(ndarray arr): */ - __pyx_v_arr->base = __pyx_v_baseptr; + (void)(PyArray_SetBaseObject(__pyx_v_arr, __pyx_v_base)); - /* "../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":977 - * + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":1022 + * int _import_umath() except -1 * * cdef inline void set_array_base(ndarray arr, object base): # <<<<<<<<<<<<<< - * cdef PyObject* baseptr - * if base is None: + * Py_INCREF(base) # important to do this before stealing the reference below! + * PyArray_SetBaseObject(arr, base) */ /* function exit code */ __Pyx_RefNannyFinishContext(); } -/* "../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":987 - * arr.base = baseptr +/* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":1026 + * PyArray_SetBaseObject(arr, base) * * cdef inline object get_array_base(ndarray arr): # <<<<<<<<<<<<<< - * if arr.base is NULL: - * return None + * base = PyArray_BASE(arr) + * if base is NULL: */ static CYTHON_INLINE PyObject *__pyx_f_5numpy_get_array_base(PyArrayObject *__pyx_v_arr) { + PyObject *__pyx_v_base; PyObject *__pyx_r = NULL; __Pyx_RefNannyDeclarations int __pyx_t_1; __Pyx_RefNannySetupContext("get_array_base", 0); - /* "../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":988 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":1027 * * cdef inline object get_array_base(ndarray arr): - * if arr.base is NULL: # <<<<<<<<<<<<<< + * base = PyArray_BASE(arr) # <<<<<<<<<<<<<< + * if base is NULL: * return None - * else: */ - __pyx_t_1 = ((__pyx_v_arr->base == NULL) != 0); - if (__pyx_t_1) { + __pyx_v_base = PyArray_BASE(__pyx_v_arr); - /* "../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":989 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":1028 * cdef inline object get_array_base(ndarray arr): - * if arr.base is NULL: + * base = PyArray_BASE(arr) + * if base is NULL: # <<<<<<<<<<<<<< + * return None + * return base + */ + __pyx_t_1 = ((__pyx_v_base == NULL) != 0); + if (__pyx_t_1) { + + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":1029 + * base = PyArray_BASE(arr) + * if base is NULL: * return None # <<<<<<<<<<<<<< - * else: - * return arr.base + * return base + * */ __Pyx_XDECREF(__pyx_r); __pyx_r = Py_None; __Pyx_INCREF(Py_None); goto __pyx_L0; - /* "../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":988 - * + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":1028 * cdef inline object get_array_base(ndarray arr): - * if arr.base is NULL: # <<<<<<<<<<<<<< + * base = PyArray_BASE(arr) + * if base is NULL: # <<<<<<<<<<<<<< * return None - * else: + * return base */ } - /* "../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":991 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":1030 + * if base is NULL: * return None - * else: - * return arr.base # <<<<<<<<<<<<<< - * + * return base # <<<<<<<<<<<<<< * + * # Versions of the import_* functions which are more suitable for */ - /*else*/ { - __Pyx_XDECREF(__pyx_r); - __Pyx_INCREF(((PyObject *)__pyx_v_arr->base)); - __pyx_r = ((PyObject *)__pyx_v_arr->base); - goto __pyx_L0; - } + __Pyx_XDECREF(__pyx_r); + __Pyx_INCREF(((PyObject *)__pyx_v_base)); + __pyx_r = ((PyObject *)__pyx_v_base); + goto __pyx_L0; - /* "../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":987 - * arr.base = baseptr + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":1026 + * PyArray_SetBaseObject(arr, base) * * cdef inline object get_array_base(ndarray arr): # <<<<<<<<<<<<<< - * if arr.base is NULL: - * return None + * base = PyArray_BASE(arr) + * if base is NULL: */ /* function exit code */ @@ -9334,7 +9327,7 @@ static CYTHON_INLINE PyObject *__pyx_f_5numpy_get_array_base(PyArrayObject *__py return __pyx_r; } -/* "../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":996 +/* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":1034 * # Versions of the import_* functions which are more suitable for * # Cython code. * cdef inline int import_array() except -1: # <<<<<<<<<<<<<< @@ -9355,7 +9348,7 @@ static CYTHON_INLINE int __pyx_f_5numpy_import_array(void) { PyObject *__pyx_t_8 = NULL; __Pyx_RefNannySetupContext("import_array", 0); - /* "../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":997 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":1035 * # Cython code. * cdef inline int import_array() except -1: * try: # <<<<<<<<<<<<<< @@ -9371,16 +9364,16 @@ static CYTHON_INLINE int __pyx_f_5numpy_import_array(void) { __Pyx_XGOTREF(__pyx_t_3); /*try:*/ { - /* "../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":998 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":1036 * cdef inline int import_array() except -1: * try: * _import_array() # <<<<<<<<<<<<<< * except Exception: * raise ImportError("numpy.core.multiarray failed to import") */ - __pyx_t_4 = _import_array(); if (unlikely(__pyx_t_4 == ((int)-1))) __PYX_ERR(3, 998, __pyx_L3_error) + __pyx_t_4 = _import_array(); if (unlikely(__pyx_t_4 == ((int)-1))) __PYX_ERR(3, 1036, __pyx_L3_error) - /* "../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":997 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":1035 * # Cython code. * cdef inline int import_array() except -1: * try: # <<<<<<<<<<<<<< @@ -9394,7 +9387,7 @@ static CYTHON_INLINE int __pyx_f_5numpy_import_array(void) { goto __pyx_L8_try_end; __pyx_L3_error:; - /* "../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":999 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":1037 * try: * _import_array() * except Exception: # <<<<<<<<<<<<<< @@ -9404,28 +9397,28 @@ static CYTHON_INLINE int __pyx_f_5numpy_import_array(void) { __pyx_t_4 = __Pyx_PyErr_ExceptionMatches(((PyObject *)(&((PyTypeObject*)PyExc_Exception)[0]))); if (__pyx_t_4) { __Pyx_AddTraceback("numpy.import_array", __pyx_clineno, __pyx_lineno, __pyx_filename); - if (__Pyx_GetException(&__pyx_t_5, &__pyx_t_6, &__pyx_t_7) < 0) __PYX_ERR(3, 999, __pyx_L5_except_error) + if (__Pyx_GetException(&__pyx_t_5, &__pyx_t_6, &__pyx_t_7) < 0) __PYX_ERR(3, 1037, __pyx_L5_except_error) __Pyx_GOTREF(__pyx_t_5); __Pyx_GOTREF(__pyx_t_6); __Pyx_GOTREF(__pyx_t_7); - /* "../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1000 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":1038 * _import_array() * except Exception: * raise ImportError("numpy.core.multiarray failed to import") # <<<<<<<<<<<<<< * * cdef inline int import_umath() except -1: */ - __pyx_t_8 = __Pyx_PyObject_Call(__pyx_builtin_ImportError, __pyx_tuple__10, NULL); if (unlikely(!__pyx_t_8)) __PYX_ERR(3, 1000, __pyx_L5_except_error) + __pyx_t_8 = __Pyx_PyObject_Call(__pyx_builtin_ImportError, __pyx_tuple__8, NULL); if (unlikely(!__pyx_t_8)) __PYX_ERR(3, 1038, __pyx_L5_except_error) __Pyx_GOTREF(__pyx_t_8); __Pyx_Raise(__pyx_t_8, 0, 0, 0); __Pyx_DECREF(__pyx_t_8); __pyx_t_8 = 0; - __PYX_ERR(3, 1000, __pyx_L5_except_error) + __PYX_ERR(3, 1038, __pyx_L5_except_error) } goto __pyx_L5_except_error; __pyx_L5_except_error:; - /* "../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":997 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":1035 * # Cython code. * cdef inline int import_array() except -1: * try: # <<<<<<<<<<<<<< @@ -9440,7 +9433,7 @@ static CYTHON_INLINE int __pyx_f_5numpy_import_array(void) { __pyx_L8_try_end:; } - /* "../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":996 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":1034 * # Versions of the import_* functions which are more suitable for * # Cython code. * cdef inline int import_array() except -1: # <<<<<<<<<<<<<< @@ -9463,7 +9456,7 @@ static CYTHON_INLINE int __pyx_f_5numpy_import_array(void) { return __pyx_r; } -/* "../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1002 +/* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":1040 * raise ImportError("numpy.core.multiarray failed to import") * * cdef inline int import_umath() except -1: # <<<<<<<<<<<<<< @@ -9484,7 +9477,7 @@ static CYTHON_INLINE int __pyx_f_5numpy_import_umath(void) { PyObject *__pyx_t_8 = NULL; __Pyx_RefNannySetupContext("import_umath", 0); - /* "../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1003 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":1041 * * cdef inline int import_umath() except -1: * try: # <<<<<<<<<<<<<< @@ -9500,16 +9493,16 @@ static CYTHON_INLINE int __pyx_f_5numpy_import_umath(void) { __Pyx_XGOTREF(__pyx_t_3); /*try:*/ { - /* "../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1004 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":1042 * cdef inline int import_umath() except -1: * try: * _import_umath() # <<<<<<<<<<<<<< * except Exception: * raise ImportError("numpy.core.umath failed to import") */ - __pyx_t_4 = _import_umath(); if (unlikely(__pyx_t_4 == ((int)-1))) __PYX_ERR(3, 1004, __pyx_L3_error) + __pyx_t_4 = _import_umath(); if (unlikely(__pyx_t_4 == ((int)-1))) __PYX_ERR(3, 1042, __pyx_L3_error) - /* "../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1003 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":1041 * * cdef inline int import_umath() except -1: * try: # <<<<<<<<<<<<<< @@ -9523,7 +9516,7 @@ static CYTHON_INLINE int __pyx_f_5numpy_import_umath(void) { goto __pyx_L8_try_end; __pyx_L3_error:; - /* "../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1005 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":1043 * try: * _import_umath() * except Exception: # <<<<<<<<<<<<<< @@ -9533,28 +9526,28 @@ static CYTHON_INLINE int __pyx_f_5numpy_import_umath(void) { __pyx_t_4 = __Pyx_PyErr_ExceptionMatches(((PyObject *)(&((PyTypeObject*)PyExc_Exception)[0]))); if (__pyx_t_4) { __Pyx_AddTraceback("numpy.import_umath", __pyx_clineno, __pyx_lineno, __pyx_filename); - if (__Pyx_GetException(&__pyx_t_5, &__pyx_t_6, &__pyx_t_7) < 0) __PYX_ERR(3, 1005, __pyx_L5_except_error) + if (__Pyx_GetException(&__pyx_t_5, &__pyx_t_6, &__pyx_t_7) < 0) __PYX_ERR(3, 1043, __pyx_L5_except_error) __Pyx_GOTREF(__pyx_t_5); __Pyx_GOTREF(__pyx_t_6); __Pyx_GOTREF(__pyx_t_7); - /* "../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1006 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":1044 * _import_umath() * except Exception: * raise ImportError("numpy.core.umath failed to import") # <<<<<<<<<<<<<< * * cdef inline int import_ufunc() except -1: */ - __pyx_t_8 = __Pyx_PyObject_Call(__pyx_builtin_ImportError, __pyx_tuple__11, NULL); if (unlikely(!__pyx_t_8)) __PYX_ERR(3, 1006, __pyx_L5_except_error) + __pyx_t_8 = __Pyx_PyObject_Call(__pyx_builtin_ImportError, __pyx_tuple__9, NULL); if (unlikely(!__pyx_t_8)) __PYX_ERR(3, 1044, __pyx_L5_except_error) __Pyx_GOTREF(__pyx_t_8); __Pyx_Raise(__pyx_t_8, 0, 0, 0); __Pyx_DECREF(__pyx_t_8); __pyx_t_8 = 0; - __PYX_ERR(3, 1006, __pyx_L5_except_error) + __PYX_ERR(3, 1044, __pyx_L5_except_error) } goto __pyx_L5_except_error; __pyx_L5_except_error:; - /* "../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1003 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":1041 * * cdef inline int import_umath() except -1: * try: # <<<<<<<<<<<<<< @@ -9569,7 +9562,7 @@ static CYTHON_INLINE int __pyx_f_5numpy_import_umath(void) { __pyx_L8_try_end:; } - /* "../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1002 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":1040 * raise ImportError("numpy.core.multiarray failed to import") * * cdef inline int import_umath() except -1: # <<<<<<<<<<<<<< @@ -9592,7 +9585,7 @@ static CYTHON_INLINE int __pyx_f_5numpy_import_umath(void) { return __pyx_r; } -/* "../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1008 +/* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":1046 * raise ImportError("numpy.core.umath failed to import") * * cdef inline int import_ufunc() except -1: # <<<<<<<<<<<<<< @@ -9613,7 +9606,7 @@ static CYTHON_INLINE int __pyx_f_5numpy_import_ufunc(void) { PyObject *__pyx_t_8 = NULL; __Pyx_RefNannySetupContext("import_ufunc", 0); - /* "../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1009 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":1047 * * cdef inline int import_ufunc() except -1: * try: # <<<<<<<<<<<<<< @@ -9629,16 +9622,16 @@ static CYTHON_INLINE int __pyx_f_5numpy_import_ufunc(void) { __Pyx_XGOTREF(__pyx_t_3); /*try:*/ { - /* "../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1010 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":1048 * cdef inline int import_ufunc() except -1: * try: * _import_umath() # <<<<<<<<<<<<<< * except Exception: * raise ImportError("numpy.core.umath failed to import") */ - __pyx_t_4 = _import_umath(); if (unlikely(__pyx_t_4 == ((int)-1))) __PYX_ERR(3, 1010, __pyx_L3_error) + __pyx_t_4 = _import_umath(); if (unlikely(__pyx_t_4 == ((int)-1))) __PYX_ERR(3, 1048, __pyx_L3_error) - /* "../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1009 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":1047 * * cdef inline int import_ufunc() except -1: * try: # <<<<<<<<<<<<<< @@ -9652,7 +9645,7 @@ static CYTHON_INLINE int __pyx_f_5numpy_import_ufunc(void) { goto __pyx_L8_try_end; __pyx_L3_error:; - /* "../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1011 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":1049 * try: * _import_umath() * except Exception: # <<<<<<<<<<<<<< @@ -9661,26 +9654,26 @@ static CYTHON_INLINE int __pyx_f_5numpy_import_ufunc(void) { __pyx_t_4 = __Pyx_PyErr_ExceptionMatches(((PyObject *)(&((PyTypeObject*)PyExc_Exception)[0]))); if (__pyx_t_4) { __Pyx_AddTraceback("numpy.import_ufunc", __pyx_clineno, __pyx_lineno, __pyx_filename); - if (__Pyx_GetException(&__pyx_t_5, &__pyx_t_6, &__pyx_t_7) < 0) __PYX_ERR(3, 1011, __pyx_L5_except_error) + if (__Pyx_GetException(&__pyx_t_5, &__pyx_t_6, &__pyx_t_7) < 0) __PYX_ERR(3, 1049, __pyx_L5_except_error) __Pyx_GOTREF(__pyx_t_5); __Pyx_GOTREF(__pyx_t_6); __Pyx_GOTREF(__pyx_t_7); - /* "../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1012 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":1050 * _import_umath() * except Exception: * raise ImportError("numpy.core.umath failed to import") # <<<<<<<<<<<<<< */ - __pyx_t_8 = __Pyx_PyObject_Call(__pyx_builtin_ImportError, __pyx_tuple__12, NULL); if (unlikely(!__pyx_t_8)) __PYX_ERR(3, 1012, __pyx_L5_except_error) + __pyx_t_8 = __Pyx_PyObject_Call(__pyx_builtin_ImportError, __pyx_tuple__9, NULL); if (unlikely(!__pyx_t_8)) __PYX_ERR(3, 1050, __pyx_L5_except_error) __Pyx_GOTREF(__pyx_t_8); __Pyx_Raise(__pyx_t_8, 0, 0, 0); __Pyx_DECREF(__pyx_t_8); __pyx_t_8 = 0; - __PYX_ERR(3, 1012, __pyx_L5_except_error) + __PYX_ERR(3, 1050, __pyx_L5_except_error) } goto __pyx_L5_except_error; __pyx_L5_except_error:; - /* "../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1009 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":1047 * * cdef inline int import_ufunc() except -1: * try: # <<<<<<<<<<<<<< @@ -9695,7 +9688,7 @@ static CYTHON_INLINE int __pyx_f_5numpy_import_ufunc(void) { __pyx_L8_try_end:; } - /* "../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1008 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":1046 * raise ImportError("numpy.core.umath failed to import") * * cdef inline int import_ufunc() except -1: # <<<<<<<<<<<<<< @@ -10645,10 +10638,21 @@ static struct PyModuleDef __pyx_moduledef = { NULL /* m_free */ }; #endif +#ifndef CYTHON_SMALL_CODE +#if defined(__clang__) + #define CYTHON_SMALL_CODE +#elif defined(__GNUC__) && (__GNUC__ > 4 || (__GNUC__ == 4 && __GNUC_MINOR__ >= 3)) + #define CYTHON_SMALL_CODE __attribute__((cold)) +#else + #define CYTHON_SMALL_CODE +#endif +#endif static __Pyx_StringTabEntry __pyx_string_tab[] = { {&__pyx_n_s_CORPUSFILE_VERSION, __pyx_k_CORPUSFILE_VERSION, sizeof(__pyx_k_CORPUSFILE_VERSION), 0, 0, 1, 1}, + {&__pyx_n_s_CythonLineSentence, __pyx_k_CythonLineSentence, sizeof(__pyx_k_CythonLineSentence), 0, 0, 1, 1}, {&__pyx_n_s_CythonLineSentence___iter, __pyx_k_CythonLineSentence___iter, sizeof(__pyx_k_CythonLineSentence___iter), 0, 0, 1, 1}, + {&__pyx_n_s_CythonVocab, __pyx_k_CythonVocab, sizeof(__pyx_k_CythonVocab), 0, 0, 1, 1}, {&__pyx_kp_u_Format_string_allocated_too_shor, __pyx_k_Format_string_allocated_too_shor, sizeof(__pyx_k_Format_string_allocated_too_shor), 0, 1, 0, 0}, {&__pyx_kp_u_Format_string_allocated_too_shor_2, __pyx_k_Format_string_allocated_too_shor_2, sizeof(__pyx_k_Format_string_allocated_too_shor_2), 0, 1, 0, 0}, {&__pyx_n_s_ImportError, __pyx_k_ImportError, sizeof(__pyx_k_ImportError), 0, 0, 1, 1}, @@ -10742,18 +10746,18 @@ static __Pyx_StringTabEntry __pyx_string_tab[] = { {&__pyx_n_s_wv, __pyx_k_wv, sizeof(__pyx_k_wv), 0, 0, 1, 1}, {0, 0, 0, 0, 0, 0, 0} }; -static int __Pyx_InitCachedBuiltins(void) { +static CYTHON_SMALL_CODE int __Pyx_InitCachedBuiltins(void) { __pyx_builtin_TypeError = __Pyx_GetBuiltinName(__pyx_n_s_TypeError); if (!__pyx_builtin_TypeError) __PYX_ERR(0, 2, __pyx_L1_error) __pyx_builtin_range = __Pyx_GetBuiltinName(__pyx_n_s_range); if (!__pyx_builtin_range) __PYX_ERR(1, 109, __pyx_L1_error) - __pyx_builtin_ValueError = __Pyx_GetBuiltinName(__pyx_n_s_ValueError); if (!__pyx_builtin_ValueError) __PYX_ERR(3, 229, __pyx_L1_error) - __pyx_builtin_RuntimeError = __Pyx_GetBuiltinName(__pyx_n_s_RuntimeError); if (!__pyx_builtin_RuntimeError) __PYX_ERR(3, 810, __pyx_L1_error) - __pyx_builtin_ImportError = __Pyx_GetBuiltinName(__pyx_n_s_ImportError); if (!__pyx_builtin_ImportError) __PYX_ERR(3, 1000, __pyx_L1_error) + __pyx_builtin_ValueError = __Pyx_GetBuiltinName(__pyx_n_s_ValueError); if (!__pyx_builtin_ValueError) __PYX_ERR(3, 272, __pyx_L1_error) + __pyx_builtin_RuntimeError = __Pyx_GetBuiltinName(__pyx_n_s_RuntimeError); if (!__pyx_builtin_RuntimeError) __PYX_ERR(3, 856, __pyx_L1_error) + __pyx_builtin_ImportError = __Pyx_GetBuiltinName(__pyx_n_s_ImportError); if (!__pyx_builtin_ImportError) __PYX_ERR(3, 1038, __pyx_L1_error) return 0; __pyx_L1_error:; return -1; } -static int __Pyx_InitCachedConstants(void) { +static CYTHON_SMALL_CODE int __Pyx_InitCachedConstants(void) { __Pyx_RefNannyDeclarations __Pyx_RefNannySetupContext("__Pyx_InitCachedConstants", 0); @@ -10776,113 +10780,82 @@ static int __Pyx_InitCachedConstants(void) { __Pyx_GOTREF(__pyx_tuple__2); __Pyx_GIVEREF(__pyx_tuple__2); - /* "gensim/models/word2vec_corpusfile.pyx":73 - * return key - * else: - * return key.encode('utf8') # <<<<<<<<<<<<<< - * - * - */ - __pyx_tuple__3 = PyTuple_Pack(1, __pyx_n_s_utf8); if (unlikely(!__pyx_tuple__3)) __PYX_ERR(1, 73, __pyx_L1_error) - __Pyx_GOTREF(__pyx_tuple__3); - __Pyx_GIVEREF(__pyx_tuple__3); - - /* "../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":229 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":272 * if ((flags & pybuf.PyBUF_C_CONTIGUOUS == pybuf.PyBUF_C_CONTIGUOUS) - * and not PyArray_CHKFLAGS(self, NPY_C_CONTIGUOUS)): + * and not PyArray_CHKFLAGS(self, NPY_ARRAY_C_CONTIGUOUS)): * raise ValueError(u"ndarray is not C contiguous") # <<<<<<<<<<<<<< * * if ((flags & pybuf.PyBUF_F_CONTIGUOUS == pybuf.PyBUF_F_CONTIGUOUS) */ - __pyx_tuple__4 = PyTuple_Pack(1, __pyx_kp_u_ndarray_is_not_C_contiguous); if (unlikely(!__pyx_tuple__4)) __PYX_ERR(3, 229, __pyx_L1_error) - __Pyx_GOTREF(__pyx_tuple__4); - __Pyx_GIVEREF(__pyx_tuple__4); + __pyx_tuple__3 = PyTuple_Pack(1, __pyx_kp_u_ndarray_is_not_C_contiguous); if (unlikely(!__pyx_tuple__3)) __PYX_ERR(3, 272, __pyx_L1_error) + __Pyx_GOTREF(__pyx_tuple__3); + __Pyx_GIVEREF(__pyx_tuple__3); - /* "../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":233 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":276 * if ((flags & pybuf.PyBUF_F_CONTIGUOUS == pybuf.PyBUF_F_CONTIGUOUS) - * and not PyArray_CHKFLAGS(self, NPY_F_CONTIGUOUS)): + * and not PyArray_CHKFLAGS(self, NPY_ARRAY_F_CONTIGUOUS)): * raise ValueError(u"ndarray is not Fortran contiguous") # <<<<<<<<<<<<<< * * info.buf = PyArray_DATA(self) */ - __pyx_tuple__5 = PyTuple_Pack(1, __pyx_kp_u_ndarray_is_not_Fortran_contiguou); if (unlikely(!__pyx_tuple__5)) __PYX_ERR(3, 233, __pyx_L1_error) - __Pyx_GOTREF(__pyx_tuple__5); - __Pyx_GIVEREF(__pyx_tuple__5); + __pyx_tuple__4 = PyTuple_Pack(1, __pyx_kp_u_ndarray_is_not_Fortran_contiguou); if (unlikely(!__pyx_tuple__4)) __PYX_ERR(3, 276, __pyx_L1_error) + __Pyx_GOTREF(__pyx_tuple__4); + __Pyx_GIVEREF(__pyx_tuple__4); - /* "../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":263 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":306 * if ((descr.byteorder == c'>' and little_endian) or * (descr.byteorder == c'<' and not little_endian)): * raise ValueError(u"Non-native byte order not supported") # <<<<<<<<<<<<<< * if t == NPY_BYTE: f = "b" * elif t == NPY_UBYTE: f = "B" */ - __pyx_tuple__6 = PyTuple_Pack(1, __pyx_kp_u_Non_native_byte_order_not_suppor); if (unlikely(!__pyx_tuple__6)) __PYX_ERR(3, 263, __pyx_L1_error) - __Pyx_GOTREF(__pyx_tuple__6); - __Pyx_GIVEREF(__pyx_tuple__6); + __pyx_tuple__5 = PyTuple_Pack(1, __pyx_kp_u_Non_native_byte_order_not_suppor); if (unlikely(!__pyx_tuple__5)) __PYX_ERR(3, 306, __pyx_L1_error) + __Pyx_GOTREF(__pyx_tuple__5); + __Pyx_GIVEREF(__pyx_tuple__5); - /* "../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":810 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":856 * * if (end - f) - (new_offset - offset[0]) < 15: * raise RuntimeError(u"Format string allocated too short, see comment in numpy.pxd") # <<<<<<<<<<<<<< * * if ((child.byteorder == c'>' and little_endian) or */ - __pyx_tuple__7 = PyTuple_Pack(1, __pyx_kp_u_Format_string_allocated_too_shor); if (unlikely(!__pyx_tuple__7)) __PYX_ERR(3, 810, __pyx_L1_error) - __Pyx_GOTREF(__pyx_tuple__7); - __Pyx_GIVEREF(__pyx_tuple__7); - - /* "../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":814 - * if ((child.byteorder == c'>' and little_endian) or - * (child.byteorder == c'<' and not little_endian)): - * raise ValueError(u"Non-native byte order not supported") # <<<<<<<<<<<<<< - * # One could encode it in the format string and have Cython - * # complain instead, BUT: < and > in format strings also imply - */ - __pyx_tuple__8 = PyTuple_Pack(1, __pyx_kp_u_Non_native_byte_order_not_suppor); if (unlikely(!__pyx_tuple__8)) __PYX_ERR(3, 814, __pyx_L1_error) - __Pyx_GOTREF(__pyx_tuple__8); - __Pyx_GIVEREF(__pyx_tuple__8); + __pyx_tuple__6 = PyTuple_Pack(1, __pyx_kp_u_Format_string_allocated_too_shor); if (unlikely(!__pyx_tuple__6)) __PYX_ERR(3, 856, __pyx_L1_error) + __Pyx_GOTREF(__pyx_tuple__6); + __Pyx_GIVEREF(__pyx_tuple__6); - /* "../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":834 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":880 * t = child.type_num * if end - f < 5: * raise RuntimeError(u"Format string allocated too short.") # <<<<<<<<<<<<<< * * # Until ticket #99 is fixed, use integers to avoid warnings */ - __pyx_tuple__9 = PyTuple_Pack(1, __pyx_kp_u_Format_string_allocated_too_shor_2); if (unlikely(!__pyx_tuple__9)) __PYX_ERR(3, 834, __pyx_L1_error) - __Pyx_GOTREF(__pyx_tuple__9); - __Pyx_GIVEREF(__pyx_tuple__9); + __pyx_tuple__7 = PyTuple_Pack(1, __pyx_kp_u_Format_string_allocated_too_shor_2); if (unlikely(!__pyx_tuple__7)) __PYX_ERR(3, 880, __pyx_L1_error) + __Pyx_GOTREF(__pyx_tuple__7); + __Pyx_GIVEREF(__pyx_tuple__7); - /* "../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1000 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":1038 * _import_array() * except Exception: * raise ImportError("numpy.core.multiarray failed to import") # <<<<<<<<<<<<<< * * cdef inline int import_umath() except -1: */ - __pyx_tuple__10 = PyTuple_Pack(1, __pyx_kp_s_numpy_core_multiarray_failed_to); if (unlikely(!__pyx_tuple__10)) __PYX_ERR(3, 1000, __pyx_L1_error) - __Pyx_GOTREF(__pyx_tuple__10); - __Pyx_GIVEREF(__pyx_tuple__10); - - /* "../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1006 + __pyx_tuple__8 = PyTuple_Pack(1, __pyx_kp_s_numpy_core_multiarray_failed_to); if (unlikely(!__pyx_tuple__8)) __PYX_ERR(3, 1038, __pyx_L1_error) + __Pyx_GOTREF(__pyx_tuple__8); + __Pyx_GIVEREF(__pyx_tuple__8); + + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":1044 * _import_umath() * except Exception: * raise ImportError("numpy.core.umath failed to import") # <<<<<<<<<<<<<< * * cdef inline int import_ufunc() except -1: */ - __pyx_tuple__11 = PyTuple_Pack(1, __pyx_kp_s_numpy_core_umath_failed_to_impor); if (unlikely(!__pyx_tuple__11)) __PYX_ERR(3, 1006, __pyx_L1_error) - __Pyx_GOTREF(__pyx_tuple__11); - __Pyx_GIVEREF(__pyx_tuple__11); - - /* "../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1012 - * _import_umath() - * except Exception: - * raise ImportError("numpy.core.umath failed to import") # <<<<<<<<<<<<<< - */ - __pyx_tuple__12 = PyTuple_Pack(1, __pyx_kp_s_numpy_core_umath_failed_to_impor); if (unlikely(!__pyx_tuple__12)) __PYX_ERR(3, 1012, __pyx_L1_error) - __Pyx_GOTREF(__pyx_tuple__12); - __Pyx_GIVEREF(__pyx_tuple__12); + __pyx_tuple__9 = PyTuple_Pack(1, __pyx_kp_s_numpy_core_umath_failed_to_impor); if (unlikely(!__pyx_tuple__9)) __PYX_ERR(3, 1044, __pyx_L1_error) + __Pyx_GOTREF(__pyx_tuple__9); + __Pyx_GIVEREF(__pyx_tuple__9); /* "gensim/models/word2vec_corpusfile.pyx":65 * @@ -10891,10 +10864,10 @@ static int __Pyx_InitCachedConstants(void) { * return CythonLineSentence(source, max_sentence_length=max_sentence_length) * */ - __pyx_tuple__13 = PyTuple_Pack(2, __pyx_n_s_source, __pyx_n_s_max_sentence_length); if (unlikely(!__pyx_tuple__13)) __PYX_ERR(1, 65, __pyx_L1_error) - __Pyx_GOTREF(__pyx_tuple__13); - __Pyx_GIVEREF(__pyx_tuple__13); - __pyx_codeobj__14 = (PyObject*)__Pyx_PyCode_New(2, 0, 2, 0, CO_OPTIMIZED|CO_NEWLOCALS, __pyx_empty_bytes, __pyx_empty_tuple, __pyx_empty_tuple, __pyx_tuple__13, __pyx_empty_tuple, __pyx_empty_tuple, __pyx_kp_s_gensim_models_word2vec_corpusfil_2, __pyx_n_s_rebuild_cython_line_sentence, 65, __pyx_empty_bytes); if (unlikely(!__pyx_codeobj__14)) __PYX_ERR(1, 65, __pyx_L1_error) + __pyx_tuple__10 = PyTuple_Pack(2, __pyx_n_s_source, __pyx_n_s_max_sentence_length); if (unlikely(!__pyx_tuple__10)) __PYX_ERR(1, 65, __pyx_L1_error) + __Pyx_GOTREF(__pyx_tuple__10); + __Pyx_GIVEREF(__pyx_tuple__10); + __pyx_codeobj__11 = (PyObject*)__Pyx_PyCode_New(2, 0, 2, 0, CO_OPTIMIZED|CO_NEWLOCALS, __pyx_empty_bytes, __pyx_empty_tuple, __pyx_empty_tuple, __pyx_tuple__10, __pyx_empty_tuple, __pyx_empty_tuple, __pyx_kp_s_gensim_models_word2vec_corpusfil_2, __pyx_n_s_rebuild_cython_line_sentence, 65, __pyx_empty_bytes); if (unlikely(!__pyx_codeobj__11)) __PYX_ERR(1, 65, __pyx_L1_error) /* "gensim/models/word2vec_corpusfile.pyx":249 * @@ -10903,10 +10876,10 @@ static int __Pyx_InitCachedConstants(void) { * _neu1, compute_loss): * """Train Skipgram model for one epoch by training on an input stream. This function is used only in multistream mode. */ - __pyx_tuple__15 = PyTuple_Pack(33, __pyx_n_s_model, __pyx_n_s_corpus_file, __pyx_n_s_offset, __pyx_n_s_cython_vocab, __pyx_n_s_cur_epoch, __pyx_n_s_expected_examples, __pyx_n_s_expected_words, __pyx_n_s_work, __pyx_n_s_neu1, __pyx_n_s_compute_loss, __pyx_n_s_c, __pyx_n_s_cur_epoch_2, __pyx_n_s_num_epochs, __pyx_n_s_expected_examples_2, __pyx_n_s_expected_words_2, __pyx_n_s_start_alpha, __pyx_n_s_end_alpha, __pyx_n_s_alpha_2, __pyx_n_s_input_stream, __pyx_n_s_vocab, __pyx_n_s_i, __pyx_n_s_j, __pyx_n_s_k, __pyx_n_s_effective_words, __pyx_n_s_effective_sentences, __pyx_n_s_effective_samples, __pyx_n_s_total_effective_words, __pyx_n_s_total_sentences, __pyx_n_s_total_words, __pyx_n_s_sent_idx, __pyx_n_s_idx_start, __pyx_n_s_idx_end, __pyx_n_s_sentences); if (unlikely(!__pyx_tuple__15)) __PYX_ERR(1, 249, __pyx_L1_error) - __Pyx_GOTREF(__pyx_tuple__15); - __Pyx_GIVEREF(__pyx_tuple__15); - __pyx_codeobj__16 = (PyObject*)__Pyx_PyCode_New(10, 0, 33, 0, CO_OPTIMIZED|CO_NEWLOCALS, __pyx_empty_bytes, __pyx_empty_tuple, __pyx_empty_tuple, __pyx_tuple__15, __pyx_empty_tuple, __pyx_empty_tuple, __pyx_kp_s_gensim_models_word2vec_corpusfil_2, __pyx_n_s_train_epoch_sg, 249, __pyx_empty_bytes); if (unlikely(!__pyx_codeobj__16)) __PYX_ERR(1, 249, __pyx_L1_error) + __pyx_tuple__12 = PyTuple_Pack(33, __pyx_n_s_model, __pyx_n_s_corpus_file, __pyx_n_s_offset, __pyx_n_s_cython_vocab, __pyx_n_s_cur_epoch, __pyx_n_s_expected_examples, __pyx_n_s_expected_words, __pyx_n_s_work, __pyx_n_s_neu1, __pyx_n_s_compute_loss, __pyx_n_s_c, __pyx_n_s_cur_epoch_2, __pyx_n_s_num_epochs, __pyx_n_s_expected_examples_2, __pyx_n_s_expected_words_2, __pyx_n_s_start_alpha, __pyx_n_s_end_alpha, __pyx_n_s_alpha_2, __pyx_n_s_input_stream, __pyx_n_s_vocab, __pyx_n_s_i, __pyx_n_s_j, __pyx_n_s_k, __pyx_n_s_effective_words, __pyx_n_s_effective_sentences, __pyx_n_s_effective_samples, __pyx_n_s_total_effective_words, __pyx_n_s_total_sentences, __pyx_n_s_total_words, __pyx_n_s_sent_idx, __pyx_n_s_idx_start, __pyx_n_s_idx_end, __pyx_n_s_sentences); if (unlikely(!__pyx_tuple__12)) __PYX_ERR(1, 249, __pyx_L1_error) + __Pyx_GOTREF(__pyx_tuple__12); + __Pyx_GIVEREF(__pyx_tuple__12); + __pyx_codeobj__13 = (PyObject*)__Pyx_PyCode_New(10, 0, 33, 0, CO_OPTIMIZED|CO_NEWLOCALS, __pyx_empty_bytes, __pyx_empty_tuple, __pyx_empty_tuple, __pyx_tuple__12, __pyx_empty_tuple, __pyx_empty_tuple, __pyx_kp_s_gensim_models_word2vec_corpusfil_2, __pyx_n_s_train_epoch_sg, 249, __pyx_empty_bytes); if (unlikely(!__pyx_codeobj__13)) __PYX_ERR(1, 249, __pyx_L1_error) /* "gensim/models/word2vec_corpusfile.pyx":348 * @@ -10915,10 +10888,10 @@ static int __Pyx_InitCachedConstants(void) { * _neu1, compute_loss): * """Train CBOW model for one epoch by training on an input stream. This function is used only in multistream mode. */ - __pyx_tuple__17 = PyTuple_Pack(32, __pyx_n_s_model, __pyx_n_s_corpus_file, __pyx_n_s_offset, __pyx_n_s_cython_vocab, __pyx_n_s_cur_epoch, __pyx_n_s_expected_examples, __pyx_n_s_expected_words, __pyx_n_s_work, __pyx_n_s_neu1, __pyx_n_s_compute_loss, __pyx_n_s_c, __pyx_n_s_cur_epoch_2, __pyx_n_s_num_epochs, __pyx_n_s_expected_examples_2, __pyx_n_s_expected_words_2, __pyx_n_s_start_alpha, __pyx_n_s_end_alpha, __pyx_n_s_alpha_2, __pyx_n_s_input_stream, __pyx_n_s_vocab, __pyx_n_s_i, __pyx_n_s_j, __pyx_n_s_k, __pyx_n_s_effective_words, __pyx_n_s_effective_sentences, __pyx_n_s_total_sentences, __pyx_n_s_total_effective_words, __pyx_n_s_total_words, __pyx_n_s_sent_idx, __pyx_n_s_idx_start, __pyx_n_s_idx_end, __pyx_n_s_sentences); if (unlikely(!__pyx_tuple__17)) __PYX_ERR(1, 348, __pyx_L1_error) - __Pyx_GOTREF(__pyx_tuple__17); - __Pyx_GIVEREF(__pyx_tuple__17); - __pyx_codeobj__18 = (PyObject*)__Pyx_PyCode_New(10, 0, 32, 0, CO_OPTIMIZED|CO_NEWLOCALS, __pyx_empty_bytes, __pyx_empty_tuple, __pyx_empty_tuple, __pyx_tuple__17, __pyx_empty_tuple, __pyx_empty_tuple, __pyx_kp_s_gensim_models_word2vec_corpusfil_2, __pyx_n_s_train_epoch_cbow, 348, __pyx_empty_bytes); if (unlikely(!__pyx_codeobj__18)) __PYX_ERR(1, 348, __pyx_L1_error) + __pyx_tuple__14 = PyTuple_Pack(32, __pyx_n_s_model, __pyx_n_s_corpus_file, __pyx_n_s_offset, __pyx_n_s_cython_vocab, __pyx_n_s_cur_epoch, __pyx_n_s_expected_examples, __pyx_n_s_expected_words, __pyx_n_s_work, __pyx_n_s_neu1, __pyx_n_s_compute_loss, __pyx_n_s_c, __pyx_n_s_cur_epoch_2, __pyx_n_s_num_epochs, __pyx_n_s_expected_examples_2, __pyx_n_s_expected_words_2, __pyx_n_s_start_alpha, __pyx_n_s_end_alpha, __pyx_n_s_alpha_2, __pyx_n_s_input_stream, __pyx_n_s_vocab, __pyx_n_s_i, __pyx_n_s_j, __pyx_n_s_k, __pyx_n_s_effective_words, __pyx_n_s_effective_sentences, __pyx_n_s_total_sentences, __pyx_n_s_total_effective_words, __pyx_n_s_total_words, __pyx_n_s_sent_idx, __pyx_n_s_idx_start, __pyx_n_s_idx_end, __pyx_n_s_sentences); if (unlikely(!__pyx_tuple__14)) __PYX_ERR(1, 348, __pyx_L1_error) + __Pyx_GOTREF(__pyx_tuple__14); + __Pyx_GIVEREF(__pyx_tuple__14); + __pyx_codeobj__15 = (PyObject*)__Pyx_PyCode_New(10, 0, 32, 0, CO_OPTIMIZED|CO_NEWLOCALS, __pyx_empty_bytes, __pyx_empty_tuple, __pyx_empty_tuple, __pyx_tuple__14, __pyx_empty_tuple, __pyx_empty_tuple, __pyx_kp_s_gensim_models_word2vec_corpusfil_2, __pyx_n_s_train_epoch_cbow, 348, __pyx_empty_bytes); if (unlikely(!__pyx_codeobj__15)) __PYX_ERR(1, 348, __pyx_L1_error) __Pyx_RefNannyFinishContext(); return 0; __pyx_L1_error:; @@ -10926,7 +10899,7 @@ static int __Pyx_InitCachedConstants(void) { return -1; } -static int __Pyx_InitGlobals(void) { +static CYTHON_SMALL_CODE int __Pyx_InitGlobals(void) { if (__Pyx_InitStrings(__pyx_string_tab) < 0) __PYX_ERR(1, 1, __pyx_L1_error); __pyx_int_0 = PyInt_FromLong(0); if (unlikely(!__pyx_int_0)) __PYX_ERR(1, 1, __pyx_L1_error) __pyx_int_1 = PyInt_FromLong(1); if (unlikely(!__pyx_int_1)) __PYX_ERR(1, 1, __pyx_L1_error) @@ -10936,13 +10909,13 @@ static int __Pyx_InitGlobals(void) { return -1; } -static int __Pyx_modinit_global_init_code(void); /*proto*/ -static int __Pyx_modinit_variable_export_code(void); /*proto*/ -static int __Pyx_modinit_function_export_code(void); /*proto*/ -static int __Pyx_modinit_type_init_code(void); /*proto*/ -static int __Pyx_modinit_type_import_code(void); /*proto*/ -static int __Pyx_modinit_variable_import_code(void); /*proto*/ -static int __Pyx_modinit_function_import_code(void); /*proto*/ +static CYTHON_SMALL_CODE int __Pyx_modinit_global_init_code(void); /*proto*/ +static CYTHON_SMALL_CODE int __Pyx_modinit_variable_export_code(void); /*proto*/ +static CYTHON_SMALL_CODE int __Pyx_modinit_function_export_code(void); /*proto*/ +static CYTHON_SMALL_CODE int __Pyx_modinit_type_init_code(void); /*proto*/ +static CYTHON_SMALL_CODE int __Pyx_modinit_type_import_code(void); /*proto*/ +static CYTHON_SMALL_CODE int __Pyx_modinit_variable_import_code(void); /*proto*/ +static CYTHON_SMALL_CODE int __Pyx_modinit_function_import_code(void); /*proto*/ static int __Pyx_modinit_global_init_code(void) { __Pyx_RefNannyDeclarations @@ -10990,7 +10963,7 @@ static int __Pyx_modinit_type_init_code(void) { __pyx_type_6gensim_6models_19word2vec_corpusfile_CythonLineSentence.tp_getattro = __Pyx_PyObject_GenericGetAttrNoDict; } if (__Pyx_SetVtable(__pyx_type_6gensim_6models_19word2vec_corpusfile_CythonLineSentence.tp_dict, __pyx_vtabptr_6gensim_6models_19word2vec_corpusfile_CythonLineSentence) < 0) __PYX_ERR(1, 77, __pyx_L1_error) - if (PyObject_SetAttrString(__pyx_m, "CythonLineSentence", (PyObject *)&__pyx_type_6gensim_6models_19word2vec_corpusfile_CythonLineSentence) < 0) __PYX_ERR(1, 77, __pyx_L1_error) + if (PyObject_SetAttr(__pyx_m, __pyx_n_s_CythonLineSentence, (PyObject *)&__pyx_type_6gensim_6models_19word2vec_corpusfile_CythonLineSentence) < 0) __PYX_ERR(1, 77, __pyx_L1_error) __pyx_ptype_6gensim_6models_19word2vec_corpusfile_CythonLineSentence = &__pyx_type_6gensim_6models_19word2vec_corpusfile_CythonLineSentence; __pyx_vtabptr_6gensim_6models_19word2vec_corpusfile_CythonVocab = &__pyx_vtable_6gensim_6models_19word2vec_corpusfile_CythonVocab; __pyx_vtable_6gensim_6models_19word2vec_corpusfile_CythonVocab.get_vocab_ptr = (__pyx_t_6gensim_6models_19word2vec_corpusfile_cvocab_t *(*)(struct __pyx_obj_6gensim_6models_19word2vec_corpusfile_CythonVocab *))__pyx_f_6gensim_6models_19word2vec_corpusfile_11CythonVocab_get_vocab_ptr; @@ -11000,7 +10973,7 @@ static int __Pyx_modinit_type_init_code(void) { __pyx_type_6gensim_6models_19word2vec_corpusfile_CythonVocab.tp_getattro = __Pyx_PyObject_GenericGetAttrNoDict; } if (__Pyx_SetVtable(__pyx_type_6gensim_6models_19word2vec_corpusfile_CythonVocab.tp_dict, __pyx_vtabptr_6gensim_6models_19word2vec_corpusfile_CythonVocab) < 0) __PYX_ERR(1, 40, __pyx_L1_error) - if (PyObject_SetAttrString(__pyx_m, "CythonVocab", (PyObject *)&__pyx_type_6gensim_6models_19word2vec_corpusfile_CythonVocab) < 0) __PYX_ERR(1, 40, __pyx_L1_error) + if (PyObject_SetAttr(__pyx_m, __pyx_n_s_CythonVocab, (PyObject *)&__pyx_type_6gensim_6models_19word2vec_corpusfile_CythonVocab) < 0) __PYX_ERR(1, 40, __pyx_L1_error) if (__Pyx_setup_reduce((PyObject*)&__pyx_type_6gensim_6models_19word2vec_corpusfile_CythonVocab) < 0) __PYX_ERR(1, 40, __pyx_L1_error) __pyx_ptype_6gensim_6models_19word2vec_corpusfile_CythonVocab = &__pyx_type_6gensim_6models_19word2vec_corpusfile_CythonVocab; if (PyType_Ready(&__pyx_type_6gensim_6models_19word2vec_corpusfile___pyx_scope_struct____iter__) < 0) __PYX_ERR(1, 122, __pyx_L1_error) @@ -11018,23 +10991,37 @@ static int __Pyx_modinit_type_init_code(void) { static int __Pyx_modinit_type_import_code(void) { __Pyx_RefNannyDeclarations + PyObject *__pyx_t_1 = NULL; __Pyx_RefNannySetupContext("__Pyx_modinit_type_import_code", 0); /*--- Type import code ---*/ - __pyx_ptype_7cpython_4type_type = __Pyx_ImportType(__Pyx_BUILTIN_MODULE_NAME, "type", + __pyx_t_1 = PyImport_ImportModule(__Pyx_BUILTIN_MODULE_NAME); if (unlikely(!__pyx_t_1)) __PYX_ERR(4, 9, __pyx_L1_error) + __Pyx_GOTREF(__pyx_t_1); + __pyx_ptype_7cpython_4type_type = __Pyx_ImportType(__pyx_t_1, __Pyx_BUILTIN_MODULE_NAME, "type", #if defined(PYPY_VERSION_NUM) && PYPY_VERSION_NUM < 0x050B0000 sizeof(PyTypeObject), #else sizeof(PyHeapTypeObject), #endif - 0); if (unlikely(!__pyx_ptype_7cpython_4type_type)) __PYX_ERR(4, 9, __pyx_L1_error) - __pyx_ptype_5numpy_dtype = __Pyx_ImportType("numpy", "dtype", sizeof(PyArray_Descr), 0); if (unlikely(!__pyx_ptype_5numpy_dtype)) __PYX_ERR(3, 164, __pyx_L1_error) - __pyx_ptype_5numpy_flatiter = __Pyx_ImportType("numpy", "flatiter", sizeof(PyArrayIterObject), 0); if (unlikely(!__pyx_ptype_5numpy_flatiter)) __PYX_ERR(3, 186, __pyx_L1_error) - __pyx_ptype_5numpy_broadcast = __Pyx_ImportType("numpy", "broadcast", sizeof(PyArrayMultiIterObject), 0); if (unlikely(!__pyx_ptype_5numpy_broadcast)) __PYX_ERR(3, 190, __pyx_L1_error) - __pyx_ptype_5numpy_ndarray = __Pyx_ImportType("numpy", "ndarray", sizeof(PyArrayObject), 0); if (unlikely(!__pyx_ptype_5numpy_ndarray)) __PYX_ERR(3, 199, __pyx_L1_error) - __pyx_ptype_5numpy_ufunc = __Pyx_ImportType("numpy", "ufunc", sizeof(PyUFuncObject), 0); if (unlikely(!__pyx_ptype_5numpy_ufunc)) __PYX_ERR(3, 872, __pyx_L1_error) + __Pyx_ImportType_CheckSize_Warn); + if (!__pyx_ptype_7cpython_4type_type) __PYX_ERR(4, 9, __pyx_L1_error) + __Pyx_DECREF(__pyx_t_1); __pyx_t_1 = 0; + __pyx_t_1 = PyImport_ImportModule("numpy"); if (unlikely(!__pyx_t_1)) __PYX_ERR(3, 206, __pyx_L1_error) + __Pyx_GOTREF(__pyx_t_1); + __pyx_ptype_5numpy_dtype = __Pyx_ImportType(__pyx_t_1, "numpy", "dtype", sizeof(PyArray_Descr), __Pyx_ImportType_CheckSize_Ignore); + if (!__pyx_ptype_5numpy_dtype) __PYX_ERR(3, 206, __pyx_L1_error) + __pyx_ptype_5numpy_flatiter = __Pyx_ImportType(__pyx_t_1, "numpy", "flatiter", sizeof(PyArrayIterObject), __Pyx_ImportType_CheckSize_Warn); + if (!__pyx_ptype_5numpy_flatiter) __PYX_ERR(3, 229, __pyx_L1_error) + __pyx_ptype_5numpy_broadcast = __Pyx_ImportType(__pyx_t_1, "numpy", "broadcast", sizeof(PyArrayMultiIterObject), __Pyx_ImportType_CheckSize_Warn); + if (!__pyx_ptype_5numpy_broadcast) __PYX_ERR(3, 233, __pyx_L1_error) + __pyx_ptype_5numpy_ndarray = __Pyx_ImportType(__pyx_t_1, "numpy", "ndarray", sizeof(PyArrayObject), __Pyx_ImportType_CheckSize_Ignore); + if (!__pyx_ptype_5numpy_ndarray) __PYX_ERR(3, 242, __pyx_L1_error) + __pyx_ptype_5numpy_ufunc = __Pyx_ImportType(__pyx_t_1, "numpy", "ufunc", sizeof(PyUFuncObject), __Pyx_ImportType_CheckSize_Warn); + if (!__pyx_ptype_5numpy_ufunc) __PYX_ERR(3, 918, __pyx_L1_error) + __Pyx_DECREF(__pyx_t_1); __pyx_t_1 = 0; __Pyx_RefNannyFinishContext(); return 0; __pyx_L1_error:; + __Pyx_XDECREF(__pyx_t_1); __Pyx_RefNannyFinishContext(); return -1; } @@ -11044,7 +11031,7 @@ static int __Pyx_modinit_variable_import_code(void) { PyObject *__pyx_t_1 = NULL; __Pyx_RefNannySetupContext("__Pyx_modinit_variable_import_code", 0); /*--- Variable import code ---*/ - __pyx_t_1 = __Pyx_ImportModule("gensim.models.word2vec_inner"); if (!__pyx_t_1) __PYX_ERR(1, 1, __pyx_L1_error) + __pyx_t_1 = PyImport_ImportModule("gensim.models.word2vec_inner"); if (!__pyx_t_1) __PYX_ERR(1, 1, __pyx_L1_error) if (__Pyx_ImportVoidPtr(__pyx_t_1, "scopy", (void **)&__pyx_vp_6gensim_6models_14word2vec_inner_scopy, "__pyx_t_6gensim_6models_14word2vec_inner_scopy_ptr") < 0) __PYX_ERR(1, 1, __pyx_L1_error) if (__Pyx_ImportVoidPtr(__pyx_t_1, "saxpy", (void **)&__pyx_vp_6gensim_6models_14word2vec_inner_saxpy, "__pyx_t_6gensim_6models_14word2vec_inner_saxpy_ptr") < 0) __PYX_ERR(1, 1, __pyx_L1_error) if (__Pyx_ImportVoidPtr(__pyx_t_1, "sdot", (void **)&__pyx_vp_6gensim_6models_14word2vec_inner_sdot, "__pyx_t_6gensim_6models_14word2vec_inner_sdot_ptr") < 0) __PYX_ERR(1, 1, __pyx_L1_error) @@ -11068,7 +11055,7 @@ static int __Pyx_modinit_function_import_code(void) { PyObject *__pyx_t_1 = NULL; __Pyx_RefNannySetupContext("__Pyx_modinit_function_import_code", 0); /*--- Function import code ---*/ - __pyx_t_1 = __Pyx_ImportModule("gensim.models.word2vec_inner"); if (!__pyx_t_1) __PYX_ERR(1, 1, __pyx_L1_error) + __pyx_t_1 = PyImport_ImportModule("gensim.models.word2vec_inner"); if (!__pyx_t_1) __PYX_ERR(1, 1, __pyx_L1_error) if (__Pyx_ImportFunction(__pyx_t_1, "random_int32", (void (**)(void))&__pyx_f_6gensim_6models_14word2vec_inner_random_int32, "unsigned PY_LONG_LONG (unsigned PY_LONG_LONG *)") < 0) __PYX_ERR(1, 1, __pyx_L1_error) if (__Pyx_ImportFunction(__pyx_t_1, "w2v_fast_sentence_sg_hs", (void (**)(void))&__pyx_f_6gensim_6models_14word2vec_inner_w2v_fast_sentence_sg_hs, "void (__pyx_t_5numpy_uint32_t const *, __pyx_t_5numpy_uint8_t const *, int const , __pyx_t_6gensim_6models_14word2vec_inner_REAL_t *, __pyx_t_6gensim_6models_14word2vec_inner_REAL_t *, int const , __pyx_t_5numpy_uint32_t const , __pyx_t_6gensim_6models_14word2vec_inner_REAL_t const , __pyx_t_6gensim_6models_14word2vec_inner_REAL_t *, __pyx_t_6gensim_6models_14word2vec_inner_REAL_t *, int const , __pyx_t_6gensim_6models_14word2vec_inner_REAL_t *)") < 0) __PYX_ERR(1, 1, __pyx_L1_error) if (__Pyx_ImportFunction(__pyx_t_1, "w2v_fast_sentence_sg_neg", (void (**)(void))&__pyx_f_6gensim_6models_14word2vec_inner_w2v_fast_sentence_sg_neg, "unsigned PY_LONG_LONG (int const , __pyx_t_5numpy_uint32_t *, unsigned PY_LONG_LONG, __pyx_t_6gensim_6models_14word2vec_inner_REAL_t *, __pyx_t_6gensim_6models_14word2vec_inner_REAL_t *, int const , __pyx_t_5numpy_uint32_t const , __pyx_t_5numpy_uint32_t const , __pyx_t_6gensim_6models_14word2vec_inner_REAL_t const , __pyx_t_6gensim_6models_14word2vec_inner_REAL_t *, unsigned PY_LONG_LONG, __pyx_t_6gensim_6models_14word2vec_inner_REAL_t *, int const , __pyx_t_6gensim_6models_14word2vec_inner_REAL_t *)") < 0) __PYX_ERR(1, 1, __pyx_L1_error) @@ -11098,15 +11085,6 @@ static int __Pyx_modinit_function_import_code(void) { #define __Pyx_PyMODINIT_FUNC PyMODINIT_FUNC #endif #endif -#ifndef CYTHON_SMALL_CODE -#if defined(__clang__) - #define CYTHON_SMALL_CODE -#elif defined(__GNUC__) && (!(defined(__cplusplus)) || (__GNUC__ > 4 || (__GNUC__ == 4 && __GNUC_MINOR__ > 4))) - #define CYTHON_SMALL_CODE __attribute__((optimize("Os"))) -#else - #define CYTHON_SMALL_CODE -#endif -#endif #if PY_MAJOR_VERSION < 3 @@ -11119,11 +11097,36 @@ __Pyx_PyMODINIT_FUNC PyInit_word2vec_corpusfile(void) { return PyModuleDef_Init(&__pyx_moduledef); } -static int __Pyx_copy_spec_to_module(PyObject *spec, PyObject *moddict, const char* from_name, const char* to_name) { +static CYTHON_SMALL_CODE int __Pyx_check_single_interpreter(void) { + #if PY_VERSION_HEX >= 0x030700A1 + static PY_INT64_T main_interpreter_id = -1; + PY_INT64_T current_id = PyInterpreterState_GetID(PyThreadState_Get()->interp); + if (main_interpreter_id == -1) { + main_interpreter_id = current_id; + return (unlikely(current_id == -1)) ? -1 : 0; + } else if (unlikely(main_interpreter_id != current_id)) + #else + static PyInterpreterState *main_interpreter = NULL; + PyInterpreterState *current_interpreter = PyThreadState_Get()->interp; + if (!main_interpreter) { + main_interpreter = current_interpreter; + } else if (unlikely(main_interpreter != current_interpreter)) + #endif + { + PyErr_SetString( + PyExc_ImportError, + "Interpreter change detected - this module can only be loaded into one interpreter per process."); + return -1; + } + return 0; +} +static CYTHON_SMALL_CODE int __Pyx_copy_spec_to_module(PyObject *spec, PyObject *moddict, const char* from_name, const char* to_name, int allow_none) { PyObject *value = PyObject_GetAttrString(spec, from_name); int result = 0; if (likely(value)) { - result = PyDict_SetItemString(moddict, to_name, value); + if (allow_none || value != Py_None) { + result = PyDict_SetItemString(moddict, to_name, value); + } Py_DECREF(value); } else if (PyErr_ExceptionMatches(PyExc_AttributeError)) { PyErr_Clear(); @@ -11132,8 +11135,10 @@ static int __Pyx_copy_spec_to_module(PyObject *spec, PyObject *moddict, const ch } return result; } -static PyObject* __pyx_pymod_create(PyObject *spec, CYTHON_UNUSED PyModuleDef *def) { +static CYTHON_SMALL_CODE PyObject* __pyx_pymod_create(PyObject *spec, CYTHON_UNUSED PyModuleDef *def) { PyObject *module = NULL, *moddict, *modname; + if (__Pyx_check_single_interpreter()) + return NULL; if (__pyx_m) return __Pyx_NewRef(__pyx_m); modname = PyObject_GetAttrString(spec, "name"); @@ -11143,10 +11148,10 @@ static PyObject* __pyx_pymod_create(PyObject *spec, CYTHON_UNUSED PyModuleDef *d if (unlikely(!module)) goto bad; moddict = PyModule_GetDict(module); if (unlikely(!moddict)) goto bad; - if (unlikely(__Pyx_copy_spec_to_module(spec, moddict, "loader", "__loader__") < 0)) goto bad; - if (unlikely(__Pyx_copy_spec_to_module(spec, moddict, "origin", "__file__") < 0)) goto bad; - if (unlikely(__Pyx_copy_spec_to_module(spec, moddict, "parent", "__package__") < 0)) goto bad; - if (unlikely(__Pyx_copy_spec_to_module(spec, moddict, "submodule_search_locations", "__path__") < 0)) goto bad; + if (unlikely(__Pyx_copy_spec_to_module(spec, moddict, "loader", "__loader__", 1) < 0)) goto bad; + if (unlikely(__Pyx_copy_spec_to_module(spec, moddict, "origin", "__file__", 1) < 0)) goto bad; + if (unlikely(__Pyx_copy_spec_to_module(spec, moddict, "parent", "__package__", 1) < 0)) goto bad; + if (unlikely(__Pyx_copy_spec_to_module(spec, moddict, "submodule_search_locations", "__path__", 0) < 0)) goto bad; return module; bad: Py_XDECREF(module); @@ -11154,7 +11159,7 @@ static PyObject* __pyx_pymod_create(PyObject *spec, CYTHON_UNUSED PyModuleDef *d } -static int __pyx_pymod_exec_word2vec_corpusfile(PyObject *__pyx_pyinit_module) +static CYTHON_SMALL_CODE int __pyx_pymod_exec_word2vec_corpusfile(PyObject *__pyx_pyinit_module) #endif #endif { @@ -11162,7 +11167,11 @@ static int __pyx_pymod_exec_word2vec_corpusfile(PyObject *__pyx_pyinit_module) PyObject *__pyx_t_2 = NULL; __Pyx_RefNannyDeclarations #if CYTHON_PEP489_MULTI_PHASE_INIT - if (__pyx_m && __pyx_m == __pyx_pyinit_module) return 0; + if (__pyx_m) { + if (__pyx_m == __pyx_pyinit_module) return 0; + PyErr_SetString(PyExc_RuntimeError, "Module 'word2vec_corpusfile' has already been imported. Re-initialisation is not supported."); + return -1; + } #elif PY_MAJOR_VERSION >= 3 if (__pyx_m) return __Pyx_NewRef(__pyx_m); #endif @@ -11177,6 +11186,9 @@ if (!__Pyx_RefNanny) { #endif __Pyx_RefNannySetupContext("__Pyx_PyMODINIT_FUNC PyInit_word2vec_corpusfile(void)", 0); if (__Pyx_check_binary_version() < 0) __PYX_ERR(1, 1, __pyx_L1_error) + #ifdef __Pxy_PyFrame_Initialize_Offsets + __Pxy_PyFrame_Initialize_Offsets(); + #endif __pyx_empty_tuple = PyTuple_New(0); if (unlikely(!__pyx_empty_tuple)) __PYX_ERR(1, 1, __pyx_L1_error) __pyx_empty_bytes = PyBytes_FromStringAndSize("", 0); if (unlikely(!__pyx_empty_bytes)) __PYX_ERR(1, 1, __pyx_L1_error) __pyx_empty_unicode = PyUnicode_FromStringAndSize("", 0); if (unlikely(!__pyx_empty_unicode)) __PYX_ERR(1, 1, __pyx_L1_error) @@ -11231,7 +11243,7 @@ if (!__Pyx_RefNanny) { if (__Pyx_init_sys_getdefaultencoding_params() < 0) __PYX_ERR(1, 1, __pyx_L1_error) #endif if (__pyx_module_is_main_gensim__models__word2vec_corpusfile) { - if (PyObject_SetAttrString(__pyx_m, "__name__", __pyx_n_s_main) < 0) __PYX_ERR(1, 1, __pyx_L1_error) + if (PyObject_SetAttr(__pyx_m, __pyx_n_s_name, __pyx_n_s_main) < 0) __PYX_ERR(1, 1, __pyx_L1_error) } #if PY_MAJOR_VERSION >= 3 { @@ -11381,9 +11393,9 @@ if (!__Pyx_RefNanny) { __Pyx_XDECREF(__pyx_t_2); if (__pyx_m) { if (__pyx_d) { - __Pyx_AddTraceback("init gensim.models.word2vec_corpusfile", 0, __pyx_lineno, __pyx_filename); + __Pyx_AddTraceback("init gensim.models.word2vec_corpusfile", __pyx_clineno, __pyx_lineno, __pyx_filename); } - Py_DECREF(__pyx_m); __pyx_m = 0; + Py_CLEAR(__pyx_m); } else if (!PyErr_Occurred()) { PyErr_SetString(PyExc_ImportError, "init gensim.models.word2vec_corpusfile"); } @@ -11404,9 +11416,9 @@ if (!__Pyx_RefNanny) { static __Pyx_RefNannyAPIStruct *__Pyx_RefNannyImportAPI(const char *modname) { PyObject *m = NULL, *p = NULL; void *r = NULL; - m = PyImport_ImportModule((char *)modname); + m = PyImport_ImportModule(modname); if (!m) goto end; - p = PyObject_GetAttrString(m, (char *)"RefNannyAPI"); + p = PyObject_GetAttrString(m, "RefNannyAPI"); if (!p) goto end; r = PyLong_AsVoidPtr(p); end: @@ -11587,41 +11599,49 @@ static void __Pyx_RaiseArgtupleInvalid( } /* GetModuleGlobalName */ -static CYTHON_INLINE PyObject *__Pyx_GetModuleGlobalName(PyObject *name) { +#if CYTHON_USE_DICT_VERSIONS +static PyObject *__Pyx__GetModuleGlobalName(PyObject *name, PY_UINT64_T *dict_version, PyObject **dict_cached_value) +#else +static CYTHON_INLINE PyObject *__Pyx__GetModuleGlobalName(PyObject *name) +#endif +{ PyObject *result; #if !CYTHON_AVOID_BORROWED_REFS #if CYTHON_COMPILING_IN_CPYTHON && PY_VERSION_HEX >= 0x030500A1 result = _PyDict_GetItem_KnownHash(__pyx_d, name, ((PyASCIIObject *) name)->hash); + __PYX_UPDATE_DICT_CACHE(__pyx_d, result, *dict_cached_value, *dict_version) if (likely(result)) { - Py_INCREF(result); + return __Pyx_NewRef(result); } else if (unlikely(PyErr_Occurred())) { - result = NULL; - } else { + return NULL; + } #else result = PyDict_GetItem(__pyx_d, name); + __PYX_UPDATE_DICT_CACHE(__pyx_d, result, *dict_cached_value, *dict_version) if (likely(result)) { - Py_INCREF(result); - } else { + return __Pyx_NewRef(result); + } #endif #else result = PyObject_GetItem(__pyx_d, name); - if (!result) { - PyErr_Clear(); -#endif - result = __Pyx_GetBuiltinName(name); + __PYX_UPDATE_DICT_CACHE(__pyx_d, result, *dict_cached_value, *dict_version) + if (likely(result)) { + return __Pyx_NewRef(result); } - return result; + PyErr_Clear(); +#endif + return __Pyx_GetBuiltinName(name); } /* PyCFunctionFastCall */ - #if CYTHON_FAST_PYCCALL +#if CYTHON_FAST_PYCCALL static CYTHON_INLINE PyObject * __Pyx_PyCFunction_FastCall(PyObject *func_obj, PyObject **args, Py_ssize_t nargs) { PyCFunctionObject *func = (PyCFunctionObject*)func_obj; PyCFunction meth = PyCFunction_GET_FUNCTION(func); PyObject *self = PyCFunction_GET_SELF(func); int flags = PyCFunction_GET_FLAGS(func); assert(PyCFunction_Check(func)); - assert(METH_FASTCALL == (flags & ~(METH_CLASS | METH_STATIC | METH_COEXIST | METH_KEYWORDS))); + assert(METH_FASTCALL == (flags & ~(METH_CLASS | METH_STATIC | METH_COEXIST | METH_KEYWORDS | METH_STACKLESS))); assert(nargs >= 0); assert(nargs == 0 || args != NULL); /* _PyCFunction_FastCallDict() must not be called with an exception set, @@ -11629,16 +11649,15 @@ static CYTHON_INLINE PyObject * __Pyx_PyCFunction_FastCall(PyObject *func_obj, P caller loses its exception */ assert(!PyErr_Occurred()); if ((PY_VERSION_HEX < 0x030700A0) || unlikely(flags & METH_KEYWORDS)) { - return (*((__Pyx_PyCFunctionFastWithKeywords)meth)) (self, args, nargs, NULL); + return (*((__Pyx_PyCFunctionFastWithKeywords)(void*)meth)) (self, args, nargs, NULL); } else { - return (*((__Pyx_PyCFunctionFast)meth)) (self, args, nargs); + return (*((__Pyx_PyCFunctionFast)(void*)meth)) (self, args, nargs); } } #endif /* PyFunctionFastCall */ - #if CYTHON_FAST_PYCALL -#include "frameobject.h" +#if CYTHON_FAST_PYCALL static PyObject* __Pyx_PyFunction_FastCallNoKw(PyCodeObject *co, PyObject **args, Py_ssize_t na, PyObject *globals) { PyFrameObject *f; @@ -11656,7 +11675,7 @@ static PyObject* __Pyx_PyFunction_FastCallNoKw(PyCodeObject *co, PyObject **args if (f == NULL) { return NULL; } - fastlocals = f->f_localsplus; + fastlocals = __Pyx_PyFrame_GetLocalsplus(f); for (i = 0; i < na; i++) { Py_INCREF(*args); fastlocals[i] = *args++; @@ -11757,7 +11776,7 @@ static PyObject *__Pyx_PyFunction_FastCallDict(PyObject *func, PyObject **args, #endif /* PyObjectCall */ - #if CYTHON_COMPILING_IN_CPYTHON +#if CYTHON_COMPILING_IN_CPYTHON static CYTHON_INLINE PyObject* __Pyx_PyObject_Call(PyObject *func, PyObject *arg, PyObject *kw) { PyObject *result; ternaryfunc call = func->ob_type->tp_call; @@ -11776,8 +11795,37 @@ static CYTHON_INLINE PyObject* __Pyx_PyObject_Call(PyObject *func, PyObject *arg } #endif +/* PyObjectCall2Args */ +static CYTHON_UNUSED PyObject* __Pyx_PyObject_Call2Args(PyObject* function, PyObject* arg1, PyObject* arg2) { + PyObject *args, *result = NULL; + #if CYTHON_FAST_PYCALL + if (PyFunction_Check(function)) { + PyObject *args[2] = {arg1, arg2}; + return __Pyx_PyFunction_FastCall(function, args, 2); + } + #endif + #if CYTHON_FAST_PYCCALL + if (__Pyx_PyFastCFunction_Check(function)) { + PyObject *args[2] = {arg1, arg2}; + return __Pyx_PyCFunction_FastCall(function, args, 2); + } + #endif + args = PyTuple_New(2); + if (unlikely(!args)) goto done; + Py_INCREF(arg1); + PyTuple_SET_ITEM(args, 0, arg1); + Py_INCREF(arg2); + PyTuple_SET_ITEM(args, 1, arg2); + Py_INCREF(function); + result = __Pyx_PyObject_Call(function, args, NULL); + Py_DECREF(args); + Py_DECREF(function); +done: + return result; +} + /* PyObjectCallMethO */ - #if CYTHON_COMPILING_IN_CPYTHON +#if CYTHON_COMPILING_IN_CPYTHON static CYTHON_INLINE PyObject* __Pyx_PyObject_CallMethO(PyObject *func, PyObject *arg) { PyObject *self, *result; PyCFunction cfunc; @@ -11797,7 +11845,7 @@ static CYTHON_INLINE PyObject* __Pyx_PyObject_CallMethO(PyObject *func, PyObject #endif /* PyObjectCallOneArg */ - #if CYTHON_COMPILING_IN_CPYTHON +#if CYTHON_COMPILING_IN_CPYTHON static PyObject* __Pyx__PyObject_CallOneArg(PyObject *func, PyObject *arg) { PyObject *result; PyObject *args = PyTuple_New(1); @@ -11837,20 +11885,20 @@ static CYTHON_INLINE PyObject* __Pyx_PyObject_CallOneArg(PyObject *func, PyObjec #endif /* RaiseTooManyValuesToUnpack */ - static CYTHON_INLINE void __Pyx_RaiseTooManyValuesError(Py_ssize_t expected) { +static CYTHON_INLINE void __Pyx_RaiseTooManyValuesError(Py_ssize_t expected) { PyErr_Format(PyExc_ValueError, "too many values to unpack (expected %" CYTHON_FORMAT_SSIZE_T "d)", expected); } /* RaiseNeedMoreValuesToUnpack */ - static CYTHON_INLINE void __Pyx_RaiseNeedMoreValuesError(Py_ssize_t index) { +static CYTHON_INLINE void __Pyx_RaiseNeedMoreValuesError(Py_ssize_t index) { PyErr_Format(PyExc_ValueError, "need more than %" CYTHON_FORMAT_SSIZE_T "d value%.1s to unpack", index, (index == 1) ? "" : "s"); } /* IterFinish */ - static CYTHON_INLINE int __Pyx_IterFinish(void) { +static CYTHON_INLINE int __Pyx_IterFinish(void) { #if CYTHON_FAST_THREAD_STATE PyThreadState *tstate = __Pyx_PyThreadState_Current; PyObject* exc_type = tstate->curexc_type; @@ -11885,7 +11933,7 @@ static CYTHON_INLINE PyObject* __Pyx_PyObject_CallOneArg(PyObject *func, PyObjec } /* UnpackItemEndCheck */ - static int __Pyx_IternextUnpackEndCheck(PyObject *retval, Py_ssize_t expected) { +static int __Pyx_IternextUnpackEndCheck(PyObject *retval, Py_ssize_t expected) { if (unlikely(retval)) { Py_DECREF(retval); __Pyx_RaiseTooManyValuesError(expected); @@ -11897,7 +11945,7 @@ static CYTHON_INLINE PyObject* __Pyx_PyObject_CallOneArg(PyObject *func, PyObjec } /* ExtTypeTest */ - static CYTHON_INLINE int __Pyx_TypeTest(PyObject *obj, PyTypeObject *type) { +static CYTHON_INLINE int __Pyx_TypeTest(PyObject *obj, PyTypeObject *type) { if (unlikely(!type)) { PyErr_SetString(PyExc_SystemError, "Missing type object"); return 0; @@ -11910,7 +11958,7 @@ static CYTHON_INLINE PyObject* __Pyx_PyObject_CallOneArg(PyObject *func, PyObjec } /* GetItemInt */ - static PyObject *__Pyx_GetItemInt_Generic(PyObject *o, PyObject* j) { +static PyObject *__Pyx_GetItemInt_Generic(PyObject *o, PyObject* j) { PyObject *r; if (!j) return NULL; r = PyObject_GetItem(o, j); @@ -11925,7 +11973,7 @@ static CYTHON_INLINE PyObject *__Pyx_GetItemInt_List_Fast(PyObject *o, Py_ssize_ if (wraparound & unlikely(i < 0)) { wrapped_i += PyList_GET_SIZE(o); } - if ((!boundscheck) || likely((0 <= wrapped_i) & (wrapped_i < PyList_GET_SIZE(o)))) { + if ((!boundscheck) || likely(__Pyx_is_valid_index(wrapped_i, PyList_GET_SIZE(o)))) { PyObject *r = PyList_GET_ITEM(o, wrapped_i); Py_INCREF(r); return r; @@ -11943,7 +11991,7 @@ static CYTHON_INLINE PyObject *__Pyx_GetItemInt_Tuple_Fast(PyObject *o, Py_ssize if (wraparound & unlikely(i < 0)) { wrapped_i += PyTuple_GET_SIZE(o); } - if ((!boundscheck) || likely((0 <= wrapped_i) & (wrapped_i < PyTuple_GET_SIZE(o)))) { + if ((!boundscheck) || likely(__Pyx_is_valid_index(wrapped_i, PyTuple_GET_SIZE(o)))) { PyObject *r = PyTuple_GET_ITEM(o, wrapped_i); Py_INCREF(r); return r; @@ -11959,7 +12007,7 @@ static CYTHON_INLINE PyObject *__Pyx_GetItemInt_Fast(PyObject *o, Py_ssize_t i, #if CYTHON_ASSUME_SAFE_MACROS && !CYTHON_AVOID_BORROWED_REFS && CYTHON_USE_TYPE_SLOTS if (is_list || PyList_CheckExact(o)) { Py_ssize_t n = ((!wraparound) | likely(i >= 0)) ? i : i + PyList_GET_SIZE(o); - if ((!boundscheck) || (likely((n >= 0) & (n < PyList_GET_SIZE(o))))) { + if ((!boundscheck) || (likely(__Pyx_is_valid_index(n, PyList_GET_SIZE(o))))) { PyObject *r = PyList_GET_ITEM(o, n); Py_INCREF(r); return r; @@ -11967,7 +12015,7 @@ static CYTHON_INLINE PyObject *__Pyx_GetItemInt_Fast(PyObject *o, Py_ssize_t i, } else if (PyTuple_CheckExact(o)) { Py_ssize_t n = ((!wraparound) | likely(i >= 0)) ? i : i + PyTuple_GET_SIZE(o); - if ((!boundscheck) || likely((n >= 0) & (n < PyTuple_GET_SIZE(o)))) { + if ((!boundscheck) || likely(__Pyx_is_valid_index(n, PyTuple_GET_SIZE(o)))) { PyObject *r = PyTuple_GET_ITEM(o, n); Py_INCREF(r); return r; @@ -11997,7 +12045,7 @@ static CYTHON_INLINE PyObject *__Pyx_GetItemInt_Fast(PyObject *o, Py_ssize_t i, } /* PyErrFetchRestore */ - #if CYTHON_FAST_THREAD_STATE +#if CYTHON_FAST_THREAD_STATE static CYTHON_INLINE void __Pyx_ErrRestoreInState(PyThreadState *tstate, PyObject *type, PyObject *value, PyObject *tb) { PyObject *tmp_type, *tmp_value, *tmp_tb; tmp_type = tstate->curexc_type; @@ -12021,7 +12069,7 @@ static CYTHON_INLINE void __Pyx_ErrFetchInState(PyThreadState *tstate, PyObject #endif /* RaiseException */ - #if PY_MAJOR_VERSION < 3 +#if PY_MAJOR_VERSION < 3 static void __Pyx_Raise(PyObject *type, PyObject *value, PyObject *tb, CYTHON_UNUSED PyObject *cause) { __Pyx_PyThreadState_declare @@ -12180,7 +12228,7 @@ static void __Pyx_Raise(PyObject *type, PyObject *value, PyObject *tb, PyObject #endif /* WriteUnraisableException */ - static void __Pyx_WriteUnraisable(const char *name, CYTHON_UNUSED int clineno, +static void __Pyx_WriteUnraisable(const char *name, CYTHON_UNUSED int clineno, CYTHON_UNUSED int lineno, CYTHON_UNUSED const char *filename, int full_traceback, CYTHON_UNUSED int nogil) { PyObject *old_exc, *old_val, *old_tb; @@ -12222,7 +12270,7 @@ static void __Pyx_Raise(PyObject *type, PyObject *value, PyObject *tb, PyObject } /* PyObjectSetAttrStr */ - #if CYTHON_USE_TYPE_SLOTS +#if CYTHON_USE_TYPE_SLOTS static CYTHON_INLINE int __Pyx_PyObject_SetAttrStr(PyObject* obj, PyObject* attr_name, PyObject* value) { PyTypeObject* tp = Py_TYPE(obj); if (likely(tp->tp_setattro)) @@ -12236,16 +12284,21 @@ static CYTHON_INLINE int __Pyx_PyObject_SetAttrStr(PyObject* obj, PyObject* attr #endif /* DictGetItem */ - #if PY_MAJOR_VERSION >= 3 && !CYTHON_COMPILING_IN_PYPY +#if PY_MAJOR_VERSION >= 3 && !CYTHON_COMPILING_IN_PYPY static PyObject *__Pyx_PyDict_GetItem(PyObject *d, PyObject* key) { PyObject *value; value = PyDict_GetItemWithError(d, key); if (unlikely(!value)) { if (!PyErr_Occurred()) { - PyObject* args = PyTuple_Pack(1, key); - if (likely(args)) - PyErr_SetObject(PyExc_KeyError, args); - Py_XDECREF(args); + if (unlikely(PyTuple_Check(key))) { + PyObject* args = PyTuple_Pack(1, key); + if (likely(args)) { + PyErr_SetObject(PyExc_KeyError, args); + Py_DECREF(args); + } + } else { + PyErr_SetObject(PyExc_KeyError, key); + } } return NULL; } @@ -12255,17 +12308,33 @@ static PyObject *__Pyx_PyDict_GetItem(PyObject *d, PyObject* key) { #endif /* RaiseNoneIterError */ - static CYTHON_INLINE void __Pyx_RaiseNoneNotIterableError(void) { +static CYTHON_INLINE void __Pyx_RaiseNoneNotIterableError(void) { PyErr_SetString(PyExc_TypeError, "'NoneType' object is not iterable"); } +/* GetTopmostException */ +#if CYTHON_USE_EXC_INFO_STACK +static _PyErr_StackItem * +__Pyx_PyErr_GetTopmostException(PyThreadState *tstate) +{ + _PyErr_StackItem *exc_info = tstate->exc_info; + while ((exc_info->exc_type == NULL || exc_info->exc_type == Py_None) && + exc_info->previous_item != NULL) + { + exc_info = exc_info->previous_item; + } + return exc_info; +} +#endif + /* SaveResetException */ - #if CYTHON_FAST_THREAD_STATE +#if CYTHON_FAST_THREAD_STATE static CYTHON_INLINE void __Pyx__ExceptionSave(PyThreadState *tstate, PyObject **type, PyObject **value, PyObject **tb) { - #if PY_VERSION_HEX >= 0x030700A3 - *type = tstate->exc_state.exc_type; - *value = tstate->exc_state.exc_value; - *tb = tstate->exc_state.exc_traceback; + #if CYTHON_USE_EXC_INFO_STACK + _PyErr_StackItem *exc_info = __Pyx_PyErr_GetTopmostException(tstate); + *type = exc_info->exc_type; + *value = exc_info->exc_value; + *tb = exc_info->exc_traceback; #else *type = tstate->exc_type; *value = tstate->exc_value; @@ -12277,13 +12346,14 @@ static CYTHON_INLINE void __Pyx__ExceptionSave(PyThreadState *tstate, PyObject * } static CYTHON_INLINE void __Pyx__ExceptionReset(PyThreadState *tstate, PyObject *type, PyObject *value, PyObject *tb) { PyObject *tmp_type, *tmp_value, *tmp_tb; - #if PY_VERSION_HEX >= 0x030700A3 - tmp_type = tstate->exc_state.exc_type; - tmp_value = tstate->exc_state.exc_value; - tmp_tb = tstate->exc_state.exc_traceback; - tstate->exc_state.exc_type = type; - tstate->exc_state.exc_value = value; - tstate->exc_state.exc_traceback = tb; + #if CYTHON_USE_EXC_INFO_STACK + _PyErr_StackItem *exc_info = tstate->exc_info; + tmp_type = exc_info->exc_type; + tmp_value = exc_info->exc_value; + tmp_tb = exc_info->exc_traceback; + exc_info->exc_type = type; + exc_info->exc_value = value; + exc_info->exc_traceback = tb; #else tmp_type = tstate->exc_type; tmp_value = tstate->exc_value; @@ -12299,7 +12369,7 @@ static CYTHON_INLINE void __Pyx__ExceptionReset(PyThreadState *tstate, PyObject #endif /* PyErrExceptionMatches */ - #if CYTHON_FAST_THREAD_STATE +#if CYTHON_FAST_THREAD_STATE static int __Pyx_PyErr_ExceptionMatchesTuple(PyObject *exc_type, PyObject *tuple) { Py_ssize_t i, n; n = PyTuple_GET_SIZE(tuple); @@ -12324,11 +12394,12 @@ static CYTHON_INLINE int __Pyx_PyErr_ExceptionMatchesInState(PyThreadState* tsta #endif /* GetException */ - #if CYTHON_FAST_THREAD_STATE -static int __Pyx__GetException(PyThreadState *tstate, PyObject **type, PyObject **value, PyObject **tb) { +#if CYTHON_FAST_THREAD_STATE +static int __Pyx__GetException(PyThreadState *tstate, PyObject **type, PyObject **value, PyObject **tb) #else -static int __Pyx_GetException(PyObject **type, PyObject **value, PyObject **tb) { +static int __Pyx_GetException(PyObject **type, PyObject **value, PyObject **tb) #endif +{ PyObject *local_type, *local_value, *local_tb; #if CYTHON_FAST_THREAD_STATE PyObject *tmp_type, *tmp_value, *tmp_tb; @@ -12361,13 +12432,16 @@ static int __Pyx_GetException(PyObject **type, PyObject **value, PyObject **tb) *value = local_value; *tb = local_tb; #if CYTHON_FAST_THREAD_STATE - #if PY_VERSION_HEX >= 0x030700A3 - tmp_type = tstate->exc_state.exc_type; - tmp_value = tstate->exc_state.exc_value; - tmp_tb = tstate->exc_state.exc_traceback; - tstate->exc_state.exc_type = local_type; - tstate->exc_state.exc_value = local_value; - tstate->exc_state.exc_traceback = local_tb; + #if CYTHON_USE_EXC_INFO_STACK + { + _PyErr_StackItem *exc_info = tstate->exc_info; + tmp_type = exc_info->exc_type; + tmp_value = exc_info->exc_value; + tmp_tb = exc_info->exc_traceback; + exc_info->exc_type = local_type; + exc_info->exc_value = local_value; + exc_info->exc_traceback = local_tb; + } #else tmp_type = tstate->exc_type; tmp_value = tstate->exc_value; @@ -12394,7 +12468,7 @@ static int __Pyx_GetException(PyObject **type, PyObject **value, PyObject **tb) } /* PyObject_GenericGetAttrNoDict */ - #if CYTHON_USE_TYPE_SLOTS && CYTHON_USE_PYTYPE_LOOKUP && PY_VERSION_HEX < 0x03070000 +#if CYTHON_USE_TYPE_SLOTS && CYTHON_USE_PYTYPE_LOOKUP && PY_VERSION_HEX < 0x03070000 static PyObject *__Pyx_RaiseGenericGetAttributeError(PyTypeObject *tp, PyObject *attr_name) { PyErr_Format(PyExc_AttributeError, #if PY_MAJOR_VERSION >= 3 @@ -12434,7 +12508,7 @@ static CYTHON_INLINE PyObject* __Pyx_PyObject_GenericGetAttrNoDict(PyObject* obj #endif /* SetVTable */ - static int __Pyx_SetVtable(PyObject *dict, void *vtable) { +static int __Pyx_SetVtable(PyObject *dict, void *vtable) { #if PY_VERSION_HEX >= 0x02070000 PyObject *ob = PyCapsule_New(vtable, 0, 0); #else @@ -12452,7 +12526,7 @@ static CYTHON_INLINE PyObject* __Pyx_PyObject_GenericGetAttrNoDict(PyObject* obj } /* SetupReduce */ - static int __Pyx_setup_reduce_is_named(PyObject* meth, PyObject* name) { +static int __Pyx_setup_reduce_is_named(PyObject* meth, PyObject* name) { int ret; PyObject *name_attr; name_attr = __Pyx_PyObject_GetAttrStr(meth, __pyx_n_s_name); @@ -12527,8 +12601,69 @@ static int __Pyx_setup_reduce(PyObject* type_obj) { return ret; } +/* TypeImport */ +#ifndef __PYX_HAVE_RT_ImportType +#define __PYX_HAVE_RT_ImportType +static PyTypeObject *__Pyx_ImportType(PyObject *module, const char *module_name, const char *class_name, + size_t size, enum __Pyx_ImportType_CheckSize check_size) +{ + PyObject *result = 0; + char warning[200]; + Py_ssize_t basicsize; +#ifdef Py_LIMITED_API + PyObject *py_basicsize; +#endif + result = PyObject_GetAttrString(module, class_name); + if (!result) + goto bad; + if (!PyType_Check(result)) { + PyErr_Format(PyExc_TypeError, + "%.200s.%.200s is not a type object", + module_name, class_name); + goto bad; + } +#ifndef Py_LIMITED_API + basicsize = ((PyTypeObject *)result)->tp_basicsize; +#else + py_basicsize = PyObject_GetAttrString(result, "__basicsize__"); + if (!py_basicsize) + goto bad; + basicsize = PyLong_AsSsize_t(py_basicsize); + Py_DECREF(py_basicsize); + py_basicsize = 0; + if (basicsize == (Py_ssize_t)-1 && PyErr_Occurred()) + goto bad; +#endif + if ((size_t)basicsize < size) { + PyErr_Format(PyExc_ValueError, + "%.200s.%.200s size changed, may indicate binary incompatibility. " + "Expected %zd from C header, got %zd from PyObject", + module_name, class_name, size, basicsize); + goto bad; + } + if (check_size == __Pyx_ImportType_CheckSize_Error && (size_t)basicsize != size) { + PyErr_Format(PyExc_ValueError, + "%.200s.%.200s size changed, may indicate binary incompatibility. " + "Expected %zd from C header, got %zd from PyObject", + module_name, class_name, size, basicsize); + goto bad; + } + else if (check_size == __Pyx_ImportType_CheckSize_Warn && (size_t)basicsize > size) { + PyOS_snprintf(warning, sizeof(warning), + "%s.%s size changed, may indicate binary incompatibility. " + "Expected %zd from C header, got %zd from PyObject", + module_name, class_name, size, basicsize); + if (PyErr_WarnEx(NULL, warning, 0) < 0) goto bad; + } + return (PyTypeObject *)result; +bad: + Py_XDECREF(result); + return NULL; +} +#endif + /* Import */ - static PyObject *__Pyx_Import(PyObject *name, PyObject *from_list, int level) { +static PyObject *__Pyx_Import(PyObject *name, PyObject *from_list, int level) { PyObject *empty_list = 0; PyObject *module = 0; PyObject *global_dict = 0; @@ -12575,7 +12710,7 @@ static int __Pyx_setup_reduce(PyObject* type_obj) { if (!py_level) goto bad; module = PyObject_CallFunctionObjArgs(py_import, - name, global_dict, empty_dict, list, py_level, NULL); + name, global_dict, empty_dict, list, py_level, (PyObject *)NULL); Py_DECREF(py_level); #else module = PyImport_ImportModuleLevelObject( @@ -12593,7 +12728,7 @@ static int __Pyx_setup_reduce(PyObject* type_obj) { } /* ImportFrom */ - static PyObject* __Pyx_ImportFrom(PyObject* module, PyObject* name) { +static PyObject* __Pyx_ImportFrom(PyObject* module, PyObject* name) { PyObject* value = __Pyx_PyObject_GetAttrStr(module, name); if (unlikely(!value) && PyErr_ExceptionMatches(PyExc_AttributeError)) { PyErr_Format(PyExc_ImportError, @@ -12607,8 +12742,8 @@ static int __Pyx_setup_reduce(PyObject* type_obj) { } /* CLineInTraceback */ - #ifndef CYTHON_CLINE_IN_TRACEBACK -static int __Pyx_CLineForTraceback(CYTHON_UNUSED PyThreadState *tstate, int c_line) { +#ifndef CYTHON_CLINE_IN_TRACEBACK +static int __Pyx_CLineForTraceback(PyThreadState *tstate, int c_line) { PyObject *use_cline; PyObject *ptype, *pvalue, *ptraceback; #if CYTHON_COMPILING_IN_CPYTHON @@ -12621,7 +12756,9 @@ static int __Pyx_CLineForTraceback(CYTHON_UNUSED PyThreadState *tstate, int c_li #if CYTHON_COMPILING_IN_CPYTHON cython_runtime_dict = _PyObject_GetDictPtr(__pyx_cython_runtime); if (likely(cython_runtime_dict)) { - use_cline = __Pyx_PyDict_GetItemStr(*cython_runtime_dict, __pyx_n_s_cline_in_traceback); + __PYX_PY_DICT_LOOKUP_IF_MODIFIED( + use_cline, *cython_runtime_dict, + __Pyx_PyDict_GetItemStr(*cython_runtime_dict, __pyx_n_s_cline_in_traceback)) } else #endif { @@ -12638,7 +12775,7 @@ static int __Pyx_CLineForTraceback(CYTHON_UNUSED PyThreadState *tstate, int c_li c_line = 0; PyObject_SetAttr(__pyx_cython_runtime, __pyx_n_s_cline_in_traceback, Py_False); } - else if (PyObject_Not(use_cline) != 0) { + else if (use_cline == Py_False || (use_cline != Py_True && PyObject_Not(use_cline) != 0)) { c_line = 0; } __Pyx_ErrRestoreInState(tstate, ptype, pvalue, ptraceback); @@ -12647,7 +12784,7 @@ static int __Pyx_CLineForTraceback(CYTHON_UNUSED PyThreadState *tstate, int c_li #endif /* CodeObjectCache */ - static int __pyx_bisect_code_objects(__Pyx_CodeObjectCacheEntry* entries, int count, int code_line) { +static int __pyx_bisect_code_objects(__Pyx_CodeObjectCacheEntry* entries, int count, int code_line) { int start = 0, mid = 0, end = count - 1; if (end >= 0 && code_line > entries[end].code_line) { return count; @@ -12727,7 +12864,7 @@ static void __pyx_insert_code_object(int code_line, PyCodeObject* code_object) { } /* AddTraceback */ - #include "compile.h" +#include "compile.h" #include "frameobject.h" #include "traceback.h" static PyCodeObject* __Pyx_CreateCodeObjectForTraceback( @@ -12812,7 +12949,7 @@ static void __Pyx_AddTraceback(const char *funcname, int c_line, } /* CIntFromPyVerify */ - #define __PYX_VERIFY_RETURN_INT(target_type, func_type, func_value)\ +#define __PYX_VERIFY_RETURN_INT(target_type, func_type, func_value)\ __PYX__VERIFY_RETURN_INT(target_type, func_type, func_value, 0) #define __PYX_VERIFY_RETURN_INT_EXC(target_type, func_type, func_value)\ __PYX__VERIFY_RETURN_INT(target_type, func_type, func_value, 1) @@ -12834,8 +12971,8 @@ static void __Pyx_AddTraceback(const char *funcname, int c_line, } /* CIntToPy */ - static CYTHON_INLINE PyObject* __Pyx_PyInt_From_npy_uint32(npy_uint32 value) { - const npy_uint32 neg_one = (npy_uint32) -1, const_zero = (npy_uint32) 0; +static CYTHON_INLINE PyObject* __Pyx_PyInt_From_npy_uint32(npy_uint32 value) { + const npy_uint32 neg_one = (npy_uint32) ((npy_uint32) 0 - (npy_uint32) 1), const_zero = (npy_uint32) 0; const int is_unsigned = neg_one > const_zero; if (is_unsigned) { if (sizeof(npy_uint32) < sizeof(long)) { @@ -12865,7 +13002,7 @@ static void __Pyx_AddTraceback(const char *funcname, int c_line, } /* None */ - static CYTHON_INLINE int __Pyx_ErrOccurredWithGIL(void) { +static CYTHON_INLINE int __Pyx_ErrOccurredWithGIL(void) { int err; #ifdef WITH_THREAD PyGILState_STATE _save = PyGILState_Ensure(); @@ -12878,8 +13015,8 @@ static void __Pyx_AddTraceback(const char *funcname, int c_line, } /* CIntToPy */ - static CYTHON_INLINE PyObject* __Pyx_PyInt_From_int(int value) { - const int neg_one = (int) -1, const_zero = (int) 0; +static CYTHON_INLINE PyObject* __Pyx_PyInt_From_int(int value) { + const int neg_one = (int) ((int) 0 - (int) 1), const_zero = (int) 0; const int is_unsigned = neg_one > const_zero; if (is_unsigned) { if (sizeof(int) < sizeof(long)) { @@ -12909,8 +13046,8 @@ static void __Pyx_AddTraceback(const char *funcname, int c_line, } /* CIntToPy */ - static CYTHON_INLINE PyObject* __Pyx_PyInt_From_PY_LONG_LONG(PY_LONG_LONG value) { - const PY_LONG_LONG neg_one = (PY_LONG_LONG) -1, const_zero = (PY_LONG_LONG) 0; +static CYTHON_INLINE PyObject* __Pyx_PyInt_From_PY_LONG_LONG(PY_LONG_LONG value) { + const PY_LONG_LONG neg_one = (PY_LONG_LONG) ((PY_LONG_LONG) 0 - (PY_LONG_LONG) 1), const_zero = (PY_LONG_LONG) 0; const int is_unsigned = neg_one > const_zero; if (is_unsigned) { if (sizeof(PY_LONG_LONG) < sizeof(long)) { @@ -12940,7 +13077,7 @@ static void __Pyx_AddTraceback(const char *funcname, int c_line, } /* Declarations */ - #if CYTHON_CCOMPLEX +#if CYTHON_CCOMPLEX #ifdef __cplusplus static CYTHON_INLINE __pyx_t_float_complex __pyx_t_float_complex_from_parts(float x, float y) { return ::std::complex< float >(x, y); @@ -12960,7 +13097,7 @@ static void __Pyx_AddTraceback(const char *funcname, int c_line, #endif /* Arithmetic */ - #if CYTHON_CCOMPLEX +#if CYTHON_CCOMPLEX #else static CYTHON_INLINE int __Pyx_c_eq_float(__pyx_t_float_complex a, __pyx_t_float_complex b) { return (a.real == b.real) && (a.imag == b.imag); @@ -13095,7 +13232,7 @@ static void __Pyx_AddTraceback(const char *funcname, int c_line, #endif /* Declarations */ - #if CYTHON_CCOMPLEX +#if CYTHON_CCOMPLEX #ifdef __cplusplus static CYTHON_INLINE __pyx_t_double_complex __pyx_t_double_complex_from_parts(double x, double y) { return ::std::complex< double >(x, y); @@ -13115,7 +13252,7 @@ static void __Pyx_AddTraceback(const char *funcname, int c_line, #endif /* Arithmetic */ - #if CYTHON_CCOMPLEX +#if CYTHON_CCOMPLEX #else static CYTHON_INLINE int __Pyx_c_eq_double(__pyx_t_double_complex a, __pyx_t_double_complex b) { return (a.real == b.real) && (a.imag == b.imag); @@ -13250,8 +13387,8 @@ static void __Pyx_AddTraceback(const char *funcname, int c_line, #endif /* CIntToPy */ - static CYTHON_INLINE PyObject* __Pyx_PyInt_From_enum__NPY_TYPES(enum NPY_TYPES value) { - const enum NPY_TYPES neg_one = (enum NPY_TYPES) -1, const_zero = (enum NPY_TYPES) 0; +static CYTHON_INLINE PyObject* __Pyx_PyInt_From_enum__NPY_TYPES(enum NPY_TYPES value) { + const enum NPY_TYPES neg_one = (enum NPY_TYPES) ((enum NPY_TYPES) 0 - (enum NPY_TYPES) 1), const_zero = (enum NPY_TYPES) 0; const int is_unsigned = neg_one > const_zero; if (is_unsigned) { if (sizeof(enum NPY_TYPES) < sizeof(long)) { @@ -13281,8 +13418,8 @@ static void __Pyx_AddTraceback(const char *funcname, int c_line, } /* CIntFromPy */ - static CYTHON_INLINE npy_uint32 __Pyx_PyInt_As_npy_uint32(PyObject *x) { - const npy_uint32 neg_one = (npy_uint32) -1, const_zero = (npy_uint32) 0; +static CYTHON_INLINE npy_uint32 __Pyx_PyInt_As_npy_uint32(PyObject *x) { + const npy_uint32 neg_one = (npy_uint32) ((npy_uint32) 0 - (npy_uint32) 1), const_zero = (npy_uint32) 0; const int is_unsigned = neg_one > const_zero; #if PY_MAJOR_VERSION < 3 if (likely(PyInt_Check(x))) { @@ -13470,8 +13607,8 @@ static void __Pyx_AddTraceback(const char *funcname, int c_line, } /* CIntFromPy */ - static CYTHON_INLINE PY_LONG_LONG __Pyx_PyInt_As_PY_LONG_LONG(PyObject *x) { - const PY_LONG_LONG neg_one = (PY_LONG_LONG) -1, const_zero = (PY_LONG_LONG) 0; +static CYTHON_INLINE PY_LONG_LONG __Pyx_PyInt_As_PY_LONG_LONG(PyObject *x) { + const PY_LONG_LONG neg_one = (PY_LONG_LONG) ((PY_LONG_LONG) 0 - (PY_LONG_LONG) 1), const_zero = (PY_LONG_LONG) 0; const int is_unsigned = neg_one > const_zero; #if PY_MAJOR_VERSION < 3 if (likely(PyInt_Check(x))) { @@ -13659,8 +13796,8 @@ static void __Pyx_AddTraceback(const char *funcname, int c_line, } /* CIntFromPy */ - static CYTHON_INLINE size_t __Pyx_PyInt_As_size_t(PyObject *x) { - const size_t neg_one = (size_t) -1, const_zero = (size_t) 0; +static CYTHON_INLINE size_t __Pyx_PyInt_As_size_t(PyObject *x) { + const size_t neg_one = (size_t) ((size_t) 0 - (size_t) 1), const_zero = (size_t) 0; const int is_unsigned = neg_one > const_zero; #if PY_MAJOR_VERSION < 3 if (likely(PyInt_Check(x))) { @@ -13848,8 +13985,8 @@ static void __Pyx_AddTraceback(const char *funcname, int c_line, } /* CIntFromPy */ - static CYTHON_INLINE int __Pyx_PyInt_As_int(PyObject *x) { - const int neg_one = (int) -1, const_zero = (int) 0; +static CYTHON_INLINE int __Pyx_PyInt_As_int(PyObject *x) { + const int neg_one = (int) ((int) 0 - (int) 1), const_zero = (int) 0; const int is_unsigned = neg_one > const_zero; #if PY_MAJOR_VERSION < 3 if (likely(PyInt_Check(x))) { @@ -14037,8 +14174,8 @@ static void __Pyx_AddTraceback(const char *funcname, int c_line, } /* CIntToPy */ - static CYTHON_INLINE PyObject* __Pyx_PyInt_From_long(long value) { - const long neg_one = (long) -1, const_zero = (long) 0; +static CYTHON_INLINE PyObject* __Pyx_PyInt_From_long(long value) { + const long neg_one = (long) ((long) 0 - (long) 1), const_zero = (long) 0; const int is_unsigned = neg_one > const_zero; if (is_unsigned) { if (sizeof(long) < sizeof(long)) { @@ -14068,8 +14205,8 @@ static void __Pyx_AddTraceback(const char *funcname, int c_line, } /* CIntFromPy */ - static CYTHON_INLINE long __Pyx_PyInt_As_long(PyObject *x) { - const long neg_one = (long) -1, const_zero = (long) 0; +static CYTHON_INLINE long __Pyx_PyInt_As_long(PyObject *x) { + const long neg_one = (long) ((long) 0 - (long) 1), const_zero = (long) 0; const int is_unsigned = neg_one > const_zero; #if PY_MAJOR_VERSION < 3 if (likely(PyInt_Check(x))) { @@ -14257,7 +14394,7 @@ static void __Pyx_AddTraceback(const char *funcname, int c_line, } /* FastTypeChecks */ - #if CYTHON_COMPILING_IN_CPYTHON +#if CYTHON_COMPILING_IN_CPYTHON static int __Pyx_InBases(PyTypeObject *a, PyTypeObject *b) { while (a) { a = a->tp_base; @@ -14357,7 +14494,7 @@ static CYTHON_INLINE int __Pyx_PyErr_GivenExceptionMatches2(PyObject *err, PyObj #endif /* FetchCommonType */ - static PyTypeObject* __Pyx_FetchCommonType(PyTypeObject* type) { +static PyTypeObject* __Pyx_FetchCommonType(PyTypeObject* type) { PyObject* fake_module; PyTypeObject* cached_type = NULL; fake_module = PyImport_AddModule((char*) "_cython_" CYTHON_ABI); @@ -14396,16 +14533,17 @@ static CYTHON_INLINE int __Pyx_PyErr_GivenExceptionMatches2(PyObject *err, PyObj } /* SwapException */ - #if CYTHON_FAST_THREAD_STATE +#if CYTHON_FAST_THREAD_STATE static CYTHON_INLINE void __Pyx__ExceptionSwap(PyThreadState *tstate, PyObject **type, PyObject **value, PyObject **tb) { PyObject *tmp_type, *tmp_value, *tmp_tb; - #if PY_VERSION_HEX >= 0x030700A3 - tmp_type = tstate->exc_state.exc_type; - tmp_value = tstate->exc_state.exc_value; - tmp_tb = tstate->exc_state.exc_traceback; - tstate->exc_state.exc_type = *type; - tstate->exc_state.exc_value = *value; - tstate->exc_state.exc_traceback = *tb; + #if CYTHON_USE_EXC_INFO_STACK + _PyErr_StackItem *exc_info = tstate->exc_info; + tmp_type = exc_info->exc_type; + tmp_value = exc_info->exc_value; + tmp_tb = exc_info->exc_traceback; + exc_info->exc_type = *type; + exc_info->exc_value = *value; + exc_info->exc_traceback = *tb; #else tmp_type = tstate->exc_type; tmp_value = tstate->exc_value; @@ -14429,59 +14567,122 @@ static CYTHON_INLINE void __Pyx_ExceptionSwap(PyObject **type, PyObject **value, } #endif -/* PyObjectCallMethod1 */ - static PyObject* __Pyx__PyObject_CallMethod1(PyObject* method, PyObject* arg) { - PyObject *result = NULL; -#if CYTHON_UNPACK_METHODS - if (likely(PyMethod_Check(method))) { - PyObject *self = PyMethod_GET_SELF(method); - if (likely(self)) { - PyObject *args; - PyObject *function = PyMethod_GET_FUNCTION(method); - #if CYTHON_FAST_PYCALL - if (PyFunction_Check(function)) { - PyObject *args[2] = {self, arg}; - result = __Pyx_PyFunction_FastCall(function, args, 2); - goto done; - } - #endif - #if CYTHON_FAST_PYCCALL - if (__Pyx_PyFastCFunction_Check(function)) { - PyObject *args[2] = {self, arg}; - result = __Pyx_PyCFunction_FastCall(function, args, 2); - goto done; +/* PyObjectGetMethod */ +static int __Pyx_PyObject_GetMethod(PyObject *obj, PyObject *name, PyObject **method) { + PyObject *attr; +#if CYTHON_UNPACK_METHODS && CYTHON_COMPILING_IN_CPYTHON && CYTHON_USE_PYTYPE_LOOKUP + PyTypeObject *tp = Py_TYPE(obj); + PyObject *descr; + descrgetfunc f = NULL; + PyObject **dictptr, *dict; + int meth_found = 0; + assert (*method == NULL); + if (unlikely(tp->tp_getattro != PyObject_GenericGetAttr)) { + attr = __Pyx_PyObject_GetAttrStr(obj, name); + goto try_unpack; + } + if (unlikely(tp->tp_dict == NULL) && unlikely(PyType_Ready(tp) < 0)) { + return 0; + } + descr = _PyType_Lookup(tp, name); + if (likely(descr != NULL)) { + Py_INCREF(descr); +#if PY_MAJOR_VERSION >= 3 + #ifdef __Pyx_CyFunction_USED + if (likely(PyFunction_Check(descr) || (Py_TYPE(descr) == &PyMethodDescr_Type) || __Pyx_CyFunction_Check(descr))) + #else + if (likely(PyFunction_Check(descr) || (Py_TYPE(descr) == &PyMethodDescr_Type))) + #endif +#else + #ifdef __Pyx_CyFunction_USED + if (likely(PyFunction_Check(descr) || __Pyx_CyFunction_Check(descr))) + #else + if (likely(PyFunction_Check(descr))) + #endif +#endif + { + meth_found = 1; + } else { + f = Py_TYPE(descr)->tp_descr_get; + if (f != NULL && PyDescr_IsData(descr)) { + attr = f(descr, obj, (PyObject *)Py_TYPE(obj)); + Py_DECREF(descr); + goto try_unpack; } - #endif - args = PyTuple_New(2); - if (unlikely(!args)) goto done; - Py_INCREF(self); - PyTuple_SET_ITEM(args, 0, self); - Py_INCREF(arg); - PyTuple_SET_ITEM(args, 1, arg); - Py_INCREF(function); - result = __Pyx_PyObject_Call(function, args, NULL); - Py_DECREF(args); - Py_DECREF(function); - return result; } } + dictptr = _PyObject_GetDictPtr(obj); + if (dictptr != NULL && (dict = *dictptr) != NULL) { + Py_INCREF(dict); + attr = __Pyx_PyDict_GetItemStr(dict, name); + if (attr != NULL) { + Py_INCREF(attr); + Py_DECREF(dict); + Py_XDECREF(descr); + goto try_unpack; + } + Py_DECREF(dict); + } + if (meth_found) { + *method = descr; + return 1; + } + if (f != NULL) { + attr = f(descr, obj, (PyObject *)Py_TYPE(obj)); + Py_DECREF(descr); + goto try_unpack; + } + if (descr != NULL) { + *method = descr; + return 0; + } + PyErr_Format(PyExc_AttributeError, +#if PY_MAJOR_VERSION >= 3 + "'%.50s' object has no attribute '%U'", + tp->tp_name, name); +#else + "'%.50s' object has no attribute '%.400s'", + tp->tp_name, PyString_AS_STRING(name)); #endif - result = __Pyx_PyObject_CallOneArg(method, arg); - goto done; -done: + return 0; +#else + attr = __Pyx_PyObject_GetAttrStr(obj, name); + goto try_unpack; +#endif +try_unpack: +#if CYTHON_UNPACK_METHODS + if (likely(attr) && PyMethod_Check(attr) && likely(PyMethod_GET_SELF(attr) == obj)) { + PyObject *function = PyMethod_GET_FUNCTION(attr); + Py_INCREF(function); + Py_DECREF(attr); + *method = function; + return 1; + } +#endif + *method = attr; + return 0; +} + +/* PyObjectCallMethod1 */ +static PyObject* __Pyx__PyObject_CallMethod1(PyObject* method, PyObject* arg) { + PyObject *result = __Pyx_PyObject_CallOneArg(method, arg); + Py_DECREF(method); return result; } static PyObject* __Pyx_PyObject_CallMethod1(PyObject* obj, PyObject* method_name, PyObject* arg) { - PyObject *method, *result; - method = __Pyx_PyObject_GetAttrStr(obj, method_name); + PyObject *method = NULL, *result; + int is_method = __Pyx_PyObject_GetMethod(obj, method_name, &method); + if (likely(is_method)) { + result = __Pyx_PyObject_Call2Args(method, obj, arg); + Py_DECREF(method); + return result; + } if (unlikely(!method)) return NULL; - result = __Pyx__PyObject_CallMethod1(method, arg); - Py_DECREF(method); - return result; + return __Pyx__PyObject_CallMethod1(method, arg); } /* CoroutineBase */ - #include +#include #include #define __Pyx_Coroutine_Undelegate(gen) Py_CLEAR((gen)->yieldfrom) static int __Pyx_PyGen__FetchStopIterationValue(CYTHON_UNUSED PyThreadState *__pyx_tstate, PyObject **pvalue) { @@ -14564,21 +14765,22 @@ static int __Pyx_PyGen__FetchStopIterationValue(CYTHON_UNUSED PyThreadState *__p return 0; } static CYTHON_INLINE -void __Pyx_Coroutine_ExceptionClear(__pyx_CoroutineObject *self) { - PyObject *exc_type = self->exc_type; - PyObject *exc_value = self->exc_value; - PyObject *exc_traceback = self->exc_traceback; - self->exc_type = NULL; - self->exc_value = NULL; - self->exc_traceback = NULL; - Py_XDECREF(exc_type); - Py_XDECREF(exc_value); - Py_XDECREF(exc_traceback); +void __Pyx_Coroutine_ExceptionClear(__Pyx_ExcInfoStruct *exc_state) { + PyObject *t, *v, *tb; + t = exc_state->exc_type; + v = exc_state->exc_value; + tb = exc_state->exc_traceback; + exc_state->exc_type = NULL; + exc_state->exc_value = NULL; + exc_state->exc_traceback = NULL; + Py_XDECREF(t); + Py_XDECREF(v); + Py_XDECREF(tb); } #define __Pyx_Coroutine_AlreadyRunningError(gen) (__Pyx__Coroutine_AlreadyRunningError(gen), (PyObject*)NULL) static void __Pyx__Coroutine_AlreadyRunningError(CYTHON_UNUSED __pyx_CoroutineObject *gen) { const char *msg; - if (0) { + if ((0)) { #ifdef __Pyx_Coroutine_USED } else if (__Pyx_Coroutine_Check((PyObject*)gen)) { msg = "coroutine already executing"; @@ -14595,7 +14797,7 @@ static void __Pyx__Coroutine_AlreadyRunningError(CYTHON_UNUSED __pyx_CoroutineOb #define __Pyx_Coroutine_NotStartedError(gen) (__Pyx__Coroutine_NotStartedError(gen), (PyObject*)NULL) static void __Pyx__Coroutine_NotStartedError(CYTHON_UNUSED PyObject *gen) { const char *msg; - if (0) { + if ((0)) { #ifdef __Pyx_Coroutine_USED } else if (__Pyx_Coroutine_Check(gen)) { msg = "can't send non-None value to a just-started coroutine"; @@ -14629,6 +14831,7 @@ static PyObject *__Pyx_Coroutine_SendEx(__pyx_CoroutineObject *self, PyObject *value, int closing) { __Pyx_PyThreadState_declare PyThreadState *tstate; + __Pyx_ExcInfoStruct *exc_state; PyObject *retval; assert(!self->is_running); if (unlikely(self->resume_label == 0)) { @@ -14645,33 +14848,47 @@ PyObject *__Pyx_Coroutine_SendEx(__pyx_CoroutineObject *self, PyObject *value, i #else tstate = __Pyx_PyThreadState_Current; #endif - if (self->exc_type) { -#if CYTHON_COMPILING_IN_PYPY || CYTHON_COMPILING_IN_PYSTON -#else - if (self->exc_traceback) { - PyTracebackObject *tb = (PyTracebackObject *) self->exc_traceback; + exc_state = &self->gi_exc_state; + if (exc_state->exc_type) { + #if CYTHON_COMPILING_IN_PYPY || CYTHON_COMPILING_IN_PYSTON + #else + if (exc_state->exc_traceback) { + PyTracebackObject *tb = (PyTracebackObject *) exc_state->exc_traceback; PyFrameObject *f = tb->tb_frame; Py_XINCREF(tstate->frame); assert(f->f_back == NULL); f->f_back = tstate->frame; } -#endif - __Pyx_ExceptionSwap(&self->exc_type, &self->exc_value, - &self->exc_traceback); + #endif + } +#if CYTHON_USE_EXC_INFO_STACK + exc_state->previous_item = tstate->exc_info; + tstate->exc_info = exc_state; +#else + if (exc_state->exc_type) { + __Pyx_ExceptionSwap(&exc_state->exc_type, &exc_state->exc_value, &exc_state->exc_traceback); } else { - __Pyx_Coroutine_ExceptionClear(self); - __Pyx_ExceptionSave(&self->exc_type, &self->exc_value, &self->exc_traceback); + __Pyx_Coroutine_ExceptionClear(exc_state); + __Pyx_ExceptionSave(&exc_state->exc_type, &exc_state->exc_value, &exc_state->exc_traceback); } +#endif self->is_running = 1; retval = self->body((PyObject *) self, tstate, value); self->is_running = 0; +#if CYTHON_USE_EXC_INFO_STACK + exc_state = &self->gi_exc_state; + tstate->exc_info = exc_state->previous_item; + exc_state->previous_item = NULL; + __Pyx_Coroutine_ResetFrameBackpointer(exc_state); +#endif return retval; } -static CYTHON_INLINE void __Pyx_Coroutine_ResetFrameBackpointer(__pyx_CoroutineObject *self) { - if (likely(self->exc_traceback)) { +static CYTHON_INLINE void __Pyx_Coroutine_ResetFrameBackpointer(__Pyx_ExcInfoStruct *exc_state) { + PyObject *exc_tb = exc_state->exc_traceback; + if (likely(exc_tb)) { #if CYTHON_COMPILING_IN_PYPY || CYTHON_COMPILING_IN_PYSTON #else - PyTracebackObject *tb = (PyTracebackObject *) self->exc_traceback; + PyTracebackObject *tb = (PyTracebackObject *) exc_tb; PyFrameObject *f = tb->tb_frame; Py_CLEAR(f->f_back); #endif @@ -14770,7 +14987,7 @@ static int __Pyx_Coroutine_CloseIter(__pyx_CoroutineObject *gen, PyObject *yf) { return -1; } else if (__Pyx_CoroutineAwait_CheckExact(yf)) { - retval = __Pyx_CoroutineAwait_Close((__pyx_CoroutineAwaitObject*)yf); + retval = __Pyx_CoroutineAwait_Close((__pyx_CoroutineAwaitObject*)yf, NULL); if (!retval) return -1; } else @@ -14835,6 +15052,9 @@ static PyObject *__Pyx_Generator_Next(PyObject *self) { } return __Pyx_Coroutine_SendEx(gen, Py_None, 0); } +static PyObject *__Pyx_Coroutine_Close_Method(PyObject *self, CYTHON_UNUSED PyObject *arg) { + return __Pyx_Coroutine_Close(self); +} static PyObject *__Pyx_Coroutine_Close(PyObject *self) { __pyx_CoroutineObject *gen = (__pyx_CoroutineObject *) self; PyObject *retval, *raised_exception; @@ -14951,23 +15171,24 @@ static PyObject *__Pyx_Coroutine_Throw(PyObject *self, PyObject *args) { return NULL; return __Pyx__Coroutine_Throw(self, typ, val, tb, args, 1); } +static CYTHON_INLINE int __Pyx_Coroutine_traverse_excstate(__Pyx_ExcInfoStruct *exc_state, visitproc visit, void *arg) { + Py_VISIT(exc_state->exc_type); + Py_VISIT(exc_state->exc_value); + Py_VISIT(exc_state->exc_traceback); + return 0; +} static int __Pyx_Coroutine_traverse(__pyx_CoroutineObject *gen, visitproc visit, void *arg) { Py_VISIT(gen->closure); Py_VISIT(gen->classobj); Py_VISIT(gen->yieldfrom); - Py_VISIT(gen->exc_type); - Py_VISIT(gen->exc_value); - Py_VISIT(gen->exc_traceback); - return 0; + return __Pyx_Coroutine_traverse_excstate(&gen->gi_exc_state, visit, arg); } static int __Pyx_Coroutine_clear(PyObject *self) { __pyx_CoroutineObject *gen = (__pyx_CoroutineObject *) self; Py_CLEAR(gen->closure); Py_CLEAR(gen->classobj); Py_CLEAR(gen->yieldfrom); - Py_CLEAR(gen->exc_type); - Py_CLEAR(gen->exc_value); - Py_CLEAR(gen->exc_traceback); + __Pyx_Coroutine_ExceptionClear(&gen->gi_exc_state); #ifdef __Pyx_AsyncGen_USED if (__Pyx_AsyncGen_CheckExact(self)) { Py_CLEAR(((__pyx_PyAsyncGenObject*)gen)->ag_finalizer); @@ -15105,7 +15326,7 @@ static void __Pyx_Coroutine_del(PyObject *self) { #endif } static PyObject * -__Pyx_Coroutine_get_name(__pyx_CoroutineObject *self) +__Pyx_Coroutine_get_name(__pyx_CoroutineObject *self, CYTHON_UNUSED void *context) { PyObject *name = self->gi_name; if (unlikely(!name)) name = Py_None; @@ -15113,14 +15334,15 @@ __Pyx_Coroutine_get_name(__pyx_CoroutineObject *self) return name; } static int -__Pyx_Coroutine_set_name(__pyx_CoroutineObject *self, PyObject *value) +__Pyx_Coroutine_set_name(__pyx_CoroutineObject *self, PyObject *value, CYTHON_UNUSED void *context) { PyObject *tmp; #if PY_MAJOR_VERSION >= 3 - if (unlikely(value == NULL || !PyUnicode_Check(value))) { + if (unlikely(value == NULL || !PyUnicode_Check(value))) #else - if (unlikely(value == NULL || !PyString_Check(value))) { + if (unlikely(value == NULL || !PyString_Check(value))) #endif + { PyErr_SetString(PyExc_TypeError, "__name__ must be set to a string object"); return -1; @@ -15132,7 +15354,7 @@ __Pyx_Coroutine_set_name(__pyx_CoroutineObject *self, PyObject *value) return 0; } static PyObject * -__Pyx_Coroutine_get_qualname(__pyx_CoroutineObject *self) +__Pyx_Coroutine_get_qualname(__pyx_CoroutineObject *self, CYTHON_UNUSED void *context) { PyObject *name = self->gi_qualname; if (unlikely(!name)) name = Py_None; @@ -15140,14 +15362,15 @@ __Pyx_Coroutine_get_qualname(__pyx_CoroutineObject *self) return name; } static int -__Pyx_Coroutine_set_qualname(__pyx_CoroutineObject *self, PyObject *value) +__Pyx_Coroutine_set_qualname(__pyx_CoroutineObject *self, PyObject *value, CYTHON_UNUSED void *context) { PyObject *tmp; #if PY_MAJOR_VERSION >= 3 - if (unlikely(value == NULL || !PyUnicode_Check(value))) { + if (unlikely(value == NULL || !PyUnicode_Check(value))) #else - if (unlikely(value == NULL || !PyString_Check(value))) { + if (unlikely(value == NULL || !PyString_Check(value))) #endif + { PyErr_SetString(PyExc_TypeError, "__qualname__ must be set to a string object"); return -1; @@ -15176,9 +15399,12 @@ static __pyx_CoroutineObject *__Pyx__Coroutine_NewInit( gen->resume_label = 0; gen->classobj = NULL; gen->yieldfrom = NULL; - gen->exc_type = NULL; - gen->exc_value = NULL; - gen->exc_traceback = NULL; + gen->gi_exc_state.exc_type = NULL; + gen->gi_exc_state.exc_value = NULL; + gen->gi_exc_state.exc_traceback = NULL; +#if CYTHON_USE_EXC_INFO_STACK + gen->gi_exc_state.previous_item = NULL; +#endif gen->gi_weakreflist = NULL; Py_XINCREF(qualname); gen->gi_qualname = qualname; @@ -15193,7 +15419,7 @@ static __pyx_CoroutineObject *__Pyx__Coroutine_NewInit( } /* PatchModuleWithCoroutine */ - static PyObject* __Pyx_Coroutine_patch_module(PyObject* module, const char* py_code) { +static PyObject* __Pyx_Coroutine_patch_module(PyObject* module, const char* py_code) { #if defined(__Pyx_Generator_USED) || defined(__Pyx_Coroutine_USED) int result; PyObject *globals, *result_obj; @@ -15233,7 +15459,7 @@ static __pyx_CoroutineObject *__Pyx__Coroutine_NewInit( } /* PatchGeneratorABC */ - #ifndef CYTHON_REGISTER_ABCS +#ifndef CYTHON_REGISTER_ABCS #define CYTHON_REGISTER_ABCS 1 #endif #if defined(__Pyx_Generator_USED) || defined(__Pyx_Coroutine_USED) @@ -15290,12 +15516,12 @@ static int __Pyx_patch_abc(void) { } /* Generator */ - static PyMethodDef __pyx_Generator_methods[] = { +static PyMethodDef __pyx_Generator_methods[] = { {"send", (PyCFunction) __Pyx_Coroutine_Send, METH_O, (char*) PyDoc_STR("send(arg) -> send 'arg' into generator,\nreturn next yielded value or raise StopIteration.")}, {"throw", (PyCFunction) __Pyx_Coroutine_Throw, METH_VARARGS, (char*) PyDoc_STR("throw(typ[,val[,tb]]) -> raise exception in generator,\nreturn next yielded value or raise StopIteration.")}, - {"close", (PyCFunction) __Pyx_Coroutine_Close, METH_NOARGS, + {"close", (PyCFunction) __Pyx_Coroutine_Close_Method, METH_NOARGS, (char*) PyDoc_STR("close() -> raise GeneratorExit inside generator.")}, {0, 0, 0, 0} }; @@ -15382,7 +15608,7 @@ static int __pyx_Generator_init(void) { } /* CheckBinaryVersion */ - static int __Pyx_check_binary_version(void) { +static int __Pyx_check_binary_version(void) { char ctversion[4], rtversion[4]; PyOS_snprintf(ctversion, 4, "%d.%d", PY_MAJOR_VERSION, PY_MINOR_VERSION); PyOS_snprintf(rtversion, 4, "%s", Py_GetVersion()); @@ -15398,7 +15624,7 @@ static int __pyx_Generator_init(void) { } /* FunctionExport */ - static int __Pyx_ExportFunction(const char *name, void (*f)(void), const char *sig) { +static int __Pyx_ExportFunction(const char *name, void (*f)(void), const char *sig) { PyObject *d = 0; PyObject *cobj = 0; union { @@ -15434,91 +15660,8 @@ static int __pyx_Generator_init(void) { return -1; } -/* ModuleImport */ - #ifndef __PYX_HAVE_RT_ImportModule -#define __PYX_HAVE_RT_ImportModule -static PyObject *__Pyx_ImportModule(const char *name) { - PyObject *py_name = 0; - PyObject *py_module = 0; - py_name = __Pyx_PyIdentifier_FromString(name); - if (!py_name) - goto bad; - py_module = PyImport_Import(py_name); - Py_DECREF(py_name); - return py_module; -bad: - Py_XDECREF(py_name); - return 0; -} -#endif - -/* TypeImport */ - #ifndef __PYX_HAVE_RT_ImportType -#define __PYX_HAVE_RT_ImportType -static PyTypeObject *__Pyx_ImportType(const char *module_name, const char *class_name, - size_t size, int strict) -{ - PyObject *py_module = 0; - PyObject *result = 0; - PyObject *py_name = 0; - char warning[200]; - Py_ssize_t basicsize; -#ifdef Py_LIMITED_API - PyObject *py_basicsize; -#endif - py_module = __Pyx_ImportModule(module_name); - if (!py_module) - goto bad; - py_name = __Pyx_PyIdentifier_FromString(class_name); - if (!py_name) - goto bad; - result = PyObject_GetAttr(py_module, py_name); - Py_DECREF(py_name); - py_name = 0; - Py_DECREF(py_module); - py_module = 0; - if (!result) - goto bad; - if (!PyType_Check(result)) { - PyErr_Format(PyExc_TypeError, - "%.200s.%.200s is not a type object", - module_name, class_name); - goto bad; - } -#ifndef Py_LIMITED_API - basicsize = ((PyTypeObject *)result)->tp_basicsize; -#else - py_basicsize = PyObject_GetAttrString(result, "__basicsize__"); - if (!py_basicsize) - goto bad; - basicsize = PyLong_AsSsize_t(py_basicsize); - Py_DECREF(py_basicsize); - py_basicsize = 0; - if (basicsize == (Py_ssize_t)-1 && PyErr_Occurred()) - goto bad; -#endif - if (!strict && (size_t)basicsize > size) { - PyOS_snprintf(warning, sizeof(warning), - "%s.%s size changed, may indicate binary incompatibility. Expected %zd, got %zd", - module_name, class_name, basicsize, size); - if (PyErr_WarnEx(NULL, warning, 0) < 0) goto bad; - } - else if ((size_t)basicsize != size) { - PyErr_Format(PyExc_ValueError, - "%.200s.%.200s has the wrong size, try recompiling. Expected %zd, got %zd", - module_name, class_name, basicsize, size); - goto bad; - } - return (PyTypeObject *)result; -bad: - Py_XDECREF(py_module); - Py_XDECREF(result); - return NULL; -} -#endif - /* VoidPtrImport */ - #ifndef __PYX_HAVE_RT_ImportVoidPtr +#ifndef __PYX_HAVE_RT_ImportVoidPtr #define __PYX_HAVE_RT_ImportVoidPtr static int __Pyx_ImportVoidPtr(PyObject *module, const char *name, void **p, const char *sig) { PyObject *d = 0; @@ -15567,7 +15710,7 @@ static int __Pyx_ImportVoidPtr(PyObject *module, const char *name, void **p, con #endif /* FunctionImport */ - #ifndef __PYX_HAVE_RT_ImportFunction +#ifndef __PYX_HAVE_RT_ImportFunction #define __PYX_HAVE_RT_ImportFunction static int __Pyx_ImportFunction(PyObject *module, const char *funcname, void (**f)(void), const char *sig) { PyObject *d = 0; @@ -15621,7 +15764,7 @@ static int __Pyx_ImportFunction(PyObject *module, const char *funcname, void (** #endif /* InitStrings */ - static int __Pyx_InitStrings(__Pyx_StringTabEntry *t) { +static int __Pyx_InitStrings(__Pyx_StringTabEntry *t) { while (t->p) { #if PY_MAJOR_VERSION < 3 if (t->is_unicode) { @@ -15730,6 +15873,13 @@ static CYTHON_INLINE int __Pyx_PyObject_IsTrue(PyObject* x) { if (is_true | (x == Py_False) | (x == Py_None)) return is_true; else return PyObject_IsTrue(x); } +static CYTHON_INLINE int __Pyx_PyObject_IsTrueAndDecref(PyObject* x) { + int retval; + if (unlikely(!x)) return -1; + retval = __Pyx_PyObject_IsTrue(x); + Py_DECREF(x); + return retval; +} static PyObject* __Pyx_PyNumber_IntOrLongWrongResultType(PyObject* result, const char* type_name) { #if PY_MAJOR_VERSION >= 3 if (PyLong_Check(result)) { @@ -15807,7 +15957,7 @@ static CYTHON_INLINE Py_ssize_t __Pyx_PyIndex_AsSsize_t(PyObject* b) { if (sizeof(Py_ssize_t) >= sizeof(long)) return PyInt_AS_LONG(b); else - return PyInt_AsSsize_t(x); + return PyInt_AsSsize_t(b); } #endif if (likely(PyLong_CheckExact(b))) { diff --git a/gensim/models/word2vec_inner.c b/gensim/models/word2vec_inner.c index c767bf61af..690e358c26 100644 --- a/gensim/models/word2vec_inner.c +++ b/gensim/models/word2vec_inner.c @@ -1,22 +1,4 @@ -/* Generated by Cython 0.28.4 */ - -/* BEGIN: Cython Metadata -{ - "distutils": { - "depends": [ - "/home/akhlif/dzr_core/gensim/gensim/models/voidptr.h" - ], - "include_dirs": [ - "/home/akhlif/dzr_core/gensim/gensim/models" - ], - "name": "gensim.models.word2vec_inner", - "sources": [ - "/home/akhlif/dzr_core/gensim/gensim/models/word2vec_inner.pyx" - ] - }, - "module_name": "gensim.models.word2vec_inner" -} -END: Cython Metadata */ +/* Generated by Cython 0.29.2 */ #define PY_SSIZE_T_CLEAN #include "Python.h" @@ -25,7 +7,8 @@ END: Cython Metadata */ #elif PY_VERSION_HEX < 0x02060000 || (0x03000000 <= PY_VERSION_HEX && PY_VERSION_HEX < 0x03030000) #error Cython requires Python 2.6+ or Python 3.3+. #else -#define CYTHON_ABI "0_28_4" +#define CYTHON_ABI "0_29_2" +#define CYTHON_HEX_VERSION 0x001D02F0 #define CYTHON_FUTURE_DIVISION 0 #include #ifndef offsetof @@ -96,6 +79,10 @@ END: Cython Metadata */ #define CYTHON_PEP489_MULTI_PHASE_INIT 0 #undef CYTHON_USE_TP_FINALIZE #define CYTHON_USE_TP_FINALIZE 0 + #undef CYTHON_USE_DICT_VERSIONS + #define CYTHON_USE_DICT_VERSIONS 0 + #undef CYTHON_USE_EXC_INFO_STACK + #define CYTHON_USE_EXC_INFO_STACK 0 #elif defined(PYSTON_VERSION) #define CYTHON_COMPILING_IN_PYPY 0 #define CYTHON_COMPILING_IN_PYSTON 1 @@ -133,6 +120,10 @@ END: Cython Metadata */ #define CYTHON_PEP489_MULTI_PHASE_INIT 0 #undef CYTHON_USE_TP_FINALIZE #define CYTHON_USE_TP_FINALIZE 0 + #undef CYTHON_USE_DICT_VERSIONS + #define CYTHON_USE_DICT_VERSIONS 0 + #undef CYTHON_USE_EXC_INFO_STACK + #define CYTHON_USE_EXC_INFO_STACK 0 #else #define CYTHON_COMPILING_IN_PYPY 0 #define CYTHON_COMPILING_IN_PYSTON 0 @@ -186,11 +177,17 @@ END: Cython Metadata */ #define CYTHON_FAST_PYCALL 1 #endif #ifndef CYTHON_PEP489_MULTI_PHASE_INIT - #define CYTHON_PEP489_MULTI_PHASE_INIT (0 && PY_VERSION_HEX >= 0x03050000) + #define CYTHON_PEP489_MULTI_PHASE_INIT (PY_VERSION_HEX >= 0x03050000) #endif #ifndef CYTHON_USE_TP_FINALIZE #define CYTHON_USE_TP_FINALIZE (PY_VERSION_HEX >= 0x030400a1) #endif + #ifndef CYTHON_USE_DICT_VERSIONS + #define CYTHON_USE_DICT_VERSIONS (PY_VERSION_HEX >= 0x030600B1) + #endif + #ifndef CYTHON_USE_EXC_INFO_STACK + #define CYTHON_USE_EXC_INFO_STACK (PY_VERSION_HEX >= 0x030700A3) + #endif #endif #if !defined(CYTHON_FAST_PYCCALL) #define CYTHON_FAST_PYCCALL (CYTHON_FAST_PYCALL && PY_VERSION_HEX >= 0x030600B1) @@ -200,6 +197,9 @@ END: Cython Metadata */ #undef SHIFT #undef BASE #undef MASK + #ifdef SIZEOF_VOID_P + enum { __pyx_check_sizeof_voidp = 1 / (int)(SIZEOF_VOID_P == sizeof(void*)) }; + #endif #endif #ifndef __has_attribute #define __has_attribute(x) 0 @@ -326,6 +326,9 @@ END: Cython Metadata */ #ifndef Py_TPFLAGS_HAVE_FINALIZE #define Py_TPFLAGS_HAVE_FINALIZE 0 #endif +#ifndef METH_STACKLESS + #define METH_STACKLESS 0 +#endif #if PY_VERSION_HEX <= 0x030700A3 || !defined(METH_FASTCALL) #ifndef METH_FASTCALL #define METH_FASTCALL 0x80 @@ -339,15 +342,40 @@ END: Cython Metadata */ #endif #if CYTHON_FAST_PYCCALL #define __Pyx_PyFastCFunction_Check(func)\ - ((PyCFunction_Check(func) && (METH_FASTCALL == (PyCFunction_GET_FLAGS(func) & ~(METH_CLASS | METH_STATIC | METH_COEXIST | METH_KEYWORDS))))) + ((PyCFunction_Check(func) && (METH_FASTCALL == (PyCFunction_GET_FLAGS(func) & ~(METH_CLASS | METH_STATIC | METH_COEXIST | METH_KEYWORDS | METH_STACKLESS))))) #else #define __Pyx_PyFastCFunction_Check(func) 0 #endif +#if CYTHON_USE_DICT_VERSIONS +#define __PYX_GET_DICT_VERSION(dict) (((PyDictObject*)(dict))->ma_version_tag) +#define __PYX_UPDATE_DICT_CACHE(dict, value, cache_var, version_var)\ + (version_var) = __PYX_GET_DICT_VERSION(dict);\ + (cache_var) = (value); +#define __PYX_PY_DICT_LOOKUP_IF_MODIFIED(VAR, DICT, LOOKUP) {\ + static PY_UINT64_T __pyx_dict_version = 0;\ + static PyObject *__pyx_dict_cached_value = NULL;\ + if (likely(__PYX_GET_DICT_VERSION(DICT) == __pyx_dict_version)) {\ + (VAR) = __pyx_dict_cached_value;\ + } else {\ + (VAR) = __pyx_dict_cached_value = (LOOKUP);\ + __pyx_dict_version = __PYX_GET_DICT_VERSION(DICT);\ + }\ + } +#else +#define __PYX_GET_DICT_VERSION(dict) (0) +#define __PYX_UPDATE_DICT_CACHE(dict, value, cache_var, version_var) +#define __PYX_PY_DICT_LOOKUP_IF_MODIFIED(VAR, DICT, LOOKUP) (VAR) = (LOOKUP); +#endif #if CYTHON_COMPILING_IN_PYPY && !defined(PyObject_Malloc) #define PyObject_Malloc(s) PyMem_Malloc(s) #define PyObject_Free(p) PyMem_Free(p) #define PyObject_Realloc(p) PyMem_Realloc(p) #endif +#if CYTHON_COMPILING_IN_CPYTHON && PY_VERSION_HEX < 0x030400A1 + #define PyMem_RawMalloc(n) PyMem_Malloc(n) + #define PyMem_RawRealloc(p, n) PyMem_Realloc(p, n) + #define PyMem_RawFree(p) PyMem_Free(p) +#endif #if CYTHON_COMPILING_IN_PYSTON #define __Pyx_PyCode_HasFreeVars(co) PyCode_HasFreeVars(co) #define __Pyx_PyFrame_SetLineNumber(frame, lineno) PyFrame_SetLineNumber(frame, lineno) @@ -455,8 +483,8 @@ static CYTHON_INLINE void * PyThread_tss_get(Py_tss_t *key) { #if CYTHON_COMPILING_IN_PYPY && !defined(PyObject_Format) #define PyObject_Format(obj, fmt) PyObject_CallMethod(obj, "__format__", "O", fmt) #endif -#define __Pyx_PyString_FormatSafe(a, b) ((unlikely((a) == Py_None)) ? PyNumber_Remainder(a, b) : __Pyx_PyString_Format(a, b)) -#define __Pyx_PyUnicode_FormatSafe(a, b) ((unlikely((a) == Py_None)) ? PyNumber_Remainder(a, b) : PyUnicode_Format(a, b)) +#define __Pyx_PyString_FormatSafe(a, b) ((unlikely((a) == Py_None || (PyString_Check(b) && !PyString_CheckExact(b)))) ? PyNumber_Remainder(a, b) : __Pyx_PyString_Format(a, b)) +#define __Pyx_PyUnicode_FormatSafe(a, b) ((unlikely((a) == Py_None || (PyUnicode_Check(b) && !PyUnicode_CheckExact(b)))) ? PyNumber_Remainder(a, b) : PyUnicode_Format(a, b)) #if PY_MAJOR_VERSION >= 3 #define __Pyx_PyString_Format(a, b) PyUnicode_Format(a, b) #else @@ -614,6 +642,9 @@ typedef struct {PyObject **p; const char *s; const Py_ssize_t n; const char* enc (sizeof(type) == sizeof(Py_ssize_t) &&\ (is_signed || likely(v < (type)PY_SSIZE_T_MAX ||\ v == (type)PY_SSIZE_T_MAX))) ) +static CYTHON_INLINE int __Pyx_is_valid_index(Py_ssize_t i, Py_ssize_t limit) { + return (size_t) i < (size_t) limit; +} #if defined (__cplusplus) && __cplusplus >= 201103L #include #define __Pyx_sst_abs(value) std::abs(value) @@ -672,6 +703,7 @@ static CYTHON_INLINE size_t __Pyx_Py_UNICODE_strlen(const Py_UNICODE *u) { #define __Pyx_Owned_Py_None(b) __Pyx_NewRef(Py_None) static CYTHON_INLINE PyObject * __Pyx_PyBool_FromLong(long b); static CYTHON_INLINE int __Pyx_PyObject_IsTrue(PyObject*); +static CYTHON_INLINE int __Pyx_PyObject_IsTrueAndDecref(PyObject*); static CYTHON_INLINE PyObject* __Pyx_PyNumber_IntOrLong(PyObject* x); #define __Pyx_PySequence_Tuple(obj)\ (likely(PyTuple_CheckExact(obj)) ? __Pyx_NewRef(obj) : PySequence_Tuple(obj)) @@ -752,7 +784,7 @@ static int __Pyx_init_sys_getdefaultencoding_params(void) { if (!default_encoding) goto bad; default_encoding_c = PyBytes_AsString(default_encoding); if (!default_encoding_c) goto bad; - __PYX_DEFAULT_STRING_ENCODING = (char*) malloc(strlen(default_encoding_c)); + __PYX_DEFAULT_STRING_ENCODING = (char*) malloc(strlen(default_encoding_c) + 1); if (!__PYX_DEFAULT_STRING_ENCODING) goto bad; strcpy(__PYX_DEFAULT_STRING_ENCODING, default_encoding_c); Py_DECREF(default_encoding); @@ -811,7 +843,7 @@ static const char *__pyx_filename; static const char *__pyx_f[] = { - "word2vec_inner.pyx", + "gensim/models/word2vec_inner.pyx", "__init__.pxd", "type.pxd", }; @@ -828,7 +860,7 @@ static const char *__pyx_f[] = { #endif -/* "../../../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":730 +/* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":776 * # in Cython to enable them only on the right systems. * * ctypedef npy_int8 int8_t # <<<<<<<<<<<<<< @@ -837,7 +869,7 @@ static const char *__pyx_f[] = { */ typedef npy_int8 __pyx_t_5numpy_int8_t; -/* "../../../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":731 +/* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":777 * * ctypedef npy_int8 int8_t * ctypedef npy_int16 int16_t # <<<<<<<<<<<<<< @@ -846,7 +878,7 @@ typedef npy_int8 __pyx_t_5numpy_int8_t; */ typedef npy_int16 __pyx_t_5numpy_int16_t; -/* "../../../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":732 +/* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":778 * ctypedef npy_int8 int8_t * ctypedef npy_int16 int16_t * ctypedef npy_int32 int32_t # <<<<<<<<<<<<<< @@ -855,7 +887,7 @@ typedef npy_int16 __pyx_t_5numpy_int16_t; */ typedef npy_int32 __pyx_t_5numpy_int32_t; -/* "../../../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":733 +/* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":779 * ctypedef npy_int16 int16_t * ctypedef npy_int32 int32_t * ctypedef npy_int64 int64_t # <<<<<<<<<<<<<< @@ -864,7 +896,7 @@ typedef npy_int32 __pyx_t_5numpy_int32_t; */ typedef npy_int64 __pyx_t_5numpy_int64_t; -/* "../../../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":737 +/* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":783 * #ctypedef npy_int128 int128_t * * ctypedef npy_uint8 uint8_t # <<<<<<<<<<<<<< @@ -873,7 +905,7 @@ typedef npy_int64 __pyx_t_5numpy_int64_t; */ typedef npy_uint8 __pyx_t_5numpy_uint8_t; -/* "../../../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":738 +/* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":784 * * ctypedef npy_uint8 uint8_t * ctypedef npy_uint16 uint16_t # <<<<<<<<<<<<<< @@ -882,7 +914,7 @@ typedef npy_uint8 __pyx_t_5numpy_uint8_t; */ typedef npy_uint16 __pyx_t_5numpy_uint16_t; -/* "../../../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":739 +/* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":785 * ctypedef npy_uint8 uint8_t * ctypedef npy_uint16 uint16_t * ctypedef npy_uint32 uint32_t # <<<<<<<<<<<<<< @@ -891,7 +923,7 @@ typedef npy_uint16 __pyx_t_5numpy_uint16_t; */ typedef npy_uint32 __pyx_t_5numpy_uint32_t; -/* "../../../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":740 +/* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":786 * ctypedef npy_uint16 uint16_t * ctypedef npy_uint32 uint32_t * ctypedef npy_uint64 uint64_t # <<<<<<<<<<<<<< @@ -900,7 +932,7 @@ typedef npy_uint32 __pyx_t_5numpy_uint32_t; */ typedef npy_uint64 __pyx_t_5numpy_uint64_t; -/* "../../../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":744 +/* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":790 * #ctypedef npy_uint128 uint128_t * * ctypedef npy_float32 float32_t # <<<<<<<<<<<<<< @@ -909,7 +941,7 @@ typedef npy_uint64 __pyx_t_5numpy_uint64_t; */ typedef npy_float32 __pyx_t_5numpy_float32_t; -/* "../../../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":745 +/* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":791 * * ctypedef npy_float32 float32_t * ctypedef npy_float64 float64_t # <<<<<<<<<<<<<< @@ -918,7 +950,7 @@ typedef npy_float32 __pyx_t_5numpy_float32_t; */ typedef npy_float64 __pyx_t_5numpy_float64_t; -/* "../../../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":754 +/* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":800 * # The int types are mapped a bit surprising -- * # numpy.int corresponds to 'l' and numpy.long to 'q' * ctypedef npy_long int_t # <<<<<<<<<<<<<< @@ -927,7 +959,7 @@ typedef npy_float64 __pyx_t_5numpy_float64_t; */ typedef npy_long __pyx_t_5numpy_int_t; -/* "../../../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":755 +/* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":801 * # numpy.int corresponds to 'l' and numpy.long to 'q' * ctypedef npy_long int_t * ctypedef npy_longlong long_t # <<<<<<<<<<<<<< @@ -936,7 +968,7 @@ typedef npy_long __pyx_t_5numpy_int_t; */ typedef npy_longlong __pyx_t_5numpy_long_t; -/* "../../../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":756 +/* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":802 * ctypedef npy_long int_t * ctypedef npy_longlong long_t * ctypedef npy_longlong longlong_t # <<<<<<<<<<<<<< @@ -945,7 +977,7 @@ typedef npy_longlong __pyx_t_5numpy_long_t; */ typedef npy_longlong __pyx_t_5numpy_longlong_t; -/* "../../../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":758 +/* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":804 * ctypedef npy_longlong longlong_t * * ctypedef npy_ulong uint_t # <<<<<<<<<<<<<< @@ -954,7 +986,7 @@ typedef npy_longlong __pyx_t_5numpy_longlong_t; */ typedef npy_ulong __pyx_t_5numpy_uint_t; -/* "../../../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":759 +/* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":805 * * ctypedef npy_ulong uint_t * ctypedef npy_ulonglong ulong_t # <<<<<<<<<<<<<< @@ -963,7 +995,7 @@ typedef npy_ulong __pyx_t_5numpy_uint_t; */ typedef npy_ulonglong __pyx_t_5numpy_ulong_t; -/* "../../../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":760 +/* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":806 * ctypedef npy_ulong uint_t * ctypedef npy_ulonglong ulong_t * ctypedef npy_ulonglong ulonglong_t # <<<<<<<<<<<<<< @@ -972,7 +1004,7 @@ typedef npy_ulonglong __pyx_t_5numpy_ulong_t; */ typedef npy_ulonglong __pyx_t_5numpy_ulonglong_t; -/* "../../../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":762 +/* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":808 * ctypedef npy_ulonglong ulonglong_t * * ctypedef npy_intp intp_t # <<<<<<<<<<<<<< @@ -981,7 +1013,7 @@ typedef npy_ulonglong __pyx_t_5numpy_ulonglong_t; */ typedef npy_intp __pyx_t_5numpy_intp_t; -/* "../../../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":763 +/* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":809 * * ctypedef npy_intp intp_t * ctypedef npy_uintp uintp_t # <<<<<<<<<<<<<< @@ -990,7 +1022,7 @@ typedef npy_intp __pyx_t_5numpy_intp_t; */ typedef npy_uintp __pyx_t_5numpy_uintp_t; -/* "../../../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":765 +/* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":811 * ctypedef npy_uintp uintp_t * * ctypedef npy_double float_t # <<<<<<<<<<<<<< @@ -999,7 +1031,7 @@ typedef npy_uintp __pyx_t_5numpy_uintp_t; */ typedef npy_double __pyx_t_5numpy_float_t; -/* "../../../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":766 +/* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":812 * * ctypedef npy_double float_t * ctypedef npy_double double_t # <<<<<<<<<<<<<< @@ -1008,7 +1040,7 @@ typedef npy_double __pyx_t_5numpy_float_t; */ typedef npy_double __pyx_t_5numpy_double_t; -/* "../../../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":767 +/* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":813 * ctypedef npy_double float_t * ctypedef npy_double double_t * ctypedef npy_longdouble longdouble_t # <<<<<<<<<<<<<< @@ -1052,7 +1084,7 @@ static CYTHON_INLINE __pyx_t_double_complex __pyx_t_double_complex_from_parts(do /*--- Type declarations ---*/ -/* "../../../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":769 +/* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":815 * ctypedef npy_longdouble longdouble_t * * ctypedef npy_cfloat cfloat_t # <<<<<<<<<<<<<< @@ -1061,7 +1093,7 @@ static CYTHON_INLINE __pyx_t_double_complex __pyx_t_double_complex_from_parts(do */ typedef npy_cfloat __pyx_t_5numpy_cfloat_t; -/* "../../../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":770 +/* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":816 * * ctypedef npy_cfloat cfloat_t * ctypedef npy_cdouble cdouble_t # <<<<<<<<<<<<<< @@ -1070,7 +1102,7 @@ typedef npy_cfloat __pyx_t_5numpy_cfloat_t; */ typedef npy_cdouble __pyx_t_5numpy_cdouble_t; -/* "../../../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":771 +/* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":817 * ctypedef npy_cfloat cfloat_t * ctypedef npy_cdouble cdouble_t * ctypedef npy_clongdouble clongdouble_t # <<<<<<<<<<<<<< @@ -1079,7 +1111,7 @@ typedef npy_cdouble __pyx_t_5numpy_cdouble_t; */ typedef npy_clongdouble __pyx_t_5numpy_clongdouble_t; -/* "../../../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":773 +/* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":819 * ctypedef npy_clongdouble clongdouble_t * * ctypedef npy_cdouble complex_t # <<<<<<<<<<<<<< @@ -1281,6 +1313,9 @@ static CYTHON_INLINE PyObject* __Pyx_PyObject_GetAttrStr(PyObject* obj, PyObject /* GetBuiltinName.proto */ static PyObject *__Pyx_GetBuiltinName(PyObject *name); +/* PyIntCompare.proto */ +static CYTHON_INLINE PyObject* __Pyx_PyInt_NeObjC(PyObject *op1, PyObject *op2, long intval, long inplace); + /* ExtTypeTest.proto */ static CYTHON_INLINE int __Pyx_TypeTest(PyObject *obj, PyTypeObject *type); @@ -1347,6 +1382,18 @@ static PyObject *__Pyx_PyFunction_FastCallDict(PyObject *func, PyObject **args, #else #define __Pyx_PyFunction_FastCallDict(func, args, nargs, kwargs) _PyFunction_FastCallDict(func, args, nargs, kwargs) #endif +#define __Pyx_BUILD_ASSERT_EXPR(cond)\ + (sizeof(char [1 - 2*!(cond)]) - 1) +#ifndef Py_MEMBER_SIZE +#define Py_MEMBER_SIZE(type, member) sizeof(((type *)0)->member) +#endif + static size_t __pyx_pyframe_localsplus_offset = 0; + #include "frameobject.h" + #define __Pxy_PyFrame_Initialize_Offsets()\ + ((void)__Pyx_BUILD_ASSERT_EXPR(sizeof(PyFrameObject) == offsetof(PyFrameObject, f_localsplus) + Py_MEMBER_SIZE(PyFrameObject, f_localsplus)),\ + (void)(__pyx_pyframe_localsplus_offset = ((size_t)PyFrame_Type.tp_basicsize) - Py_MEMBER_SIZE(PyFrameObject, f_localsplus))) + #define __Pyx_PyFrame_GetLocalsplus(frame)\ + (assert(__pyx_pyframe_localsplus_offset), (PyObject **)(((char *)(frame)) + __pyx_pyframe_localsplus_offset)) #endif /* PyCFunctionFastCall.proto */ @@ -1432,6 +1479,11 @@ static CYTHON_INLINE void __Pyx_RaiseNeedMoreValuesError(Py_ssize_t index); /* RaiseNoneIterError.proto */ static CYTHON_INLINE void __Pyx_RaiseNoneNotIterableError(void); +/* GetTopmostException.proto */ +#if CYTHON_USE_EXC_INFO_STACK +static _PyErr_StackItem * __Pyx_PyErr_GetTopmostException(PyThreadState *tstate); +#endif + /* SaveResetException.proto */ #if CYTHON_FAST_THREAD_STATE #define __Pyx_ExceptionSave(type, value, tb) __Pyx__ExceptionSave(__pyx_tstate, type, value, tb) @@ -1459,6 +1511,17 @@ static int __Pyx__GetException(PyThreadState *tstate, PyObject **type, PyObject static int __Pyx_GetException(PyObject **type, PyObject **value, PyObject **tb); #endif +/* TypeImport.proto */ +#ifndef __PYX_HAVE_RT_ImportType_proto +#define __PYX_HAVE_RT_ImportType_proto +enum __Pyx_ImportType_CheckSize { + __Pyx_ImportType_CheckSize_Error = 0, + __Pyx_ImportType_CheckSize_Warn = 1, + __Pyx_ImportType_CheckSize_Ignore = 2 +}; +static PyTypeObject *__Pyx_ImportType(PyObject* module, const char *module_name, const char *class_name, size_t size, enum __Pyx_ImportType_CheckSize check_size); +#endif + /* Import.proto */ static PyObject *__Pyx_Import(PyObject *name, PyObject *from_list, int level); @@ -1466,7 +1529,25 @@ static PyObject *__Pyx_Import(PyObject *name, PyObject *from_list, int level); static PyObject* __Pyx_ImportFrom(PyObject* module, PyObject* name); /* GetModuleGlobalName.proto */ -static CYTHON_INLINE PyObject *__Pyx_GetModuleGlobalName(PyObject *name); +#if CYTHON_USE_DICT_VERSIONS +#define __Pyx_GetModuleGlobalName(var, name) {\ + static PY_UINT64_T __pyx_dict_version = 0;\ + static PyObject *__pyx_dict_cached_value = NULL;\ + (var) = (likely(__pyx_dict_version == __PYX_GET_DICT_VERSION(__pyx_d))) ?\ + (likely(__pyx_dict_cached_value) ? __Pyx_NewRef(__pyx_dict_cached_value) : __Pyx_GetBuiltinName(name)) :\ + __Pyx__GetModuleGlobalName(name, &__pyx_dict_version, &__pyx_dict_cached_value);\ +} +#define __Pyx_GetModuleGlobalNameUncached(var, name) {\ + PY_UINT64_T __pyx_dict_version;\ + PyObject *__pyx_dict_cached_value;\ + (var) = __Pyx__GetModuleGlobalName(name, &__pyx_dict_version, &__pyx_dict_cached_value);\ +} +static PyObject *__Pyx__GetModuleGlobalName(PyObject *name, PY_UINT64_T *dict_version, PyObject **dict_cached_value); +#else +#define __Pyx_GetModuleGlobalName(var, name) (var) = __Pyx__GetModuleGlobalName(name) +#define __Pyx_GetModuleGlobalNameUncached(var, name) (var) = __Pyx__GetModuleGlobalName(name) +static CYTHON_INLINE PyObject *__Pyx__GetModuleGlobalName(PyObject *name); +#endif /* PyObjectCallNoArg.proto */ #if CYTHON_COMPILING_IN_CPYTHON @@ -1651,21 +1732,6 @@ static int __Pyx_ExportVoidPtr(PyObject *name, void *p, const char *sig); /* FunctionExport.proto */ static int __Pyx_ExportFunction(const char *name, void (*f)(void), const char *sig); -/* PyIdentifierFromString.proto */ -#if !defined(__Pyx_PyIdentifier_FromString) -#if PY_MAJOR_VERSION < 3 - #define __Pyx_PyIdentifier_FromString(s) PyString_FromString(s) -#else - #define __Pyx_PyIdentifier_FromString(s) PyUnicode_FromString(s) -#endif -#endif - -/* ModuleImport.proto */ -static PyObject *__Pyx_ImportModule(const char *name); - -/* TypeImport.proto */ -static PyTypeObject *__Pyx_ImportType(const char *module_name, const char *class_name, size_t size, int strict); - /* InitStrings.proto */ static int __Pyx_InitStrings(__Pyx_StringTabEntry *t); @@ -1745,15 +1811,16 @@ static const char __pyx_k_j[] = "j"; static const char __pyx_k_k[] = "k"; static const char __pyx_k_x[] = "x"; static const char __pyx_k_y[] = "y"; +static const char __pyx_k__9[] = "*"; static const char __pyx_k_hs[] = "hs"; static const char __pyx_k_np[] = "np"; static const char __pyx_k_wv[] = "wv"; -static const char __pyx_k__12[] = "*"; static const char __pyx_k_REAL[] = "REAL"; static const char __pyx_k_code[] = "code"; static const char __pyx_k_init[] = "init"; static const char __pyx_k_item[] = "item"; static const char __pyx_k_main[] = "__main__"; +static const char __pyx_k_name[] = "__name__"; static const char __pyx_k_neu1[] = "_neu1"; static const char __pyx_k_sdot[] = "sdot"; static const char __pyx_k_sent[] = "sent"; @@ -1823,18 +1890,17 @@ static const char __pyx_k_scipy_linalg_blas[] = "scipy.linalg.blas"; static const char __pyx_k_score_sentence_sg[] = "score_sentence_sg"; static const char __pyx_k_MAX_WORDS_IN_BATCH[] = "MAX_WORDS_IN_BATCH"; static const char __pyx_k_cline_in_traceback[] = "cline_in_traceback"; -static const char __pyx_k_word2vec_inner_pyx[] = "word2vec_inner.pyx"; static const char __pyx_k_effective_sentences[] = "effective_sentences"; static const char __pyx_k_score_sentence_cbow[] = "score_sentence_cbow"; static const char __pyx_k_running_training_loss[] = "running_training_loss"; static const char __pyx_k_ndarray_is_not_C_contiguous[] = "ndarray is not C contiguous"; static const char __pyx_k_gensim_models_word2vec_inner[] = "gensim.models.word2vec_inner"; -static const char __pyx_k_running_training_loss_sample[] = "_running_training_loss_sample"; static const char __pyx_k_numpy_core_multiarray_failed_to[] = "numpy.core.multiarray failed to import"; static const char __pyx_k_unknown_dtype_code_in_numpy_pxd[] = "unknown dtype code in numpy.pxd (%d)"; static const char __pyx_k_Format_string_allocated_too_shor[] = "Format string allocated too short, see comment in numpy.pxd"; static const char __pyx_k_Non_native_byte_order_not_suppor[] = "Non-native byte order not supported"; static const char __pyx_k_Optimized_cython_functions_for_t[] = "Optimized cython functions for training :class:`~gensim.models.word2vec.Word2Vec` model."; +static const char __pyx_k_gensim_models_word2vec_inner_pyx[] = "gensim/models/word2vec_inner.pyx"; static const char __pyx_k_ndarray_is_not_Fortran_contiguou[] = "ndarray is not Fortran contiguous"; static const char __pyx_k_numpy_core_umath_failed_to_impor[] = "numpy.core.umath failed to import"; static const char __pyx_k_Format_string_allocated_too_shor_2[] = "Format string allocated too short."; @@ -1848,7 +1914,7 @@ static PyObject *__pyx_kp_u_Non_native_byte_order_not_suppor; static PyObject *__pyx_n_s_REAL; static PyObject *__pyx_n_s_RuntimeError; static PyObject *__pyx_n_s_ValueError; -static PyObject *__pyx_n_s__12; +static PyObject *__pyx_n_s__9; static PyObject *__pyx_n_s_alpha; static PyObject *__pyx_n_s_c; static PyObject *__pyx_n_s_cbow_mean; @@ -1867,6 +1933,7 @@ static PyObject *__pyx_n_s_expected; static PyObject *__pyx_n_s_fblas; static PyObject *__pyx_n_s_float32; static PyObject *__pyx_n_s_gensim_models_word2vec_inner; +static PyObject *__pyx_kp_s_gensim_models_word2vec_inner_pyx; static PyObject *__pyx_n_s_hs; static PyObject *__pyx_n_s_i; static PyObject *__pyx_n_s_idx_end; @@ -1879,6 +1946,7 @@ static PyObject *__pyx_n_s_j; static PyObject *__pyx_n_s_k; static PyObject *__pyx_n_s_main; static PyObject *__pyx_n_s_model; +static PyObject *__pyx_n_s_name; static PyObject *__pyx_kp_u_ndarray_is_not_C_contiguous; static PyObject *__pyx_kp_u_ndarray_is_not_Fortran_contiguou; static PyObject *__pyx_n_s_negative; @@ -1897,7 +1965,6 @@ static PyObject *__pyx_n_s_random; static PyObject *__pyx_n_s_range; static PyObject *__pyx_n_s_result; static PyObject *__pyx_n_s_running_training_loss; -static PyObject *__pyx_n_s_running_training_loss_sample; static PyObject *__pyx_n_s_sample; static PyObject *__pyx_n_s_sample_int; static PyObject *__pyx_n_s_saxpy; @@ -1930,7 +1997,6 @@ static PyObject *__pyx_n_s_vocab; static PyObject *__pyx_n_s_vocabulary; static PyObject *__pyx_n_s_window; static PyObject *__pyx_n_s_word; -static PyObject *__pyx_kp_s_word2vec_inner_pyx; static PyObject *__pyx_n_s_work; static PyObject *__pyx_n_s_workers; static PyObject *__pyx_n_s_wv; @@ -1956,19 +2022,16 @@ static PyObject *__pyx_tuple__5; static PyObject *__pyx_tuple__6; static PyObject *__pyx_tuple__7; static PyObject *__pyx_tuple__8; -static PyObject *__pyx_tuple__9; static PyObject *__pyx_tuple__10; -static PyObject *__pyx_tuple__11; -static PyObject *__pyx_tuple__13; -static PyObject *__pyx_tuple__15; -static PyObject *__pyx_tuple__17; -static PyObject *__pyx_tuple__19; -static PyObject *__pyx_tuple__21; -static PyObject *__pyx_codeobj__14; -static PyObject *__pyx_codeobj__16; -static PyObject *__pyx_codeobj__18; -static PyObject *__pyx_codeobj__20; -static PyObject *__pyx_codeobj__22; +static PyObject *__pyx_tuple__12; +static PyObject *__pyx_tuple__14; +static PyObject *__pyx_tuple__16; +static PyObject *__pyx_tuple__18; +static PyObject *__pyx_codeobj__11; +static PyObject *__pyx_codeobj__13; +static PyObject *__pyx_codeobj__15; +static PyObject *__pyx_codeobj__17; +static PyObject *__pyx_codeobj__19; /* Late includes */ /* "gensim/models/word2vec_inner.pyx":51 @@ -4056,7 +4119,8 @@ static PyObject *__pyx_f_6gensim_6models_14word2vec_inner_init_w2v_config(struct __pyx_t_3 = __Pyx_PyObject_GetAttrStr(__pyx_t_1, __pyx_n_s_sample); if (unlikely(!__pyx_t_3)) __PYX_ERR(0, 470, __pyx_L1_error) __Pyx_GOTREF(__pyx_t_3); __Pyx_DECREF(__pyx_t_1); __pyx_t_1 = 0; - __pyx_t_1 = PyObject_RichCompare(__pyx_t_3, __pyx_int_0, Py_NE); __Pyx_XGOTREF(__pyx_t_1); if (unlikely(!__pyx_t_1)) __PYX_ERR(0, 470, __pyx_L1_error) + __pyx_t_1 = __Pyx_PyInt_NeObjC(__pyx_t_3, __pyx_int_0, 0, 0); if (unlikely(!__pyx_t_1)) __PYX_ERR(0, 470, __pyx_L1_error) + __Pyx_GOTREF(__pyx_t_1); __Pyx_DECREF(__pyx_t_3); __pyx_t_3 = 0; __pyx_t_2 = __Pyx_PyInt_As_int(__pyx_t_1); if (unlikely((__pyx_t_2 == (int)-1) && PyErr_Occurred())) __PYX_ERR(0, 470, __pyx_L1_error) __Pyx_DECREF(__pyx_t_1); __pyx_t_1 = 0; @@ -4326,7 +4390,7 @@ static PyObject *__pyx_f_6gensim_6models_14word2vec_inner_init_w2v_config(struct __pyx_t_8 = __Pyx_PyObject_GetAttrStr(__pyx_t_3, __pyx_n_s_randint); if (unlikely(!__pyx_t_8)) __PYX_ERR(0, 491, __pyx_L1_error) __Pyx_GOTREF(__pyx_t_8); __Pyx_DECREF(__pyx_t_3); __pyx_t_3 = 0; - __pyx_t_3 = __Pyx_PyObject_Call(__pyx_t_8, __pyx_tuple__2, NULL); if (unlikely(!__pyx_t_3)) __PYX_ERR(0, 491, __pyx_L1_error) + __pyx_t_3 = __Pyx_PyObject_Call(__pyx_t_8, __pyx_tuple_, NULL); if (unlikely(!__pyx_t_3)) __PYX_ERR(0, 491, __pyx_L1_error) __Pyx_GOTREF(__pyx_t_3); __Pyx_DECREF(__pyx_t_8); __pyx_t_8 = 0; __pyx_t_8 = PyNumber_Add(__pyx_t_1, __pyx_t_3); if (unlikely(!__pyx_t_8)) __PYX_ERR(0, 491, __pyx_L1_error) @@ -4420,7 +4484,7 @@ static PyObject *__pyx_f_6gensim_6models_14word2vec_inner_init_w2v_config(struct /* Python wrapper */ static PyObject *__pyx_pw_6gensim_6models_14word2vec_inner_1train_batch_sg(PyObject *__pyx_self, PyObject *__pyx_args, PyObject *__pyx_kwds); /*proto*/ static char __pyx_doc_6gensim_6models_14word2vec_inner_train_batch_sg[] = "train_batch_sg(model, sentences, alpha, _work, compute_loss)\nUpdate skip-gram model by training on a batch of sentences.\n\n Called internally from :meth:`~gensim.models.word2vec.Word2Vec.train`.\n\n Parameters\n ----------\n model : :class:`~gensim.models.word2Vec.Word2Vec`\n The Word2Vec model instance to train.\n sentences : iterable of list of str\n The corpus used to train the model.\n alpha : float\n The learning rate\n _work : np.ndarray\n Private working memory for each worker.\n compute_loss : bool\n Whether or not the training loss should be computed in this batch.\n\n Returns\n -------\n int\n Number of words in the vocabulary actually used for training (They already existed in the vocabulary\n and were not discarded by negative sampling).\n int\n Number of samples used for training. A sample is a positive/negative example.\n\n "; -static PyMethodDef __pyx_mdef_6gensim_6models_14word2vec_inner_1train_batch_sg = {"train_batch_sg", (PyCFunction)__pyx_pw_6gensim_6models_14word2vec_inner_1train_batch_sg, METH_VARARGS|METH_KEYWORDS, __pyx_doc_6gensim_6models_14word2vec_inner_train_batch_sg}; +static PyMethodDef __pyx_mdef_6gensim_6models_14word2vec_inner_1train_batch_sg = {"train_batch_sg", (PyCFunction)(void*)(PyCFunctionWithKeywords)__pyx_pw_6gensim_6models_14word2vec_inner_1train_batch_sg, METH_VARARGS|METH_KEYWORDS, __pyx_doc_6gensim_6models_14word2vec_inner_train_batch_sg}; static PyObject *__pyx_pw_6gensim_6models_14word2vec_inner_1train_batch_sg(PyObject *__pyx_self, PyObject *__pyx_args, PyObject *__pyx_kwds) { PyObject *__pyx_v_model = 0; PyObject *__pyx_v_sentences = 0; @@ -4529,7 +4593,6 @@ static PyObject *__pyx_pf_6gensim_6models_14word2vec_inner_train_batch_sg(CYTHON PyObject *__pyx_v_token = NULL; PyObject *__pyx_v_word = NULL; PyObject *__pyx_v_item = NULL; - CYTHON_UNUSED long __pyx_v__running_training_loss_sample; PyObject *__pyx_r = NULL; __Pyx_RefNannyDeclarations PyObject *__pyx_t_1 = NULL; @@ -5243,7 +5306,7 @@ static PyObject *__pyx_pf_6gensim_6models_14word2vec_inner_train_batch_sg(CYTHON * k = i + c.window + 1 - c.reduced_windows[i] * if k > idx_end: # <<<<<<<<<<<<<< * k = idx_end - * _running_training_loss_sample = 0 + * for j in range(j, k): */ __pyx_t_5 = ((__pyx_v_k > __pyx_v_idx_end) != 0); if (__pyx_t_5) { @@ -5252,8 +5315,8 @@ static PyObject *__pyx_pf_6gensim_6models_14word2vec_inner_train_batch_sg(CYTHON * k = i + c.window + 1 - c.reduced_windows[i] * if k > idx_end: * k = idx_end # <<<<<<<<<<<<<< - * _running_training_loss_sample = 0 * for j in range(j, k): + * if j == i: */ __pyx_v_k = __pyx_v_idx_end; @@ -5262,22 +5325,13 @@ static PyObject *__pyx_pf_6gensim_6models_14word2vec_inner_train_batch_sg(CYTHON * k = i + c.window + 1 - c.reduced_windows[i] * if k > idx_end: # <<<<<<<<<<<<<< * k = idx_end - * _running_training_loss_sample = 0 + * for j in range(j, k): */ } /* "gensim/models/word2vec_inner.pyx":581 * if k > idx_end: * k = idx_end - * _running_training_loss_sample = 0 # <<<<<<<<<<<<<< - * for j in range(j, k): - * if j == i: - */ - __pyx_v__running_training_loss_sample = 0; - - /* "gensim/models/word2vec_inner.pyx":582 - * k = idx_end - * _running_training_loss_sample = 0 * for j in range(j, k): # <<<<<<<<<<<<<< * if j == i: * continue @@ -5287,8 +5341,8 @@ static PyObject *__pyx_pf_6gensim_6models_14word2vec_inner_train_batch_sg(CYTHON for (__pyx_t_23 = __pyx_v_j; __pyx_t_23 < __pyx_t_22; __pyx_t_23+=1) { __pyx_v_j = __pyx_t_23; - /* "gensim/models/word2vec_inner.pyx":583 - * _running_training_loss_sample = 0 + /* "gensim/models/word2vec_inner.pyx":582 + * k = idx_end * for j in range(j, k): * if j == i: # <<<<<<<<<<<<<< * continue @@ -5297,7 +5351,7 @@ static PyObject *__pyx_pf_6gensim_6models_14word2vec_inner_train_batch_sg(CYTHON __pyx_t_5 = ((__pyx_v_j == __pyx_v_i) != 0); if (__pyx_t_5) { - /* "gensim/models/word2vec_inner.pyx":584 + /* "gensim/models/word2vec_inner.pyx":583 * for j in range(j, k): * if j == i: * continue # <<<<<<<<<<<<<< @@ -5306,8 +5360,8 @@ static PyObject *__pyx_pf_6gensim_6models_14word2vec_inner_train_batch_sg(CYTHON */ goto __pyx_L26_continue; - /* "gensim/models/word2vec_inner.pyx":583 - * _running_training_loss_sample = 0 + /* "gensim/models/word2vec_inner.pyx":582 + * k = idx_end * for j in range(j, k): * if j == i: # <<<<<<<<<<<<<< * continue @@ -5315,7 +5369,7 @@ static PyObject *__pyx_pf_6gensim_6models_14word2vec_inner_train_batch_sg(CYTHON */ } - /* "gensim/models/word2vec_inner.pyx":585 + /* "gensim/models/word2vec_inner.pyx":584 * if j == i: * continue * effective_samples += 1 # <<<<<<<<<<<<<< @@ -5324,7 +5378,7 @@ static PyObject *__pyx_pf_6gensim_6models_14word2vec_inner_train_batch_sg(CYTHON */ __pyx_v_effective_samples = (__pyx_v_effective_samples + 1); - /* "gensim/models/word2vec_inner.pyx":586 + /* "gensim/models/word2vec_inner.pyx":585 * continue * effective_samples += 1 * if c.hs: # <<<<<<<<<<<<<< @@ -5334,7 +5388,7 @@ static PyObject *__pyx_pf_6gensim_6models_14word2vec_inner_train_batch_sg(CYTHON __pyx_t_5 = (__pyx_v_c.hs != 0); if (__pyx_t_5) { - /* "gensim/models/word2vec_inner.pyx":587 + /* "gensim/models/word2vec_inner.pyx":586 * effective_samples += 1 * if c.hs: * w2v_fast_sentence_sg_hs(c.points[i], c.codes[i], c.codelens[i], c.syn0, c.syn1, c.size, c.indexes[j], c.alpha, c.work, c.word_locks, c.compute_loss, &c.running_training_loss) # <<<<<<<<<<<<<< @@ -5343,7 +5397,7 @@ static PyObject *__pyx_pf_6gensim_6models_14word2vec_inner_train_batch_sg(CYTHON */ __pyx_f_6gensim_6models_14word2vec_inner_w2v_fast_sentence_sg_hs((__pyx_v_c.points[__pyx_v_i]), (__pyx_v_c.codes[__pyx_v_i]), (__pyx_v_c.codelens[__pyx_v_i]), __pyx_v_c.syn0, __pyx_v_c.syn1, __pyx_v_c.size, (__pyx_v_c.indexes[__pyx_v_j]), __pyx_v_c.alpha, __pyx_v_c.work, __pyx_v_c.word_locks, __pyx_v_c.compute_loss, (&__pyx_v_c.running_training_loss)); - /* "gensim/models/word2vec_inner.pyx":586 + /* "gensim/models/word2vec_inner.pyx":585 * continue * effective_samples += 1 * if c.hs: # <<<<<<<<<<<<<< @@ -5352,7 +5406,7 @@ static PyObject *__pyx_pf_6gensim_6models_14word2vec_inner_train_batch_sg(CYTHON */ } - /* "gensim/models/word2vec_inner.pyx":588 + /* "gensim/models/word2vec_inner.pyx":587 * if c.hs: * w2v_fast_sentence_sg_hs(c.points[i], c.codes[i], c.codelens[i], c.syn0, c.syn1, c.size, c.indexes[j], c.alpha, c.work, c.word_locks, c.compute_loss, &c.running_training_loss) * if c.negative: # <<<<<<<<<<<<<< @@ -5362,7 +5416,7 @@ static PyObject *__pyx_pf_6gensim_6models_14word2vec_inner_train_batch_sg(CYTHON __pyx_t_5 = (__pyx_v_c.negative != 0); if (__pyx_t_5) { - /* "gensim/models/word2vec_inner.pyx":589 + /* "gensim/models/word2vec_inner.pyx":588 * w2v_fast_sentence_sg_hs(c.points[i], c.codes[i], c.codelens[i], c.syn0, c.syn1, c.size, c.indexes[j], c.alpha, c.work, c.word_locks, c.compute_loss, &c.running_training_loss) * if c.negative: * c.next_random = w2v_fast_sentence_sg_neg(c.negative, c.cum_table, c.cum_table_len, c.syn0, c.syn1neg, c.size, c.indexes[i], c.indexes[j], c.alpha, c.work, c.next_random, c.word_locks, c.compute_loss, &c.running_training_loss) # <<<<<<<<<<<<<< @@ -5371,7 +5425,7 @@ static PyObject *__pyx_pf_6gensim_6models_14word2vec_inner_train_batch_sg(CYTHON */ __pyx_v_c.next_random = __pyx_f_6gensim_6models_14word2vec_inner_w2v_fast_sentence_sg_neg(__pyx_v_c.negative, __pyx_v_c.cum_table, __pyx_v_c.cum_table_len, __pyx_v_c.syn0, __pyx_v_c.syn1neg, __pyx_v_c.size, (__pyx_v_c.indexes[__pyx_v_i]), (__pyx_v_c.indexes[__pyx_v_j]), __pyx_v_c.alpha, __pyx_v_c.work, __pyx_v_c.next_random, __pyx_v_c.word_locks, __pyx_v_c.compute_loss, (&__pyx_v_c.running_training_loss)); - /* "gensim/models/word2vec_inner.pyx":588 + /* "gensim/models/word2vec_inner.pyx":587 * if c.hs: * w2v_fast_sentence_sg_hs(c.points[i], c.codes[i], c.codelens[i], c.syn0, c.syn1, c.size, c.indexes[j], c.alpha, c.work, c.word_locks, c.compute_loss, &c.running_training_loss) * if c.negative: # <<<<<<<<<<<<<< @@ -5404,25 +5458,25 @@ static PyObject *__pyx_pf_6gensim_6models_14word2vec_inner_train_batch_sg(CYTHON } } - /* "gensim/models/word2vec_inner.pyx":591 + /* "gensim/models/word2vec_inner.pyx":590 * c.next_random = w2v_fast_sentence_sg_neg(c.negative, c.cum_table, c.cum_table_len, c.syn0, c.syn1neg, c.size, c.indexes[i], c.indexes[j], c.alpha, c.work, c.next_random, c.word_locks, c.compute_loss, &c.running_training_loss) * * model.running_training_loss += c.running_training_loss # <<<<<<<<<<<<<< * return effective_words, effective_samples * */ - __pyx_t_11 = __Pyx_PyObject_GetAttrStr(__pyx_v_model, __pyx_n_s_running_training_loss); if (unlikely(!__pyx_t_11)) __PYX_ERR(0, 591, __pyx_L1_error) + __pyx_t_11 = __Pyx_PyObject_GetAttrStr(__pyx_v_model, __pyx_n_s_running_training_loss); if (unlikely(!__pyx_t_11)) __PYX_ERR(0, 590, __pyx_L1_error) __Pyx_GOTREF(__pyx_t_11); - __pyx_t_2 = PyFloat_FromDouble(__pyx_v_c.running_training_loss); if (unlikely(!__pyx_t_2)) __PYX_ERR(0, 591, __pyx_L1_error) + __pyx_t_2 = PyFloat_FromDouble(__pyx_v_c.running_training_loss); if (unlikely(!__pyx_t_2)) __PYX_ERR(0, 590, __pyx_L1_error) __Pyx_GOTREF(__pyx_t_2); - __pyx_t_16 = PyNumber_InPlaceAdd(__pyx_t_11, __pyx_t_2); if (unlikely(!__pyx_t_16)) __PYX_ERR(0, 591, __pyx_L1_error) + __pyx_t_16 = PyNumber_InPlaceAdd(__pyx_t_11, __pyx_t_2); if (unlikely(!__pyx_t_16)) __PYX_ERR(0, 590, __pyx_L1_error) __Pyx_GOTREF(__pyx_t_16); __Pyx_DECREF(__pyx_t_11); __pyx_t_11 = 0; __Pyx_DECREF(__pyx_t_2); __pyx_t_2 = 0; - if (__Pyx_PyObject_SetAttrStr(__pyx_v_model, __pyx_n_s_running_training_loss, __pyx_t_16) < 0) __PYX_ERR(0, 591, __pyx_L1_error) + if (__Pyx_PyObject_SetAttrStr(__pyx_v_model, __pyx_n_s_running_training_loss, __pyx_t_16) < 0) __PYX_ERR(0, 590, __pyx_L1_error) __Pyx_DECREF(__pyx_t_16); __pyx_t_16 = 0; - /* "gensim/models/word2vec_inner.pyx":592 + /* "gensim/models/word2vec_inner.pyx":591 * * model.running_training_loss += c.running_training_loss * return effective_words, effective_samples # <<<<<<<<<<<<<< @@ -5430,11 +5484,11 @@ static PyObject *__pyx_pf_6gensim_6models_14word2vec_inner_train_batch_sg(CYTHON * */ __Pyx_XDECREF(__pyx_r); - __pyx_t_16 = __Pyx_PyInt_From_int(__pyx_v_effective_words); if (unlikely(!__pyx_t_16)) __PYX_ERR(0, 592, __pyx_L1_error) + __pyx_t_16 = __Pyx_PyInt_From_int(__pyx_v_effective_words); if (unlikely(!__pyx_t_16)) __PYX_ERR(0, 591, __pyx_L1_error) __Pyx_GOTREF(__pyx_t_16); - __pyx_t_2 = __Pyx_PyInt_From_int(__pyx_v_effective_samples); if (unlikely(!__pyx_t_2)) __PYX_ERR(0, 592, __pyx_L1_error) + __pyx_t_2 = __Pyx_PyInt_From_int(__pyx_v_effective_samples); if (unlikely(!__pyx_t_2)) __PYX_ERR(0, 591, __pyx_L1_error) __Pyx_GOTREF(__pyx_t_2); - __pyx_t_11 = PyTuple_New(2); if (unlikely(!__pyx_t_11)) __PYX_ERR(0, 592, __pyx_L1_error) + __pyx_t_11 = PyTuple_New(2); if (unlikely(!__pyx_t_11)) __PYX_ERR(0, 591, __pyx_L1_error) __Pyx_GOTREF(__pyx_t_11); __Pyx_GIVEREF(__pyx_t_16); PyTuple_SET_ITEM(__pyx_t_11, 0, __pyx_t_16); @@ -5475,7 +5529,7 @@ static PyObject *__pyx_pf_6gensim_6models_14word2vec_inner_train_batch_sg(CYTHON return __pyx_r; } -/* "gensim/models/word2vec_inner.pyx":595 +/* "gensim/models/word2vec_inner.pyx":594 * * * def train_batch_cbow(model, sentences, alpha, _work, _neu1, compute_loss): # <<<<<<<<<<<<<< @@ -5486,7 +5540,7 @@ static PyObject *__pyx_pf_6gensim_6models_14word2vec_inner_train_batch_sg(CYTHON /* Python wrapper */ static PyObject *__pyx_pw_6gensim_6models_14word2vec_inner_3train_batch_cbow(PyObject *__pyx_self, PyObject *__pyx_args, PyObject *__pyx_kwds); /*proto*/ static char __pyx_doc_6gensim_6models_14word2vec_inner_2train_batch_cbow[] = "train_batch_cbow(model, sentences, alpha, _work, _neu1, compute_loss)\nUpdate CBOW model by training on a batch of sentences.\n\n Called internally from :meth:`~gensim.models.word2vec.Word2Vec.train`.\n\n Parameters\n ----------\n model : :class:`~gensim.models.word2vec.Word2Vec`\n The Word2Vec model instance to train.\n sentences : iterable of list of str\n The corpus used to train the model.\n alpha : float\n The learning rate.\n _work : np.ndarray\n Private working memory for each worker.\n _neu1 : np.ndarray\n Private working memory for each worker.\n compute_loss : bool\n Whether or not the training loss should be computed in this batch.\n\n Returns\n -------\n int\n Number of words in the vocabulary actually used for training (They already existed in the vocabulary\n and were not discarded by negative sampling).\n int\n Number of samples used for training. A sample is a positive/negative example. In the case of CBOW\n this is the same as the effective number of words.\n "; -static PyMethodDef __pyx_mdef_6gensim_6models_14word2vec_inner_3train_batch_cbow = {"train_batch_cbow", (PyCFunction)__pyx_pw_6gensim_6models_14word2vec_inner_3train_batch_cbow, METH_VARARGS|METH_KEYWORDS, __pyx_doc_6gensim_6models_14word2vec_inner_2train_batch_cbow}; +static PyMethodDef __pyx_mdef_6gensim_6models_14word2vec_inner_3train_batch_cbow = {"train_batch_cbow", (PyCFunction)(void*)(PyCFunctionWithKeywords)__pyx_pw_6gensim_6models_14word2vec_inner_3train_batch_cbow, METH_VARARGS|METH_KEYWORDS, __pyx_doc_6gensim_6models_14word2vec_inner_2train_batch_cbow}; static PyObject *__pyx_pw_6gensim_6models_14word2vec_inner_3train_batch_cbow(PyObject *__pyx_self, PyObject *__pyx_args, PyObject *__pyx_kwds) { PyObject *__pyx_v_model = 0; PyObject *__pyx_v_sentences = 0; @@ -5528,35 +5582,35 @@ static PyObject *__pyx_pw_6gensim_6models_14word2vec_inner_3train_batch_cbow(PyO case 1: if (likely((values[1] = __Pyx_PyDict_GetItemStr(__pyx_kwds, __pyx_n_s_sentences)) != 0)) kw_args--; else { - __Pyx_RaiseArgtupleInvalid("train_batch_cbow", 1, 6, 6, 1); __PYX_ERR(0, 595, __pyx_L3_error) + __Pyx_RaiseArgtupleInvalid("train_batch_cbow", 1, 6, 6, 1); __PYX_ERR(0, 594, __pyx_L3_error) } CYTHON_FALLTHROUGH; case 2: if (likely((values[2] = __Pyx_PyDict_GetItemStr(__pyx_kwds, __pyx_n_s_alpha)) != 0)) kw_args--; else { - __Pyx_RaiseArgtupleInvalid("train_batch_cbow", 1, 6, 6, 2); __PYX_ERR(0, 595, __pyx_L3_error) + __Pyx_RaiseArgtupleInvalid("train_batch_cbow", 1, 6, 6, 2); __PYX_ERR(0, 594, __pyx_L3_error) } CYTHON_FALLTHROUGH; case 3: if (likely((values[3] = __Pyx_PyDict_GetItemStr(__pyx_kwds, __pyx_n_s_work)) != 0)) kw_args--; else { - __Pyx_RaiseArgtupleInvalid("train_batch_cbow", 1, 6, 6, 3); __PYX_ERR(0, 595, __pyx_L3_error) + __Pyx_RaiseArgtupleInvalid("train_batch_cbow", 1, 6, 6, 3); __PYX_ERR(0, 594, __pyx_L3_error) } CYTHON_FALLTHROUGH; case 4: if (likely((values[4] = __Pyx_PyDict_GetItemStr(__pyx_kwds, __pyx_n_s_neu1)) != 0)) kw_args--; else { - __Pyx_RaiseArgtupleInvalid("train_batch_cbow", 1, 6, 6, 4); __PYX_ERR(0, 595, __pyx_L3_error) + __Pyx_RaiseArgtupleInvalid("train_batch_cbow", 1, 6, 6, 4); __PYX_ERR(0, 594, __pyx_L3_error) } CYTHON_FALLTHROUGH; case 5: if (likely((values[5] = __Pyx_PyDict_GetItemStr(__pyx_kwds, __pyx_n_s_compute_loss)) != 0)) kw_args--; else { - __Pyx_RaiseArgtupleInvalid("train_batch_cbow", 1, 6, 6, 5); __PYX_ERR(0, 595, __pyx_L3_error) + __Pyx_RaiseArgtupleInvalid("train_batch_cbow", 1, 6, 6, 5); __PYX_ERR(0, 594, __pyx_L3_error) } } if (unlikely(kw_args > 0)) { - if (unlikely(__Pyx_ParseOptionalKeywords(__pyx_kwds, __pyx_pyargnames, 0, values, pos_args, "train_batch_cbow") < 0)) __PYX_ERR(0, 595, __pyx_L3_error) + if (unlikely(__Pyx_ParseOptionalKeywords(__pyx_kwds, __pyx_pyargnames, 0, values, pos_args, "train_batch_cbow") < 0)) __PYX_ERR(0, 594, __pyx_L3_error) } } else if (PyTuple_GET_SIZE(__pyx_args) != 6) { goto __pyx_L5_argtuple_error; @@ -5577,7 +5631,7 @@ static PyObject *__pyx_pw_6gensim_6models_14word2vec_inner_3train_batch_cbow(PyO } goto __pyx_L4_argument_unpacking_done; __pyx_L5_argtuple_error:; - __Pyx_RaiseArgtupleInvalid("train_batch_cbow", 1, 6, 6, PyTuple_GET_SIZE(__pyx_args)); __PYX_ERR(0, 595, __pyx_L3_error) + __Pyx_RaiseArgtupleInvalid("train_batch_cbow", 1, 6, 6, PyTuple_GET_SIZE(__pyx_args)); __PYX_ERR(0, 594, __pyx_L3_error) __pyx_L3_error:; __Pyx_AddTraceback("gensim.models.word2vec_inner.train_batch_cbow", __pyx_clineno, __pyx_lineno, __pyx_filename); __Pyx_RefNannyFinishContext(); @@ -5630,7 +5684,7 @@ static PyObject *__pyx_pf_6gensim_6models_14word2vec_inner_2train_batch_cbow(CYT int __pyx_t_21; __Pyx_RefNannySetupContext("train_batch_cbow", 0); - /* "gensim/models/word2vec_inner.pyx":627 + /* "gensim/models/word2vec_inner.pyx":626 * cdef Word2VecConfig c * cdef int i, j, k * cdef int effective_words = 0, effective_sentences = 0 # <<<<<<<<<<<<<< @@ -5640,7 +5694,7 @@ static PyObject *__pyx_pf_6gensim_6models_14word2vec_inner_2train_batch_cbow(CYT __pyx_v_effective_words = 0; __pyx_v_effective_sentences = 0; - /* "gensim/models/word2vec_inner.pyx":630 + /* "gensim/models/word2vec_inner.pyx":629 * cdef int sent_idx, idx_start, idx_end * * init_w2v_config(&c, model, alpha, compute_loss, _work, _neu1) # <<<<<<<<<<<<<< @@ -5649,26 +5703,26 @@ static PyObject *__pyx_pf_6gensim_6models_14word2vec_inner_2train_batch_cbow(CYT */ __pyx_t_2.__pyx_n = 1; __pyx_t_2._neu1 = __pyx_v__neu1; - __pyx_t_1 = __pyx_f_6gensim_6models_14word2vec_inner_init_w2v_config((&__pyx_v_c), __pyx_v_model, __pyx_v_alpha, __pyx_v_compute_loss, __pyx_v__work, &__pyx_t_2); if (unlikely(!__pyx_t_1)) __PYX_ERR(0, 630, __pyx_L1_error) + __pyx_t_1 = __pyx_f_6gensim_6models_14word2vec_inner_init_w2v_config((&__pyx_v_c), __pyx_v_model, __pyx_v_alpha, __pyx_v_compute_loss, __pyx_v__work, &__pyx_t_2); if (unlikely(!__pyx_t_1)) __PYX_ERR(0, 629, __pyx_L1_error) __Pyx_GOTREF(__pyx_t_1); __Pyx_DECREF(__pyx_t_1); __pyx_t_1 = 0; - /* "gensim/models/word2vec_inner.pyx":633 + /* "gensim/models/word2vec_inner.pyx":632 * * # prepare C structures so we can go "full C" and release the Python GIL * vlookup = model.wv.vocab # <<<<<<<<<<<<<< * c.sentence_idx[0] = 0 # indices of the first sentence always start at 0 * for sent in sentences: */ - __pyx_t_1 = __Pyx_PyObject_GetAttrStr(__pyx_v_model, __pyx_n_s_wv); if (unlikely(!__pyx_t_1)) __PYX_ERR(0, 633, __pyx_L1_error) + __pyx_t_1 = __Pyx_PyObject_GetAttrStr(__pyx_v_model, __pyx_n_s_wv); if (unlikely(!__pyx_t_1)) __PYX_ERR(0, 632, __pyx_L1_error) __Pyx_GOTREF(__pyx_t_1); - __pyx_t_3 = __Pyx_PyObject_GetAttrStr(__pyx_t_1, __pyx_n_s_vocab); if (unlikely(!__pyx_t_3)) __PYX_ERR(0, 633, __pyx_L1_error) + __pyx_t_3 = __Pyx_PyObject_GetAttrStr(__pyx_t_1, __pyx_n_s_vocab); if (unlikely(!__pyx_t_3)) __PYX_ERR(0, 632, __pyx_L1_error) __Pyx_GOTREF(__pyx_t_3); __Pyx_DECREF(__pyx_t_1); __pyx_t_1 = 0; __pyx_v_vlookup = __pyx_t_3; __pyx_t_3 = 0; - /* "gensim/models/word2vec_inner.pyx":634 + /* "gensim/models/word2vec_inner.pyx":633 * # prepare C structures so we can go "full C" and release the Python GIL * vlookup = model.wv.vocab * c.sentence_idx[0] = 0 # indices of the first sentence always start at 0 # <<<<<<<<<<<<<< @@ -5677,7 +5731,7 @@ static PyObject *__pyx_pf_6gensim_6models_14word2vec_inner_2train_batch_cbow(CYT */ (__pyx_v_c.sentence_idx[0]) = 0; - /* "gensim/models/word2vec_inner.pyx":635 + /* "gensim/models/word2vec_inner.pyx":634 * vlookup = model.wv.vocab * c.sentence_idx[0] = 0 # indices of the first sentence always start at 0 * for sent in sentences: # <<<<<<<<<<<<<< @@ -5688,26 +5742,26 @@ static PyObject *__pyx_pf_6gensim_6models_14word2vec_inner_2train_batch_cbow(CYT __pyx_t_3 = __pyx_v_sentences; __Pyx_INCREF(__pyx_t_3); __pyx_t_4 = 0; __pyx_t_5 = NULL; } else { - __pyx_t_4 = -1; __pyx_t_3 = PyObject_GetIter(__pyx_v_sentences); if (unlikely(!__pyx_t_3)) __PYX_ERR(0, 635, __pyx_L1_error) + __pyx_t_4 = -1; __pyx_t_3 = PyObject_GetIter(__pyx_v_sentences); if (unlikely(!__pyx_t_3)) __PYX_ERR(0, 634, __pyx_L1_error) __Pyx_GOTREF(__pyx_t_3); - __pyx_t_5 = Py_TYPE(__pyx_t_3)->tp_iternext; if (unlikely(!__pyx_t_5)) __PYX_ERR(0, 635, __pyx_L1_error) + __pyx_t_5 = Py_TYPE(__pyx_t_3)->tp_iternext; if (unlikely(!__pyx_t_5)) __PYX_ERR(0, 634, __pyx_L1_error) } for (;;) { if (likely(!__pyx_t_5)) { if (likely(PyList_CheckExact(__pyx_t_3))) { if (__pyx_t_4 >= PyList_GET_SIZE(__pyx_t_3)) break; #if CYTHON_ASSUME_SAFE_MACROS && !CYTHON_AVOID_BORROWED_REFS - __pyx_t_1 = PyList_GET_ITEM(__pyx_t_3, __pyx_t_4); __Pyx_INCREF(__pyx_t_1); __pyx_t_4++; if (unlikely(0 < 0)) __PYX_ERR(0, 635, __pyx_L1_error) + __pyx_t_1 = PyList_GET_ITEM(__pyx_t_3, __pyx_t_4); __Pyx_INCREF(__pyx_t_1); __pyx_t_4++; if (unlikely(0 < 0)) __PYX_ERR(0, 634, __pyx_L1_error) #else - __pyx_t_1 = PySequence_ITEM(__pyx_t_3, __pyx_t_4); __pyx_t_4++; if (unlikely(!__pyx_t_1)) __PYX_ERR(0, 635, __pyx_L1_error) + __pyx_t_1 = PySequence_ITEM(__pyx_t_3, __pyx_t_4); __pyx_t_4++; if (unlikely(!__pyx_t_1)) __PYX_ERR(0, 634, __pyx_L1_error) __Pyx_GOTREF(__pyx_t_1); #endif } else { if (__pyx_t_4 >= PyTuple_GET_SIZE(__pyx_t_3)) break; #if CYTHON_ASSUME_SAFE_MACROS && !CYTHON_AVOID_BORROWED_REFS - __pyx_t_1 = PyTuple_GET_ITEM(__pyx_t_3, __pyx_t_4); __Pyx_INCREF(__pyx_t_1); __pyx_t_4++; if (unlikely(0 < 0)) __PYX_ERR(0, 635, __pyx_L1_error) + __pyx_t_1 = PyTuple_GET_ITEM(__pyx_t_3, __pyx_t_4); __Pyx_INCREF(__pyx_t_1); __pyx_t_4++; if (unlikely(0 < 0)) __PYX_ERR(0, 634, __pyx_L1_error) #else - __pyx_t_1 = PySequence_ITEM(__pyx_t_3, __pyx_t_4); __pyx_t_4++; if (unlikely(!__pyx_t_1)) __PYX_ERR(0, 635, __pyx_L1_error) + __pyx_t_1 = PySequence_ITEM(__pyx_t_3, __pyx_t_4); __pyx_t_4++; if (unlikely(!__pyx_t_1)) __PYX_ERR(0, 634, __pyx_L1_error) __Pyx_GOTREF(__pyx_t_1); #endif } @@ -5717,7 +5771,7 @@ static PyObject *__pyx_pf_6gensim_6models_14word2vec_inner_2train_batch_cbow(CYT PyObject* exc_type = PyErr_Occurred(); if (exc_type) { if (likely(__Pyx_PyErr_GivenExceptionMatches(exc_type, PyExc_StopIteration))) PyErr_Clear(); - else __PYX_ERR(0, 635, __pyx_L1_error) + else __PYX_ERR(0, 634, __pyx_L1_error) } break; } @@ -5726,18 +5780,18 @@ static PyObject *__pyx_pf_6gensim_6models_14word2vec_inner_2train_batch_cbow(CYT __Pyx_XDECREF_SET(__pyx_v_sent, __pyx_t_1); __pyx_t_1 = 0; - /* "gensim/models/word2vec_inner.pyx":636 + /* "gensim/models/word2vec_inner.pyx":635 * c.sentence_idx[0] = 0 # indices of the first sentence always start at 0 * for sent in sentences: * if not sent: # <<<<<<<<<<<<<< * continue # ignore empty sentences; leave effective_sentences unchanged * for token in sent: */ - __pyx_t_6 = __Pyx_PyObject_IsTrue(__pyx_v_sent); if (unlikely(__pyx_t_6 < 0)) __PYX_ERR(0, 636, __pyx_L1_error) + __pyx_t_6 = __Pyx_PyObject_IsTrue(__pyx_v_sent); if (unlikely(__pyx_t_6 < 0)) __PYX_ERR(0, 635, __pyx_L1_error) __pyx_t_7 = ((!__pyx_t_6) != 0); if (__pyx_t_7) { - /* "gensim/models/word2vec_inner.pyx":637 + /* "gensim/models/word2vec_inner.pyx":636 * for sent in sentences: * if not sent: * continue # ignore empty sentences; leave effective_sentences unchanged # <<<<<<<<<<<<<< @@ -5746,7 +5800,7 @@ static PyObject *__pyx_pf_6gensim_6models_14word2vec_inner_2train_batch_cbow(CYT */ goto __pyx_L3_continue; - /* "gensim/models/word2vec_inner.pyx":636 + /* "gensim/models/word2vec_inner.pyx":635 * c.sentence_idx[0] = 0 # indices of the first sentence always start at 0 * for sent in sentences: * if not sent: # <<<<<<<<<<<<<< @@ -5755,7 +5809,7 @@ static PyObject *__pyx_pf_6gensim_6models_14word2vec_inner_2train_batch_cbow(CYT */ } - /* "gensim/models/word2vec_inner.pyx":638 + /* "gensim/models/word2vec_inner.pyx":637 * if not sent: * continue # ignore empty sentences; leave effective_sentences unchanged * for token in sent: # <<<<<<<<<<<<<< @@ -5766,26 +5820,26 @@ static PyObject *__pyx_pf_6gensim_6models_14word2vec_inner_2train_batch_cbow(CYT __pyx_t_1 = __pyx_v_sent; __Pyx_INCREF(__pyx_t_1); __pyx_t_8 = 0; __pyx_t_9 = NULL; } else { - __pyx_t_8 = -1; __pyx_t_1 = PyObject_GetIter(__pyx_v_sent); if (unlikely(!__pyx_t_1)) __PYX_ERR(0, 638, __pyx_L1_error) + __pyx_t_8 = -1; __pyx_t_1 = PyObject_GetIter(__pyx_v_sent); if (unlikely(!__pyx_t_1)) __PYX_ERR(0, 637, __pyx_L1_error) __Pyx_GOTREF(__pyx_t_1); - __pyx_t_9 = Py_TYPE(__pyx_t_1)->tp_iternext; if (unlikely(!__pyx_t_9)) __PYX_ERR(0, 638, __pyx_L1_error) + __pyx_t_9 = Py_TYPE(__pyx_t_1)->tp_iternext; if (unlikely(!__pyx_t_9)) __PYX_ERR(0, 637, __pyx_L1_error) } for (;;) { if (likely(!__pyx_t_9)) { if (likely(PyList_CheckExact(__pyx_t_1))) { if (__pyx_t_8 >= PyList_GET_SIZE(__pyx_t_1)) break; #if CYTHON_ASSUME_SAFE_MACROS && !CYTHON_AVOID_BORROWED_REFS - __pyx_t_10 = PyList_GET_ITEM(__pyx_t_1, __pyx_t_8); __Pyx_INCREF(__pyx_t_10); __pyx_t_8++; if (unlikely(0 < 0)) __PYX_ERR(0, 638, __pyx_L1_error) + __pyx_t_10 = PyList_GET_ITEM(__pyx_t_1, __pyx_t_8); __Pyx_INCREF(__pyx_t_10); __pyx_t_8++; if (unlikely(0 < 0)) __PYX_ERR(0, 637, __pyx_L1_error) #else - __pyx_t_10 = PySequence_ITEM(__pyx_t_1, __pyx_t_8); __pyx_t_8++; if (unlikely(!__pyx_t_10)) __PYX_ERR(0, 638, __pyx_L1_error) + __pyx_t_10 = PySequence_ITEM(__pyx_t_1, __pyx_t_8); __pyx_t_8++; if (unlikely(!__pyx_t_10)) __PYX_ERR(0, 637, __pyx_L1_error) __Pyx_GOTREF(__pyx_t_10); #endif } else { if (__pyx_t_8 >= PyTuple_GET_SIZE(__pyx_t_1)) break; #if CYTHON_ASSUME_SAFE_MACROS && !CYTHON_AVOID_BORROWED_REFS - __pyx_t_10 = PyTuple_GET_ITEM(__pyx_t_1, __pyx_t_8); __Pyx_INCREF(__pyx_t_10); __pyx_t_8++; if (unlikely(0 < 0)) __PYX_ERR(0, 638, __pyx_L1_error) + __pyx_t_10 = PyTuple_GET_ITEM(__pyx_t_1, __pyx_t_8); __Pyx_INCREF(__pyx_t_10); __pyx_t_8++; if (unlikely(0 < 0)) __PYX_ERR(0, 637, __pyx_L1_error) #else - __pyx_t_10 = PySequence_ITEM(__pyx_t_1, __pyx_t_8); __pyx_t_8++; if (unlikely(!__pyx_t_10)) __PYX_ERR(0, 638, __pyx_L1_error) + __pyx_t_10 = PySequence_ITEM(__pyx_t_1, __pyx_t_8); __pyx_t_8++; if (unlikely(!__pyx_t_10)) __PYX_ERR(0, 637, __pyx_L1_error) __Pyx_GOTREF(__pyx_t_10); #endif } @@ -5795,7 +5849,7 @@ static PyObject *__pyx_pf_6gensim_6models_14word2vec_inner_2train_batch_cbow(CYT PyObject* exc_type = PyErr_Occurred(); if (exc_type) { if (likely(__Pyx_PyErr_GivenExceptionMatches(exc_type, PyExc_StopIteration))) PyErr_Clear(); - else __PYX_ERR(0, 638, __pyx_L1_error) + else __PYX_ERR(0, 637, __pyx_L1_error) } break; } @@ -5804,16 +5858,16 @@ static PyObject *__pyx_pf_6gensim_6models_14word2vec_inner_2train_batch_cbow(CYT __Pyx_XDECREF_SET(__pyx_v_token, __pyx_t_10); __pyx_t_10 = 0; - /* "gensim/models/word2vec_inner.pyx":639 + /* "gensim/models/word2vec_inner.pyx":638 * continue # ignore empty sentences; leave effective_sentences unchanged * for token in sent: * word = vlookup[token] if token in vlookup else None # <<<<<<<<<<<<<< * if word is None: * continue # leaving `effective_words` unchanged = shortening the sentence = expanding the window */ - __pyx_t_7 = (__Pyx_PySequence_ContainsTF(__pyx_v_token, __pyx_v_vlookup, Py_EQ)); if (unlikely(__pyx_t_7 < 0)) __PYX_ERR(0, 639, __pyx_L1_error) + __pyx_t_7 = (__Pyx_PySequence_ContainsTF(__pyx_v_token, __pyx_v_vlookup, Py_EQ)); if (unlikely(__pyx_t_7 < 0)) __PYX_ERR(0, 638, __pyx_L1_error) if ((__pyx_t_7 != 0)) { - __pyx_t_11 = __Pyx_PyObject_GetItem(__pyx_v_vlookup, __pyx_v_token); if (unlikely(!__pyx_t_11)) __PYX_ERR(0, 639, __pyx_L1_error) + __pyx_t_11 = __Pyx_PyObject_GetItem(__pyx_v_vlookup, __pyx_v_token); if (unlikely(!__pyx_t_11)) __PYX_ERR(0, 638, __pyx_L1_error) __Pyx_GOTREF(__pyx_t_11); __pyx_t_10 = __pyx_t_11; __pyx_t_11 = 0; @@ -5824,7 +5878,7 @@ static PyObject *__pyx_pf_6gensim_6models_14word2vec_inner_2train_batch_cbow(CYT __Pyx_XDECREF_SET(__pyx_v_word, __pyx_t_10); __pyx_t_10 = 0; - /* "gensim/models/word2vec_inner.pyx":640 + /* "gensim/models/word2vec_inner.pyx":639 * for token in sent: * word = vlookup[token] if token in vlookup else None * if word is None: # <<<<<<<<<<<<<< @@ -5835,7 +5889,7 @@ static PyObject *__pyx_pf_6gensim_6models_14word2vec_inner_2train_batch_cbow(CYT __pyx_t_6 = (__pyx_t_7 != 0); if (__pyx_t_6) { - /* "gensim/models/word2vec_inner.pyx":641 + /* "gensim/models/word2vec_inner.pyx":640 * word = vlookup[token] if token in vlookup else None * if word is None: * continue # leaving `effective_words` unchanged = shortening the sentence = expanding the window # <<<<<<<<<<<<<< @@ -5844,7 +5898,7 @@ static PyObject *__pyx_pf_6gensim_6models_14word2vec_inner_2train_batch_cbow(CYT */ goto __pyx_L6_continue; - /* "gensim/models/word2vec_inner.pyx":640 + /* "gensim/models/word2vec_inner.pyx":639 * for token in sent: * word = vlookup[token] if token in vlookup else None * if word is None: # <<<<<<<<<<<<<< @@ -5853,7 +5907,7 @@ static PyObject *__pyx_pf_6gensim_6models_14word2vec_inner_2train_batch_cbow(CYT */ } - /* "gensim/models/word2vec_inner.pyx":642 + /* "gensim/models/word2vec_inner.pyx":641 * if word is None: * continue # leaving `effective_words` unchanged = shortening the sentence = expanding the window * if c.sample and word.sample_int < random_int32(&c.next_random): # <<<<<<<<<<<<<< @@ -5866,20 +5920,20 @@ static PyObject *__pyx_pf_6gensim_6models_14word2vec_inner_2train_batch_cbow(CYT __pyx_t_6 = __pyx_t_7; goto __pyx_L10_bool_binop_done; } - __pyx_t_10 = __Pyx_PyObject_GetAttrStr(__pyx_v_word, __pyx_n_s_sample_int); if (unlikely(!__pyx_t_10)) __PYX_ERR(0, 642, __pyx_L1_error) + __pyx_t_10 = __Pyx_PyObject_GetAttrStr(__pyx_v_word, __pyx_n_s_sample_int); if (unlikely(!__pyx_t_10)) __PYX_ERR(0, 641, __pyx_L1_error) __Pyx_GOTREF(__pyx_t_10); - __pyx_t_11 = __Pyx_PyInt_From_unsigned_PY_LONG_LONG(__pyx_f_6gensim_6models_14word2vec_inner_random_int32((&__pyx_v_c.next_random))); if (unlikely(!__pyx_t_11)) __PYX_ERR(0, 642, __pyx_L1_error) + __pyx_t_11 = __Pyx_PyInt_From_unsigned_PY_LONG_LONG(__pyx_f_6gensim_6models_14word2vec_inner_random_int32((&__pyx_v_c.next_random))); if (unlikely(!__pyx_t_11)) __PYX_ERR(0, 641, __pyx_L1_error) __Pyx_GOTREF(__pyx_t_11); - __pyx_t_12 = PyObject_RichCompare(__pyx_t_10, __pyx_t_11, Py_LT); __Pyx_XGOTREF(__pyx_t_12); if (unlikely(!__pyx_t_12)) __PYX_ERR(0, 642, __pyx_L1_error) + __pyx_t_12 = PyObject_RichCompare(__pyx_t_10, __pyx_t_11, Py_LT); __Pyx_XGOTREF(__pyx_t_12); if (unlikely(!__pyx_t_12)) __PYX_ERR(0, 641, __pyx_L1_error) __Pyx_DECREF(__pyx_t_10); __pyx_t_10 = 0; __Pyx_DECREF(__pyx_t_11); __pyx_t_11 = 0; - __pyx_t_7 = __Pyx_PyObject_IsTrue(__pyx_t_12); if (unlikely(__pyx_t_7 < 0)) __PYX_ERR(0, 642, __pyx_L1_error) + __pyx_t_7 = __Pyx_PyObject_IsTrue(__pyx_t_12); if (unlikely(__pyx_t_7 < 0)) __PYX_ERR(0, 641, __pyx_L1_error) __Pyx_DECREF(__pyx_t_12); __pyx_t_12 = 0; __pyx_t_6 = __pyx_t_7; __pyx_L10_bool_binop_done:; if (__pyx_t_6) { - /* "gensim/models/word2vec_inner.pyx":643 + /* "gensim/models/word2vec_inner.pyx":642 * continue # leaving `effective_words` unchanged = shortening the sentence = expanding the window * if c.sample and word.sample_int < random_int32(&c.next_random): * continue # <<<<<<<<<<<<<< @@ -5888,7 +5942,7 @@ static PyObject *__pyx_pf_6gensim_6models_14word2vec_inner_2train_batch_cbow(CYT */ goto __pyx_L6_continue; - /* "gensim/models/word2vec_inner.pyx":642 + /* "gensim/models/word2vec_inner.pyx":641 * if word is None: * continue # leaving `effective_words` unchanged = shortening the sentence = expanding the window * if c.sample and word.sample_int < random_int32(&c.next_random): # <<<<<<<<<<<<<< @@ -5897,20 +5951,20 @@ static PyObject *__pyx_pf_6gensim_6models_14word2vec_inner_2train_batch_cbow(CYT */ } - /* "gensim/models/word2vec_inner.pyx":644 + /* "gensim/models/word2vec_inner.pyx":643 * if c.sample and word.sample_int < random_int32(&c.next_random): * continue * c.indexes[effective_words] = word.index # <<<<<<<<<<<<<< * if c.hs: * c.codelens[effective_words] = len(word.code) */ - __pyx_t_12 = __Pyx_PyObject_GetAttrStr(__pyx_v_word, __pyx_n_s_index); if (unlikely(!__pyx_t_12)) __PYX_ERR(0, 644, __pyx_L1_error) + __pyx_t_12 = __Pyx_PyObject_GetAttrStr(__pyx_v_word, __pyx_n_s_index); if (unlikely(!__pyx_t_12)) __PYX_ERR(0, 643, __pyx_L1_error) __Pyx_GOTREF(__pyx_t_12); - __pyx_t_13 = __Pyx_PyInt_As_npy_uint32(__pyx_t_12); if (unlikely((__pyx_t_13 == ((npy_uint32)-1)) && PyErr_Occurred())) __PYX_ERR(0, 644, __pyx_L1_error) + __pyx_t_13 = __Pyx_PyInt_As_npy_uint32(__pyx_t_12); if (unlikely((__pyx_t_13 == ((npy_uint32)-1)) && PyErr_Occurred())) __PYX_ERR(0, 643, __pyx_L1_error) __Pyx_DECREF(__pyx_t_12); __pyx_t_12 = 0; (__pyx_v_c.indexes[__pyx_v_effective_words]) = __pyx_t_13; - /* "gensim/models/word2vec_inner.pyx":645 + /* "gensim/models/word2vec_inner.pyx":644 * continue * c.indexes[effective_words] = word.index * if c.hs: # <<<<<<<<<<<<<< @@ -5920,46 +5974,46 @@ static PyObject *__pyx_pf_6gensim_6models_14word2vec_inner_2train_batch_cbow(CYT __pyx_t_6 = (__pyx_v_c.hs != 0); if (__pyx_t_6) { - /* "gensim/models/word2vec_inner.pyx":646 + /* "gensim/models/word2vec_inner.pyx":645 * c.indexes[effective_words] = word.index * if c.hs: * c.codelens[effective_words] = len(word.code) # <<<<<<<<<<<<<< * c.codes[effective_words] = np.PyArray_DATA(word.code) * c.points[effective_words] = np.PyArray_DATA(word.point) */ - __pyx_t_12 = __Pyx_PyObject_GetAttrStr(__pyx_v_word, __pyx_n_s_code); if (unlikely(!__pyx_t_12)) __PYX_ERR(0, 646, __pyx_L1_error) + __pyx_t_12 = __Pyx_PyObject_GetAttrStr(__pyx_v_word, __pyx_n_s_code); if (unlikely(!__pyx_t_12)) __PYX_ERR(0, 645, __pyx_L1_error) __Pyx_GOTREF(__pyx_t_12); - __pyx_t_14 = PyObject_Length(__pyx_t_12); if (unlikely(__pyx_t_14 == ((Py_ssize_t)-1))) __PYX_ERR(0, 646, __pyx_L1_error) + __pyx_t_14 = PyObject_Length(__pyx_t_12); if (unlikely(__pyx_t_14 == ((Py_ssize_t)-1))) __PYX_ERR(0, 645, __pyx_L1_error) __Pyx_DECREF(__pyx_t_12); __pyx_t_12 = 0; (__pyx_v_c.codelens[__pyx_v_effective_words]) = ((int)__pyx_t_14); - /* "gensim/models/word2vec_inner.pyx":647 + /* "gensim/models/word2vec_inner.pyx":646 * if c.hs: * c.codelens[effective_words] = len(word.code) * c.codes[effective_words] = np.PyArray_DATA(word.code) # <<<<<<<<<<<<<< * c.points[effective_words] = np.PyArray_DATA(word.point) * effective_words += 1 */ - __pyx_t_12 = __Pyx_PyObject_GetAttrStr(__pyx_v_word, __pyx_n_s_code); if (unlikely(!__pyx_t_12)) __PYX_ERR(0, 647, __pyx_L1_error) + __pyx_t_12 = __Pyx_PyObject_GetAttrStr(__pyx_v_word, __pyx_n_s_code); if (unlikely(!__pyx_t_12)) __PYX_ERR(0, 646, __pyx_L1_error) __Pyx_GOTREF(__pyx_t_12); - if (!(likely(((__pyx_t_12) == Py_None) || likely(__Pyx_TypeTest(__pyx_t_12, __pyx_ptype_5numpy_ndarray))))) __PYX_ERR(0, 647, __pyx_L1_error) + if (!(likely(((__pyx_t_12) == Py_None) || likely(__Pyx_TypeTest(__pyx_t_12, __pyx_ptype_5numpy_ndarray))))) __PYX_ERR(0, 646, __pyx_L1_error) (__pyx_v_c.codes[__pyx_v_effective_words]) = ((__pyx_t_5numpy_uint8_t *)PyArray_DATA(((PyArrayObject *)__pyx_t_12))); __Pyx_DECREF(__pyx_t_12); __pyx_t_12 = 0; - /* "gensim/models/word2vec_inner.pyx":648 + /* "gensim/models/word2vec_inner.pyx":647 * c.codelens[effective_words] = len(word.code) * c.codes[effective_words] = np.PyArray_DATA(word.code) * c.points[effective_words] = np.PyArray_DATA(word.point) # <<<<<<<<<<<<<< * effective_words += 1 * if effective_words == MAX_SENTENCE_LEN: */ - __pyx_t_12 = __Pyx_PyObject_GetAttrStr(__pyx_v_word, __pyx_n_s_point); if (unlikely(!__pyx_t_12)) __PYX_ERR(0, 648, __pyx_L1_error) + __pyx_t_12 = __Pyx_PyObject_GetAttrStr(__pyx_v_word, __pyx_n_s_point); if (unlikely(!__pyx_t_12)) __PYX_ERR(0, 647, __pyx_L1_error) __Pyx_GOTREF(__pyx_t_12); - if (!(likely(((__pyx_t_12) == Py_None) || likely(__Pyx_TypeTest(__pyx_t_12, __pyx_ptype_5numpy_ndarray))))) __PYX_ERR(0, 648, __pyx_L1_error) + if (!(likely(((__pyx_t_12) == Py_None) || likely(__Pyx_TypeTest(__pyx_t_12, __pyx_ptype_5numpy_ndarray))))) __PYX_ERR(0, 647, __pyx_L1_error) (__pyx_v_c.points[__pyx_v_effective_words]) = ((__pyx_t_5numpy_uint32_t *)PyArray_DATA(((PyArrayObject *)__pyx_t_12))); __Pyx_DECREF(__pyx_t_12); __pyx_t_12 = 0; - /* "gensim/models/word2vec_inner.pyx":645 + /* "gensim/models/word2vec_inner.pyx":644 * continue * c.indexes[effective_words] = word.index * if c.hs: # <<<<<<<<<<<<<< @@ -5968,7 +6022,7 @@ static PyObject *__pyx_pf_6gensim_6models_14word2vec_inner_2train_batch_cbow(CYT */ } - /* "gensim/models/word2vec_inner.pyx":649 + /* "gensim/models/word2vec_inner.pyx":648 * c.codes[effective_words] = np.PyArray_DATA(word.code) * c.points[effective_words] = np.PyArray_DATA(word.point) * effective_words += 1 # <<<<<<<<<<<<<< @@ -5977,7 +6031,7 @@ static PyObject *__pyx_pf_6gensim_6models_14word2vec_inner_2train_batch_cbow(CYT */ __pyx_v_effective_words = (__pyx_v_effective_words + 1); - /* "gensim/models/word2vec_inner.pyx":650 + /* "gensim/models/word2vec_inner.pyx":649 * c.points[effective_words] = np.PyArray_DATA(word.point) * effective_words += 1 * if effective_words == MAX_SENTENCE_LEN: # <<<<<<<<<<<<<< @@ -5987,7 +6041,7 @@ static PyObject *__pyx_pf_6gensim_6models_14word2vec_inner_2train_batch_cbow(CYT __pyx_t_6 = ((__pyx_v_effective_words == 0x2710) != 0); if (__pyx_t_6) { - /* "gensim/models/word2vec_inner.pyx":651 + /* "gensim/models/word2vec_inner.pyx":650 * effective_words += 1 * if effective_words == MAX_SENTENCE_LEN: * break # TODO: log warning, tally overflow? # <<<<<<<<<<<<<< @@ -5996,7 +6050,7 @@ static PyObject *__pyx_pf_6gensim_6models_14word2vec_inner_2train_batch_cbow(CYT */ goto __pyx_L7_break; - /* "gensim/models/word2vec_inner.pyx":650 + /* "gensim/models/word2vec_inner.pyx":649 * c.points[effective_words] = np.PyArray_DATA(word.point) * effective_words += 1 * if effective_words == MAX_SENTENCE_LEN: # <<<<<<<<<<<<<< @@ -6005,7 +6059,7 @@ static PyObject *__pyx_pf_6gensim_6models_14word2vec_inner_2train_batch_cbow(CYT */ } - /* "gensim/models/word2vec_inner.pyx":638 + /* "gensim/models/word2vec_inner.pyx":637 * if not sent: * continue # ignore empty sentences; leave effective_sentences unchanged * for token in sent: # <<<<<<<<<<<<<< @@ -6017,7 +6071,7 @@ static PyObject *__pyx_pf_6gensim_6models_14word2vec_inner_2train_batch_cbow(CYT __pyx_L7_break:; __Pyx_DECREF(__pyx_t_1); __pyx_t_1 = 0; - /* "gensim/models/word2vec_inner.pyx":656 + /* "gensim/models/word2vec_inner.pyx":655 * # across sentence boundaries. * # indices of sentence number X are between tp_iternext; if (unlikely(!__pyx_t_5)) __PYX_ERR(0, 663, __pyx_L1_error) + __pyx_t_5 = Py_TYPE(__pyx_t_12)->tp_iternext; if (unlikely(!__pyx_t_5)) __PYX_ERR(0, 662, __pyx_L1_error) } __Pyx_DECREF(__pyx_t_3); __pyx_t_3 = 0; for (;;) { @@ -6158,17 +6212,17 @@ static PyObject *__pyx_pf_6gensim_6models_14word2vec_inner_2train_batch_cbow(CYT if (likely(PyList_CheckExact(__pyx_t_12))) { if (__pyx_t_4 >= PyList_GET_SIZE(__pyx_t_12)) break; #if CYTHON_ASSUME_SAFE_MACROS && !CYTHON_AVOID_BORROWED_REFS - __pyx_t_3 = PyList_GET_ITEM(__pyx_t_12, __pyx_t_4); __Pyx_INCREF(__pyx_t_3); __pyx_t_4++; if (unlikely(0 < 0)) __PYX_ERR(0, 663, __pyx_L1_error) + __pyx_t_3 = PyList_GET_ITEM(__pyx_t_12, __pyx_t_4); __Pyx_INCREF(__pyx_t_3); __pyx_t_4++; if (unlikely(0 < 0)) __PYX_ERR(0, 662, __pyx_L1_error) #else - __pyx_t_3 = PySequence_ITEM(__pyx_t_12, __pyx_t_4); __pyx_t_4++; if (unlikely(!__pyx_t_3)) __PYX_ERR(0, 663, __pyx_L1_error) + __pyx_t_3 = PySequence_ITEM(__pyx_t_12, __pyx_t_4); __pyx_t_4++; if (unlikely(!__pyx_t_3)) __PYX_ERR(0, 662, __pyx_L1_error) __Pyx_GOTREF(__pyx_t_3); #endif } else { if (__pyx_t_4 >= PyTuple_GET_SIZE(__pyx_t_12)) break; #if CYTHON_ASSUME_SAFE_MACROS && !CYTHON_AVOID_BORROWED_REFS - __pyx_t_3 = PyTuple_GET_ITEM(__pyx_t_12, __pyx_t_4); __Pyx_INCREF(__pyx_t_3); __pyx_t_4++; if (unlikely(0 < 0)) __PYX_ERR(0, 663, __pyx_L1_error) + __pyx_t_3 = PyTuple_GET_ITEM(__pyx_t_12, __pyx_t_4); __Pyx_INCREF(__pyx_t_3); __pyx_t_4++; if (unlikely(0 < 0)) __PYX_ERR(0, 662, __pyx_L1_error) #else - __pyx_t_3 = PySequence_ITEM(__pyx_t_12, __pyx_t_4); __pyx_t_4++; if (unlikely(!__pyx_t_3)) __PYX_ERR(0, 663, __pyx_L1_error) + __pyx_t_3 = PySequence_ITEM(__pyx_t_12, __pyx_t_4); __pyx_t_4++; if (unlikely(!__pyx_t_3)) __PYX_ERR(0, 662, __pyx_L1_error) __Pyx_GOTREF(__pyx_t_3); #endif } @@ -6178,7 +6232,7 @@ static PyObject *__pyx_pf_6gensim_6models_14word2vec_inner_2train_batch_cbow(CYT PyObject* exc_type = PyErr_Occurred(); if (exc_type) { if (likely(__Pyx_PyErr_GivenExceptionMatches(exc_type, PyExc_StopIteration))) PyErr_Clear(); - else __PYX_ERR(0, 663, __pyx_L1_error) + else __PYX_ERR(0, 662, __pyx_L1_error) } break; } @@ -6189,17 +6243,17 @@ static PyObject *__pyx_pf_6gensim_6models_14word2vec_inner_2train_batch_cbow(CYT __pyx_v_i = __pyx_t_15; __pyx_t_15 = (__pyx_t_15 + 1); - /* "gensim/models/word2vec_inner.pyx":664 + /* "gensim/models/word2vec_inner.pyx":663 * # precompute "reduced window" offsets in a single randint() call * for i, item in enumerate(model.random.randint(0, c.window, effective_words)): * c.reduced_windows[i] = item # <<<<<<<<<<<<<< * * # release GIL & train on all sentences */ - __pyx_t_13 = __Pyx_PyInt_As_npy_uint32(__pyx_v_item); if (unlikely((__pyx_t_13 == ((npy_uint32)-1)) && PyErr_Occurred())) __PYX_ERR(0, 664, __pyx_L1_error) + __pyx_t_13 = __Pyx_PyInt_As_npy_uint32(__pyx_v_item); if (unlikely((__pyx_t_13 == ((npy_uint32)-1)) && PyErr_Occurred())) __PYX_ERR(0, 663, __pyx_L1_error) (__pyx_v_c.reduced_windows[__pyx_v_i]) = __pyx_t_13; - /* "gensim/models/word2vec_inner.pyx":663 + /* "gensim/models/word2vec_inner.pyx":662 * * # precompute "reduced window" offsets in a single randint() call * for i, item in enumerate(model.random.randint(0, c.window, effective_words)): # <<<<<<<<<<<<<< @@ -6209,7 +6263,7 @@ static PyObject *__pyx_pf_6gensim_6models_14word2vec_inner_2train_batch_cbow(CYT } __Pyx_DECREF(__pyx_t_12); __pyx_t_12 = 0; - /* "gensim/models/word2vec_inner.pyx":667 + /* "gensim/models/word2vec_inner.pyx":666 * * # release GIL & train on all sentences * with nogil: # <<<<<<<<<<<<<< @@ -6224,7 +6278,7 @@ static PyObject *__pyx_pf_6gensim_6models_14word2vec_inner_2train_batch_cbow(CYT #endif /*try:*/ { - /* "gensim/models/word2vec_inner.pyx":668 + /* "gensim/models/word2vec_inner.pyx":667 * # release GIL & train on all sentences * with nogil: * for sent_idx in range(effective_sentences): # <<<<<<<<<<<<<< @@ -6236,7 +6290,7 @@ static PyObject *__pyx_pf_6gensim_6models_14word2vec_inner_2train_batch_cbow(CYT for (__pyx_t_18 = 0; __pyx_t_18 < __pyx_t_16; __pyx_t_18+=1) { __pyx_v_sent_idx = __pyx_t_18; - /* "gensim/models/word2vec_inner.pyx":669 + /* "gensim/models/word2vec_inner.pyx":668 * with nogil: * for sent_idx in range(effective_sentences): * idx_start = c.sentence_idx[sent_idx] # <<<<<<<<<<<<<< @@ -6245,7 +6299,7 @@ static PyObject *__pyx_pf_6gensim_6models_14word2vec_inner_2train_batch_cbow(CYT */ __pyx_v_idx_start = (__pyx_v_c.sentence_idx[__pyx_v_sent_idx]); - /* "gensim/models/word2vec_inner.pyx":670 + /* "gensim/models/word2vec_inner.pyx":669 * for sent_idx in range(effective_sentences): * idx_start = c.sentence_idx[sent_idx] * idx_end = c.sentence_idx[sent_idx + 1] # <<<<<<<<<<<<<< @@ -6254,7 +6308,7 @@ static PyObject *__pyx_pf_6gensim_6models_14word2vec_inner_2train_batch_cbow(CYT */ __pyx_v_idx_end = (__pyx_v_c.sentence_idx[(__pyx_v_sent_idx + 1)]); - /* "gensim/models/word2vec_inner.pyx":671 + /* "gensim/models/word2vec_inner.pyx":670 * idx_start = c.sentence_idx[sent_idx] * idx_end = c.sentence_idx[sent_idx + 1] * for i in range(idx_start, idx_end): # <<<<<<<<<<<<<< @@ -6266,7 +6320,7 @@ static PyObject *__pyx_pf_6gensim_6models_14word2vec_inner_2train_batch_cbow(CYT for (__pyx_t_21 = __pyx_v_idx_start; __pyx_t_21 < __pyx_t_20; __pyx_t_21+=1) { __pyx_v_i = __pyx_t_21; - /* "gensim/models/word2vec_inner.pyx":672 + /* "gensim/models/word2vec_inner.pyx":671 * idx_end = c.sentence_idx[sent_idx + 1] * for i in range(idx_start, idx_end): * j = i - c.window + c.reduced_windows[i] # <<<<<<<<<<<<<< @@ -6275,7 +6329,7 @@ static PyObject *__pyx_pf_6gensim_6models_14word2vec_inner_2train_batch_cbow(CYT */ __pyx_v_j = ((__pyx_v_i - __pyx_v_c.window) + (__pyx_v_c.reduced_windows[__pyx_v_i])); - /* "gensim/models/word2vec_inner.pyx":673 + /* "gensim/models/word2vec_inner.pyx":672 * for i in range(idx_start, idx_end): * j = i - c.window + c.reduced_windows[i] * if j < idx_start: # <<<<<<<<<<<<<< @@ -6285,7 +6339,7 @@ static PyObject *__pyx_pf_6gensim_6models_14word2vec_inner_2train_batch_cbow(CYT __pyx_t_6 = ((__pyx_v_j < __pyx_v_idx_start) != 0); if (__pyx_t_6) { - /* "gensim/models/word2vec_inner.pyx":674 + /* "gensim/models/word2vec_inner.pyx":673 * j = i - c.window + c.reduced_windows[i] * if j < idx_start: * j = idx_start # <<<<<<<<<<<<<< @@ -6294,7 +6348,7 @@ static PyObject *__pyx_pf_6gensim_6models_14word2vec_inner_2train_batch_cbow(CYT */ __pyx_v_j = __pyx_v_idx_start; - /* "gensim/models/word2vec_inner.pyx":673 + /* "gensim/models/word2vec_inner.pyx":672 * for i in range(idx_start, idx_end): * j = i - c.window + c.reduced_windows[i] * if j < idx_start: # <<<<<<<<<<<<<< @@ -6303,7 +6357,7 @@ static PyObject *__pyx_pf_6gensim_6models_14word2vec_inner_2train_batch_cbow(CYT */ } - /* "gensim/models/word2vec_inner.pyx":675 + /* "gensim/models/word2vec_inner.pyx":674 * if j < idx_start: * j = idx_start * k = i + c.window + 1 - c.reduced_windows[i] # <<<<<<<<<<<<<< @@ -6312,7 +6366,7 @@ static PyObject *__pyx_pf_6gensim_6models_14word2vec_inner_2train_batch_cbow(CYT */ __pyx_v_k = (((__pyx_v_i + __pyx_v_c.window) + 1) - (__pyx_v_c.reduced_windows[__pyx_v_i])); - /* "gensim/models/word2vec_inner.pyx":676 + /* "gensim/models/word2vec_inner.pyx":675 * j = idx_start * k = i + c.window + 1 - c.reduced_windows[i] * if k > idx_end: # <<<<<<<<<<<<<< @@ -6322,7 +6376,7 @@ static PyObject *__pyx_pf_6gensim_6models_14word2vec_inner_2train_batch_cbow(CYT __pyx_t_6 = ((__pyx_v_k > __pyx_v_idx_end) != 0); if (__pyx_t_6) { - /* "gensim/models/word2vec_inner.pyx":677 + /* "gensim/models/word2vec_inner.pyx":676 * k = i + c.window + 1 - c.reduced_windows[i] * if k > idx_end: * k = idx_end # <<<<<<<<<<<<<< @@ -6331,7 +6385,7 @@ static PyObject *__pyx_pf_6gensim_6models_14word2vec_inner_2train_batch_cbow(CYT */ __pyx_v_k = __pyx_v_idx_end; - /* "gensim/models/word2vec_inner.pyx":676 + /* "gensim/models/word2vec_inner.pyx":675 * j = idx_start * k = i + c.window + 1 - c.reduced_windows[i] * if k > idx_end: # <<<<<<<<<<<<<< @@ -6340,7 +6394,7 @@ static PyObject *__pyx_pf_6gensim_6models_14word2vec_inner_2train_batch_cbow(CYT */ } - /* "gensim/models/word2vec_inner.pyx":678 + /* "gensim/models/word2vec_inner.pyx":677 * if k > idx_end: * k = idx_end * if c.hs: # <<<<<<<<<<<<<< @@ -6350,7 +6404,7 @@ static PyObject *__pyx_pf_6gensim_6models_14word2vec_inner_2train_batch_cbow(CYT __pyx_t_6 = (__pyx_v_c.hs != 0); if (__pyx_t_6) { - /* "gensim/models/word2vec_inner.pyx":679 + /* "gensim/models/word2vec_inner.pyx":678 * k = idx_end * if c.hs: * w2v_fast_sentence_cbow_hs(c.points[i], c.codes[i], c.codelens, c.neu1, c.syn0, c.syn1, c.size, c.indexes, c.alpha, c.work, i, j, k, c.cbow_mean, c.word_locks, c.compute_loss, &c.running_training_loss) # <<<<<<<<<<<<<< @@ -6359,7 +6413,7 @@ static PyObject *__pyx_pf_6gensim_6models_14word2vec_inner_2train_batch_cbow(CYT */ __pyx_f_6gensim_6models_14word2vec_inner_w2v_fast_sentence_cbow_hs((__pyx_v_c.points[__pyx_v_i]), (__pyx_v_c.codes[__pyx_v_i]), __pyx_v_c.codelens, __pyx_v_c.neu1, __pyx_v_c.syn0, __pyx_v_c.syn1, __pyx_v_c.size, __pyx_v_c.indexes, __pyx_v_c.alpha, __pyx_v_c.work, __pyx_v_i, __pyx_v_j, __pyx_v_k, __pyx_v_c.cbow_mean, __pyx_v_c.word_locks, __pyx_v_c.compute_loss, (&__pyx_v_c.running_training_loss)); - /* "gensim/models/word2vec_inner.pyx":678 + /* "gensim/models/word2vec_inner.pyx":677 * if k > idx_end: * k = idx_end * if c.hs: # <<<<<<<<<<<<<< @@ -6368,7 +6422,7 @@ static PyObject *__pyx_pf_6gensim_6models_14word2vec_inner_2train_batch_cbow(CYT */ } - /* "gensim/models/word2vec_inner.pyx":680 + /* "gensim/models/word2vec_inner.pyx":679 * if c.hs: * w2v_fast_sentence_cbow_hs(c.points[i], c.codes[i], c.codelens, c.neu1, c.syn0, c.syn1, c.size, c.indexes, c.alpha, c.work, i, j, k, c.cbow_mean, c.word_locks, c.compute_loss, &c.running_training_loss) * if c.negative: # <<<<<<<<<<<<<< @@ -6378,7 +6432,7 @@ static PyObject *__pyx_pf_6gensim_6models_14word2vec_inner_2train_batch_cbow(CYT __pyx_t_6 = (__pyx_v_c.negative != 0); if (__pyx_t_6) { - /* "gensim/models/word2vec_inner.pyx":681 + /* "gensim/models/word2vec_inner.pyx":680 * w2v_fast_sentence_cbow_hs(c.points[i], c.codes[i], c.codelens, c.neu1, c.syn0, c.syn1, c.size, c.indexes, c.alpha, c.work, i, j, k, c.cbow_mean, c.word_locks, c.compute_loss, &c.running_training_loss) * if c.negative: * c.next_random = w2v_fast_sentence_cbow_neg(c.negative, c.cum_table, c.cum_table_len, c.codelens, c.neu1, c.syn0, c.syn1neg, c.size, c.indexes, c.alpha, c.work, i, j, k, c.cbow_mean, c.next_random, c.word_locks, c.compute_loss, &c.running_training_loss) # <<<<<<<<<<<<<< @@ -6387,7 +6441,7 @@ static PyObject *__pyx_pf_6gensim_6models_14word2vec_inner_2train_batch_cbow(CYT */ __pyx_v_c.next_random = __pyx_f_6gensim_6models_14word2vec_inner_w2v_fast_sentence_cbow_neg(__pyx_v_c.negative, __pyx_v_c.cum_table, __pyx_v_c.cum_table_len, __pyx_v_c.codelens, __pyx_v_c.neu1, __pyx_v_c.syn0, __pyx_v_c.syn1neg, __pyx_v_c.size, __pyx_v_c.indexes, __pyx_v_c.alpha, __pyx_v_c.work, __pyx_v_i, __pyx_v_j, __pyx_v_k, __pyx_v_c.cbow_mean, __pyx_v_c.next_random, __pyx_v_c.word_locks, __pyx_v_c.compute_loss, (&__pyx_v_c.running_training_loss)); - /* "gensim/models/word2vec_inner.pyx":680 + /* "gensim/models/word2vec_inner.pyx":679 * if c.hs: * w2v_fast_sentence_cbow_hs(c.points[i], c.codes[i], c.codelens, c.neu1, c.syn0, c.syn1, c.size, c.indexes, c.alpha, c.work, i, j, k, c.cbow_mean, c.word_locks, c.compute_loss, &c.running_training_loss) * if c.negative: # <<<<<<<<<<<<<< @@ -6399,7 +6453,7 @@ static PyObject *__pyx_pf_6gensim_6models_14word2vec_inner_2train_batch_cbow(CYT } } - /* "gensim/models/word2vec_inner.pyx":667 + /* "gensim/models/word2vec_inner.pyx":666 * * # release GIL & train on all sentences * with nogil: # <<<<<<<<<<<<<< @@ -6418,25 +6472,25 @@ static PyObject *__pyx_pf_6gensim_6models_14word2vec_inner_2train_batch_cbow(CYT } } - /* "gensim/models/word2vec_inner.pyx":682 + /* "gensim/models/word2vec_inner.pyx":681 * if c.negative: * c.next_random = w2v_fast_sentence_cbow_neg(c.negative, c.cum_table, c.cum_table_len, c.codelens, c.neu1, c.syn0, c.syn1neg, c.size, c.indexes, c.alpha, c.work, i, j, k, c.cbow_mean, c.next_random, c.word_locks, c.compute_loss, &c.running_training_loss) * model.running_training_loss += c.running_training_loss # <<<<<<<<<<<<<< * * return effective_words, effective_words */ - __pyx_t_12 = __Pyx_PyObject_GetAttrStr(__pyx_v_model, __pyx_n_s_running_training_loss); if (unlikely(!__pyx_t_12)) __PYX_ERR(0, 682, __pyx_L1_error) + __pyx_t_12 = __Pyx_PyObject_GetAttrStr(__pyx_v_model, __pyx_n_s_running_training_loss); if (unlikely(!__pyx_t_12)) __PYX_ERR(0, 681, __pyx_L1_error) __Pyx_GOTREF(__pyx_t_12); - __pyx_t_3 = PyFloat_FromDouble(__pyx_v_c.running_training_loss); if (unlikely(!__pyx_t_3)) __PYX_ERR(0, 682, __pyx_L1_error) + __pyx_t_3 = PyFloat_FromDouble(__pyx_v_c.running_training_loss); if (unlikely(!__pyx_t_3)) __PYX_ERR(0, 681, __pyx_L1_error) __Pyx_GOTREF(__pyx_t_3); - __pyx_t_17 = PyNumber_InPlaceAdd(__pyx_t_12, __pyx_t_3); if (unlikely(!__pyx_t_17)) __PYX_ERR(0, 682, __pyx_L1_error) + __pyx_t_17 = PyNumber_InPlaceAdd(__pyx_t_12, __pyx_t_3); if (unlikely(!__pyx_t_17)) __PYX_ERR(0, 681, __pyx_L1_error) __Pyx_GOTREF(__pyx_t_17); __Pyx_DECREF(__pyx_t_12); __pyx_t_12 = 0; __Pyx_DECREF(__pyx_t_3); __pyx_t_3 = 0; - if (__Pyx_PyObject_SetAttrStr(__pyx_v_model, __pyx_n_s_running_training_loss, __pyx_t_17) < 0) __PYX_ERR(0, 682, __pyx_L1_error) + if (__Pyx_PyObject_SetAttrStr(__pyx_v_model, __pyx_n_s_running_training_loss, __pyx_t_17) < 0) __PYX_ERR(0, 681, __pyx_L1_error) __Pyx_DECREF(__pyx_t_17); __pyx_t_17 = 0; - /* "gensim/models/word2vec_inner.pyx":684 + /* "gensim/models/word2vec_inner.pyx":683 * model.running_training_loss += c.running_training_loss * * return effective_words, effective_words # <<<<<<<<<<<<<< @@ -6444,11 +6498,11 @@ static PyObject *__pyx_pf_6gensim_6models_14word2vec_inner_2train_batch_cbow(CYT * */ __Pyx_XDECREF(__pyx_r); - __pyx_t_17 = __Pyx_PyInt_From_int(__pyx_v_effective_words); if (unlikely(!__pyx_t_17)) __PYX_ERR(0, 684, __pyx_L1_error) + __pyx_t_17 = __Pyx_PyInt_From_int(__pyx_v_effective_words); if (unlikely(!__pyx_t_17)) __PYX_ERR(0, 683, __pyx_L1_error) __Pyx_GOTREF(__pyx_t_17); - __pyx_t_3 = __Pyx_PyInt_From_int(__pyx_v_effective_words); if (unlikely(!__pyx_t_3)) __PYX_ERR(0, 684, __pyx_L1_error) + __pyx_t_3 = __Pyx_PyInt_From_int(__pyx_v_effective_words); if (unlikely(!__pyx_t_3)) __PYX_ERR(0, 683, __pyx_L1_error) __Pyx_GOTREF(__pyx_t_3); - __pyx_t_12 = PyTuple_New(2); if (unlikely(!__pyx_t_12)) __PYX_ERR(0, 684, __pyx_L1_error) + __pyx_t_12 = PyTuple_New(2); if (unlikely(!__pyx_t_12)) __PYX_ERR(0, 683, __pyx_L1_error) __Pyx_GOTREF(__pyx_t_12); __Pyx_GIVEREF(__pyx_t_17); PyTuple_SET_ITEM(__pyx_t_12, 0, __pyx_t_17); @@ -6460,7 +6514,7 @@ static PyObject *__pyx_pf_6gensim_6models_14word2vec_inner_2train_batch_cbow(CYT __pyx_t_12 = 0; goto __pyx_L0; - /* "gensim/models/word2vec_inner.pyx":595 + /* "gensim/models/word2vec_inner.pyx":594 * * * def train_batch_cbow(model, sentences, alpha, _work, _neu1, compute_loss): # <<<<<<<<<<<<<< @@ -6489,7 +6543,7 @@ static PyObject *__pyx_pf_6gensim_6models_14word2vec_inner_2train_batch_cbow(CYT return __pyx_r; } -/* "gensim/models/word2vec_inner.pyx":687 +/* "gensim/models/word2vec_inner.pyx":686 * * * def score_sentence_sg(model, sentence, _work): # <<<<<<<<<<<<<< @@ -6500,7 +6554,7 @@ static PyObject *__pyx_pf_6gensim_6models_14word2vec_inner_2train_batch_cbow(CYT /* Python wrapper */ static PyObject *__pyx_pw_6gensim_6models_14word2vec_inner_5score_sentence_sg(PyObject *__pyx_self, PyObject *__pyx_args, PyObject *__pyx_kwds); /*proto*/ static char __pyx_doc_6gensim_6models_14word2vec_inner_4score_sentence_sg[] = "score_sentence_sg(model, sentence, _work)\nObtain likelihood score for a single sentence in a fitted skip-gram representation.\n\n Notes\n -----\n This scoring function is only implemented for hierarchical softmax (`model.hs == 1`).\n The model should have been trained using the skip-gram model (`model.sg` == 1`).\n\n Parameters\n ----------\n model : :class:`~gensim.models.word2vec.Word2Vec`\n The trained model. It **MUST** have been trained using hierarchical softmax and the skip-gram algorithm.\n sentence : list of str\n The words comprising the sentence to be scored.\n _work : np.ndarray\n Private working memory for each worker.\n\n Returns\n -------\n float\n The probability assigned to this sentence by the Skip-Gram model.\n\n "; -static PyMethodDef __pyx_mdef_6gensim_6models_14word2vec_inner_5score_sentence_sg = {"score_sentence_sg", (PyCFunction)__pyx_pw_6gensim_6models_14word2vec_inner_5score_sentence_sg, METH_VARARGS|METH_KEYWORDS, __pyx_doc_6gensim_6models_14word2vec_inner_4score_sentence_sg}; +static PyMethodDef __pyx_mdef_6gensim_6models_14word2vec_inner_5score_sentence_sg = {"score_sentence_sg", (PyCFunction)(void*)(PyCFunctionWithKeywords)__pyx_pw_6gensim_6models_14word2vec_inner_5score_sentence_sg, METH_VARARGS|METH_KEYWORDS, __pyx_doc_6gensim_6models_14word2vec_inner_4score_sentence_sg}; static PyObject *__pyx_pw_6gensim_6models_14word2vec_inner_5score_sentence_sg(PyObject *__pyx_self, PyObject *__pyx_args, PyObject *__pyx_kwds) { PyObject *__pyx_v_model = 0; PyObject *__pyx_v_sentence = 0; @@ -6533,17 +6587,17 @@ static PyObject *__pyx_pw_6gensim_6models_14word2vec_inner_5score_sentence_sg(Py case 1: if (likely((values[1] = __Pyx_PyDict_GetItemStr(__pyx_kwds, __pyx_n_s_sentence)) != 0)) kw_args--; else { - __Pyx_RaiseArgtupleInvalid("score_sentence_sg", 1, 3, 3, 1); __PYX_ERR(0, 687, __pyx_L3_error) + __Pyx_RaiseArgtupleInvalid("score_sentence_sg", 1, 3, 3, 1); __PYX_ERR(0, 686, __pyx_L3_error) } CYTHON_FALLTHROUGH; case 2: if (likely((values[2] = __Pyx_PyDict_GetItemStr(__pyx_kwds, __pyx_n_s_work)) != 0)) kw_args--; else { - __Pyx_RaiseArgtupleInvalid("score_sentence_sg", 1, 3, 3, 2); __PYX_ERR(0, 687, __pyx_L3_error) + __Pyx_RaiseArgtupleInvalid("score_sentence_sg", 1, 3, 3, 2); __PYX_ERR(0, 686, __pyx_L3_error) } } if (unlikely(kw_args > 0)) { - if (unlikely(__Pyx_ParseOptionalKeywords(__pyx_kwds, __pyx_pyargnames, 0, values, pos_args, "score_sentence_sg") < 0)) __PYX_ERR(0, 687, __pyx_L3_error) + if (unlikely(__Pyx_ParseOptionalKeywords(__pyx_kwds, __pyx_pyargnames, 0, values, pos_args, "score_sentence_sg") < 0)) __PYX_ERR(0, 686, __pyx_L3_error) } } else if (PyTuple_GET_SIZE(__pyx_args) != 3) { goto __pyx_L5_argtuple_error; @@ -6558,7 +6612,7 @@ static PyObject *__pyx_pw_6gensim_6models_14word2vec_inner_5score_sentence_sg(Py } goto __pyx_L4_argument_unpacking_done; __pyx_L5_argtuple_error:; - __Pyx_RaiseArgtupleInvalid("score_sentence_sg", 1, 3, 3, PyTuple_GET_SIZE(__pyx_args)); __PYX_ERR(0, 687, __pyx_L3_error) + __Pyx_RaiseArgtupleInvalid("score_sentence_sg", 1, 3, 3, PyTuple_GET_SIZE(__pyx_args)); __PYX_ERR(0, 686, __pyx_L3_error) __pyx_L3_error:; __Pyx_AddTraceback("gensim.models.word2vec_inner.score_sentence_sg", __pyx_clineno, __pyx_lineno, __pyx_filename); __Pyx_RefNannyFinishContext(); @@ -6600,52 +6654,52 @@ static PyObject *__pyx_pf_6gensim_6models_14word2vec_inner_4score_sentence_sg(CY int __pyx_t_15; __Pyx_RefNannySetupContext("score_sentence_sg", 0); - /* "gensim/models/word2vec_inner.pyx":711 + /* "gensim/models/word2vec_inner.pyx":710 * """ * cdef Word2VecConfig c * c.syn0 = (np.PyArray_DATA(model.wv.vectors)) # <<<<<<<<<<<<<< * c.size = model.wv.vector_size * */ - __pyx_t_1 = __Pyx_PyObject_GetAttrStr(__pyx_v_model, __pyx_n_s_wv); if (unlikely(!__pyx_t_1)) __PYX_ERR(0, 711, __pyx_L1_error) + __pyx_t_1 = __Pyx_PyObject_GetAttrStr(__pyx_v_model, __pyx_n_s_wv); if (unlikely(!__pyx_t_1)) __PYX_ERR(0, 710, __pyx_L1_error) __Pyx_GOTREF(__pyx_t_1); - __pyx_t_2 = __Pyx_PyObject_GetAttrStr(__pyx_t_1, __pyx_n_s_vectors); if (unlikely(!__pyx_t_2)) __PYX_ERR(0, 711, __pyx_L1_error) + __pyx_t_2 = __Pyx_PyObject_GetAttrStr(__pyx_t_1, __pyx_n_s_vectors); if (unlikely(!__pyx_t_2)) __PYX_ERR(0, 710, __pyx_L1_error) __Pyx_GOTREF(__pyx_t_2); __Pyx_DECREF(__pyx_t_1); __pyx_t_1 = 0; - if (!(likely(((__pyx_t_2) == Py_None) || likely(__Pyx_TypeTest(__pyx_t_2, __pyx_ptype_5numpy_ndarray))))) __PYX_ERR(0, 711, __pyx_L1_error) + if (!(likely(((__pyx_t_2) == Py_None) || likely(__Pyx_TypeTest(__pyx_t_2, __pyx_ptype_5numpy_ndarray))))) __PYX_ERR(0, 710, __pyx_L1_error) __pyx_v_c.syn0 = ((__pyx_t_6gensim_6models_14word2vec_inner_REAL_t *)PyArray_DATA(((PyArrayObject *)__pyx_t_2))); __Pyx_DECREF(__pyx_t_2); __pyx_t_2 = 0; - /* "gensim/models/word2vec_inner.pyx":712 + /* "gensim/models/word2vec_inner.pyx":711 * cdef Word2VecConfig c * c.syn0 = (np.PyArray_DATA(model.wv.vectors)) * c.size = model.wv.vector_size # <<<<<<<<<<<<<< * * c.window = model.window */ - __pyx_t_2 = __Pyx_PyObject_GetAttrStr(__pyx_v_model, __pyx_n_s_wv); if (unlikely(!__pyx_t_2)) __PYX_ERR(0, 712, __pyx_L1_error) + __pyx_t_2 = __Pyx_PyObject_GetAttrStr(__pyx_v_model, __pyx_n_s_wv); if (unlikely(!__pyx_t_2)) __PYX_ERR(0, 711, __pyx_L1_error) __Pyx_GOTREF(__pyx_t_2); - __pyx_t_1 = __Pyx_PyObject_GetAttrStr(__pyx_t_2, __pyx_n_s_vector_size); if (unlikely(!__pyx_t_1)) __PYX_ERR(0, 712, __pyx_L1_error) + __pyx_t_1 = __Pyx_PyObject_GetAttrStr(__pyx_t_2, __pyx_n_s_vector_size); if (unlikely(!__pyx_t_1)) __PYX_ERR(0, 711, __pyx_L1_error) __Pyx_GOTREF(__pyx_t_1); __Pyx_DECREF(__pyx_t_2); __pyx_t_2 = 0; - __pyx_t_3 = __Pyx_PyInt_As_int(__pyx_t_1); if (unlikely((__pyx_t_3 == (int)-1) && PyErr_Occurred())) __PYX_ERR(0, 712, __pyx_L1_error) + __pyx_t_3 = __Pyx_PyInt_As_int(__pyx_t_1); if (unlikely((__pyx_t_3 == (int)-1) && PyErr_Occurred())) __PYX_ERR(0, 711, __pyx_L1_error) __Pyx_DECREF(__pyx_t_1); __pyx_t_1 = 0; __pyx_v_c.size = __pyx_t_3; - /* "gensim/models/word2vec_inner.pyx":714 + /* "gensim/models/word2vec_inner.pyx":713 * c.size = model.wv.vector_size * * c.window = model.window # <<<<<<<<<<<<<< * * cdef int i, j, k */ - __pyx_t_1 = __Pyx_PyObject_GetAttrStr(__pyx_v_model, __pyx_n_s_window); if (unlikely(!__pyx_t_1)) __PYX_ERR(0, 714, __pyx_L1_error) + __pyx_t_1 = __Pyx_PyObject_GetAttrStr(__pyx_v_model, __pyx_n_s_window); if (unlikely(!__pyx_t_1)) __PYX_ERR(0, 713, __pyx_L1_error) __Pyx_GOTREF(__pyx_t_1); - __pyx_t_3 = __Pyx_PyInt_As_int(__pyx_t_1); if (unlikely((__pyx_t_3 == (int)-1) && PyErr_Occurred())) __PYX_ERR(0, 714, __pyx_L1_error) + __pyx_t_3 = __Pyx_PyInt_As_int(__pyx_t_1); if (unlikely((__pyx_t_3 == (int)-1) && PyErr_Occurred())) __PYX_ERR(0, 713, __pyx_L1_error) __Pyx_DECREF(__pyx_t_1); __pyx_t_1 = 0; __pyx_v_c.window = __pyx_t_3; - /* "gensim/models/word2vec_inner.pyx":717 + /* "gensim/models/word2vec_inner.pyx":716 * * cdef int i, j, k * cdef long result = 0 # <<<<<<<<<<<<<< @@ -6654,48 +6708,48 @@ static PyObject *__pyx_pf_6gensim_6models_14word2vec_inner_4score_sentence_sg(CY */ __pyx_v_result = 0; - /* "gensim/models/word2vec_inner.pyx":720 + /* "gensim/models/word2vec_inner.pyx":719 * cdef int sentence_len * * c.syn1 = (np.PyArray_DATA(model.trainables.syn1)) # <<<<<<<<<<<<<< * * # convert Python structures to primitive types, so we can release the GIL */ - __pyx_t_1 = __Pyx_PyObject_GetAttrStr(__pyx_v_model, __pyx_n_s_trainables); if (unlikely(!__pyx_t_1)) __PYX_ERR(0, 720, __pyx_L1_error) + __pyx_t_1 = __Pyx_PyObject_GetAttrStr(__pyx_v_model, __pyx_n_s_trainables); if (unlikely(!__pyx_t_1)) __PYX_ERR(0, 719, __pyx_L1_error) __Pyx_GOTREF(__pyx_t_1); - __pyx_t_2 = __Pyx_PyObject_GetAttrStr(__pyx_t_1, __pyx_n_s_syn1); if (unlikely(!__pyx_t_2)) __PYX_ERR(0, 720, __pyx_L1_error) + __pyx_t_2 = __Pyx_PyObject_GetAttrStr(__pyx_t_1, __pyx_n_s_syn1); if (unlikely(!__pyx_t_2)) __PYX_ERR(0, 719, __pyx_L1_error) __Pyx_GOTREF(__pyx_t_2); __Pyx_DECREF(__pyx_t_1); __pyx_t_1 = 0; - if (!(likely(((__pyx_t_2) == Py_None) || likely(__Pyx_TypeTest(__pyx_t_2, __pyx_ptype_5numpy_ndarray))))) __PYX_ERR(0, 720, __pyx_L1_error) + if (!(likely(((__pyx_t_2) == Py_None) || likely(__Pyx_TypeTest(__pyx_t_2, __pyx_ptype_5numpy_ndarray))))) __PYX_ERR(0, 719, __pyx_L1_error) __pyx_v_c.syn1 = ((__pyx_t_6gensim_6models_14word2vec_inner_REAL_t *)PyArray_DATA(((PyArrayObject *)__pyx_t_2))); __Pyx_DECREF(__pyx_t_2); __pyx_t_2 = 0; - /* "gensim/models/word2vec_inner.pyx":723 + /* "gensim/models/word2vec_inner.pyx":722 * * # convert Python structures to primitive types, so we can release the GIL * c.work = np.PyArray_DATA(_work) # <<<<<<<<<<<<<< * * vlookup = model.wv.vocab */ - if (!(likely(((__pyx_v__work) == Py_None) || likely(__Pyx_TypeTest(__pyx_v__work, __pyx_ptype_5numpy_ndarray))))) __PYX_ERR(0, 723, __pyx_L1_error) + if (!(likely(((__pyx_v__work) == Py_None) || likely(__Pyx_TypeTest(__pyx_v__work, __pyx_ptype_5numpy_ndarray))))) __PYX_ERR(0, 722, __pyx_L1_error) __pyx_v_c.work = ((__pyx_t_6gensim_6models_14word2vec_inner_REAL_t *)PyArray_DATA(((PyArrayObject *)__pyx_v__work))); - /* "gensim/models/word2vec_inner.pyx":725 + /* "gensim/models/word2vec_inner.pyx":724 * c.work = np.PyArray_DATA(_work) * * vlookup = model.wv.vocab # <<<<<<<<<<<<<< * i = 0 * for token in sentence: */ - __pyx_t_2 = __Pyx_PyObject_GetAttrStr(__pyx_v_model, __pyx_n_s_wv); if (unlikely(!__pyx_t_2)) __PYX_ERR(0, 725, __pyx_L1_error) + __pyx_t_2 = __Pyx_PyObject_GetAttrStr(__pyx_v_model, __pyx_n_s_wv); if (unlikely(!__pyx_t_2)) __PYX_ERR(0, 724, __pyx_L1_error) __Pyx_GOTREF(__pyx_t_2); - __pyx_t_1 = __Pyx_PyObject_GetAttrStr(__pyx_t_2, __pyx_n_s_vocab); if (unlikely(!__pyx_t_1)) __PYX_ERR(0, 725, __pyx_L1_error) + __pyx_t_1 = __Pyx_PyObject_GetAttrStr(__pyx_t_2, __pyx_n_s_vocab); if (unlikely(!__pyx_t_1)) __PYX_ERR(0, 724, __pyx_L1_error) __Pyx_GOTREF(__pyx_t_1); __Pyx_DECREF(__pyx_t_2); __pyx_t_2 = 0; __pyx_v_vlookup = __pyx_t_1; __pyx_t_1 = 0; - /* "gensim/models/word2vec_inner.pyx":726 + /* "gensim/models/word2vec_inner.pyx":725 * * vlookup = model.wv.vocab * i = 0 # <<<<<<<<<<<<<< @@ -6704,7 +6758,7 @@ static PyObject *__pyx_pf_6gensim_6models_14word2vec_inner_4score_sentence_sg(CY */ __pyx_v_i = 0; - /* "gensim/models/word2vec_inner.pyx":727 + /* "gensim/models/word2vec_inner.pyx":726 * vlookup = model.wv.vocab * i = 0 * for token in sentence: # <<<<<<<<<<<<<< @@ -6715,26 +6769,26 @@ static PyObject *__pyx_pf_6gensim_6models_14word2vec_inner_4score_sentence_sg(CY __pyx_t_1 = __pyx_v_sentence; __Pyx_INCREF(__pyx_t_1); __pyx_t_4 = 0; __pyx_t_5 = NULL; } else { - __pyx_t_4 = -1; __pyx_t_1 = PyObject_GetIter(__pyx_v_sentence); if (unlikely(!__pyx_t_1)) __PYX_ERR(0, 727, __pyx_L1_error) + __pyx_t_4 = -1; __pyx_t_1 = PyObject_GetIter(__pyx_v_sentence); if (unlikely(!__pyx_t_1)) __PYX_ERR(0, 726, __pyx_L1_error) __Pyx_GOTREF(__pyx_t_1); - __pyx_t_5 = Py_TYPE(__pyx_t_1)->tp_iternext; if (unlikely(!__pyx_t_5)) __PYX_ERR(0, 727, __pyx_L1_error) + __pyx_t_5 = Py_TYPE(__pyx_t_1)->tp_iternext; if (unlikely(!__pyx_t_5)) __PYX_ERR(0, 726, __pyx_L1_error) } for (;;) { if (likely(!__pyx_t_5)) { if (likely(PyList_CheckExact(__pyx_t_1))) { if (__pyx_t_4 >= PyList_GET_SIZE(__pyx_t_1)) break; #if CYTHON_ASSUME_SAFE_MACROS && !CYTHON_AVOID_BORROWED_REFS - __pyx_t_2 = PyList_GET_ITEM(__pyx_t_1, __pyx_t_4); __Pyx_INCREF(__pyx_t_2); __pyx_t_4++; if (unlikely(0 < 0)) __PYX_ERR(0, 727, __pyx_L1_error) + __pyx_t_2 = PyList_GET_ITEM(__pyx_t_1, __pyx_t_4); __Pyx_INCREF(__pyx_t_2); __pyx_t_4++; if (unlikely(0 < 0)) __PYX_ERR(0, 726, __pyx_L1_error) #else - __pyx_t_2 = PySequence_ITEM(__pyx_t_1, __pyx_t_4); __pyx_t_4++; if (unlikely(!__pyx_t_2)) __PYX_ERR(0, 727, __pyx_L1_error) + __pyx_t_2 = PySequence_ITEM(__pyx_t_1, __pyx_t_4); __pyx_t_4++; if (unlikely(!__pyx_t_2)) __PYX_ERR(0, 726, __pyx_L1_error) __Pyx_GOTREF(__pyx_t_2); #endif } else { if (__pyx_t_4 >= PyTuple_GET_SIZE(__pyx_t_1)) break; #if CYTHON_ASSUME_SAFE_MACROS && !CYTHON_AVOID_BORROWED_REFS - __pyx_t_2 = PyTuple_GET_ITEM(__pyx_t_1, __pyx_t_4); __Pyx_INCREF(__pyx_t_2); __pyx_t_4++; if (unlikely(0 < 0)) __PYX_ERR(0, 727, __pyx_L1_error) + __pyx_t_2 = PyTuple_GET_ITEM(__pyx_t_1, __pyx_t_4); __Pyx_INCREF(__pyx_t_2); __pyx_t_4++; if (unlikely(0 < 0)) __PYX_ERR(0, 726, __pyx_L1_error) #else - __pyx_t_2 = PySequence_ITEM(__pyx_t_1, __pyx_t_4); __pyx_t_4++; if (unlikely(!__pyx_t_2)) __PYX_ERR(0, 727, __pyx_L1_error) + __pyx_t_2 = PySequence_ITEM(__pyx_t_1, __pyx_t_4); __pyx_t_4++; if (unlikely(!__pyx_t_2)) __PYX_ERR(0, 726, __pyx_L1_error) __Pyx_GOTREF(__pyx_t_2); #endif } @@ -6744,7 +6798,7 @@ static PyObject *__pyx_pf_6gensim_6models_14word2vec_inner_4score_sentence_sg(CY PyObject* exc_type = PyErr_Occurred(); if (exc_type) { if (likely(__Pyx_PyErr_GivenExceptionMatches(exc_type, PyExc_StopIteration))) PyErr_Clear(); - else __PYX_ERR(0, 727, __pyx_L1_error) + else __PYX_ERR(0, 726, __pyx_L1_error) } break; } @@ -6753,16 +6807,16 @@ static PyObject *__pyx_pf_6gensim_6models_14word2vec_inner_4score_sentence_sg(CY __Pyx_XDECREF_SET(__pyx_v_token, __pyx_t_2); __pyx_t_2 = 0; - /* "gensim/models/word2vec_inner.pyx":728 + /* "gensim/models/word2vec_inner.pyx":727 * i = 0 * for token in sentence: * word = vlookup[token] if token in vlookup else None # <<<<<<<<<<<<<< * if word is None: * continue # should drop the */ - __pyx_t_6 = (__Pyx_PySequence_ContainsTF(__pyx_v_token, __pyx_v_vlookup, Py_EQ)); if (unlikely(__pyx_t_6 < 0)) __PYX_ERR(0, 728, __pyx_L1_error) + __pyx_t_6 = (__Pyx_PySequence_ContainsTF(__pyx_v_token, __pyx_v_vlookup, Py_EQ)); if (unlikely(__pyx_t_6 < 0)) __PYX_ERR(0, 727, __pyx_L1_error) if ((__pyx_t_6 != 0)) { - __pyx_t_7 = __Pyx_PyObject_GetItem(__pyx_v_vlookup, __pyx_v_token); if (unlikely(!__pyx_t_7)) __PYX_ERR(0, 728, __pyx_L1_error) + __pyx_t_7 = __Pyx_PyObject_GetItem(__pyx_v_vlookup, __pyx_v_token); if (unlikely(!__pyx_t_7)) __PYX_ERR(0, 727, __pyx_L1_error) __Pyx_GOTREF(__pyx_t_7); __pyx_t_2 = __pyx_t_7; __pyx_t_7 = 0; @@ -6773,7 +6827,7 @@ static PyObject *__pyx_pf_6gensim_6models_14word2vec_inner_4score_sentence_sg(CY __Pyx_XDECREF_SET(__pyx_v_word, __pyx_t_2); __pyx_t_2 = 0; - /* "gensim/models/word2vec_inner.pyx":729 + /* "gensim/models/word2vec_inner.pyx":728 * for token in sentence: * word = vlookup[token] if token in vlookup else None * if word is None: # <<<<<<<<<<<<<< @@ -6784,7 +6838,7 @@ static PyObject *__pyx_pf_6gensim_6models_14word2vec_inner_4score_sentence_sg(CY __pyx_t_8 = (__pyx_t_6 != 0); if (__pyx_t_8) { - /* "gensim/models/word2vec_inner.pyx":730 + /* "gensim/models/word2vec_inner.pyx":729 * word = vlookup[token] if token in vlookup else None * if word is None: * continue # should drop the # <<<<<<<<<<<<<< @@ -6793,7 +6847,7 @@ static PyObject *__pyx_pf_6gensim_6models_14word2vec_inner_4score_sentence_sg(CY */ goto __pyx_L3_continue; - /* "gensim/models/word2vec_inner.pyx":729 + /* "gensim/models/word2vec_inner.pyx":728 * for token in sentence: * word = vlookup[token] if token in vlookup else None * if word is None: # <<<<<<<<<<<<<< @@ -6802,59 +6856,59 @@ static PyObject *__pyx_pf_6gensim_6models_14word2vec_inner_4score_sentence_sg(CY */ } - /* "gensim/models/word2vec_inner.pyx":731 + /* "gensim/models/word2vec_inner.pyx":730 * if word is None: * continue # should drop the * c.indexes[i] = word.index # <<<<<<<<<<<<<< * c.codelens[i] = len(word.code) * c.codes[i] = np.PyArray_DATA(word.code) */ - __pyx_t_2 = __Pyx_PyObject_GetAttrStr(__pyx_v_word, __pyx_n_s_index); if (unlikely(!__pyx_t_2)) __PYX_ERR(0, 731, __pyx_L1_error) + __pyx_t_2 = __Pyx_PyObject_GetAttrStr(__pyx_v_word, __pyx_n_s_index); if (unlikely(!__pyx_t_2)) __PYX_ERR(0, 730, __pyx_L1_error) __Pyx_GOTREF(__pyx_t_2); - __pyx_t_9 = __Pyx_PyInt_As_npy_uint32(__pyx_t_2); if (unlikely((__pyx_t_9 == ((npy_uint32)-1)) && PyErr_Occurred())) __PYX_ERR(0, 731, __pyx_L1_error) + __pyx_t_9 = __Pyx_PyInt_As_npy_uint32(__pyx_t_2); if (unlikely((__pyx_t_9 == ((npy_uint32)-1)) && PyErr_Occurred())) __PYX_ERR(0, 730, __pyx_L1_error) __Pyx_DECREF(__pyx_t_2); __pyx_t_2 = 0; (__pyx_v_c.indexes[__pyx_v_i]) = __pyx_t_9; - /* "gensim/models/word2vec_inner.pyx":732 + /* "gensim/models/word2vec_inner.pyx":731 * continue # should drop the * c.indexes[i] = word.index * c.codelens[i] = len(word.code) # <<<<<<<<<<<<<< * c.codes[i] = np.PyArray_DATA(word.code) * c.points[i] = np.PyArray_DATA(word.point) */ - __pyx_t_2 = __Pyx_PyObject_GetAttrStr(__pyx_v_word, __pyx_n_s_code); if (unlikely(!__pyx_t_2)) __PYX_ERR(0, 732, __pyx_L1_error) + __pyx_t_2 = __Pyx_PyObject_GetAttrStr(__pyx_v_word, __pyx_n_s_code); if (unlikely(!__pyx_t_2)) __PYX_ERR(0, 731, __pyx_L1_error) __Pyx_GOTREF(__pyx_t_2); - __pyx_t_10 = PyObject_Length(__pyx_t_2); if (unlikely(__pyx_t_10 == ((Py_ssize_t)-1))) __PYX_ERR(0, 732, __pyx_L1_error) + __pyx_t_10 = PyObject_Length(__pyx_t_2); if (unlikely(__pyx_t_10 == ((Py_ssize_t)-1))) __PYX_ERR(0, 731, __pyx_L1_error) __Pyx_DECREF(__pyx_t_2); __pyx_t_2 = 0; (__pyx_v_c.codelens[__pyx_v_i]) = ((int)__pyx_t_10); - /* "gensim/models/word2vec_inner.pyx":733 + /* "gensim/models/word2vec_inner.pyx":732 * c.indexes[i] = word.index * c.codelens[i] = len(word.code) * c.codes[i] = np.PyArray_DATA(word.code) # <<<<<<<<<<<<<< * c.points[i] = np.PyArray_DATA(word.point) * result += 1 */ - __pyx_t_2 = __Pyx_PyObject_GetAttrStr(__pyx_v_word, __pyx_n_s_code); if (unlikely(!__pyx_t_2)) __PYX_ERR(0, 733, __pyx_L1_error) + __pyx_t_2 = __Pyx_PyObject_GetAttrStr(__pyx_v_word, __pyx_n_s_code); if (unlikely(!__pyx_t_2)) __PYX_ERR(0, 732, __pyx_L1_error) __Pyx_GOTREF(__pyx_t_2); - if (!(likely(((__pyx_t_2) == Py_None) || likely(__Pyx_TypeTest(__pyx_t_2, __pyx_ptype_5numpy_ndarray))))) __PYX_ERR(0, 733, __pyx_L1_error) + if (!(likely(((__pyx_t_2) == Py_None) || likely(__Pyx_TypeTest(__pyx_t_2, __pyx_ptype_5numpy_ndarray))))) __PYX_ERR(0, 732, __pyx_L1_error) (__pyx_v_c.codes[__pyx_v_i]) = ((__pyx_t_5numpy_uint8_t *)PyArray_DATA(((PyArrayObject *)__pyx_t_2))); __Pyx_DECREF(__pyx_t_2); __pyx_t_2 = 0; - /* "gensim/models/word2vec_inner.pyx":734 + /* "gensim/models/word2vec_inner.pyx":733 * c.codelens[i] = len(word.code) * c.codes[i] = np.PyArray_DATA(word.code) * c.points[i] = np.PyArray_DATA(word.point) # <<<<<<<<<<<<<< * result += 1 * i += 1 */ - __pyx_t_2 = __Pyx_PyObject_GetAttrStr(__pyx_v_word, __pyx_n_s_point); if (unlikely(!__pyx_t_2)) __PYX_ERR(0, 734, __pyx_L1_error) + __pyx_t_2 = __Pyx_PyObject_GetAttrStr(__pyx_v_word, __pyx_n_s_point); if (unlikely(!__pyx_t_2)) __PYX_ERR(0, 733, __pyx_L1_error) __Pyx_GOTREF(__pyx_t_2); - if (!(likely(((__pyx_t_2) == Py_None) || likely(__Pyx_TypeTest(__pyx_t_2, __pyx_ptype_5numpy_ndarray))))) __PYX_ERR(0, 734, __pyx_L1_error) + if (!(likely(((__pyx_t_2) == Py_None) || likely(__Pyx_TypeTest(__pyx_t_2, __pyx_ptype_5numpy_ndarray))))) __PYX_ERR(0, 733, __pyx_L1_error) (__pyx_v_c.points[__pyx_v_i]) = ((__pyx_t_5numpy_uint32_t *)PyArray_DATA(((PyArrayObject *)__pyx_t_2))); __Pyx_DECREF(__pyx_t_2); __pyx_t_2 = 0; - /* "gensim/models/word2vec_inner.pyx":735 + /* "gensim/models/word2vec_inner.pyx":734 * c.codes[i] = np.PyArray_DATA(word.code) * c.points[i] = np.PyArray_DATA(word.point) * result += 1 # <<<<<<<<<<<<<< @@ -6863,7 +6917,7 @@ static PyObject *__pyx_pf_6gensim_6models_14word2vec_inner_4score_sentence_sg(CY */ __pyx_v_result = (__pyx_v_result + 1); - /* "gensim/models/word2vec_inner.pyx":736 + /* "gensim/models/word2vec_inner.pyx":735 * c.points[i] = np.PyArray_DATA(word.point) * result += 1 * i += 1 # <<<<<<<<<<<<<< @@ -6872,7 +6926,7 @@ static PyObject *__pyx_pf_6gensim_6models_14word2vec_inner_4score_sentence_sg(CY */ __pyx_v_i = (__pyx_v_i + 1); - /* "gensim/models/word2vec_inner.pyx":737 + /* "gensim/models/word2vec_inner.pyx":736 * result += 1 * i += 1 * if i == MAX_SENTENCE_LEN: # <<<<<<<<<<<<<< @@ -6882,7 +6936,7 @@ static PyObject *__pyx_pf_6gensim_6models_14word2vec_inner_4score_sentence_sg(CY __pyx_t_8 = ((__pyx_v_i == 0x2710) != 0); if (__pyx_t_8) { - /* "gensim/models/word2vec_inner.pyx":738 + /* "gensim/models/word2vec_inner.pyx":737 * i += 1 * if i == MAX_SENTENCE_LEN: * break # TODO: log warning, tally overflow? # <<<<<<<<<<<<<< @@ -6891,7 +6945,7 @@ static PyObject *__pyx_pf_6gensim_6models_14word2vec_inner_4score_sentence_sg(CY */ goto __pyx_L4_break; - /* "gensim/models/word2vec_inner.pyx":737 + /* "gensim/models/word2vec_inner.pyx":736 * result += 1 * i += 1 * if i == MAX_SENTENCE_LEN: # <<<<<<<<<<<<<< @@ -6900,7 +6954,7 @@ static PyObject *__pyx_pf_6gensim_6models_14word2vec_inner_4score_sentence_sg(CY */ } - /* "gensim/models/word2vec_inner.pyx":727 + /* "gensim/models/word2vec_inner.pyx":726 * vlookup = model.wv.vocab * i = 0 * for token in sentence: # <<<<<<<<<<<<<< @@ -6912,7 +6966,7 @@ static PyObject *__pyx_pf_6gensim_6models_14word2vec_inner_4score_sentence_sg(CY __pyx_L4_break:; __Pyx_DECREF(__pyx_t_1); __pyx_t_1 = 0; - /* "gensim/models/word2vec_inner.pyx":739 + /* "gensim/models/word2vec_inner.pyx":738 * if i == MAX_SENTENCE_LEN: * break # TODO: log warning, tally overflow? * sentence_len = i # <<<<<<<<<<<<<< @@ -6921,7 +6975,7 @@ static PyObject *__pyx_pf_6gensim_6models_14word2vec_inner_4score_sentence_sg(CY */ __pyx_v_sentence_len = __pyx_v_i; - /* "gensim/models/word2vec_inner.pyx":742 + /* "gensim/models/word2vec_inner.pyx":741 * * # release GIL & train on the sentence * c.work[0] = 0.0 # <<<<<<<<<<<<<< @@ -6930,7 +6984,7 @@ static PyObject *__pyx_pf_6gensim_6models_14word2vec_inner_4score_sentence_sg(CY */ (__pyx_v_c.work[0]) = 0.0; - /* "gensim/models/word2vec_inner.pyx":744 + /* "gensim/models/word2vec_inner.pyx":743 * c.work[0] = 0.0 * * with nogil: # <<<<<<<<<<<<<< @@ -6945,7 +6999,7 @@ static PyObject *__pyx_pf_6gensim_6models_14word2vec_inner_4score_sentence_sg(CY #endif /*try:*/ { - /* "gensim/models/word2vec_inner.pyx":745 + /* "gensim/models/word2vec_inner.pyx":744 * * with nogil: * for i in range(sentence_len): # <<<<<<<<<<<<<< @@ -6957,7 +7011,7 @@ static PyObject *__pyx_pf_6gensim_6models_14word2vec_inner_4score_sentence_sg(CY for (__pyx_t_12 = 0; __pyx_t_12 < __pyx_t_11; __pyx_t_12+=1) { __pyx_v_i = __pyx_t_12; - /* "gensim/models/word2vec_inner.pyx":746 + /* "gensim/models/word2vec_inner.pyx":745 * with nogil: * for i in range(sentence_len): * if c.codelens[i] == 0: # <<<<<<<<<<<<<< @@ -6967,7 +7021,7 @@ static PyObject *__pyx_pf_6gensim_6models_14word2vec_inner_4score_sentence_sg(CY __pyx_t_8 = (((__pyx_v_c.codelens[__pyx_v_i]) == 0) != 0); if (__pyx_t_8) { - /* "gensim/models/word2vec_inner.pyx":747 + /* "gensim/models/word2vec_inner.pyx":746 * for i in range(sentence_len): * if c.codelens[i] == 0: * continue # <<<<<<<<<<<<<< @@ -6976,7 +7030,7 @@ static PyObject *__pyx_pf_6gensim_6models_14word2vec_inner_4score_sentence_sg(CY */ goto __pyx_L10_continue; - /* "gensim/models/word2vec_inner.pyx":746 + /* "gensim/models/word2vec_inner.pyx":745 * with nogil: * for i in range(sentence_len): * if c.codelens[i] == 0: # <<<<<<<<<<<<<< @@ -6985,7 +7039,7 @@ static PyObject *__pyx_pf_6gensim_6models_14word2vec_inner_4score_sentence_sg(CY */ } - /* "gensim/models/word2vec_inner.pyx":748 + /* "gensim/models/word2vec_inner.pyx":747 * if c.codelens[i] == 0: * continue * j = i - c.window # <<<<<<<<<<<<<< @@ -6994,7 +7048,7 @@ static PyObject *__pyx_pf_6gensim_6models_14word2vec_inner_4score_sentence_sg(CY */ __pyx_v_j = (__pyx_v_i - __pyx_v_c.window); - /* "gensim/models/word2vec_inner.pyx":749 + /* "gensim/models/word2vec_inner.pyx":748 * continue * j = i - c.window * if j < 0: # <<<<<<<<<<<<<< @@ -7004,7 +7058,7 @@ static PyObject *__pyx_pf_6gensim_6models_14word2vec_inner_4score_sentence_sg(CY __pyx_t_8 = ((__pyx_v_j < 0) != 0); if (__pyx_t_8) { - /* "gensim/models/word2vec_inner.pyx":750 + /* "gensim/models/word2vec_inner.pyx":749 * j = i - c.window * if j < 0: * j = 0 # <<<<<<<<<<<<<< @@ -7013,7 +7067,7 @@ static PyObject *__pyx_pf_6gensim_6models_14word2vec_inner_4score_sentence_sg(CY */ __pyx_v_j = 0; - /* "gensim/models/word2vec_inner.pyx":749 + /* "gensim/models/word2vec_inner.pyx":748 * continue * j = i - c.window * if j < 0: # <<<<<<<<<<<<<< @@ -7022,7 +7076,7 @@ static PyObject *__pyx_pf_6gensim_6models_14word2vec_inner_4score_sentence_sg(CY */ } - /* "gensim/models/word2vec_inner.pyx":751 + /* "gensim/models/word2vec_inner.pyx":750 * if j < 0: * j = 0 * k = i + c.window + 1 # <<<<<<<<<<<<<< @@ -7031,7 +7085,7 @@ static PyObject *__pyx_pf_6gensim_6models_14word2vec_inner_4score_sentence_sg(CY */ __pyx_v_k = ((__pyx_v_i + __pyx_v_c.window) + 1); - /* "gensim/models/word2vec_inner.pyx":752 + /* "gensim/models/word2vec_inner.pyx":751 * j = 0 * k = i + c.window + 1 * if k > sentence_len: # <<<<<<<<<<<<<< @@ -7041,7 +7095,7 @@ static PyObject *__pyx_pf_6gensim_6models_14word2vec_inner_4score_sentence_sg(CY __pyx_t_8 = ((__pyx_v_k > __pyx_v_sentence_len) != 0); if (__pyx_t_8) { - /* "gensim/models/word2vec_inner.pyx":753 + /* "gensim/models/word2vec_inner.pyx":752 * k = i + c.window + 1 * if k > sentence_len: * k = sentence_len # <<<<<<<<<<<<<< @@ -7050,7 +7104,7 @@ static PyObject *__pyx_pf_6gensim_6models_14word2vec_inner_4score_sentence_sg(CY */ __pyx_v_k = __pyx_v_sentence_len; - /* "gensim/models/word2vec_inner.pyx":752 + /* "gensim/models/word2vec_inner.pyx":751 * j = 0 * k = i + c.window + 1 * if k > sentence_len: # <<<<<<<<<<<<<< @@ -7059,7 +7113,7 @@ static PyObject *__pyx_pf_6gensim_6models_14word2vec_inner_4score_sentence_sg(CY */ } - /* "gensim/models/word2vec_inner.pyx":754 + /* "gensim/models/word2vec_inner.pyx":753 * if k > sentence_len: * k = sentence_len * for j in range(j, k): # <<<<<<<<<<<<<< @@ -7071,7 +7125,7 @@ static PyObject *__pyx_pf_6gensim_6models_14word2vec_inner_4score_sentence_sg(CY for (__pyx_t_15 = __pyx_v_j; __pyx_t_15 < __pyx_t_14; __pyx_t_15+=1) { __pyx_v_j = __pyx_t_15; - /* "gensim/models/word2vec_inner.pyx":755 + /* "gensim/models/word2vec_inner.pyx":754 * k = sentence_len * for j in range(j, k): * if j == i or c.codelens[j] == 0: # <<<<<<<<<<<<<< @@ -7089,7 +7143,7 @@ static PyObject *__pyx_pf_6gensim_6models_14word2vec_inner_4score_sentence_sg(CY __pyx_L18_bool_binop_done:; if (__pyx_t_8) { - /* "gensim/models/word2vec_inner.pyx":756 + /* "gensim/models/word2vec_inner.pyx":755 * for j in range(j, k): * if j == i or c.codelens[j] == 0: * continue # <<<<<<<<<<<<<< @@ -7098,7 +7152,7 @@ static PyObject *__pyx_pf_6gensim_6models_14word2vec_inner_4score_sentence_sg(CY */ goto __pyx_L15_continue; - /* "gensim/models/word2vec_inner.pyx":755 + /* "gensim/models/word2vec_inner.pyx":754 * k = sentence_len * for j in range(j, k): * if j == i or c.codelens[j] == 0: # <<<<<<<<<<<<<< @@ -7107,7 +7161,7 @@ static PyObject *__pyx_pf_6gensim_6models_14word2vec_inner_4score_sentence_sg(CY */ } - /* "gensim/models/word2vec_inner.pyx":757 + /* "gensim/models/word2vec_inner.pyx":756 * if j == i or c.codelens[j] == 0: * continue * score_pair_sg_hs(c.points[i], c.codes[i], c.codelens[i], c.syn0, c.syn1, c.size, c.indexes[j], c.work) # <<<<<<<<<<<<<< @@ -7121,7 +7175,7 @@ static PyObject *__pyx_pf_6gensim_6models_14word2vec_inner_4score_sentence_sg(CY } } - /* "gensim/models/word2vec_inner.pyx":744 + /* "gensim/models/word2vec_inner.pyx":743 * c.work[0] = 0.0 * * with nogil: # <<<<<<<<<<<<<< @@ -7140,7 +7194,7 @@ static PyObject *__pyx_pf_6gensim_6models_14word2vec_inner_4score_sentence_sg(CY } } - /* "gensim/models/word2vec_inner.pyx":759 + /* "gensim/models/word2vec_inner.pyx":758 * score_pair_sg_hs(c.points[i], c.codes[i], c.codelens[i], c.syn0, c.syn1, c.size, c.indexes[j], c.work) * * return c.work[0] # <<<<<<<<<<<<<< @@ -7148,13 +7202,13 @@ static PyObject *__pyx_pf_6gensim_6models_14word2vec_inner_4score_sentence_sg(CY * cdef void score_pair_sg_hs( */ __Pyx_XDECREF(__pyx_r); - __pyx_t_1 = PyFloat_FromDouble((__pyx_v_c.work[0])); if (unlikely(!__pyx_t_1)) __PYX_ERR(0, 759, __pyx_L1_error) + __pyx_t_1 = PyFloat_FromDouble((__pyx_v_c.work[0])); if (unlikely(!__pyx_t_1)) __PYX_ERR(0, 758, __pyx_L1_error) __Pyx_GOTREF(__pyx_t_1); __pyx_r = __pyx_t_1; __pyx_t_1 = 0; goto __pyx_L0; - /* "gensim/models/word2vec_inner.pyx":687 + /* "gensim/models/word2vec_inner.pyx":686 * * * def score_sentence_sg(model, sentence, _work): # <<<<<<<<<<<<<< @@ -7178,7 +7232,7 @@ static PyObject *__pyx_pf_6gensim_6models_14word2vec_inner_4score_sentence_sg(CY return __pyx_r; } -/* "gensim/models/word2vec_inner.pyx":761 +/* "gensim/models/word2vec_inner.pyx":760 * return c.work[0] * * cdef void score_pair_sg_hs( # <<<<<<<<<<<<<< @@ -7199,7 +7253,7 @@ static void __pyx_f_6gensim_6models_14word2vec_inner_score_pair_sg_hs(__pyx_t_5n int __pyx_t_5; long __pyx_t_6; - /* "gensim/models/word2vec_inner.pyx":767 + /* "gensim/models/word2vec_inner.pyx":766 * * cdef long long b * cdef long long row1 = word2_index * size, row2, sgn # <<<<<<<<<<<<<< @@ -7208,7 +7262,7 @@ static void __pyx_f_6gensim_6models_14word2vec_inner_score_pair_sg_hs(__pyx_t_5n */ __pyx_v_row1 = (__pyx_v_word2_index * __pyx_v_size); - /* "gensim/models/word2vec_inner.pyx":770 + /* "gensim/models/word2vec_inner.pyx":769 * cdef REAL_t f * * for b in range(codelen): # <<<<<<<<<<<<<< @@ -7220,7 +7274,7 @@ static void __pyx_f_6gensim_6models_14word2vec_inner_score_pair_sg_hs(__pyx_t_5n for (__pyx_t_3 = 0; __pyx_t_3 < __pyx_t_2; __pyx_t_3+=1) { __pyx_v_b = __pyx_t_3; - /* "gensim/models/word2vec_inner.pyx":771 + /* "gensim/models/word2vec_inner.pyx":770 * * for b in range(codelen): * row2 = word_point[b] * size # <<<<<<<<<<<<<< @@ -7229,7 +7283,7 @@ static void __pyx_f_6gensim_6models_14word2vec_inner_score_pair_sg_hs(__pyx_t_5n */ __pyx_v_row2 = ((__pyx_v_word_point[__pyx_v_b]) * __pyx_v_size); - /* "gensim/models/word2vec_inner.pyx":772 + /* "gensim/models/word2vec_inner.pyx":771 * for b in range(codelen): * row2 = word_point[b] * size * f = our_dot(&size, &syn0[row1], &ONE, &syn1[row2], &ONE) # <<<<<<<<<<<<<< @@ -7238,7 +7292,7 @@ static void __pyx_f_6gensim_6models_14word2vec_inner_score_pair_sg_hs(__pyx_t_5n */ __pyx_v_f = __pyx_v_6gensim_6models_14word2vec_inner_our_dot((&__pyx_v_size), (&(__pyx_v_syn0[__pyx_v_row1])), (&__pyx_v_6gensim_6models_14word2vec_inner_ONE), (&(__pyx_v_syn1[__pyx_v_row2])), (&__pyx_v_6gensim_6models_14word2vec_inner_ONE)); - /* "gensim/models/word2vec_inner.pyx":773 + /* "gensim/models/word2vec_inner.pyx":772 * row2 = word_point[b] * size * f = our_dot(&size, &syn0[row1], &ONE, &syn1[row2], &ONE) * sgn = (-1)**word_code[b] # ch function: 0-> 1, 1 -> -1 # <<<<<<<<<<<<<< @@ -7247,7 +7301,7 @@ static void __pyx_f_6gensim_6models_14word2vec_inner_score_pair_sg_hs(__pyx_t_5n */ __pyx_v_sgn = __Pyx_pow_long(-1L, ((long)(__pyx_v_word_code[__pyx_v_b]))); - /* "gensim/models/word2vec_inner.pyx":774 + /* "gensim/models/word2vec_inner.pyx":773 * f = our_dot(&size, &syn0[row1], &ONE, &syn1[row2], &ONE) * sgn = (-1)**word_code[b] # ch function: 0-> 1, 1 -> -1 * f *= sgn # <<<<<<<<<<<<<< @@ -7256,7 +7310,7 @@ static void __pyx_f_6gensim_6models_14word2vec_inner_score_pair_sg_hs(__pyx_t_5n */ __pyx_v_f = (__pyx_v_f * __pyx_v_sgn); - /* "gensim/models/word2vec_inner.pyx":775 + /* "gensim/models/word2vec_inner.pyx":774 * sgn = (-1)**word_code[b] # ch function: 0-> 1, 1 -> -1 * f *= sgn * if f <= -MAX_EXP or f >= MAX_EXP: # <<<<<<<<<<<<<< @@ -7274,7 +7328,7 @@ static void __pyx_f_6gensim_6models_14word2vec_inner_score_pair_sg_hs(__pyx_t_5n __pyx_L6_bool_binop_done:; if (__pyx_t_4) { - /* "gensim/models/word2vec_inner.pyx":776 + /* "gensim/models/word2vec_inner.pyx":775 * f *= sgn * if f <= -MAX_EXP or f >= MAX_EXP: * continue # <<<<<<<<<<<<<< @@ -7283,7 +7337,7 @@ static void __pyx_f_6gensim_6models_14word2vec_inner_score_pair_sg_hs(__pyx_t_5n */ goto __pyx_L3_continue; - /* "gensim/models/word2vec_inner.pyx":775 + /* "gensim/models/word2vec_inner.pyx":774 * sgn = (-1)**word_code[b] # ch function: 0-> 1, 1 -> -1 * f *= sgn * if f <= -MAX_EXP or f >= MAX_EXP: # <<<<<<<<<<<<<< @@ -7292,7 +7346,7 @@ static void __pyx_f_6gensim_6models_14word2vec_inner_score_pair_sg_hs(__pyx_t_5n */ } - /* "gensim/models/word2vec_inner.pyx":777 + /* "gensim/models/word2vec_inner.pyx":776 * if f <= -MAX_EXP or f >= MAX_EXP: * continue * f = LOG_TABLE[((f + MAX_EXP) * (EXP_TABLE_SIZE / MAX_EXP / 2))] # <<<<<<<<<<<<<< @@ -7301,7 +7355,7 @@ static void __pyx_f_6gensim_6models_14word2vec_inner_score_pair_sg_hs(__pyx_t_5n */ __pyx_v_f = (__pyx_v_6gensim_6models_14word2vec_inner_LOG_TABLE[((int)((__pyx_v_f + 6.0) * 83.0))]); - /* "gensim/models/word2vec_inner.pyx":778 + /* "gensim/models/word2vec_inner.pyx":777 * continue * f = LOG_TABLE[((f + MAX_EXP) * (EXP_TABLE_SIZE / MAX_EXP / 2))] * work[0] += f # <<<<<<<<<<<<<< @@ -7313,7 +7367,7 @@ static void __pyx_f_6gensim_6models_14word2vec_inner_score_pair_sg_hs(__pyx_t_5n __pyx_L3_continue:; } - /* "gensim/models/word2vec_inner.pyx":761 + /* "gensim/models/word2vec_inner.pyx":760 * return c.work[0] * * cdef void score_pair_sg_hs( # <<<<<<<<<<<<<< @@ -7324,7 +7378,7 @@ static void __pyx_f_6gensim_6models_14word2vec_inner_score_pair_sg_hs(__pyx_t_5n /* function exit code */ } -/* "gensim/models/word2vec_inner.pyx":780 +/* "gensim/models/word2vec_inner.pyx":779 * work[0] += f * * def score_sentence_cbow(model, sentence, _work, _neu1): # <<<<<<<<<<<<<< @@ -7335,7 +7389,7 @@ static void __pyx_f_6gensim_6models_14word2vec_inner_score_pair_sg_hs(__pyx_t_5n /* Python wrapper */ static PyObject *__pyx_pw_6gensim_6models_14word2vec_inner_7score_sentence_cbow(PyObject *__pyx_self, PyObject *__pyx_args, PyObject *__pyx_kwds); /*proto*/ static char __pyx_doc_6gensim_6models_14word2vec_inner_6score_sentence_cbow[] = "score_sentence_cbow(model, sentence, _work, _neu1)\nObtain likelihood score for a single sentence in a fitted CBOW representation.\n\n Notes\n -----\n This scoring function is only implemented for hierarchical softmax (`model.hs == 1`).\n The model should have been trained using the skip-gram model (`model.cbow` == 1`).\n\n Parameters\n ----------\n model : :class:`~gensim.models.word2vec.Word2Vec`\n The trained model. It **MUST** have been trained using hierarchical softmax and the CBOW algorithm.\n sentence : list of str\n The words comprising the sentence to be scored.\n _work : np.ndarray\n Private working memory for each worker.\n _neu1 : np.ndarray\n Private working memory for each worker.\n\n Returns\n -------\n float\n The probability assigned to this sentence by the Skip-Gram model.\n\n "; -static PyMethodDef __pyx_mdef_6gensim_6models_14word2vec_inner_7score_sentence_cbow = {"score_sentence_cbow", (PyCFunction)__pyx_pw_6gensim_6models_14word2vec_inner_7score_sentence_cbow, METH_VARARGS|METH_KEYWORDS, __pyx_doc_6gensim_6models_14word2vec_inner_6score_sentence_cbow}; +static PyMethodDef __pyx_mdef_6gensim_6models_14word2vec_inner_7score_sentence_cbow = {"score_sentence_cbow", (PyCFunction)(void*)(PyCFunctionWithKeywords)__pyx_pw_6gensim_6models_14word2vec_inner_7score_sentence_cbow, METH_VARARGS|METH_KEYWORDS, __pyx_doc_6gensim_6models_14word2vec_inner_6score_sentence_cbow}; static PyObject *__pyx_pw_6gensim_6models_14word2vec_inner_7score_sentence_cbow(PyObject *__pyx_self, PyObject *__pyx_args, PyObject *__pyx_kwds) { PyObject *__pyx_v_model = 0; PyObject *__pyx_v_sentence = 0; @@ -7371,23 +7425,23 @@ static PyObject *__pyx_pw_6gensim_6models_14word2vec_inner_7score_sentence_cbow( case 1: if (likely((values[1] = __Pyx_PyDict_GetItemStr(__pyx_kwds, __pyx_n_s_sentence)) != 0)) kw_args--; else { - __Pyx_RaiseArgtupleInvalid("score_sentence_cbow", 1, 4, 4, 1); __PYX_ERR(0, 780, __pyx_L3_error) + __Pyx_RaiseArgtupleInvalid("score_sentence_cbow", 1, 4, 4, 1); __PYX_ERR(0, 779, __pyx_L3_error) } CYTHON_FALLTHROUGH; case 2: if (likely((values[2] = __Pyx_PyDict_GetItemStr(__pyx_kwds, __pyx_n_s_work)) != 0)) kw_args--; else { - __Pyx_RaiseArgtupleInvalid("score_sentence_cbow", 1, 4, 4, 2); __PYX_ERR(0, 780, __pyx_L3_error) + __Pyx_RaiseArgtupleInvalid("score_sentence_cbow", 1, 4, 4, 2); __PYX_ERR(0, 779, __pyx_L3_error) } CYTHON_FALLTHROUGH; case 3: if (likely((values[3] = __Pyx_PyDict_GetItemStr(__pyx_kwds, __pyx_n_s_neu1)) != 0)) kw_args--; else { - __Pyx_RaiseArgtupleInvalid("score_sentence_cbow", 1, 4, 4, 3); __PYX_ERR(0, 780, __pyx_L3_error) + __Pyx_RaiseArgtupleInvalid("score_sentence_cbow", 1, 4, 4, 3); __PYX_ERR(0, 779, __pyx_L3_error) } } if (unlikely(kw_args > 0)) { - if (unlikely(__Pyx_ParseOptionalKeywords(__pyx_kwds, __pyx_pyargnames, 0, values, pos_args, "score_sentence_cbow") < 0)) __PYX_ERR(0, 780, __pyx_L3_error) + if (unlikely(__Pyx_ParseOptionalKeywords(__pyx_kwds, __pyx_pyargnames, 0, values, pos_args, "score_sentence_cbow") < 0)) __PYX_ERR(0, 779, __pyx_L3_error) } } else if (PyTuple_GET_SIZE(__pyx_args) != 4) { goto __pyx_L5_argtuple_error; @@ -7404,7 +7458,7 @@ static PyObject *__pyx_pw_6gensim_6models_14word2vec_inner_7score_sentence_cbow( } goto __pyx_L4_argument_unpacking_done; __pyx_L5_argtuple_error:; - __Pyx_RaiseArgtupleInvalid("score_sentence_cbow", 1, 4, 4, PyTuple_GET_SIZE(__pyx_args)); __PYX_ERR(0, 780, __pyx_L3_error) + __Pyx_RaiseArgtupleInvalid("score_sentence_cbow", 1, 4, 4, PyTuple_GET_SIZE(__pyx_args)); __PYX_ERR(0, 779, __pyx_L3_error) __pyx_L3_error:; __Pyx_AddTraceback("gensim.models.word2vec_inner.score_sentence_cbow", __pyx_clineno, __pyx_lineno, __pyx_filename); __Pyx_RefNannyFinishContext(); @@ -7443,65 +7497,65 @@ static PyObject *__pyx_pf_6gensim_6models_14word2vec_inner_6score_sentence_cbow( int __pyx_t_12; __Pyx_RefNannySetupContext("score_sentence_cbow", 0); - /* "gensim/models/word2vec_inner.pyx":807 + /* "gensim/models/word2vec_inner.pyx":806 * cdef Word2VecConfig c * * c.cbow_mean = model.cbow_mean # <<<<<<<<<<<<<< * c.syn0 = (np.PyArray_DATA(model.wv.vectors)) * c.size = model.wv.vector_size */ - __pyx_t_1 = __Pyx_PyObject_GetAttrStr(__pyx_v_model, __pyx_n_s_cbow_mean); if (unlikely(!__pyx_t_1)) __PYX_ERR(0, 807, __pyx_L1_error) + __pyx_t_1 = __Pyx_PyObject_GetAttrStr(__pyx_v_model, __pyx_n_s_cbow_mean); if (unlikely(!__pyx_t_1)) __PYX_ERR(0, 806, __pyx_L1_error) __Pyx_GOTREF(__pyx_t_1); - __pyx_t_2 = __Pyx_PyInt_As_int(__pyx_t_1); if (unlikely((__pyx_t_2 == (int)-1) && PyErr_Occurred())) __PYX_ERR(0, 807, __pyx_L1_error) + __pyx_t_2 = __Pyx_PyInt_As_int(__pyx_t_1); if (unlikely((__pyx_t_2 == (int)-1) && PyErr_Occurred())) __PYX_ERR(0, 806, __pyx_L1_error) __Pyx_DECREF(__pyx_t_1); __pyx_t_1 = 0; __pyx_v_c.cbow_mean = __pyx_t_2; - /* "gensim/models/word2vec_inner.pyx":808 + /* "gensim/models/word2vec_inner.pyx":807 * * c.cbow_mean = model.cbow_mean * c.syn0 = (np.PyArray_DATA(model.wv.vectors)) # <<<<<<<<<<<<<< * c.size = model.wv.vector_size * c.window = model.window */ - __pyx_t_1 = __Pyx_PyObject_GetAttrStr(__pyx_v_model, __pyx_n_s_wv); if (unlikely(!__pyx_t_1)) __PYX_ERR(0, 808, __pyx_L1_error) + __pyx_t_1 = __Pyx_PyObject_GetAttrStr(__pyx_v_model, __pyx_n_s_wv); if (unlikely(!__pyx_t_1)) __PYX_ERR(0, 807, __pyx_L1_error) __Pyx_GOTREF(__pyx_t_1); - __pyx_t_3 = __Pyx_PyObject_GetAttrStr(__pyx_t_1, __pyx_n_s_vectors); if (unlikely(!__pyx_t_3)) __PYX_ERR(0, 808, __pyx_L1_error) + __pyx_t_3 = __Pyx_PyObject_GetAttrStr(__pyx_t_1, __pyx_n_s_vectors); if (unlikely(!__pyx_t_3)) __PYX_ERR(0, 807, __pyx_L1_error) __Pyx_GOTREF(__pyx_t_3); __Pyx_DECREF(__pyx_t_1); __pyx_t_1 = 0; - if (!(likely(((__pyx_t_3) == Py_None) || likely(__Pyx_TypeTest(__pyx_t_3, __pyx_ptype_5numpy_ndarray))))) __PYX_ERR(0, 808, __pyx_L1_error) + if (!(likely(((__pyx_t_3) == Py_None) || likely(__Pyx_TypeTest(__pyx_t_3, __pyx_ptype_5numpy_ndarray))))) __PYX_ERR(0, 807, __pyx_L1_error) __pyx_v_c.syn0 = ((__pyx_t_6gensim_6models_14word2vec_inner_REAL_t *)PyArray_DATA(((PyArrayObject *)__pyx_t_3))); __Pyx_DECREF(__pyx_t_3); __pyx_t_3 = 0; - /* "gensim/models/word2vec_inner.pyx":809 + /* "gensim/models/word2vec_inner.pyx":808 * c.cbow_mean = model.cbow_mean * c.syn0 = (np.PyArray_DATA(model.wv.vectors)) * c.size = model.wv.vector_size # <<<<<<<<<<<<<< * c.window = model.window * */ - __pyx_t_3 = __Pyx_PyObject_GetAttrStr(__pyx_v_model, __pyx_n_s_wv); if (unlikely(!__pyx_t_3)) __PYX_ERR(0, 809, __pyx_L1_error) + __pyx_t_3 = __Pyx_PyObject_GetAttrStr(__pyx_v_model, __pyx_n_s_wv); if (unlikely(!__pyx_t_3)) __PYX_ERR(0, 808, __pyx_L1_error) __Pyx_GOTREF(__pyx_t_3); - __pyx_t_1 = __Pyx_PyObject_GetAttrStr(__pyx_t_3, __pyx_n_s_vector_size); if (unlikely(!__pyx_t_1)) __PYX_ERR(0, 809, __pyx_L1_error) + __pyx_t_1 = __Pyx_PyObject_GetAttrStr(__pyx_t_3, __pyx_n_s_vector_size); if (unlikely(!__pyx_t_1)) __PYX_ERR(0, 808, __pyx_L1_error) __Pyx_GOTREF(__pyx_t_1); __Pyx_DECREF(__pyx_t_3); __pyx_t_3 = 0; - __pyx_t_2 = __Pyx_PyInt_As_int(__pyx_t_1); if (unlikely((__pyx_t_2 == (int)-1) && PyErr_Occurred())) __PYX_ERR(0, 809, __pyx_L1_error) + __pyx_t_2 = __Pyx_PyInt_As_int(__pyx_t_1); if (unlikely((__pyx_t_2 == (int)-1) && PyErr_Occurred())) __PYX_ERR(0, 808, __pyx_L1_error) __Pyx_DECREF(__pyx_t_1); __pyx_t_1 = 0; __pyx_v_c.size = __pyx_t_2; - /* "gensim/models/word2vec_inner.pyx":810 + /* "gensim/models/word2vec_inner.pyx":809 * c.syn0 = (np.PyArray_DATA(model.wv.vectors)) * c.size = model.wv.vector_size * c.window = model.window # <<<<<<<<<<<<<< * * cdef int i, j, k */ - __pyx_t_1 = __Pyx_PyObject_GetAttrStr(__pyx_v_model, __pyx_n_s_window); if (unlikely(!__pyx_t_1)) __PYX_ERR(0, 810, __pyx_L1_error) + __pyx_t_1 = __Pyx_PyObject_GetAttrStr(__pyx_v_model, __pyx_n_s_window); if (unlikely(!__pyx_t_1)) __PYX_ERR(0, 809, __pyx_L1_error) __Pyx_GOTREF(__pyx_t_1); - __pyx_t_2 = __Pyx_PyInt_As_int(__pyx_t_1); if (unlikely((__pyx_t_2 == (int)-1) && PyErr_Occurred())) __PYX_ERR(0, 810, __pyx_L1_error) + __pyx_t_2 = __Pyx_PyInt_As_int(__pyx_t_1); if (unlikely((__pyx_t_2 == (int)-1) && PyErr_Occurred())) __PYX_ERR(0, 809, __pyx_L1_error) __Pyx_DECREF(__pyx_t_1); __pyx_t_1 = 0; __pyx_v_c.window = __pyx_t_2; - /* "gensim/models/word2vec_inner.pyx":813 + /* "gensim/models/word2vec_inner.pyx":812 * * cdef int i, j, k * cdef long result = 0 # <<<<<<<<<<<<<< @@ -7510,58 +7564,58 @@ static PyObject *__pyx_pf_6gensim_6models_14word2vec_inner_6score_sentence_cbow( */ __pyx_v_result = 0; - /* "gensim/models/word2vec_inner.pyx":815 + /* "gensim/models/word2vec_inner.pyx":814 * cdef long result = 0 * * c.syn1 = (np.PyArray_DATA(model.trainables.syn1)) # <<<<<<<<<<<<<< * * # convert Python structures to primitive types, so we can release the GIL */ - __pyx_t_1 = __Pyx_PyObject_GetAttrStr(__pyx_v_model, __pyx_n_s_trainables); if (unlikely(!__pyx_t_1)) __PYX_ERR(0, 815, __pyx_L1_error) + __pyx_t_1 = __Pyx_PyObject_GetAttrStr(__pyx_v_model, __pyx_n_s_trainables); if (unlikely(!__pyx_t_1)) __PYX_ERR(0, 814, __pyx_L1_error) __Pyx_GOTREF(__pyx_t_1); - __pyx_t_3 = __Pyx_PyObject_GetAttrStr(__pyx_t_1, __pyx_n_s_syn1); if (unlikely(!__pyx_t_3)) __PYX_ERR(0, 815, __pyx_L1_error) + __pyx_t_3 = __Pyx_PyObject_GetAttrStr(__pyx_t_1, __pyx_n_s_syn1); if (unlikely(!__pyx_t_3)) __PYX_ERR(0, 814, __pyx_L1_error) __Pyx_GOTREF(__pyx_t_3); __Pyx_DECREF(__pyx_t_1); __pyx_t_1 = 0; - if (!(likely(((__pyx_t_3) == Py_None) || likely(__Pyx_TypeTest(__pyx_t_3, __pyx_ptype_5numpy_ndarray))))) __PYX_ERR(0, 815, __pyx_L1_error) + if (!(likely(((__pyx_t_3) == Py_None) || likely(__Pyx_TypeTest(__pyx_t_3, __pyx_ptype_5numpy_ndarray))))) __PYX_ERR(0, 814, __pyx_L1_error) __pyx_v_c.syn1 = ((__pyx_t_6gensim_6models_14word2vec_inner_REAL_t *)PyArray_DATA(((PyArrayObject *)__pyx_t_3))); __Pyx_DECREF(__pyx_t_3); __pyx_t_3 = 0; - /* "gensim/models/word2vec_inner.pyx":818 + /* "gensim/models/word2vec_inner.pyx":817 * * # convert Python structures to primitive types, so we can release the GIL * c.work = np.PyArray_DATA(_work) # <<<<<<<<<<<<<< * c.neu1 = np.PyArray_DATA(_neu1) * */ - if (!(likely(((__pyx_v__work) == Py_None) || likely(__Pyx_TypeTest(__pyx_v__work, __pyx_ptype_5numpy_ndarray))))) __PYX_ERR(0, 818, __pyx_L1_error) + if (!(likely(((__pyx_v__work) == Py_None) || likely(__Pyx_TypeTest(__pyx_v__work, __pyx_ptype_5numpy_ndarray))))) __PYX_ERR(0, 817, __pyx_L1_error) __pyx_v_c.work = ((__pyx_t_6gensim_6models_14word2vec_inner_REAL_t *)PyArray_DATA(((PyArrayObject *)__pyx_v__work))); - /* "gensim/models/word2vec_inner.pyx":819 + /* "gensim/models/word2vec_inner.pyx":818 * # convert Python structures to primitive types, so we can release the GIL * c.work = np.PyArray_DATA(_work) * c.neu1 = np.PyArray_DATA(_neu1) # <<<<<<<<<<<<<< * * vlookup = model.wv.vocab */ - if (!(likely(((__pyx_v__neu1) == Py_None) || likely(__Pyx_TypeTest(__pyx_v__neu1, __pyx_ptype_5numpy_ndarray))))) __PYX_ERR(0, 819, __pyx_L1_error) + if (!(likely(((__pyx_v__neu1) == Py_None) || likely(__Pyx_TypeTest(__pyx_v__neu1, __pyx_ptype_5numpy_ndarray))))) __PYX_ERR(0, 818, __pyx_L1_error) __pyx_v_c.neu1 = ((__pyx_t_6gensim_6models_14word2vec_inner_REAL_t *)PyArray_DATA(((PyArrayObject *)__pyx_v__neu1))); - /* "gensim/models/word2vec_inner.pyx":821 + /* "gensim/models/word2vec_inner.pyx":820 * c.neu1 = np.PyArray_DATA(_neu1) * * vlookup = model.wv.vocab # <<<<<<<<<<<<<< * i = 0 * for token in sentence: */ - __pyx_t_3 = __Pyx_PyObject_GetAttrStr(__pyx_v_model, __pyx_n_s_wv); if (unlikely(!__pyx_t_3)) __PYX_ERR(0, 821, __pyx_L1_error) + __pyx_t_3 = __Pyx_PyObject_GetAttrStr(__pyx_v_model, __pyx_n_s_wv); if (unlikely(!__pyx_t_3)) __PYX_ERR(0, 820, __pyx_L1_error) __Pyx_GOTREF(__pyx_t_3); - __pyx_t_1 = __Pyx_PyObject_GetAttrStr(__pyx_t_3, __pyx_n_s_vocab); if (unlikely(!__pyx_t_1)) __PYX_ERR(0, 821, __pyx_L1_error) + __pyx_t_1 = __Pyx_PyObject_GetAttrStr(__pyx_t_3, __pyx_n_s_vocab); if (unlikely(!__pyx_t_1)) __PYX_ERR(0, 820, __pyx_L1_error) __Pyx_GOTREF(__pyx_t_1); __Pyx_DECREF(__pyx_t_3); __pyx_t_3 = 0; __pyx_v_vlookup = __pyx_t_1; __pyx_t_1 = 0; - /* "gensim/models/word2vec_inner.pyx":822 + /* "gensim/models/word2vec_inner.pyx":821 * * vlookup = model.wv.vocab * i = 0 # <<<<<<<<<<<<<< @@ -7570,7 +7624,7 @@ static PyObject *__pyx_pf_6gensim_6models_14word2vec_inner_6score_sentence_cbow( */ __pyx_v_i = 0; - /* "gensim/models/word2vec_inner.pyx":823 + /* "gensim/models/word2vec_inner.pyx":822 * vlookup = model.wv.vocab * i = 0 * for token in sentence: # <<<<<<<<<<<<<< @@ -7581,26 +7635,26 @@ static PyObject *__pyx_pf_6gensim_6models_14word2vec_inner_6score_sentence_cbow( __pyx_t_1 = __pyx_v_sentence; __Pyx_INCREF(__pyx_t_1); __pyx_t_4 = 0; __pyx_t_5 = NULL; } else { - __pyx_t_4 = -1; __pyx_t_1 = PyObject_GetIter(__pyx_v_sentence); if (unlikely(!__pyx_t_1)) __PYX_ERR(0, 823, __pyx_L1_error) + __pyx_t_4 = -1; __pyx_t_1 = PyObject_GetIter(__pyx_v_sentence); if (unlikely(!__pyx_t_1)) __PYX_ERR(0, 822, __pyx_L1_error) __Pyx_GOTREF(__pyx_t_1); - __pyx_t_5 = Py_TYPE(__pyx_t_1)->tp_iternext; if (unlikely(!__pyx_t_5)) __PYX_ERR(0, 823, __pyx_L1_error) + __pyx_t_5 = Py_TYPE(__pyx_t_1)->tp_iternext; if (unlikely(!__pyx_t_5)) __PYX_ERR(0, 822, __pyx_L1_error) } for (;;) { if (likely(!__pyx_t_5)) { if (likely(PyList_CheckExact(__pyx_t_1))) { if (__pyx_t_4 >= PyList_GET_SIZE(__pyx_t_1)) break; #if CYTHON_ASSUME_SAFE_MACROS && !CYTHON_AVOID_BORROWED_REFS - __pyx_t_3 = PyList_GET_ITEM(__pyx_t_1, __pyx_t_4); __Pyx_INCREF(__pyx_t_3); __pyx_t_4++; if (unlikely(0 < 0)) __PYX_ERR(0, 823, __pyx_L1_error) + __pyx_t_3 = PyList_GET_ITEM(__pyx_t_1, __pyx_t_4); __Pyx_INCREF(__pyx_t_3); __pyx_t_4++; if (unlikely(0 < 0)) __PYX_ERR(0, 822, __pyx_L1_error) #else - __pyx_t_3 = PySequence_ITEM(__pyx_t_1, __pyx_t_4); __pyx_t_4++; if (unlikely(!__pyx_t_3)) __PYX_ERR(0, 823, __pyx_L1_error) + __pyx_t_3 = PySequence_ITEM(__pyx_t_1, __pyx_t_4); __pyx_t_4++; if (unlikely(!__pyx_t_3)) __PYX_ERR(0, 822, __pyx_L1_error) __Pyx_GOTREF(__pyx_t_3); #endif } else { if (__pyx_t_4 >= PyTuple_GET_SIZE(__pyx_t_1)) break; #if CYTHON_ASSUME_SAFE_MACROS && !CYTHON_AVOID_BORROWED_REFS - __pyx_t_3 = PyTuple_GET_ITEM(__pyx_t_1, __pyx_t_4); __Pyx_INCREF(__pyx_t_3); __pyx_t_4++; if (unlikely(0 < 0)) __PYX_ERR(0, 823, __pyx_L1_error) + __pyx_t_3 = PyTuple_GET_ITEM(__pyx_t_1, __pyx_t_4); __Pyx_INCREF(__pyx_t_3); __pyx_t_4++; if (unlikely(0 < 0)) __PYX_ERR(0, 822, __pyx_L1_error) #else - __pyx_t_3 = PySequence_ITEM(__pyx_t_1, __pyx_t_4); __pyx_t_4++; if (unlikely(!__pyx_t_3)) __PYX_ERR(0, 823, __pyx_L1_error) + __pyx_t_3 = PySequence_ITEM(__pyx_t_1, __pyx_t_4); __pyx_t_4++; if (unlikely(!__pyx_t_3)) __PYX_ERR(0, 822, __pyx_L1_error) __Pyx_GOTREF(__pyx_t_3); #endif } @@ -7610,7 +7664,7 @@ static PyObject *__pyx_pf_6gensim_6models_14word2vec_inner_6score_sentence_cbow( PyObject* exc_type = PyErr_Occurred(); if (exc_type) { if (likely(__Pyx_PyErr_GivenExceptionMatches(exc_type, PyExc_StopIteration))) PyErr_Clear(); - else __PYX_ERR(0, 823, __pyx_L1_error) + else __PYX_ERR(0, 822, __pyx_L1_error) } break; } @@ -7619,16 +7673,16 @@ static PyObject *__pyx_pf_6gensim_6models_14word2vec_inner_6score_sentence_cbow( __Pyx_XDECREF_SET(__pyx_v_token, __pyx_t_3); __pyx_t_3 = 0; - /* "gensim/models/word2vec_inner.pyx":824 + /* "gensim/models/word2vec_inner.pyx":823 * i = 0 * for token in sentence: * word = vlookup[token] if token in vlookup else None # <<<<<<<<<<<<<< * if word is None: * continue # for score, should this be a default negative value? */ - __pyx_t_6 = (__Pyx_PySequence_ContainsTF(__pyx_v_token, __pyx_v_vlookup, Py_EQ)); if (unlikely(__pyx_t_6 < 0)) __PYX_ERR(0, 824, __pyx_L1_error) + __pyx_t_6 = (__Pyx_PySequence_ContainsTF(__pyx_v_token, __pyx_v_vlookup, Py_EQ)); if (unlikely(__pyx_t_6 < 0)) __PYX_ERR(0, 823, __pyx_L1_error) if ((__pyx_t_6 != 0)) { - __pyx_t_7 = __Pyx_PyObject_GetItem(__pyx_v_vlookup, __pyx_v_token); if (unlikely(!__pyx_t_7)) __PYX_ERR(0, 824, __pyx_L1_error) + __pyx_t_7 = __Pyx_PyObject_GetItem(__pyx_v_vlookup, __pyx_v_token); if (unlikely(!__pyx_t_7)) __PYX_ERR(0, 823, __pyx_L1_error) __Pyx_GOTREF(__pyx_t_7); __pyx_t_3 = __pyx_t_7; __pyx_t_7 = 0; @@ -7639,7 +7693,7 @@ static PyObject *__pyx_pf_6gensim_6models_14word2vec_inner_6score_sentence_cbow( __Pyx_XDECREF_SET(__pyx_v_word, __pyx_t_3); __pyx_t_3 = 0; - /* "gensim/models/word2vec_inner.pyx":825 + /* "gensim/models/word2vec_inner.pyx":824 * for token in sentence: * word = vlookup[token] if token in vlookup else None * if word is None: # <<<<<<<<<<<<<< @@ -7650,7 +7704,7 @@ static PyObject *__pyx_pf_6gensim_6models_14word2vec_inner_6score_sentence_cbow( __pyx_t_8 = (__pyx_t_6 != 0); if (__pyx_t_8) { - /* "gensim/models/word2vec_inner.pyx":826 + /* "gensim/models/word2vec_inner.pyx":825 * word = vlookup[token] if token in vlookup else None * if word is None: * continue # for score, should this be a default negative value? # <<<<<<<<<<<<<< @@ -7659,7 +7713,7 @@ static PyObject *__pyx_pf_6gensim_6models_14word2vec_inner_6score_sentence_cbow( */ goto __pyx_L3_continue; - /* "gensim/models/word2vec_inner.pyx":825 + /* "gensim/models/word2vec_inner.pyx":824 * for token in sentence: * word = vlookup[token] if token in vlookup else None * if word is None: # <<<<<<<<<<<<<< @@ -7668,59 +7722,59 @@ static PyObject *__pyx_pf_6gensim_6models_14word2vec_inner_6score_sentence_cbow( */ } - /* "gensim/models/word2vec_inner.pyx":827 + /* "gensim/models/word2vec_inner.pyx":826 * if word is None: * continue # for score, should this be a default negative value? * c.indexes[i] = word.index # <<<<<<<<<<<<<< * c.codelens[i] = len(word.code) * c.codes[i] = np.PyArray_DATA(word.code) */ - __pyx_t_3 = __Pyx_PyObject_GetAttrStr(__pyx_v_word, __pyx_n_s_index); if (unlikely(!__pyx_t_3)) __PYX_ERR(0, 827, __pyx_L1_error) + __pyx_t_3 = __Pyx_PyObject_GetAttrStr(__pyx_v_word, __pyx_n_s_index); if (unlikely(!__pyx_t_3)) __PYX_ERR(0, 826, __pyx_L1_error) __Pyx_GOTREF(__pyx_t_3); - __pyx_t_9 = __Pyx_PyInt_As_npy_uint32(__pyx_t_3); if (unlikely((__pyx_t_9 == ((npy_uint32)-1)) && PyErr_Occurred())) __PYX_ERR(0, 827, __pyx_L1_error) + __pyx_t_9 = __Pyx_PyInt_As_npy_uint32(__pyx_t_3); if (unlikely((__pyx_t_9 == ((npy_uint32)-1)) && PyErr_Occurred())) __PYX_ERR(0, 826, __pyx_L1_error) __Pyx_DECREF(__pyx_t_3); __pyx_t_3 = 0; (__pyx_v_c.indexes[__pyx_v_i]) = __pyx_t_9; - /* "gensim/models/word2vec_inner.pyx":828 + /* "gensim/models/word2vec_inner.pyx":827 * continue # for score, should this be a default negative value? * c.indexes[i] = word.index * c.codelens[i] = len(word.code) # <<<<<<<<<<<<<< * c.codes[i] = np.PyArray_DATA(word.code) * c.points[i] = np.PyArray_DATA(word.point) */ - __pyx_t_3 = __Pyx_PyObject_GetAttrStr(__pyx_v_word, __pyx_n_s_code); if (unlikely(!__pyx_t_3)) __PYX_ERR(0, 828, __pyx_L1_error) + __pyx_t_3 = __Pyx_PyObject_GetAttrStr(__pyx_v_word, __pyx_n_s_code); if (unlikely(!__pyx_t_3)) __PYX_ERR(0, 827, __pyx_L1_error) __Pyx_GOTREF(__pyx_t_3); - __pyx_t_10 = PyObject_Length(__pyx_t_3); if (unlikely(__pyx_t_10 == ((Py_ssize_t)-1))) __PYX_ERR(0, 828, __pyx_L1_error) + __pyx_t_10 = PyObject_Length(__pyx_t_3); if (unlikely(__pyx_t_10 == ((Py_ssize_t)-1))) __PYX_ERR(0, 827, __pyx_L1_error) __Pyx_DECREF(__pyx_t_3); __pyx_t_3 = 0; (__pyx_v_c.codelens[__pyx_v_i]) = ((int)__pyx_t_10); - /* "gensim/models/word2vec_inner.pyx":829 + /* "gensim/models/word2vec_inner.pyx":828 * c.indexes[i] = word.index * c.codelens[i] = len(word.code) * c.codes[i] = np.PyArray_DATA(word.code) # <<<<<<<<<<<<<< * c.points[i] = np.PyArray_DATA(word.point) * result += 1 */ - __pyx_t_3 = __Pyx_PyObject_GetAttrStr(__pyx_v_word, __pyx_n_s_code); if (unlikely(!__pyx_t_3)) __PYX_ERR(0, 829, __pyx_L1_error) + __pyx_t_3 = __Pyx_PyObject_GetAttrStr(__pyx_v_word, __pyx_n_s_code); if (unlikely(!__pyx_t_3)) __PYX_ERR(0, 828, __pyx_L1_error) __Pyx_GOTREF(__pyx_t_3); - if (!(likely(((__pyx_t_3) == Py_None) || likely(__Pyx_TypeTest(__pyx_t_3, __pyx_ptype_5numpy_ndarray))))) __PYX_ERR(0, 829, __pyx_L1_error) + if (!(likely(((__pyx_t_3) == Py_None) || likely(__Pyx_TypeTest(__pyx_t_3, __pyx_ptype_5numpy_ndarray))))) __PYX_ERR(0, 828, __pyx_L1_error) (__pyx_v_c.codes[__pyx_v_i]) = ((__pyx_t_5numpy_uint8_t *)PyArray_DATA(((PyArrayObject *)__pyx_t_3))); __Pyx_DECREF(__pyx_t_3); __pyx_t_3 = 0; - /* "gensim/models/word2vec_inner.pyx":830 + /* "gensim/models/word2vec_inner.pyx":829 * c.codelens[i] = len(word.code) * c.codes[i] = np.PyArray_DATA(word.code) * c.points[i] = np.PyArray_DATA(word.point) # <<<<<<<<<<<<<< * result += 1 * i += 1 */ - __pyx_t_3 = __Pyx_PyObject_GetAttrStr(__pyx_v_word, __pyx_n_s_point); if (unlikely(!__pyx_t_3)) __PYX_ERR(0, 830, __pyx_L1_error) + __pyx_t_3 = __Pyx_PyObject_GetAttrStr(__pyx_v_word, __pyx_n_s_point); if (unlikely(!__pyx_t_3)) __PYX_ERR(0, 829, __pyx_L1_error) __Pyx_GOTREF(__pyx_t_3); - if (!(likely(((__pyx_t_3) == Py_None) || likely(__Pyx_TypeTest(__pyx_t_3, __pyx_ptype_5numpy_ndarray))))) __PYX_ERR(0, 830, __pyx_L1_error) + if (!(likely(((__pyx_t_3) == Py_None) || likely(__Pyx_TypeTest(__pyx_t_3, __pyx_ptype_5numpy_ndarray))))) __PYX_ERR(0, 829, __pyx_L1_error) (__pyx_v_c.points[__pyx_v_i]) = ((__pyx_t_5numpy_uint32_t *)PyArray_DATA(((PyArrayObject *)__pyx_t_3))); __Pyx_DECREF(__pyx_t_3); __pyx_t_3 = 0; - /* "gensim/models/word2vec_inner.pyx":831 + /* "gensim/models/word2vec_inner.pyx":830 * c.codes[i] = np.PyArray_DATA(word.code) * c.points[i] = np.PyArray_DATA(word.point) * result += 1 # <<<<<<<<<<<<<< @@ -7729,7 +7783,7 @@ static PyObject *__pyx_pf_6gensim_6models_14word2vec_inner_6score_sentence_cbow( */ __pyx_v_result = (__pyx_v_result + 1); - /* "gensim/models/word2vec_inner.pyx":832 + /* "gensim/models/word2vec_inner.pyx":831 * c.points[i] = np.PyArray_DATA(word.point) * result += 1 * i += 1 # <<<<<<<<<<<<<< @@ -7738,7 +7792,7 @@ static PyObject *__pyx_pf_6gensim_6models_14word2vec_inner_6score_sentence_cbow( */ __pyx_v_i = (__pyx_v_i + 1); - /* "gensim/models/word2vec_inner.pyx":833 + /* "gensim/models/word2vec_inner.pyx":832 * result += 1 * i += 1 * if i == MAX_SENTENCE_LEN: # <<<<<<<<<<<<<< @@ -7748,7 +7802,7 @@ static PyObject *__pyx_pf_6gensim_6models_14word2vec_inner_6score_sentence_cbow( __pyx_t_8 = ((__pyx_v_i == 0x2710) != 0); if (__pyx_t_8) { - /* "gensim/models/word2vec_inner.pyx":834 + /* "gensim/models/word2vec_inner.pyx":833 * i += 1 * if i == MAX_SENTENCE_LEN: * break # TODO: log warning, tally overflow? # <<<<<<<<<<<<<< @@ -7757,7 +7811,7 @@ static PyObject *__pyx_pf_6gensim_6models_14word2vec_inner_6score_sentence_cbow( */ goto __pyx_L4_break; - /* "gensim/models/word2vec_inner.pyx":833 + /* "gensim/models/word2vec_inner.pyx":832 * result += 1 * i += 1 * if i == MAX_SENTENCE_LEN: # <<<<<<<<<<<<<< @@ -7766,7 +7820,7 @@ static PyObject *__pyx_pf_6gensim_6models_14word2vec_inner_6score_sentence_cbow( */ } - /* "gensim/models/word2vec_inner.pyx":823 + /* "gensim/models/word2vec_inner.pyx":822 * vlookup = model.wv.vocab * i = 0 * for token in sentence: # <<<<<<<<<<<<<< @@ -7778,7 +7832,7 @@ static PyObject *__pyx_pf_6gensim_6models_14word2vec_inner_6score_sentence_cbow( __pyx_L4_break:; __Pyx_DECREF(__pyx_t_1); __pyx_t_1 = 0; - /* "gensim/models/word2vec_inner.pyx":835 + /* "gensim/models/word2vec_inner.pyx":834 * if i == MAX_SENTENCE_LEN: * break # TODO: log warning, tally overflow? * sentence_len = i # <<<<<<<<<<<<<< @@ -7787,7 +7841,7 @@ static PyObject *__pyx_pf_6gensim_6models_14word2vec_inner_6score_sentence_cbow( */ __pyx_v_sentence_len = __pyx_v_i; - /* "gensim/models/word2vec_inner.pyx":838 + /* "gensim/models/word2vec_inner.pyx":837 * * # release GIL & train on the sentence * c.work[0] = 0.0 # <<<<<<<<<<<<<< @@ -7796,7 +7850,7 @@ static PyObject *__pyx_pf_6gensim_6models_14word2vec_inner_6score_sentence_cbow( */ (__pyx_v_c.work[0]) = 0.0; - /* "gensim/models/word2vec_inner.pyx":839 + /* "gensim/models/word2vec_inner.pyx":838 * # release GIL & train on the sentence * c.work[0] = 0.0 * with nogil: # <<<<<<<<<<<<<< @@ -7811,7 +7865,7 @@ static PyObject *__pyx_pf_6gensim_6models_14word2vec_inner_6score_sentence_cbow( #endif /*try:*/ { - /* "gensim/models/word2vec_inner.pyx":840 + /* "gensim/models/word2vec_inner.pyx":839 * c.work[0] = 0.0 * with nogil: * for i in range(sentence_len): # <<<<<<<<<<<<<< @@ -7823,7 +7877,7 @@ static PyObject *__pyx_pf_6gensim_6models_14word2vec_inner_6score_sentence_cbow( for (__pyx_t_12 = 0; __pyx_t_12 < __pyx_t_11; __pyx_t_12+=1) { __pyx_v_i = __pyx_t_12; - /* "gensim/models/word2vec_inner.pyx":841 + /* "gensim/models/word2vec_inner.pyx":840 * with nogil: * for i in range(sentence_len): * if c.codelens[i] == 0: # <<<<<<<<<<<<<< @@ -7833,7 +7887,7 @@ static PyObject *__pyx_pf_6gensim_6models_14word2vec_inner_6score_sentence_cbow( __pyx_t_8 = (((__pyx_v_c.codelens[__pyx_v_i]) == 0) != 0); if (__pyx_t_8) { - /* "gensim/models/word2vec_inner.pyx":842 + /* "gensim/models/word2vec_inner.pyx":841 * for i in range(sentence_len): * if c.codelens[i] == 0: * continue # <<<<<<<<<<<<<< @@ -7842,7 +7896,7 @@ static PyObject *__pyx_pf_6gensim_6models_14word2vec_inner_6score_sentence_cbow( */ goto __pyx_L10_continue; - /* "gensim/models/word2vec_inner.pyx":841 + /* "gensim/models/word2vec_inner.pyx":840 * with nogil: * for i in range(sentence_len): * if c.codelens[i] == 0: # <<<<<<<<<<<<<< @@ -7851,7 +7905,7 @@ static PyObject *__pyx_pf_6gensim_6models_14word2vec_inner_6score_sentence_cbow( */ } - /* "gensim/models/word2vec_inner.pyx":843 + /* "gensim/models/word2vec_inner.pyx":842 * if c.codelens[i] == 0: * continue * j = i - c.window # <<<<<<<<<<<<<< @@ -7860,7 +7914,7 @@ static PyObject *__pyx_pf_6gensim_6models_14word2vec_inner_6score_sentence_cbow( */ __pyx_v_j = (__pyx_v_i - __pyx_v_c.window); - /* "gensim/models/word2vec_inner.pyx":844 + /* "gensim/models/word2vec_inner.pyx":843 * continue * j = i - c.window * if j < 0: # <<<<<<<<<<<<<< @@ -7870,7 +7924,7 @@ static PyObject *__pyx_pf_6gensim_6models_14word2vec_inner_6score_sentence_cbow( __pyx_t_8 = ((__pyx_v_j < 0) != 0); if (__pyx_t_8) { - /* "gensim/models/word2vec_inner.pyx":845 + /* "gensim/models/word2vec_inner.pyx":844 * j = i - c.window * if j < 0: * j = 0 # <<<<<<<<<<<<<< @@ -7879,7 +7933,7 @@ static PyObject *__pyx_pf_6gensim_6models_14word2vec_inner_6score_sentence_cbow( */ __pyx_v_j = 0; - /* "gensim/models/word2vec_inner.pyx":844 + /* "gensim/models/word2vec_inner.pyx":843 * continue * j = i - c.window * if j < 0: # <<<<<<<<<<<<<< @@ -7888,7 +7942,7 @@ static PyObject *__pyx_pf_6gensim_6models_14word2vec_inner_6score_sentence_cbow( */ } - /* "gensim/models/word2vec_inner.pyx":846 + /* "gensim/models/word2vec_inner.pyx":845 * if j < 0: * j = 0 * k = i + c.window + 1 # <<<<<<<<<<<<<< @@ -7897,7 +7951,7 @@ static PyObject *__pyx_pf_6gensim_6models_14word2vec_inner_6score_sentence_cbow( */ __pyx_v_k = ((__pyx_v_i + __pyx_v_c.window) + 1); - /* "gensim/models/word2vec_inner.pyx":847 + /* "gensim/models/word2vec_inner.pyx":846 * j = 0 * k = i + c.window + 1 * if k > sentence_len: # <<<<<<<<<<<<<< @@ -7907,7 +7961,7 @@ static PyObject *__pyx_pf_6gensim_6models_14word2vec_inner_6score_sentence_cbow( __pyx_t_8 = ((__pyx_v_k > __pyx_v_sentence_len) != 0); if (__pyx_t_8) { - /* "gensim/models/word2vec_inner.pyx":848 + /* "gensim/models/word2vec_inner.pyx":847 * k = i + c.window + 1 * if k > sentence_len: * k = sentence_len # <<<<<<<<<<<<<< @@ -7916,7 +7970,7 @@ static PyObject *__pyx_pf_6gensim_6models_14word2vec_inner_6score_sentence_cbow( */ __pyx_v_k = __pyx_v_sentence_len; - /* "gensim/models/word2vec_inner.pyx":847 + /* "gensim/models/word2vec_inner.pyx":846 * j = 0 * k = i + c.window + 1 * if k > sentence_len: # <<<<<<<<<<<<<< @@ -7925,7 +7979,7 @@ static PyObject *__pyx_pf_6gensim_6models_14word2vec_inner_6score_sentence_cbow( */ } - /* "gensim/models/word2vec_inner.pyx":849 + /* "gensim/models/word2vec_inner.pyx":848 * if k > sentence_len: * k = sentence_len * score_pair_cbow_hs(c.points[i], c.codes[i], c.codelens, c.neu1, c.syn0, c.syn1, c.size, c.indexes, c.work, i, j, k, c.cbow_mean) # <<<<<<<<<<<<<< @@ -7937,7 +7991,7 @@ static PyObject *__pyx_pf_6gensim_6models_14word2vec_inner_6score_sentence_cbow( } } - /* "gensim/models/word2vec_inner.pyx":839 + /* "gensim/models/word2vec_inner.pyx":838 * # release GIL & train on the sentence * c.work[0] = 0.0 * with nogil: # <<<<<<<<<<<<<< @@ -7956,7 +8010,7 @@ static PyObject *__pyx_pf_6gensim_6models_14word2vec_inner_6score_sentence_cbow( } } - /* "gensim/models/word2vec_inner.pyx":851 + /* "gensim/models/word2vec_inner.pyx":850 * score_pair_cbow_hs(c.points[i], c.codes[i], c.codelens, c.neu1, c.syn0, c.syn1, c.size, c.indexes, c.work, i, j, k, c.cbow_mean) * * return c.work[0] # <<<<<<<<<<<<<< @@ -7964,13 +8018,13 @@ static PyObject *__pyx_pf_6gensim_6models_14word2vec_inner_6score_sentence_cbow( * cdef void score_pair_cbow_hs( */ __Pyx_XDECREF(__pyx_r); - __pyx_t_1 = PyFloat_FromDouble((__pyx_v_c.work[0])); if (unlikely(!__pyx_t_1)) __PYX_ERR(0, 851, __pyx_L1_error) + __pyx_t_1 = PyFloat_FromDouble((__pyx_v_c.work[0])); if (unlikely(!__pyx_t_1)) __PYX_ERR(0, 850, __pyx_L1_error) __Pyx_GOTREF(__pyx_t_1); __pyx_r = __pyx_t_1; __pyx_t_1 = 0; goto __pyx_L0; - /* "gensim/models/word2vec_inner.pyx":780 + /* "gensim/models/word2vec_inner.pyx":779 * work[0] += f * * def score_sentence_cbow(model, sentence, _work, _neu1): # <<<<<<<<<<<<<< @@ -7994,7 +8048,7 @@ static PyObject *__pyx_pf_6gensim_6models_14word2vec_inner_6score_sentence_cbow( return __pyx_r; } -/* "gensim/models/word2vec_inner.pyx":853 +/* "gensim/models/word2vec_inner.pyx":852 * return c.work[0] * * cdef void score_pair_cbow_hs( # <<<<<<<<<<<<<< @@ -8018,7 +8072,7 @@ static void __pyx_f_6gensim_6models_14word2vec_inner_score_pair_cbow_hs(__pyx_t_ PY_LONG_LONG __pyx_t_6; long __pyx_t_7; - /* "gensim/models/word2vec_inner.pyx":864 + /* "gensim/models/word2vec_inner.pyx":863 * cdef int m * * memset(neu1, 0, size * cython.sizeof(REAL_t)) # <<<<<<<<<<<<<< @@ -8027,7 +8081,7 @@ static void __pyx_f_6gensim_6models_14word2vec_inner_score_pair_cbow_hs(__pyx_t_ */ (void)(memset(__pyx_v_neu1, 0, (__pyx_v_size * (sizeof(__pyx_t_6gensim_6models_14word2vec_inner_REAL_t))))); - /* "gensim/models/word2vec_inner.pyx":865 + /* "gensim/models/word2vec_inner.pyx":864 * * memset(neu1, 0, size * cython.sizeof(REAL_t)) * count = 0.0 # <<<<<<<<<<<<<< @@ -8036,7 +8090,7 @@ static void __pyx_f_6gensim_6models_14word2vec_inner_score_pair_cbow_hs(__pyx_t_ */ __pyx_v_count = ((__pyx_t_6gensim_6models_14word2vec_inner_REAL_t)0.0); - /* "gensim/models/word2vec_inner.pyx":866 + /* "gensim/models/word2vec_inner.pyx":865 * memset(neu1, 0, size * cython.sizeof(REAL_t)) * count = 0.0 * for m in range(j, k): # <<<<<<<<<<<<<< @@ -8048,7 +8102,7 @@ static void __pyx_f_6gensim_6models_14word2vec_inner_score_pair_cbow_hs(__pyx_t_ for (__pyx_t_3 = __pyx_v_j; __pyx_t_3 < __pyx_t_2; __pyx_t_3+=1) { __pyx_v_m = __pyx_t_3; - /* "gensim/models/word2vec_inner.pyx":867 + /* "gensim/models/word2vec_inner.pyx":866 * count = 0.0 * for m in range(j, k): * if m == i or codelens[m] == 0: # <<<<<<<<<<<<<< @@ -8066,7 +8120,7 @@ static void __pyx_f_6gensim_6models_14word2vec_inner_score_pair_cbow_hs(__pyx_t_ __pyx_L6_bool_binop_done:; if (__pyx_t_4) { - /* "gensim/models/word2vec_inner.pyx":868 + /* "gensim/models/word2vec_inner.pyx":867 * for m in range(j, k): * if m == i or codelens[m] == 0: * continue # <<<<<<<<<<<<<< @@ -8075,7 +8129,7 @@ static void __pyx_f_6gensim_6models_14word2vec_inner_score_pair_cbow_hs(__pyx_t_ */ goto __pyx_L3_continue; - /* "gensim/models/word2vec_inner.pyx":867 + /* "gensim/models/word2vec_inner.pyx":866 * count = 0.0 * for m in range(j, k): * if m == i or codelens[m] == 0: # <<<<<<<<<<<<<< @@ -8084,7 +8138,7 @@ static void __pyx_f_6gensim_6models_14word2vec_inner_score_pair_cbow_hs(__pyx_t_ */ } - /* "gensim/models/word2vec_inner.pyx":870 + /* "gensim/models/word2vec_inner.pyx":869 * continue * else: * count += ONEF # <<<<<<<<<<<<<< @@ -8094,7 +8148,7 @@ static void __pyx_f_6gensim_6models_14word2vec_inner_score_pair_cbow_hs(__pyx_t_ /*else*/ { __pyx_v_count = (__pyx_v_count + __pyx_v_6gensim_6models_14word2vec_inner_ONEF); - /* "gensim/models/word2vec_inner.pyx":871 + /* "gensim/models/word2vec_inner.pyx":870 * else: * count += ONEF * our_saxpy(&size, &ONEF, &syn0[indexes[m] * size], &ONE, neu1, &ONE) # <<<<<<<<<<<<<< @@ -8106,7 +8160,7 @@ static void __pyx_f_6gensim_6models_14word2vec_inner_score_pair_cbow_hs(__pyx_t_ __pyx_L3_continue:; } - /* "gensim/models/word2vec_inner.pyx":872 + /* "gensim/models/word2vec_inner.pyx":871 * count += ONEF * our_saxpy(&size, &ONEF, &syn0[indexes[m] * size], &ONE, neu1, &ONE) * if count > (0.5): # <<<<<<<<<<<<<< @@ -8116,7 +8170,7 @@ static void __pyx_f_6gensim_6models_14word2vec_inner_score_pair_cbow_hs(__pyx_t_ __pyx_t_4 = ((__pyx_v_count > ((__pyx_t_6gensim_6models_14word2vec_inner_REAL_t)0.5)) != 0); if (__pyx_t_4) { - /* "gensim/models/word2vec_inner.pyx":873 + /* "gensim/models/word2vec_inner.pyx":872 * our_saxpy(&size, &ONEF, &syn0[indexes[m] * size], &ONE, neu1, &ONE) * if count > (0.5): * inv_count = ONEF/count # <<<<<<<<<<<<<< @@ -8125,7 +8179,7 @@ static void __pyx_f_6gensim_6models_14word2vec_inner_score_pair_cbow_hs(__pyx_t_ */ __pyx_v_inv_count = (__pyx_v_6gensim_6models_14word2vec_inner_ONEF / __pyx_v_count); - /* "gensim/models/word2vec_inner.pyx":872 + /* "gensim/models/word2vec_inner.pyx":871 * count += ONEF * our_saxpy(&size, &ONEF, &syn0[indexes[m] * size], &ONE, neu1, &ONE) * if count > (0.5): # <<<<<<<<<<<<<< @@ -8134,7 +8188,7 @@ static void __pyx_f_6gensim_6models_14word2vec_inner_score_pair_cbow_hs(__pyx_t_ */ } - /* "gensim/models/word2vec_inner.pyx":874 + /* "gensim/models/word2vec_inner.pyx":873 * if count > (0.5): * inv_count = ONEF/count * if cbow_mean: # <<<<<<<<<<<<<< @@ -8144,7 +8198,7 @@ static void __pyx_f_6gensim_6models_14word2vec_inner_score_pair_cbow_hs(__pyx_t_ __pyx_t_4 = (__pyx_v_cbow_mean != 0); if (__pyx_t_4) { - /* "gensim/models/word2vec_inner.pyx":875 + /* "gensim/models/word2vec_inner.pyx":874 * inv_count = ONEF/count * if cbow_mean: * sscal(&size, &inv_count, neu1, &ONE) # <<<<<<<<<<<<<< @@ -8153,7 +8207,7 @@ static void __pyx_f_6gensim_6models_14word2vec_inner_score_pair_cbow_hs(__pyx_t_ */ __pyx_v_6gensim_6models_14word2vec_inner_sscal((&__pyx_v_size), (&__pyx_v_inv_count), __pyx_v_neu1, (&__pyx_v_6gensim_6models_14word2vec_inner_ONE)); - /* "gensim/models/word2vec_inner.pyx":874 + /* "gensim/models/word2vec_inner.pyx":873 * if count > (0.5): * inv_count = ONEF/count * if cbow_mean: # <<<<<<<<<<<<<< @@ -8162,7 +8216,7 @@ static void __pyx_f_6gensim_6models_14word2vec_inner_score_pair_cbow_hs(__pyx_t_ */ } - /* "gensim/models/word2vec_inner.pyx":877 + /* "gensim/models/word2vec_inner.pyx":876 * sscal(&size, &inv_count, neu1, &ONE) * * for b in range(codelens[i]): # <<<<<<<<<<<<<< @@ -8174,7 +8228,7 @@ static void __pyx_f_6gensim_6models_14word2vec_inner_score_pair_cbow_hs(__pyx_t_ for (__pyx_t_6 = 0; __pyx_t_6 < __pyx_t_2; __pyx_t_6+=1) { __pyx_v_b = __pyx_t_6; - /* "gensim/models/word2vec_inner.pyx":878 + /* "gensim/models/word2vec_inner.pyx":877 * * for b in range(codelens[i]): * row2 = word_point[b] * size # <<<<<<<<<<<<<< @@ -8183,7 +8237,7 @@ static void __pyx_f_6gensim_6models_14word2vec_inner_score_pair_cbow_hs(__pyx_t_ */ __pyx_v_row2 = ((__pyx_v_word_point[__pyx_v_b]) * __pyx_v_size); - /* "gensim/models/word2vec_inner.pyx":879 + /* "gensim/models/word2vec_inner.pyx":878 * for b in range(codelens[i]): * row2 = word_point[b] * size * f = our_dot(&size, neu1, &ONE, &syn1[row2], &ONE) # <<<<<<<<<<<<<< @@ -8192,7 +8246,7 @@ static void __pyx_f_6gensim_6models_14word2vec_inner_score_pair_cbow_hs(__pyx_t_ */ __pyx_v_f = __pyx_v_6gensim_6models_14word2vec_inner_our_dot((&__pyx_v_size), __pyx_v_neu1, (&__pyx_v_6gensim_6models_14word2vec_inner_ONE), (&(__pyx_v_syn1[__pyx_v_row2])), (&__pyx_v_6gensim_6models_14word2vec_inner_ONE)); - /* "gensim/models/word2vec_inner.pyx":880 + /* "gensim/models/word2vec_inner.pyx":879 * row2 = word_point[b] * size * f = our_dot(&size, neu1, &ONE, &syn1[row2], &ONE) * sgn = (-1)**word_code[b] # ch function: 0-> 1, 1 -> -1 # <<<<<<<<<<<<<< @@ -8201,7 +8255,7 @@ static void __pyx_f_6gensim_6models_14word2vec_inner_score_pair_cbow_hs(__pyx_t_ */ __pyx_v_sgn = __Pyx_pow_long(-1L, ((long)(__pyx_v_word_code[__pyx_v_b]))); - /* "gensim/models/word2vec_inner.pyx":881 + /* "gensim/models/word2vec_inner.pyx":880 * f = our_dot(&size, neu1, &ONE, &syn1[row2], &ONE) * sgn = (-1)**word_code[b] # ch function: 0-> 1, 1 -> -1 * f *= sgn # <<<<<<<<<<<<<< @@ -8210,7 +8264,7 @@ static void __pyx_f_6gensim_6models_14word2vec_inner_score_pair_cbow_hs(__pyx_t_ */ __pyx_v_f = (__pyx_v_f * __pyx_v_sgn); - /* "gensim/models/word2vec_inner.pyx":882 + /* "gensim/models/word2vec_inner.pyx":881 * sgn = (-1)**word_code[b] # ch function: 0-> 1, 1 -> -1 * f *= sgn * if f <= -MAX_EXP or f >= MAX_EXP: # <<<<<<<<<<<<<< @@ -8228,7 +8282,7 @@ static void __pyx_f_6gensim_6models_14word2vec_inner_score_pair_cbow_hs(__pyx_t_ __pyx_L13_bool_binop_done:; if (__pyx_t_4) { - /* "gensim/models/word2vec_inner.pyx":883 + /* "gensim/models/word2vec_inner.pyx":882 * f *= sgn * if f <= -MAX_EXP or f >= MAX_EXP: * continue # <<<<<<<<<<<<<< @@ -8237,7 +8291,7 @@ static void __pyx_f_6gensim_6models_14word2vec_inner_score_pair_cbow_hs(__pyx_t_ */ goto __pyx_L10_continue; - /* "gensim/models/word2vec_inner.pyx":882 + /* "gensim/models/word2vec_inner.pyx":881 * sgn = (-1)**word_code[b] # ch function: 0-> 1, 1 -> -1 * f *= sgn * if f <= -MAX_EXP or f >= MAX_EXP: # <<<<<<<<<<<<<< @@ -8246,7 +8300,7 @@ static void __pyx_f_6gensim_6models_14word2vec_inner_score_pair_cbow_hs(__pyx_t_ */ } - /* "gensim/models/word2vec_inner.pyx":884 + /* "gensim/models/word2vec_inner.pyx":883 * if f <= -MAX_EXP or f >= MAX_EXP: * continue * f = LOG_TABLE[((f + MAX_EXP) * (EXP_TABLE_SIZE / MAX_EXP / 2))] # <<<<<<<<<<<<<< @@ -8255,7 +8309,7 @@ static void __pyx_f_6gensim_6models_14word2vec_inner_score_pair_cbow_hs(__pyx_t_ */ __pyx_v_f = (__pyx_v_6gensim_6models_14word2vec_inner_LOG_TABLE[((int)((__pyx_v_f + 6.0) * 83.0))]); - /* "gensim/models/word2vec_inner.pyx":885 + /* "gensim/models/word2vec_inner.pyx":884 * continue * f = LOG_TABLE[((f + MAX_EXP) * (EXP_TABLE_SIZE / MAX_EXP / 2))] * work[0] += f # <<<<<<<<<<<<<< @@ -8267,7 +8321,7 @@ static void __pyx_f_6gensim_6models_14word2vec_inner_score_pair_cbow_hs(__pyx_t_ __pyx_L10_continue:; } - /* "gensim/models/word2vec_inner.pyx":853 + /* "gensim/models/word2vec_inner.pyx":852 * return c.work[0] * * cdef void score_pair_cbow_hs( # <<<<<<<<<<<<<< @@ -8278,7 +8332,7 @@ static void __pyx_f_6gensim_6models_14word2vec_inner_score_pair_cbow_hs(__pyx_t_ /* function exit code */ } -/* "gensim/models/word2vec_inner.pyx":888 +/* "gensim/models/word2vec_inner.pyx":887 * * * def init(): # <<<<<<<<<<<<<< @@ -8317,7 +8371,7 @@ static PyObject *__pyx_pf_6gensim_6models_14word2vec_inner_8init(CYTHON_UNUSED P int __pyx_t_4; __Pyx_RefNannySetupContext("init", 0); - /* "gensim/models/word2vec_inner.pyx":904 + /* "gensim/models/word2vec_inner.pyx":903 * * cdef int i * cdef float *x = [10.0] # <<<<<<<<<<<<<< @@ -8327,7 +8381,7 @@ static PyObject *__pyx_pf_6gensim_6models_14word2vec_inner_8init(CYTHON_UNUSED P __pyx_t_1[0] = ((float)10.0); __pyx_v_x = __pyx_t_1; - /* "gensim/models/word2vec_inner.pyx":905 + /* "gensim/models/word2vec_inner.pyx":904 * cdef int i * cdef float *x = [10.0] * cdef float *y = [0.01] # <<<<<<<<<<<<<< @@ -8337,7 +8391,7 @@ static PyObject *__pyx_pf_6gensim_6models_14word2vec_inner_8init(CYTHON_UNUSED P __pyx_t_2[0] = ((float)0.01); __pyx_v_y = __pyx_t_2; - /* "gensim/models/word2vec_inner.pyx":906 + /* "gensim/models/word2vec_inner.pyx":905 * cdef float *x = [10.0] * cdef float *y = [0.01] * cdef float expected = 0.1 # <<<<<<<<<<<<<< @@ -8346,7 +8400,7 @@ static PyObject *__pyx_pf_6gensim_6models_14word2vec_inner_8init(CYTHON_UNUSED P */ __pyx_v_expected = ((float)0.1); - /* "gensim/models/word2vec_inner.pyx":907 + /* "gensim/models/word2vec_inner.pyx":906 * cdef float *y = [0.01] * cdef float expected = 0.1 * cdef int size = 1 # <<<<<<<<<<<<<< @@ -8355,7 +8409,7 @@ static PyObject *__pyx_pf_6gensim_6models_14word2vec_inner_8init(CYTHON_UNUSED P */ __pyx_v_size = 1; - /* "gensim/models/word2vec_inner.pyx":912 + /* "gensim/models/word2vec_inner.pyx":911 * * # build the sigmoid table * for i in range(EXP_TABLE_SIZE): # <<<<<<<<<<<<<< @@ -8365,7 +8419,7 @@ static PyObject *__pyx_pf_6gensim_6models_14word2vec_inner_8init(CYTHON_UNUSED P for (__pyx_t_3 = 0; __pyx_t_3 < 0x3E8; __pyx_t_3+=1) { __pyx_v_i = __pyx_t_3; - /* "gensim/models/word2vec_inner.pyx":913 + /* "gensim/models/word2vec_inner.pyx":912 * # build the sigmoid table * for i in range(EXP_TABLE_SIZE): * EXP_TABLE[i] = exp((i / EXP_TABLE_SIZE * 2 - 1) * MAX_EXP) # <<<<<<<<<<<<<< @@ -8374,7 +8428,7 @@ static PyObject *__pyx_pf_6gensim_6models_14word2vec_inner_8init(CYTHON_UNUSED P */ (__pyx_v_6gensim_6models_14word2vec_inner_EXP_TABLE[__pyx_v_i]) = ((__pyx_t_6gensim_6models_14word2vec_inner_REAL_t)exp(((((__pyx_v_i / ((__pyx_t_6gensim_6models_14word2vec_inner_REAL_t)0x3E8)) * 2.0) - 1.0) * 6.0))); - /* "gensim/models/word2vec_inner.pyx":914 + /* "gensim/models/word2vec_inner.pyx":913 * for i in range(EXP_TABLE_SIZE): * EXP_TABLE[i] = exp((i / EXP_TABLE_SIZE * 2 - 1) * MAX_EXP) * EXP_TABLE[i] = (EXP_TABLE[i] / (EXP_TABLE[i] + 1)) # <<<<<<<<<<<<<< @@ -8383,7 +8437,7 @@ static PyObject *__pyx_pf_6gensim_6models_14word2vec_inner_8init(CYTHON_UNUSED P */ (__pyx_v_6gensim_6models_14word2vec_inner_EXP_TABLE[__pyx_v_i]) = ((__pyx_t_6gensim_6models_14word2vec_inner_REAL_t)((__pyx_v_6gensim_6models_14word2vec_inner_EXP_TABLE[__pyx_v_i]) / ((__pyx_v_6gensim_6models_14word2vec_inner_EXP_TABLE[__pyx_v_i]) + 1.0))); - /* "gensim/models/word2vec_inner.pyx":915 + /* "gensim/models/word2vec_inner.pyx":914 * EXP_TABLE[i] = exp((i / EXP_TABLE_SIZE * 2 - 1) * MAX_EXP) * EXP_TABLE[i] = (EXP_TABLE[i] / (EXP_TABLE[i] + 1)) * LOG_TABLE[i] = log( EXP_TABLE[i] ) # <<<<<<<<<<<<<< @@ -8393,7 +8447,7 @@ static PyObject *__pyx_pf_6gensim_6models_14word2vec_inner_8init(CYTHON_UNUSED P (__pyx_v_6gensim_6models_14word2vec_inner_LOG_TABLE[__pyx_v_i]) = ((__pyx_t_6gensim_6models_14word2vec_inner_REAL_t)log((__pyx_v_6gensim_6models_14word2vec_inner_EXP_TABLE[__pyx_v_i]))); } - /* "gensim/models/word2vec_inner.pyx":918 + /* "gensim/models/word2vec_inner.pyx":917 * * # check whether sdot returns double or float * d_res = dsdot(&size, x, &ONE, y, &ONE) # <<<<<<<<<<<<<< @@ -8402,7 +8456,7 @@ static PyObject *__pyx_pf_6gensim_6models_14word2vec_inner_8init(CYTHON_UNUSED P */ __pyx_v_d_res = __pyx_v_6gensim_6models_14word2vec_inner_dsdot((&__pyx_v_size), __pyx_v_x, (&__pyx_v_6gensim_6models_14word2vec_inner_ONE), __pyx_v_y, (&__pyx_v_6gensim_6models_14word2vec_inner_ONE)); - /* "gensim/models/word2vec_inner.pyx":919 + /* "gensim/models/word2vec_inner.pyx":918 * # check whether sdot returns double or float * d_res = dsdot(&size, x, &ONE, y, &ONE) * p_res = &d_res # <<<<<<<<<<<<<< @@ -8411,7 +8465,7 @@ static PyObject *__pyx_pf_6gensim_6models_14word2vec_inner_8init(CYTHON_UNUSED P */ __pyx_v_p_res = ((float *)(&__pyx_v_d_res)); - /* "gensim/models/word2vec_inner.pyx":920 + /* "gensim/models/word2vec_inner.pyx":919 * d_res = dsdot(&size, x, &ONE, y, &ONE) * p_res = &d_res * if abs(d_res - expected) < 0.0001: # <<<<<<<<<<<<<< @@ -8421,7 +8475,7 @@ static PyObject *__pyx_pf_6gensim_6models_14word2vec_inner_8init(CYTHON_UNUSED P __pyx_t_4 = ((fabs((__pyx_v_d_res - __pyx_v_expected)) < 0.0001) != 0); if (__pyx_t_4) { - /* "gensim/models/word2vec_inner.pyx":921 + /* "gensim/models/word2vec_inner.pyx":920 * p_res = &d_res * if abs(d_res - expected) < 0.0001: * our_dot = our_dot_double # <<<<<<<<<<<<<< @@ -8430,7 +8484,7 @@ static PyObject *__pyx_pf_6gensim_6models_14word2vec_inner_8init(CYTHON_UNUSED P */ __pyx_v_6gensim_6models_14word2vec_inner_our_dot = __pyx_f_6gensim_6models_14word2vec_inner_our_dot_double; - /* "gensim/models/word2vec_inner.pyx":922 + /* "gensim/models/word2vec_inner.pyx":921 * if abs(d_res - expected) < 0.0001: * our_dot = our_dot_double * our_saxpy = saxpy # <<<<<<<<<<<<<< @@ -8439,7 +8493,7 @@ static PyObject *__pyx_pf_6gensim_6models_14word2vec_inner_8init(CYTHON_UNUSED P */ __pyx_v_6gensim_6models_14word2vec_inner_our_saxpy = __pyx_v_6gensim_6models_14word2vec_inner_saxpy; - /* "gensim/models/word2vec_inner.pyx":923 + /* "gensim/models/word2vec_inner.pyx":922 * our_dot = our_dot_double * our_saxpy = saxpy * return 0 # double # <<<<<<<<<<<<<< @@ -8451,7 +8505,7 @@ static PyObject *__pyx_pf_6gensim_6models_14word2vec_inner_8init(CYTHON_UNUSED P __pyx_r = __pyx_int_0; goto __pyx_L0; - /* "gensim/models/word2vec_inner.pyx":920 + /* "gensim/models/word2vec_inner.pyx":919 * d_res = dsdot(&size, x, &ONE, y, &ONE) * p_res = &d_res * if abs(d_res - expected) < 0.0001: # <<<<<<<<<<<<<< @@ -8460,7 +8514,7 @@ static PyObject *__pyx_pf_6gensim_6models_14word2vec_inner_8init(CYTHON_UNUSED P */ } - /* "gensim/models/word2vec_inner.pyx":924 + /* "gensim/models/word2vec_inner.pyx":923 * our_saxpy = saxpy * return 0 # double * elif abs(p_res[0] - expected) < 0.0001: # <<<<<<<<<<<<<< @@ -8470,7 +8524,7 @@ static PyObject *__pyx_pf_6gensim_6models_14word2vec_inner_8init(CYTHON_UNUSED P __pyx_t_4 = ((fabsf(((__pyx_v_p_res[0]) - __pyx_v_expected)) < 0.0001) != 0); if (__pyx_t_4) { - /* "gensim/models/word2vec_inner.pyx":925 + /* "gensim/models/word2vec_inner.pyx":924 * return 0 # double * elif abs(p_res[0] - expected) < 0.0001: * our_dot = our_dot_float # <<<<<<<<<<<<<< @@ -8479,7 +8533,7 @@ static PyObject *__pyx_pf_6gensim_6models_14word2vec_inner_8init(CYTHON_UNUSED P */ __pyx_v_6gensim_6models_14word2vec_inner_our_dot = __pyx_f_6gensim_6models_14word2vec_inner_our_dot_float; - /* "gensim/models/word2vec_inner.pyx":926 + /* "gensim/models/word2vec_inner.pyx":925 * elif abs(p_res[0] - expected) < 0.0001: * our_dot = our_dot_float * our_saxpy = saxpy # <<<<<<<<<<<<<< @@ -8488,7 +8542,7 @@ static PyObject *__pyx_pf_6gensim_6models_14word2vec_inner_8init(CYTHON_UNUSED P */ __pyx_v_6gensim_6models_14word2vec_inner_our_saxpy = __pyx_v_6gensim_6models_14word2vec_inner_saxpy; - /* "gensim/models/word2vec_inner.pyx":927 + /* "gensim/models/word2vec_inner.pyx":926 * our_dot = our_dot_float * our_saxpy = saxpy * return 1 # float # <<<<<<<<<<<<<< @@ -8500,7 +8554,7 @@ static PyObject *__pyx_pf_6gensim_6models_14word2vec_inner_8init(CYTHON_UNUSED P __pyx_r = __pyx_int_1; goto __pyx_L0; - /* "gensim/models/word2vec_inner.pyx":924 + /* "gensim/models/word2vec_inner.pyx":923 * our_saxpy = saxpy * return 0 # double * elif abs(p_res[0] - expected) < 0.0001: # <<<<<<<<<<<<<< @@ -8509,7 +8563,7 @@ static PyObject *__pyx_pf_6gensim_6models_14word2vec_inner_8init(CYTHON_UNUSED P */ } - /* "gensim/models/word2vec_inner.pyx":931 + /* "gensim/models/word2vec_inner.pyx":930 * # neither => use cython loops, no BLAS * # actually, the BLAS is so messed up we'll probably have segfaulted above and never even reach here * our_dot = our_dot_noblas # <<<<<<<<<<<<<< @@ -8519,7 +8573,7 @@ static PyObject *__pyx_pf_6gensim_6models_14word2vec_inner_8init(CYTHON_UNUSED P /*else*/ { __pyx_v_6gensim_6models_14word2vec_inner_our_dot = __pyx_f_6gensim_6models_14word2vec_inner_our_dot_noblas; - /* "gensim/models/word2vec_inner.pyx":932 + /* "gensim/models/word2vec_inner.pyx":931 * # actually, the BLAS is so messed up we'll probably have segfaulted above and never even reach here * our_dot = our_dot_noblas * our_saxpy = our_saxpy_noblas # <<<<<<<<<<<<<< @@ -8528,7 +8582,7 @@ static PyObject *__pyx_pf_6gensim_6models_14word2vec_inner_8init(CYTHON_UNUSED P */ __pyx_v_6gensim_6models_14word2vec_inner_our_saxpy = __pyx_f_6gensim_6models_14word2vec_inner_our_saxpy_noblas; - /* "gensim/models/word2vec_inner.pyx":933 + /* "gensim/models/word2vec_inner.pyx":932 * our_dot = our_dot_noblas * our_saxpy = our_saxpy_noblas * return 2 # <<<<<<<<<<<<<< @@ -8541,7 +8595,7 @@ static PyObject *__pyx_pf_6gensim_6models_14word2vec_inner_8init(CYTHON_UNUSED P goto __pyx_L0; } - /* "gensim/models/word2vec_inner.pyx":888 + /* "gensim/models/word2vec_inner.pyx":887 * * * def init(): # <<<<<<<<<<<<<< @@ -8556,7 +8610,7 @@ static PyObject *__pyx_pf_6gensim_6models_14word2vec_inner_8init(CYTHON_UNUSED P return __pyx_r; } -/* "../../../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":215 +/* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":258 * # experimental exception made for __getbuffer__ and __releasebuffer__ * # -- the details of this may change. * def __getbuffer__(ndarray self, Py_buffer* info, int flags): # <<<<<<<<<<<<<< @@ -8594,8 +8648,9 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P int __pyx_t_4; int __pyx_t_5; int __pyx_t_6; - PyObject *__pyx_t_7 = NULL; - char *__pyx_t_8; + PyArray_Descr *__pyx_t_7; + PyObject *__pyx_t_8 = NULL; + char *__pyx_t_9; if (__pyx_v_info == NULL) { PyErr_SetString(PyExc_BufferError, "PyObject_GetBuffer: view==NULL argument is obsolete"); return -1; @@ -8604,7 +8659,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P __pyx_v_info->obj = Py_None; __Pyx_INCREF(Py_None); __Pyx_GIVEREF(__pyx_v_info->obj); - /* "../../../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":222 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":265 * * cdef int i, ndim * cdef int endian_detector = 1 # <<<<<<<<<<<<<< @@ -8613,7 +8668,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P */ __pyx_v_endian_detector = 1; - /* "../../../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":223 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":266 * cdef int i, ndim * cdef int endian_detector = 1 * cdef bint little_endian = ((&endian_detector)[0] != 0) # <<<<<<<<<<<<<< @@ -8622,7 +8677,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P */ __pyx_v_little_endian = ((((char *)(&__pyx_v_endian_detector))[0]) != 0); - /* "../../../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":225 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":268 * cdef bint little_endian = ((&endian_detector)[0] != 0) * * ndim = PyArray_NDIM(self) # <<<<<<<<<<<<<< @@ -8631,11 +8686,11 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P */ __pyx_v_ndim = PyArray_NDIM(__pyx_v_self); - /* "../../../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":227 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":270 * ndim = PyArray_NDIM(self) * * if ((flags & pybuf.PyBUF_C_CONTIGUOUS == pybuf.PyBUF_C_CONTIGUOUS) # <<<<<<<<<<<<<< - * and not PyArray_CHKFLAGS(self, NPY_C_CONTIGUOUS)): + * and not PyArray_CHKFLAGS(self, NPY_ARRAY_C_CONTIGUOUS)): * raise ValueError(u"ndarray is not C contiguous") */ __pyx_t_2 = (((__pyx_v_flags & PyBUF_C_CONTIGUOUS) == PyBUF_C_CONTIGUOUS) != 0); @@ -8645,53 +8700,53 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P goto __pyx_L4_bool_binop_done; } - /* "../../../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":228 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":271 * * if ((flags & pybuf.PyBUF_C_CONTIGUOUS == pybuf.PyBUF_C_CONTIGUOUS) - * and not PyArray_CHKFLAGS(self, NPY_C_CONTIGUOUS)): # <<<<<<<<<<<<<< + * and not PyArray_CHKFLAGS(self, NPY_ARRAY_C_CONTIGUOUS)): # <<<<<<<<<<<<<< * raise ValueError(u"ndarray is not C contiguous") * */ - __pyx_t_2 = ((!(PyArray_CHKFLAGS(__pyx_v_self, NPY_C_CONTIGUOUS) != 0)) != 0); + __pyx_t_2 = ((!(PyArray_CHKFLAGS(__pyx_v_self, NPY_ARRAY_C_CONTIGUOUS) != 0)) != 0); __pyx_t_1 = __pyx_t_2; __pyx_L4_bool_binop_done:; - /* "../../../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":227 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":270 * ndim = PyArray_NDIM(self) * * if ((flags & pybuf.PyBUF_C_CONTIGUOUS == pybuf.PyBUF_C_CONTIGUOUS) # <<<<<<<<<<<<<< - * and not PyArray_CHKFLAGS(self, NPY_C_CONTIGUOUS)): + * and not PyArray_CHKFLAGS(self, NPY_ARRAY_C_CONTIGUOUS)): * raise ValueError(u"ndarray is not C contiguous") */ if (unlikely(__pyx_t_1)) { - /* "../../../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":229 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":272 * if ((flags & pybuf.PyBUF_C_CONTIGUOUS == pybuf.PyBUF_C_CONTIGUOUS) - * and not PyArray_CHKFLAGS(self, NPY_C_CONTIGUOUS)): + * and not PyArray_CHKFLAGS(self, NPY_ARRAY_C_CONTIGUOUS)): * raise ValueError(u"ndarray is not C contiguous") # <<<<<<<<<<<<<< * * if ((flags & pybuf.PyBUF_F_CONTIGUOUS == pybuf.PyBUF_F_CONTIGUOUS) */ - __pyx_t_3 = __Pyx_PyObject_Call(__pyx_builtin_ValueError, __pyx_tuple__3, NULL); if (unlikely(!__pyx_t_3)) __PYX_ERR(1, 229, __pyx_L1_error) + __pyx_t_3 = __Pyx_PyObject_Call(__pyx_builtin_ValueError, __pyx_tuple__2, NULL); if (unlikely(!__pyx_t_3)) __PYX_ERR(1, 272, __pyx_L1_error) __Pyx_GOTREF(__pyx_t_3); __Pyx_Raise(__pyx_t_3, 0, 0, 0); __Pyx_DECREF(__pyx_t_3); __pyx_t_3 = 0; - __PYX_ERR(1, 229, __pyx_L1_error) + __PYX_ERR(1, 272, __pyx_L1_error) - /* "../../../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":227 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":270 * ndim = PyArray_NDIM(self) * * if ((flags & pybuf.PyBUF_C_CONTIGUOUS == pybuf.PyBUF_C_CONTIGUOUS) # <<<<<<<<<<<<<< - * and not PyArray_CHKFLAGS(self, NPY_C_CONTIGUOUS)): + * and not PyArray_CHKFLAGS(self, NPY_ARRAY_C_CONTIGUOUS)): * raise ValueError(u"ndarray is not C contiguous") */ } - /* "../../../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":231 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":274 * raise ValueError(u"ndarray is not C contiguous") * * if ((flags & pybuf.PyBUF_F_CONTIGUOUS == pybuf.PyBUF_F_CONTIGUOUS) # <<<<<<<<<<<<<< - * and not PyArray_CHKFLAGS(self, NPY_F_CONTIGUOUS)): + * and not PyArray_CHKFLAGS(self, NPY_ARRAY_F_CONTIGUOUS)): * raise ValueError(u"ndarray is not Fortran contiguous") */ __pyx_t_2 = (((__pyx_v_flags & PyBUF_F_CONTIGUOUS) == PyBUF_F_CONTIGUOUS) != 0); @@ -8701,49 +8756,49 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P goto __pyx_L7_bool_binop_done; } - /* "../../../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":232 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":275 * * if ((flags & pybuf.PyBUF_F_CONTIGUOUS == pybuf.PyBUF_F_CONTIGUOUS) - * and not PyArray_CHKFLAGS(self, NPY_F_CONTIGUOUS)): # <<<<<<<<<<<<<< + * and not PyArray_CHKFLAGS(self, NPY_ARRAY_F_CONTIGUOUS)): # <<<<<<<<<<<<<< * raise ValueError(u"ndarray is not Fortran contiguous") * */ - __pyx_t_2 = ((!(PyArray_CHKFLAGS(__pyx_v_self, NPY_F_CONTIGUOUS) != 0)) != 0); + __pyx_t_2 = ((!(PyArray_CHKFLAGS(__pyx_v_self, NPY_ARRAY_F_CONTIGUOUS) != 0)) != 0); __pyx_t_1 = __pyx_t_2; __pyx_L7_bool_binop_done:; - /* "../../../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":231 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":274 * raise ValueError(u"ndarray is not C contiguous") * * if ((flags & pybuf.PyBUF_F_CONTIGUOUS == pybuf.PyBUF_F_CONTIGUOUS) # <<<<<<<<<<<<<< - * and not PyArray_CHKFLAGS(self, NPY_F_CONTIGUOUS)): + * and not PyArray_CHKFLAGS(self, NPY_ARRAY_F_CONTIGUOUS)): * raise ValueError(u"ndarray is not Fortran contiguous") */ if (unlikely(__pyx_t_1)) { - /* "../../../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":233 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":276 * if ((flags & pybuf.PyBUF_F_CONTIGUOUS == pybuf.PyBUF_F_CONTIGUOUS) - * and not PyArray_CHKFLAGS(self, NPY_F_CONTIGUOUS)): + * and not PyArray_CHKFLAGS(self, NPY_ARRAY_F_CONTIGUOUS)): * raise ValueError(u"ndarray is not Fortran contiguous") # <<<<<<<<<<<<<< * * info.buf = PyArray_DATA(self) */ - __pyx_t_3 = __Pyx_PyObject_Call(__pyx_builtin_ValueError, __pyx_tuple__4, NULL); if (unlikely(!__pyx_t_3)) __PYX_ERR(1, 233, __pyx_L1_error) + __pyx_t_3 = __Pyx_PyObject_Call(__pyx_builtin_ValueError, __pyx_tuple__3, NULL); if (unlikely(!__pyx_t_3)) __PYX_ERR(1, 276, __pyx_L1_error) __Pyx_GOTREF(__pyx_t_3); __Pyx_Raise(__pyx_t_3, 0, 0, 0); __Pyx_DECREF(__pyx_t_3); __pyx_t_3 = 0; - __PYX_ERR(1, 233, __pyx_L1_error) + __PYX_ERR(1, 276, __pyx_L1_error) - /* "../../../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":231 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":274 * raise ValueError(u"ndarray is not C contiguous") * * if ((flags & pybuf.PyBUF_F_CONTIGUOUS == pybuf.PyBUF_F_CONTIGUOUS) # <<<<<<<<<<<<<< - * and not PyArray_CHKFLAGS(self, NPY_F_CONTIGUOUS)): + * and not PyArray_CHKFLAGS(self, NPY_ARRAY_F_CONTIGUOUS)): * raise ValueError(u"ndarray is not Fortran contiguous") */ } - /* "../../../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":235 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":278 * raise ValueError(u"ndarray is not Fortran contiguous") * * info.buf = PyArray_DATA(self) # <<<<<<<<<<<<<< @@ -8752,7 +8807,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P */ __pyx_v_info->buf = PyArray_DATA(__pyx_v_self); - /* "../../../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":236 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":279 * * info.buf = PyArray_DATA(self) * info.ndim = ndim # <<<<<<<<<<<<<< @@ -8761,7 +8816,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P */ __pyx_v_info->ndim = __pyx_v_ndim; - /* "../../../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":237 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":280 * info.buf = PyArray_DATA(self) * info.ndim = ndim * if sizeof(npy_intp) != sizeof(Py_ssize_t): # <<<<<<<<<<<<<< @@ -8771,7 +8826,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P __pyx_t_1 = (((sizeof(npy_intp)) != (sizeof(Py_ssize_t))) != 0); if (__pyx_t_1) { - /* "../../../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":240 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":283 * # Allocate new buffer for strides and shape info. * # This is allocated as one block, strides first. * info.strides = PyObject_Malloc(sizeof(Py_ssize_t) * 2 * ndim) # <<<<<<<<<<<<<< @@ -8780,7 +8835,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P */ __pyx_v_info->strides = ((Py_ssize_t *)PyObject_Malloc((((sizeof(Py_ssize_t)) * 2) * ((size_t)__pyx_v_ndim)))); - /* "../../../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":241 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":284 * # This is allocated as one block, strides first. * info.strides = PyObject_Malloc(sizeof(Py_ssize_t) * 2 * ndim) * info.shape = info.strides + ndim # <<<<<<<<<<<<<< @@ -8789,7 +8844,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P */ __pyx_v_info->shape = (__pyx_v_info->strides + __pyx_v_ndim); - /* "../../../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":242 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":285 * info.strides = PyObject_Malloc(sizeof(Py_ssize_t) * 2 * ndim) * info.shape = info.strides + ndim * for i in range(ndim): # <<<<<<<<<<<<<< @@ -8801,7 +8856,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P for (__pyx_t_6 = 0; __pyx_t_6 < __pyx_t_5; __pyx_t_6+=1) { __pyx_v_i = __pyx_t_6; - /* "../../../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":243 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":286 * info.shape = info.strides + ndim * for i in range(ndim): * info.strides[i] = PyArray_STRIDES(self)[i] # <<<<<<<<<<<<<< @@ -8810,7 +8865,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P */ (__pyx_v_info->strides[__pyx_v_i]) = (PyArray_STRIDES(__pyx_v_self)[__pyx_v_i]); - /* "../../../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":244 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":287 * for i in range(ndim): * info.strides[i] = PyArray_STRIDES(self)[i] * info.shape[i] = PyArray_DIMS(self)[i] # <<<<<<<<<<<<<< @@ -8820,7 +8875,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P (__pyx_v_info->shape[__pyx_v_i]) = (PyArray_DIMS(__pyx_v_self)[__pyx_v_i]); } - /* "../../../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":237 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":280 * info.buf = PyArray_DATA(self) * info.ndim = ndim * if sizeof(npy_intp) != sizeof(Py_ssize_t): # <<<<<<<<<<<<<< @@ -8830,7 +8885,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P goto __pyx_L9; } - /* "../../../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":246 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":289 * info.shape[i] = PyArray_DIMS(self)[i] * else: * info.strides = PyArray_STRIDES(self) # <<<<<<<<<<<<<< @@ -8840,7 +8895,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P /*else*/ { __pyx_v_info->strides = ((Py_ssize_t *)PyArray_STRIDES(__pyx_v_self)); - /* "../../../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":247 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":290 * else: * info.strides = PyArray_STRIDES(self) * info.shape = PyArray_DIMS(self) # <<<<<<<<<<<<<< @@ -8851,7 +8906,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P } __pyx_L9:; - /* "../../../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":248 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":291 * info.strides = PyArray_STRIDES(self) * info.shape = PyArray_DIMS(self) * info.suboffsets = NULL # <<<<<<<<<<<<<< @@ -8860,7 +8915,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P */ __pyx_v_info->suboffsets = NULL; - /* "../../../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":249 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":292 * info.shape = PyArray_DIMS(self) * info.suboffsets = NULL * info.itemsize = PyArray_ITEMSIZE(self) # <<<<<<<<<<<<<< @@ -8869,7 +8924,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P */ __pyx_v_info->itemsize = PyArray_ITEMSIZE(__pyx_v_self); - /* "../../../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":250 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":293 * info.suboffsets = NULL * info.itemsize = PyArray_ITEMSIZE(self) * info.readonly = not PyArray_ISWRITEABLE(self) # <<<<<<<<<<<<<< @@ -8878,28 +8933,29 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P */ __pyx_v_info->readonly = (!(PyArray_ISWRITEABLE(__pyx_v_self) != 0)); - /* "../../../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":253 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":296 * * cdef int t * cdef char* f = NULL # <<<<<<<<<<<<<< - * cdef dtype descr = self.descr + * cdef dtype descr = PyArray_DESCR(self) * cdef int offset */ __pyx_v_f = NULL; - /* "../../../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":254 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":297 * cdef int t * cdef char* f = NULL - * cdef dtype descr = self.descr # <<<<<<<<<<<<<< + * cdef dtype descr = PyArray_DESCR(self) # <<<<<<<<<<<<<< * cdef int offset * */ - __pyx_t_3 = ((PyObject *)__pyx_v_self->descr); + __pyx_t_7 = PyArray_DESCR(__pyx_v_self); + __pyx_t_3 = ((PyObject *)__pyx_t_7); __Pyx_INCREF(__pyx_t_3); __pyx_v_descr = ((PyArray_Descr *)__pyx_t_3); __pyx_t_3 = 0; - /* "../../../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":257 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":300 * cdef int offset * * info.obj = self # <<<<<<<<<<<<<< @@ -8912,7 +8968,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P __Pyx_DECREF(__pyx_v_info->obj); __pyx_v_info->obj = ((PyObject *)__pyx_v_self); - /* "../../../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":259 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":302 * info.obj = self * * if not PyDataType_HASFIELDS(descr): # <<<<<<<<<<<<<< @@ -8922,7 +8978,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P __pyx_t_1 = ((!(PyDataType_HASFIELDS(__pyx_v_descr) != 0)) != 0); if (__pyx_t_1) { - /* "../../../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":260 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":303 * * if not PyDataType_HASFIELDS(descr): * t = descr.type_num # <<<<<<<<<<<<<< @@ -8932,7 +8988,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P __pyx_t_4 = __pyx_v_descr->type_num; __pyx_v_t = __pyx_t_4; - /* "../../../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":261 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":304 * if not PyDataType_HASFIELDS(descr): * t = descr.type_num * if ((descr.byteorder == c'>' and little_endian) or # <<<<<<<<<<<<<< @@ -8952,7 +9008,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P } __pyx_L15_next_or:; - /* "../../../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":262 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":305 * t = descr.type_num * if ((descr.byteorder == c'>' and little_endian) or * (descr.byteorder == c'<' and not little_endian)): # <<<<<<<<<<<<<< @@ -8969,7 +9025,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P __pyx_t_1 = __pyx_t_2; __pyx_L14_bool_binop_done:; - /* "../../../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":261 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":304 * if not PyDataType_HASFIELDS(descr): * t = descr.type_num * if ((descr.byteorder == c'>' and little_endian) or # <<<<<<<<<<<<<< @@ -8978,20 +9034,20 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P */ if (unlikely(__pyx_t_1)) { - /* "../../../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":263 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":306 * if ((descr.byteorder == c'>' and little_endian) or * (descr.byteorder == c'<' and not little_endian)): * raise ValueError(u"Non-native byte order not supported") # <<<<<<<<<<<<<< * if t == NPY_BYTE: f = "b" * elif t == NPY_UBYTE: f = "B" */ - __pyx_t_3 = __Pyx_PyObject_Call(__pyx_builtin_ValueError, __pyx_tuple__5, NULL); if (unlikely(!__pyx_t_3)) __PYX_ERR(1, 263, __pyx_L1_error) + __pyx_t_3 = __Pyx_PyObject_Call(__pyx_builtin_ValueError, __pyx_tuple__4, NULL); if (unlikely(!__pyx_t_3)) __PYX_ERR(1, 306, __pyx_L1_error) __Pyx_GOTREF(__pyx_t_3); __Pyx_Raise(__pyx_t_3, 0, 0, 0); __Pyx_DECREF(__pyx_t_3); __pyx_t_3 = 0; - __PYX_ERR(1, 263, __pyx_L1_error) + __PYX_ERR(1, 306, __pyx_L1_error) - /* "../../../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":261 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":304 * if not PyDataType_HASFIELDS(descr): * t = descr.type_num * if ((descr.byteorder == c'>' and little_endian) or # <<<<<<<<<<<<<< @@ -9000,7 +9056,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P */ } - /* "../../../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":264 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":307 * (descr.byteorder == c'<' and not little_endian)): * raise ValueError(u"Non-native byte order not supported") * if t == NPY_BYTE: f = "b" # <<<<<<<<<<<<<< @@ -9011,206 +9067,206 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P case NPY_BYTE: __pyx_v_f = ((char *)"b"); break; + case NPY_UBYTE: - /* "../../../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":265 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":308 * raise ValueError(u"Non-native byte order not supported") * if t == NPY_BYTE: f = "b" * elif t == NPY_UBYTE: f = "B" # <<<<<<<<<<<<<< * elif t == NPY_SHORT: f = "h" * elif t == NPY_USHORT: f = "H" */ - case NPY_UBYTE: __pyx_v_f = ((char *)"B"); break; + case NPY_SHORT: - /* "../../../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":266 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":309 * if t == NPY_BYTE: f = "b" * elif t == NPY_UBYTE: f = "B" * elif t == NPY_SHORT: f = "h" # <<<<<<<<<<<<<< * elif t == NPY_USHORT: f = "H" * elif t == NPY_INT: f = "i" */ - case NPY_SHORT: __pyx_v_f = ((char *)"h"); break; + case NPY_USHORT: - /* "../../../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":267 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":310 * elif t == NPY_UBYTE: f = "B" * elif t == NPY_SHORT: f = "h" * elif t == NPY_USHORT: f = "H" # <<<<<<<<<<<<<< * elif t == NPY_INT: f = "i" * elif t == NPY_UINT: f = "I" */ - case NPY_USHORT: __pyx_v_f = ((char *)"H"); break; + case NPY_INT: - /* "../../../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":268 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":311 * elif t == NPY_SHORT: f = "h" * elif t == NPY_USHORT: f = "H" * elif t == NPY_INT: f = "i" # <<<<<<<<<<<<<< * elif t == NPY_UINT: f = "I" * elif t == NPY_LONG: f = "l" */ - case NPY_INT: __pyx_v_f = ((char *)"i"); break; + case NPY_UINT: - /* "../../../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":269 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":312 * elif t == NPY_USHORT: f = "H" * elif t == NPY_INT: f = "i" * elif t == NPY_UINT: f = "I" # <<<<<<<<<<<<<< * elif t == NPY_LONG: f = "l" * elif t == NPY_ULONG: f = "L" */ - case NPY_UINT: __pyx_v_f = ((char *)"I"); break; + case NPY_LONG: - /* "../../../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":270 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":313 * elif t == NPY_INT: f = "i" * elif t == NPY_UINT: f = "I" * elif t == NPY_LONG: f = "l" # <<<<<<<<<<<<<< * elif t == NPY_ULONG: f = "L" * elif t == NPY_LONGLONG: f = "q" */ - case NPY_LONG: __pyx_v_f = ((char *)"l"); break; + case NPY_ULONG: - /* "../../../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":271 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":314 * elif t == NPY_UINT: f = "I" * elif t == NPY_LONG: f = "l" * elif t == NPY_ULONG: f = "L" # <<<<<<<<<<<<<< * elif t == NPY_LONGLONG: f = "q" * elif t == NPY_ULONGLONG: f = "Q" */ - case NPY_ULONG: __pyx_v_f = ((char *)"L"); break; + case NPY_LONGLONG: - /* "../../../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":272 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":315 * elif t == NPY_LONG: f = "l" * elif t == NPY_ULONG: f = "L" * elif t == NPY_LONGLONG: f = "q" # <<<<<<<<<<<<<< * elif t == NPY_ULONGLONG: f = "Q" * elif t == NPY_FLOAT: f = "f" */ - case NPY_LONGLONG: __pyx_v_f = ((char *)"q"); break; + case NPY_ULONGLONG: - /* "../../../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":273 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":316 * elif t == NPY_ULONG: f = "L" * elif t == NPY_LONGLONG: f = "q" * elif t == NPY_ULONGLONG: f = "Q" # <<<<<<<<<<<<<< * elif t == NPY_FLOAT: f = "f" * elif t == NPY_DOUBLE: f = "d" */ - case NPY_ULONGLONG: __pyx_v_f = ((char *)"Q"); break; + case NPY_FLOAT: - /* "../../../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":274 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":317 * elif t == NPY_LONGLONG: f = "q" * elif t == NPY_ULONGLONG: f = "Q" * elif t == NPY_FLOAT: f = "f" # <<<<<<<<<<<<<< * elif t == NPY_DOUBLE: f = "d" * elif t == NPY_LONGDOUBLE: f = "g" */ - case NPY_FLOAT: __pyx_v_f = ((char *)"f"); break; + case NPY_DOUBLE: - /* "../../../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":275 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":318 * elif t == NPY_ULONGLONG: f = "Q" * elif t == NPY_FLOAT: f = "f" * elif t == NPY_DOUBLE: f = "d" # <<<<<<<<<<<<<< * elif t == NPY_LONGDOUBLE: f = "g" * elif t == NPY_CFLOAT: f = "Zf" */ - case NPY_DOUBLE: __pyx_v_f = ((char *)"d"); break; + case NPY_LONGDOUBLE: - /* "../../../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":276 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":319 * elif t == NPY_FLOAT: f = "f" * elif t == NPY_DOUBLE: f = "d" * elif t == NPY_LONGDOUBLE: f = "g" # <<<<<<<<<<<<<< * elif t == NPY_CFLOAT: f = "Zf" * elif t == NPY_CDOUBLE: f = "Zd" */ - case NPY_LONGDOUBLE: __pyx_v_f = ((char *)"g"); break; + case NPY_CFLOAT: - /* "../../../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":277 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":320 * elif t == NPY_DOUBLE: f = "d" * elif t == NPY_LONGDOUBLE: f = "g" * elif t == NPY_CFLOAT: f = "Zf" # <<<<<<<<<<<<<< * elif t == NPY_CDOUBLE: f = "Zd" * elif t == NPY_CLONGDOUBLE: f = "Zg" */ - case NPY_CFLOAT: __pyx_v_f = ((char *)"Zf"); break; + case NPY_CDOUBLE: - /* "../../../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":278 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":321 * elif t == NPY_LONGDOUBLE: f = "g" * elif t == NPY_CFLOAT: f = "Zf" * elif t == NPY_CDOUBLE: f = "Zd" # <<<<<<<<<<<<<< * elif t == NPY_CLONGDOUBLE: f = "Zg" * elif t == NPY_OBJECT: f = "O" */ - case NPY_CDOUBLE: __pyx_v_f = ((char *)"Zd"); break; + case NPY_CLONGDOUBLE: - /* "../../../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":279 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":322 * elif t == NPY_CFLOAT: f = "Zf" * elif t == NPY_CDOUBLE: f = "Zd" * elif t == NPY_CLONGDOUBLE: f = "Zg" # <<<<<<<<<<<<<< * elif t == NPY_OBJECT: f = "O" * else: */ - case NPY_CLONGDOUBLE: __pyx_v_f = ((char *)"Zg"); break; + case NPY_OBJECT: - /* "../../../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":280 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":323 * elif t == NPY_CDOUBLE: f = "Zd" * elif t == NPY_CLONGDOUBLE: f = "Zg" * elif t == NPY_OBJECT: f = "O" # <<<<<<<<<<<<<< * else: * raise ValueError(u"unknown dtype code in numpy.pxd (%d)" % t) */ - case NPY_OBJECT: __pyx_v_f = ((char *)"O"); break; default: - /* "../../../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":282 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":325 * elif t == NPY_OBJECT: f = "O" * else: * raise ValueError(u"unknown dtype code in numpy.pxd (%d)" % t) # <<<<<<<<<<<<<< * info.format = f * return */ - __pyx_t_3 = __Pyx_PyInt_From_int(__pyx_v_t); if (unlikely(!__pyx_t_3)) __PYX_ERR(1, 282, __pyx_L1_error) + __pyx_t_3 = __Pyx_PyInt_From_int(__pyx_v_t); if (unlikely(!__pyx_t_3)) __PYX_ERR(1, 325, __pyx_L1_error) __Pyx_GOTREF(__pyx_t_3); - __pyx_t_7 = PyUnicode_Format(__pyx_kp_u_unknown_dtype_code_in_numpy_pxd, __pyx_t_3); if (unlikely(!__pyx_t_7)) __PYX_ERR(1, 282, __pyx_L1_error) - __Pyx_GOTREF(__pyx_t_7); + __pyx_t_8 = PyUnicode_Format(__pyx_kp_u_unknown_dtype_code_in_numpy_pxd, __pyx_t_3); if (unlikely(!__pyx_t_8)) __PYX_ERR(1, 325, __pyx_L1_error) + __Pyx_GOTREF(__pyx_t_8); __Pyx_DECREF(__pyx_t_3); __pyx_t_3 = 0; - __pyx_t_3 = __Pyx_PyObject_CallOneArg(__pyx_builtin_ValueError, __pyx_t_7); if (unlikely(!__pyx_t_3)) __PYX_ERR(1, 282, __pyx_L1_error) + __pyx_t_3 = __Pyx_PyObject_CallOneArg(__pyx_builtin_ValueError, __pyx_t_8); if (unlikely(!__pyx_t_3)) __PYX_ERR(1, 325, __pyx_L1_error) __Pyx_GOTREF(__pyx_t_3); - __Pyx_DECREF(__pyx_t_7); __pyx_t_7 = 0; + __Pyx_DECREF(__pyx_t_8); __pyx_t_8 = 0; __Pyx_Raise(__pyx_t_3, 0, 0, 0); __Pyx_DECREF(__pyx_t_3); __pyx_t_3 = 0; - __PYX_ERR(1, 282, __pyx_L1_error) + __PYX_ERR(1, 325, __pyx_L1_error) break; } - /* "../../../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":283 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":326 * else: * raise ValueError(u"unknown dtype code in numpy.pxd (%d)" % t) * info.format = f # <<<<<<<<<<<<<< @@ -9219,7 +9275,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P */ __pyx_v_info->format = __pyx_v_f; - /* "../../../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":284 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":327 * raise ValueError(u"unknown dtype code in numpy.pxd (%d)" % t) * info.format = f * return # <<<<<<<<<<<<<< @@ -9229,7 +9285,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P __pyx_r = 0; goto __pyx_L0; - /* "../../../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":259 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":302 * info.obj = self * * if not PyDataType_HASFIELDS(descr): # <<<<<<<<<<<<<< @@ -9238,7 +9294,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P */ } - /* "../../../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":286 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":329 * return * else: * info.format = PyObject_Malloc(_buffer_format_string_len) # <<<<<<<<<<<<<< @@ -9248,7 +9304,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P /*else*/ { __pyx_v_info->format = ((char *)PyObject_Malloc(0xFF)); - /* "../../../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":287 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":330 * else: * info.format = PyObject_Malloc(_buffer_format_string_len) * info.format[0] = c'^' # Native data types, manual alignment # <<<<<<<<<<<<<< @@ -9257,7 +9313,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P */ (__pyx_v_info->format[0]) = '^'; - /* "../../../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":288 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":331 * info.format = PyObject_Malloc(_buffer_format_string_len) * info.format[0] = c'^' # Native data types, manual alignment * offset = 0 # <<<<<<<<<<<<<< @@ -9266,17 +9322,17 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P */ __pyx_v_offset = 0; - /* "../../../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":289 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":332 * info.format[0] = c'^' # Native data types, manual alignment * offset = 0 * f = _util_dtypestring(descr, info.format + 1, # <<<<<<<<<<<<<< * info.format + _buffer_format_string_len, * &offset) */ - __pyx_t_8 = __pyx_f_5numpy__util_dtypestring(__pyx_v_descr, (__pyx_v_info->format + 1), (__pyx_v_info->format + 0xFF), (&__pyx_v_offset)); if (unlikely(__pyx_t_8 == ((char *)NULL))) __PYX_ERR(1, 289, __pyx_L1_error) - __pyx_v_f = __pyx_t_8; + __pyx_t_9 = __pyx_f_5numpy__util_dtypestring(__pyx_v_descr, (__pyx_v_info->format + 1), (__pyx_v_info->format + 0xFF), (&__pyx_v_offset)); if (unlikely(__pyx_t_9 == ((char *)NULL))) __PYX_ERR(1, 332, __pyx_L1_error) + __pyx_v_f = __pyx_t_9; - /* "../../../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":292 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":335 * info.format + _buffer_format_string_len, * &offset) * f[0] = c'\0' # Terminate format string # <<<<<<<<<<<<<< @@ -9286,7 +9342,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P (__pyx_v_f[0]) = '\x00'; } - /* "../../../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":215 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":258 * # experimental exception made for __getbuffer__ and __releasebuffer__ * # -- the details of this may change. * def __getbuffer__(ndarray self, Py_buffer* info, int flags): # <<<<<<<<<<<<<< @@ -9299,7 +9355,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P goto __pyx_L0; __pyx_L1_error:; __Pyx_XDECREF(__pyx_t_3); - __Pyx_XDECREF(__pyx_t_7); + __Pyx_XDECREF(__pyx_t_8); __Pyx_AddTraceback("numpy.ndarray.__getbuffer__", __pyx_clineno, __pyx_lineno, __pyx_filename); __pyx_r = -1; if (__pyx_v_info->obj != NULL) { @@ -9318,7 +9374,7 @@ static int __pyx_pf_5numpy_7ndarray___getbuffer__(PyArrayObject *__pyx_v_self, P return __pyx_r; } -/* "../../../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":294 +/* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":337 * f[0] = c'\0' # Terminate format string * * def __releasebuffer__(ndarray self, Py_buffer* info): # <<<<<<<<<<<<<< @@ -9342,7 +9398,7 @@ static void __pyx_pf_5numpy_7ndarray_2__releasebuffer__(PyArrayObject *__pyx_v_s int __pyx_t_1; __Pyx_RefNannySetupContext("__releasebuffer__", 0); - /* "../../../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":295 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":338 * * def __releasebuffer__(ndarray self, Py_buffer* info): * if PyArray_HASFIELDS(self): # <<<<<<<<<<<<<< @@ -9352,7 +9408,7 @@ static void __pyx_pf_5numpy_7ndarray_2__releasebuffer__(PyArrayObject *__pyx_v_s __pyx_t_1 = (PyArray_HASFIELDS(__pyx_v_self) != 0); if (__pyx_t_1) { - /* "../../../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":296 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":339 * def __releasebuffer__(ndarray self, Py_buffer* info): * if PyArray_HASFIELDS(self): * PyObject_Free(info.format) # <<<<<<<<<<<<<< @@ -9361,7 +9417,7 @@ static void __pyx_pf_5numpy_7ndarray_2__releasebuffer__(PyArrayObject *__pyx_v_s */ PyObject_Free(__pyx_v_info->format); - /* "../../../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":295 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":338 * * def __releasebuffer__(ndarray self, Py_buffer* info): * if PyArray_HASFIELDS(self): # <<<<<<<<<<<<<< @@ -9370,7 +9426,7 @@ static void __pyx_pf_5numpy_7ndarray_2__releasebuffer__(PyArrayObject *__pyx_v_s */ } - /* "../../../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":297 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":340 * if PyArray_HASFIELDS(self): * PyObject_Free(info.format) * if sizeof(npy_intp) != sizeof(Py_ssize_t): # <<<<<<<<<<<<<< @@ -9380,7 +9436,7 @@ static void __pyx_pf_5numpy_7ndarray_2__releasebuffer__(PyArrayObject *__pyx_v_s __pyx_t_1 = (((sizeof(npy_intp)) != (sizeof(Py_ssize_t))) != 0); if (__pyx_t_1) { - /* "../../../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":298 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":341 * PyObject_Free(info.format) * if sizeof(npy_intp) != sizeof(Py_ssize_t): * PyObject_Free(info.strides) # <<<<<<<<<<<<<< @@ -9389,7 +9445,7 @@ static void __pyx_pf_5numpy_7ndarray_2__releasebuffer__(PyArrayObject *__pyx_v_s */ PyObject_Free(__pyx_v_info->strides); - /* "../../../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":297 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":340 * if PyArray_HASFIELDS(self): * PyObject_Free(info.format) * if sizeof(npy_intp) != sizeof(Py_ssize_t): # <<<<<<<<<<<<<< @@ -9398,7 +9454,7 @@ static void __pyx_pf_5numpy_7ndarray_2__releasebuffer__(PyArrayObject *__pyx_v_s */ } - /* "../../../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":294 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":337 * f[0] = c'\0' # Terminate format string * * def __releasebuffer__(ndarray self, Py_buffer* info): # <<<<<<<<<<<<<< @@ -9410,7 +9466,7 @@ static void __pyx_pf_5numpy_7ndarray_2__releasebuffer__(PyArrayObject *__pyx_v_s __Pyx_RefNannyFinishContext(); } -/* "../../../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":775 +/* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":821 * ctypedef npy_cdouble complex_t * * cdef inline object PyArray_MultiIterNew1(a): # <<<<<<<<<<<<<< @@ -9424,7 +9480,7 @@ static CYTHON_INLINE PyObject *__pyx_f_5numpy_PyArray_MultiIterNew1(PyObject *__ PyObject *__pyx_t_1 = NULL; __Pyx_RefNannySetupContext("PyArray_MultiIterNew1", 0); - /* "../../../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":776 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":822 * * cdef inline object PyArray_MultiIterNew1(a): * return PyArray_MultiIterNew(1, a) # <<<<<<<<<<<<<< @@ -9432,13 +9488,13 @@ static CYTHON_INLINE PyObject *__pyx_f_5numpy_PyArray_MultiIterNew1(PyObject *__ * cdef inline object PyArray_MultiIterNew2(a, b): */ __Pyx_XDECREF(__pyx_r); - __pyx_t_1 = PyArray_MultiIterNew(1, ((void *)__pyx_v_a)); if (unlikely(!__pyx_t_1)) __PYX_ERR(1, 776, __pyx_L1_error) + __pyx_t_1 = PyArray_MultiIterNew(1, ((void *)__pyx_v_a)); if (unlikely(!__pyx_t_1)) __PYX_ERR(1, 822, __pyx_L1_error) __Pyx_GOTREF(__pyx_t_1); __pyx_r = __pyx_t_1; __pyx_t_1 = 0; goto __pyx_L0; - /* "../../../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":775 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":821 * ctypedef npy_cdouble complex_t * * cdef inline object PyArray_MultiIterNew1(a): # <<<<<<<<<<<<<< @@ -9457,7 +9513,7 @@ static CYTHON_INLINE PyObject *__pyx_f_5numpy_PyArray_MultiIterNew1(PyObject *__ return __pyx_r; } -/* "../../../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":778 +/* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":824 * return PyArray_MultiIterNew(1, a) * * cdef inline object PyArray_MultiIterNew2(a, b): # <<<<<<<<<<<<<< @@ -9471,7 +9527,7 @@ static CYTHON_INLINE PyObject *__pyx_f_5numpy_PyArray_MultiIterNew2(PyObject *__ PyObject *__pyx_t_1 = NULL; __Pyx_RefNannySetupContext("PyArray_MultiIterNew2", 0); - /* "../../../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":779 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":825 * * cdef inline object PyArray_MultiIterNew2(a, b): * return PyArray_MultiIterNew(2, a, b) # <<<<<<<<<<<<<< @@ -9479,13 +9535,13 @@ static CYTHON_INLINE PyObject *__pyx_f_5numpy_PyArray_MultiIterNew2(PyObject *__ * cdef inline object PyArray_MultiIterNew3(a, b, c): */ __Pyx_XDECREF(__pyx_r); - __pyx_t_1 = PyArray_MultiIterNew(2, ((void *)__pyx_v_a), ((void *)__pyx_v_b)); if (unlikely(!__pyx_t_1)) __PYX_ERR(1, 779, __pyx_L1_error) + __pyx_t_1 = PyArray_MultiIterNew(2, ((void *)__pyx_v_a), ((void *)__pyx_v_b)); if (unlikely(!__pyx_t_1)) __PYX_ERR(1, 825, __pyx_L1_error) __Pyx_GOTREF(__pyx_t_1); __pyx_r = __pyx_t_1; __pyx_t_1 = 0; goto __pyx_L0; - /* "../../../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":778 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":824 * return PyArray_MultiIterNew(1, a) * * cdef inline object PyArray_MultiIterNew2(a, b): # <<<<<<<<<<<<<< @@ -9504,7 +9560,7 @@ static CYTHON_INLINE PyObject *__pyx_f_5numpy_PyArray_MultiIterNew2(PyObject *__ return __pyx_r; } -/* "../../../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":781 +/* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":827 * return PyArray_MultiIterNew(2, a, b) * * cdef inline object PyArray_MultiIterNew3(a, b, c): # <<<<<<<<<<<<<< @@ -9518,7 +9574,7 @@ static CYTHON_INLINE PyObject *__pyx_f_5numpy_PyArray_MultiIterNew3(PyObject *__ PyObject *__pyx_t_1 = NULL; __Pyx_RefNannySetupContext("PyArray_MultiIterNew3", 0); - /* "../../../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":782 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":828 * * cdef inline object PyArray_MultiIterNew3(a, b, c): * return PyArray_MultiIterNew(3, a, b, c) # <<<<<<<<<<<<<< @@ -9526,13 +9582,13 @@ static CYTHON_INLINE PyObject *__pyx_f_5numpy_PyArray_MultiIterNew3(PyObject *__ * cdef inline object PyArray_MultiIterNew4(a, b, c, d): */ __Pyx_XDECREF(__pyx_r); - __pyx_t_1 = PyArray_MultiIterNew(3, ((void *)__pyx_v_a), ((void *)__pyx_v_b), ((void *)__pyx_v_c)); if (unlikely(!__pyx_t_1)) __PYX_ERR(1, 782, __pyx_L1_error) + __pyx_t_1 = PyArray_MultiIterNew(3, ((void *)__pyx_v_a), ((void *)__pyx_v_b), ((void *)__pyx_v_c)); if (unlikely(!__pyx_t_1)) __PYX_ERR(1, 828, __pyx_L1_error) __Pyx_GOTREF(__pyx_t_1); __pyx_r = __pyx_t_1; __pyx_t_1 = 0; goto __pyx_L0; - /* "../../../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":781 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":827 * return PyArray_MultiIterNew(2, a, b) * * cdef inline object PyArray_MultiIterNew3(a, b, c): # <<<<<<<<<<<<<< @@ -9551,7 +9607,7 @@ static CYTHON_INLINE PyObject *__pyx_f_5numpy_PyArray_MultiIterNew3(PyObject *__ return __pyx_r; } -/* "../../../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":784 +/* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":830 * return PyArray_MultiIterNew(3, a, b, c) * * cdef inline object PyArray_MultiIterNew4(a, b, c, d): # <<<<<<<<<<<<<< @@ -9565,7 +9621,7 @@ static CYTHON_INLINE PyObject *__pyx_f_5numpy_PyArray_MultiIterNew4(PyObject *__ PyObject *__pyx_t_1 = NULL; __Pyx_RefNannySetupContext("PyArray_MultiIterNew4", 0); - /* "../../../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":785 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":831 * * cdef inline object PyArray_MultiIterNew4(a, b, c, d): * return PyArray_MultiIterNew(4, a, b, c, d) # <<<<<<<<<<<<<< @@ -9573,13 +9629,13 @@ static CYTHON_INLINE PyObject *__pyx_f_5numpy_PyArray_MultiIterNew4(PyObject *__ * cdef inline object PyArray_MultiIterNew5(a, b, c, d, e): */ __Pyx_XDECREF(__pyx_r); - __pyx_t_1 = PyArray_MultiIterNew(4, ((void *)__pyx_v_a), ((void *)__pyx_v_b), ((void *)__pyx_v_c), ((void *)__pyx_v_d)); if (unlikely(!__pyx_t_1)) __PYX_ERR(1, 785, __pyx_L1_error) + __pyx_t_1 = PyArray_MultiIterNew(4, ((void *)__pyx_v_a), ((void *)__pyx_v_b), ((void *)__pyx_v_c), ((void *)__pyx_v_d)); if (unlikely(!__pyx_t_1)) __PYX_ERR(1, 831, __pyx_L1_error) __Pyx_GOTREF(__pyx_t_1); __pyx_r = __pyx_t_1; __pyx_t_1 = 0; goto __pyx_L0; - /* "../../../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":784 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":830 * return PyArray_MultiIterNew(3, a, b, c) * * cdef inline object PyArray_MultiIterNew4(a, b, c, d): # <<<<<<<<<<<<<< @@ -9598,7 +9654,7 @@ static CYTHON_INLINE PyObject *__pyx_f_5numpy_PyArray_MultiIterNew4(PyObject *__ return __pyx_r; } -/* "../../../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":787 +/* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":833 * return PyArray_MultiIterNew(4, a, b, c, d) * * cdef inline object PyArray_MultiIterNew5(a, b, c, d, e): # <<<<<<<<<<<<<< @@ -9612,7 +9668,7 @@ static CYTHON_INLINE PyObject *__pyx_f_5numpy_PyArray_MultiIterNew5(PyObject *__ PyObject *__pyx_t_1 = NULL; __Pyx_RefNannySetupContext("PyArray_MultiIterNew5", 0); - /* "../../../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":788 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":834 * * cdef inline object PyArray_MultiIterNew5(a, b, c, d, e): * return PyArray_MultiIterNew(5, a, b, c, d, e) # <<<<<<<<<<<<<< @@ -9620,13 +9676,13 @@ static CYTHON_INLINE PyObject *__pyx_f_5numpy_PyArray_MultiIterNew5(PyObject *__ * cdef inline tuple PyDataType_SHAPE(dtype d): */ __Pyx_XDECREF(__pyx_r); - __pyx_t_1 = PyArray_MultiIterNew(5, ((void *)__pyx_v_a), ((void *)__pyx_v_b), ((void *)__pyx_v_c), ((void *)__pyx_v_d), ((void *)__pyx_v_e)); if (unlikely(!__pyx_t_1)) __PYX_ERR(1, 788, __pyx_L1_error) + __pyx_t_1 = PyArray_MultiIterNew(5, ((void *)__pyx_v_a), ((void *)__pyx_v_b), ((void *)__pyx_v_c), ((void *)__pyx_v_d), ((void *)__pyx_v_e)); if (unlikely(!__pyx_t_1)) __PYX_ERR(1, 834, __pyx_L1_error) __Pyx_GOTREF(__pyx_t_1); __pyx_r = __pyx_t_1; __pyx_t_1 = 0; goto __pyx_L0; - /* "../../../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":787 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":833 * return PyArray_MultiIterNew(4, a, b, c, d) * * cdef inline object PyArray_MultiIterNew5(a, b, c, d, e): # <<<<<<<<<<<<<< @@ -9645,7 +9701,7 @@ static CYTHON_INLINE PyObject *__pyx_f_5numpy_PyArray_MultiIterNew5(PyObject *__ return __pyx_r; } -/* "../../../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":790 +/* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":836 * return PyArray_MultiIterNew(5, a, b, c, d, e) * * cdef inline tuple PyDataType_SHAPE(dtype d): # <<<<<<<<<<<<<< @@ -9659,7 +9715,7 @@ static CYTHON_INLINE PyObject *__pyx_f_5numpy_PyDataType_SHAPE(PyArray_Descr *__ int __pyx_t_1; __Pyx_RefNannySetupContext("PyDataType_SHAPE", 0); - /* "../../../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":791 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":837 * * cdef inline tuple PyDataType_SHAPE(dtype d): * if PyDataType_HASSUBARRAY(d): # <<<<<<<<<<<<<< @@ -9669,7 +9725,7 @@ static CYTHON_INLINE PyObject *__pyx_f_5numpy_PyDataType_SHAPE(PyArray_Descr *__ __pyx_t_1 = (PyDataType_HASSUBARRAY(__pyx_v_d) != 0); if (__pyx_t_1) { - /* "../../../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":792 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":838 * cdef inline tuple PyDataType_SHAPE(dtype d): * if PyDataType_HASSUBARRAY(d): * return d.subarray.shape # <<<<<<<<<<<<<< @@ -9681,7 +9737,7 @@ static CYTHON_INLINE PyObject *__pyx_f_5numpy_PyDataType_SHAPE(PyArray_Descr *__ __pyx_r = ((PyObject*)__pyx_v_d->subarray->shape); goto __pyx_L0; - /* "../../../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":791 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":837 * * cdef inline tuple PyDataType_SHAPE(dtype d): * if PyDataType_HASSUBARRAY(d): # <<<<<<<<<<<<<< @@ -9690,7 +9746,7 @@ static CYTHON_INLINE PyObject *__pyx_f_5numpy_PyDataType_SHAPE(PyArray_Descr *__ */ } - /* "../../../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":794 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":840 * return d.subarray.shape * else: * return () # <<<<<<<<<<<<<< @@ -9704,7 +9760,7 @@ static CYTHON_INLINE PyObject *__pyx_f_5numpy_PyDataType_SHAPE(PyArray_Descr *__ goto __pyx_L0; } - /* "../../../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":790 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":836 * return PyArray_MultiIterNew(5, a, b, c, d, e) * * cdef inline tuple PyDataType_SHAPE(dtype d): # <<<<<<<<<<<<<< @@ -9719,7 +9775,7 @@ static CYTHON_INLINE PyObject *__pyx_f_5numpy_PyDataType_SHAPE(PyArray_Descr *__ return __pyx_r; } -/* "../../../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":796 +/* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":842 * return () * * cdef inline char* _util_dtypestring(dtype descr, char* f, char* end, int* offset) except NULL: # <<<<<<<<<<<<<< @@ -9748,7 +9804,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx char *__pyx_t_9; __Pyx_RefNannySetupContext("_util_dtypestring", 0); - /* "../../../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":801 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":847 * * cdef dtype child * cdef int endian_detector = 1 # <<<<<<<<<<<<<< @@ -9757,7 +9813,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx */ __pyx_v_endian_detector = 1; - /* "../../../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":802 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":848 * cdef dtype child * cdef int endian_detector = 1 * cdef bint little_endian = ((&endian_detector)[0] != 0) # <<<<<<<<<<<<<< @@ -9766,7 +9822,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx */ __pyx_v_little_endian = ((((char *)(&__pyx_v_endian_detector))[0]) != 0); - /* "../../../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":805 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":851 * cdef tuple fields * * for childname in descr.names: # <<<<<<<<<<<<<< @@ -9775,21 +9831,21 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx */ if (unlikely(__pyx_v_descr->names == Py_None)) { PyErr_SetString(PyExc_TypeError, "'NoneType' object is not iterable"); - __PYX_ERR(1, 805, __pyx_L1_error) + __PYX_ERR(1, 851, __pyx_L1_error) } __pyx_t_1 = __pyx_v_descr->names; __Pyx_INCREF(__pyx_t_1); __pyx_t_2 = 0; for (;;) { if (__pyx_t_2 >= PyTuple_GET_SIZE(__pyx_t_1)) break; #if CYTHON_ASSUME_SAFE_MACROS && !CYTHON_AVOID_BORROWED_REFS - __pyx_t_3 = PyTuple_GET_ITEM(__pyx_t_1, __pyx_t_2); __Pyx_INCREF(__pyx_t_3); __pyx_t_2++; if (unlikely(0 < 0)) __PYX_ERR(1, 805, __pyx_L1_error) + __pyx_t_3 = PyTuple_GET_ITEM(__pyx_t_1, __pyx_t_2); __Pyx_INCREF(__pyx_t_3); __pyx_t_2++; if (unlikely(0 < 0)) __PYX_ERR(1, 851, __pyx_L1_error) #else - __pyx_t_3 = PySequence_ITEM(__pyx_t_1, __pyx_t_2); __pyx_t_2++; if (unlikely(!__pyx_t_3)) __PYX_ERR(1, 805, __pyx_L1_error) + __pyx_t_3 = PySequence_ITEM(__pyx_t_1, __pyx_t_2); __pyx_t_2++; if (unlikely(!__pyx_t_3)) __PYX_ERR(1, 851, __pyx_L1_error) __Pyx_GOTREF(__pyx_t_3); #endif __Pyx_XDECREF_SET(__pyx_v_childname, __pyx_t_3); __pyx_t_3 = 0; - /* "../../../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":806 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":852 * * for childname in descr.names: * fields = descr.fields[childname] # <<<<<<<<<<<<<< @@ -9798,15 +9854,15 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx */ if (unlikely(__pyx_v_descr->fields == Py_None)) { PyErr_SetString(PyExc_TypeError, "'NoneType' object is not subscriptable"); - __PYX_ERR(1, 806, __pyx_L1_error) + __PYX_ERR(1, 852, __pyx_L1_error) } - __pyx_t_3 = __Pyx_PyDict_GetItem(__pyx_v_descr->fields, __pyx_v_childname); if (unlikely(!__pyx_t_3)) __PYX_ERR(1, 806, __pyx_L1_error) + __pyx_t_3 = __Pyx_PyDict_GetItem(__pyx_v_descr->fields, __pyx_v_childname); if (unlikely(!__pyx_t_3)) __PYX_ERR(1, 852, __pyx_L1_error) __Pyx_GOTREF(__pyx_t_3); - if (!(likely(PyTuple_CheckExact(__pyx_t_3))||((__pyx_t_3) == Py_None)||(PyErr_Format(PyExc_TypeError, "Expected %.16s, got %.200s", "tuple", Py_TYPE(__pyx_t_3)->tp_name), 0))) __PYX_ERR(1, 806, __pyx_L1_error) + if (!(likely(PyTuple_CheckExact(__pyx_t_3))||((__pyx_t_3) == Py_None)||(PyErr_Format(PyExc_TypeError, "Expected %.16s, got %.200s", "tuple", Py_TYPE(__pyx_t_3)->tp_name), 0))) __PYX_ERR(1, 852, __pyx_L1_error) __Pyx_XDECREF_SET(__pyx_v_fields, ((PyObject*)__pyx_t_3)); __pyx_t_3 = 0; - /* "../../../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":807 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":853 * for childname in descr.names: * fields = descr.fields[childname] * child, new_offset = fields # <<<<<<<<<<<<<< @@ -9819,7 +9875,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx if (unlikely(size != 2)) { if (size > 2) __Pyx_RaiseTooManyValuesError(2); else if (size >= 0) __Pyx_RaiseNeedMoreValuesError(size); - __PYX_ERR(1, 807, __pyx_L1_error) + __PYX_ERR(1, 853, __pyx_L1_error) } #if CYTHON_ASSUME_SAFE_MACROS && !CYTHON_AVOID_BORROWED_REFS __pyx_t_3 = PyTuple_GET_ITEM(sequence, 0); @@ -9827,51 +9883,51 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx __Pyx_INCREF(__pyx_t_3); __Pyx_INCREF(__pyx_t_4); #else - __pyx_t_3 = PySequence_ITEM(sequence, 0); if (unlikely(!__pyx_t_3)) __PYX_ERR(1, 807, __pyx_L1_error) + __pyx_t_3 = PySequence_ITEM(sequence, 0); if (unlikely(!__pyx_t_3)) __PYX_ERR(1, 853, __pyx_L1_error) __Pyx_GOTREF(__pyx_t_3); - __pyx_t_4 = PySequence_ITEM(sequence, 1); if (unlikely(!__pyx_t_4)) __PYX_ERR(1, 807, __pyx_L1_error) + __pyx_t_4 = PySequence_ITEM(sequence, 1); if (unlikely(!__pyx_t_4)) __PYX_ERR(1, 853, __pyx_L1_error) __Pyx_GOTREF(__pyx_t_4); #endif } else { - __Pyx_RaiseNoneNotIterableError(); __PYX_ERR(1, 807, __pyx_L1_error) + __Pyx_RaiseNoneNotIterableError(); __PYX_ERR(1, 853, __pyx_L1_error) } - if (!(likely(((__pyx_t_3) == Py_None) || likely(__Pyx_TypeTest(__pyx_t_3, __pyx_ptype_5numpy_dtype))))) __PYX_ERR(1, 807, __pyx_L1_error) + if (!(likely(((__pyx_t_3) == Py_None) || likely(__Pyx_TypeTest(__pyx_t_3, __pyx_ptype_5numpy_dtype))))) __PYX_ERR(1, 853, __pyx_L1_error) __Pyx_XDECREF_SET(__pyx_v_child, ((PyArray_Descr *)__pyx_t_3)); __pyx_t_3 = 0; __Pyx_XDECREF_SET(__pyx_v_new_offset, __pyx_t_4); __pyx_t_4 = 0; - /* "../../../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":809 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":855 * child, new_offset = fields * * if (end - f) - (new_offset - offset[0]) < 15: # <<<<<<<<<<<<<< * raise RuntimeError(u"Format string allocated too short, see comment in numpy.pxd") * */ - __pyx_t_4 = __Pyx_PyInt_From_int((__pyx_v_offset[0])); if (unlikely(!__pyx_t_4)) __PYX_ERR(1, 809, __pyx_L1_error) + __pyx_t_4 = __Pyx_PyInt_From_int((__pyx_v_offset[0])); if (unlikely(!__pyx_t_4)) __PYX_ERR(1, 855, __pyx_L1_error) __Pyx_GOTREF(__pyx_t_4); - __pyx_t_3 = PyNumber_Subtract(__pyx_v_new_offset, __pyx_t_4); if (unlikely(!__pyx_t_3)) __PYX_ERR(1, 809, __pyx_L1_error) + __pyx_t_3 = PyNumber_Subtract(__pyx_v_new_offset, __pyx_t_4); if (unlikely(!__pyx_t_3)) __PYX_ERR(1, 855, __pyx_L1_error) __Pyx_GOTREF(__pyx_t_3); __Pyx_DECREF(__pyx_t_4); __pyx_t_4 = 0; - __pyx_t_5 = __Pyx_PyInt_As_int(__pyx_t_3); if (unlikely((__pyx_t_5 == (int)-1) && PyErr_Occurred())) __PYX_ERR(1, 809, __pyx_L1_error) + __pyx_t_5 = __Pyx_PyInt_As_int(__pyx_t_3); if (unlikely((__pyx_t_5 == (int)-1) && PyErr_Occurred())) __PYX_ERR(1, 855, __pyx_L1_error) __Pyx_DECREF(__pyx_t_3); __pyx_t_3 = 0; __pyx_t_6 = ((((__pyx_v_end - __pyx_v_f) - ((int)__pyx_t_5)) < 15) != 0); if (unlikely(__pyx_t_6)) { - /* "../../../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":810 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":856 * * if (end - f) - (new_offset - offset[0]) < 15: * raise RuntimeError(u"Format string allocated too short, see comment in numpy.pxd") # <<<<<<<<<<<<<< * * if ((child.byteorder == c'>' and little_endian) or */ - __pyx_t_3 = __Pyx_PyObject_Call(__pyx_builtin_RuntimeError, __pyx_tuple__6, NULL); if (unlikely(!__pyx_t_3)) __PYX_ERR(1, 810, __pyx_L1_error) + __pyx_t_3 = __Pyx_PyObject_Call(__pyx_builtin_RuntimeError, __pyx_tuple__5, NULL); if (unlikely(!__pyx_t_3)) __PYX_ERR(1, 856, __pyx_L1_error) __Pyx_GOTREF(__pyx_t_3); __Pyx_Raise(__pyx_t_3, 0, 0, 0); __Pyx_DECREF(__pyx_t_3); __pyx_t_3 = 0; - __PYX_ERR(1, 810, __pyx_L1_error) + __PYX_ERR(1, 856, __pyx_L1_error) - /* "../../../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":809 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":855 * child, new_offset = fields * * if (end - f) - (new_offset - offset[0]) < 15: # <<<<<<<<<<<<<< @@ -9880,7 +9936,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx */ } - /* "../../../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":812 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":858 * raise RuntimeError(u"Format string allocated too short, see comment in numpy.pxd") * * if ((child.byteorder == c'>' and little_endian) or # <<<<<<<<<<<<<< @@ -9900,7 +9956,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx } __pyx_L8_next_or:; - /* "../../../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":813 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":859 * * if ((child.byteorder == c'>' and little_endian) or * (child.byteorder == c'<' and not little_endian)): # <<<<<<<<<<<<<< @@ -9917,7 +9973,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx __pyx_t_6 = __pyx_t_7; __pyx_L7_bool_binop_done:; - /* "../../../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":812 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":858 * raise RuntimeError(u"Format string allocated too short, see comment in numpy.pxd") * * if ((child.byteorder == c'>' and little_endian) or # <<<<<<<<<<<<<< @@ -9926,20 +9982,20 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx */ if (unlikely(__pyx_t_6)) { - /* "../../../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":814 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":860 * if ((child.byteorder == c'>' and little_endian) or * (child.byteorder == c'<' and not little_endian)): * raise ValueError(u"Non-native byte order not supported") # <<<<<<<<<<<<<< * # One could encode it in the format string and have Cython * # complain instead, BUT: < and > in format strings also imply */ - __pyx_t_3 = __Pyx_PyObject_Call(__pyx_builtin_ValueError, __pyx_tuple__7, NULL); if (unlikely(!__pyx_t_3)) __PYX_ERR(1, 814, __pyx_L1_error) + __pyx_t_3 = __Pyx_PyObject_Call(__pyx_builtin_ValueError, __pyx_tuple__4, NULL); if (unlikely(!__pyx_t_3)) __PYX_ERR(1, 860, __pyx_L1_error) __Pyx_GOTREF(__pyx_t_3); __Pyx_Raise(__pyx_t_3, 0, 0, 0); __Pyx_DECREF(__pyx_t_3); __pyx_t_3 = 0; - __PYX_ERR(1, 814, __pyx_L1_error) + __PYX_ERR(1, 860, __pyx_L1_error) - /* "../../../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":812 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":858 * raise RuntimeError(u"Format string allocated too short, see comment in numpy.pxd") * * if ((child.byteorder == c'>' and little_endian) or # <<<<<<<<<<<<<< @@ -9948,7 +10004,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx */ } - /* "../../../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":824 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":870 * * # Output padding bytes * while offset[0] < new_offset: # <<<<<<<<<<<<<< @@ -9956,15 +10012,15 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx * f += 1 */ while (1) { - __pyx_t_3 = __Pyx_PyInt_From_int((__pyx_v_offset[0])); if (unlikely(!__pyx_t_3)) __PYX_ERR(1, 824, __pyx_L1_error) + __pyx_t_3 = __Pyx_PyInt_From_int((__pyx_v_offset[0])); if (unlikely(!__pyx_t_3)) __PYX_ERR(1, 870, __pyx_L1_error) __Pyx_GOTREF(__pyx_t_3); - __pyx_t_4 = PyObject_RichCompare(__pyx_t_3, __pyx_v_new_offset, Py_LT); __Pyx_XGOTREF(__pyx_t_4); if (unlikely(!__pyx_t_4)) __PYX_ERR(1, 824, __pyx_L1_error) + __pyx_t_4 = PyObject_RichCompare(__pyx_t_3, __pyx_v_new_offset, Py_LT); __Pyx_XGOTREF(__pyx_t_4); if (unlikely(!__pyx_t_4)) __PYX_ERR(1, 870, __pyx_L1_error) __Pyx_DECREF(__pyx_t_3); __pyx_t_3 = 0; - __pyx_t_6 = __Pyx_PyObject_IsTrue(__pyx_t_4); if (unlikely(__pyx_t_6 < 0)) __PYX_ERR(1, 824, __pyx_L1_error) + __pyx_t_6 = __Pyx_PyObject_IsTrue(__pyx_t_4); if (unlikely(__pyx_t_6 < 0)) __PYX_ERR(1, 870, __pyx_L1_error) __Pyx_DECREF(__pyx_t_4); __pyx_t_4 = 0; if (!__pyx_t_6) break; - /* "../../../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":825 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":871 * # Output padding bytes * while offset[0] < new_offset: * f[0] = 120 # "x"; pad byte # <<<<<<<<<<<<<< @@ -9973,7 +10029,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx */ (__pyx_v_f[0]) = 0x78; - /* "../../../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":826 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":872 * while offset[0] < new_offset: * f[0] = 120 # "x"; pad byte * f += 1 # <<<<<<<<<<<<<< @@ -9982,7 +10038,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx */ __pyx_v_f = (__pyx_v_f + 1); - /* "../../../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":827 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":873 * f[0] = 120 # "x"; pad byte * f += 1 * offset[0] += 1 # <<<<<<<<<<<<<< @@ -9993,7 +10049,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx (__pyx_v_offset[__pyx_t_8]) = ((__pyx_v_offset[__pyx_t_8]) + 1); } - /* "../../../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":829 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":875 * offset[0] += 1 * * offset[0] += child.itemsize # <<<<<<<<<<<<<< @@ -10003,7 +10059,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx __pyx_t_8 = 0; (__pyx_v_offset[__pyx_t_8]) = ((__pyx_v_offset[__pyx_t_8]) + __pyx_v_child->elsize); - /* "../../../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":831 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":877 * offset[0] += child.itemsize * * if not PyDataType_HASFIELDS(child): # <<<<<<<<<<<<<< @@ -10013,19 +10069,19 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx __pyx_t_6 = ((!(PyDataType_HASFIELDS(__pyx_v_child) != 0)) != 0); if (__pyx_t_6) { - /* "../../../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":832 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":878 * * if not PyDataType_HASFIELDS(child): * t = child.type_num # <<<<<<<<<<<<<< * if end - f < 5: * raise RuntimeError(u"Format string allocated too short.") */ - __pyx_t_4 = __Pyx_PyInt_From_int(__pyx_v_child->type_num); if (unlikely(!__pyx_t_4)) __PYX_ERR(1, 832, __pyx_L1_error) + __pyx_t_4 = __Pyx_PyInt_From_int(__pyx_v_child->type_num); if (unlikely(!__pyx_t_4)) __PYX_ERR(1, 878, __pyx_L1_error) __Pyx_GOTREF(__pyx_t_4); __Pyx_XDECREF_SET(__pyx_v_t, __pyx_t_4); __pyx_t_4 = 0; - /* "../../../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":833 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":879 * if not PyDataType_HASFIELDS(child): * t = child.type_num * if end - f < 5: # <<<<<<<<<<<<<< @@ -10035,20 +10091,20 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx __pyx_t_6 = (((__pyx_v_end - __pyx_v_f) < 5) != 0); if (unlikely(__pyx_t_6)) { - /* "../../../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":834 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":880 * t = child.type_num * if end - f < 5: * raise RuntimeError(u"Format string allocated too short.") # <<<<<<<<<<<<<< * * # Until ticket #99 is fixed, use integers to avoid warnings */ - __pyx_t_4 = __Pyx_PyObject_Call(__pyx_builtin_RuntimeError, __pyx_tuple__8, NULL); if (unlikely(!__pyx_t_4)) __PYX_ERR(1, 834, __pyx_L1_error) + __pyx_t_4 = __Pyx_PyObject_Call(__pyx_builtin_RuntimeError, __pyx_tuple__6, NULL); if (unlikely(!__pyx_t_4)) __PYX_ERR(1, 880, __pyx_L1_error) __Pyx_GOTREF(__pyx_t_4); __Pyx_Raise(__pyx_t_4, 0, 0, 0); __Pyx_DECREF(__pyx_t_4); __pyx_t_4 = 0; - __PYX_ERR(1, 834, __pyx_L1_error) + __PYX_ERR(1, 880, __pyx_L1_error) - /* "../../../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":833 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":879 * if not PyDataType_HASFIELDS(child): * t = child.type_num * if end - f < 5: # <<<<<<<<<<<<<< @@ -10057,252 +10113,252 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx */ } - /* "../../../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":837 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":883 * * # Until ticket #99 is fixed, use integers to avoid warnings * if t == NPY_BYTE: f[0] = 98 #"b" # <<<<<<<<<<<<<< * elif t == NPY_UBYTE: f[0] = 66 #"B" * elif t == NPY_SHORT: f[0] = 104 #"h" */ - __pyx_t_4 = __Pyx_PyInt_From_enum__NPY_TYPES(NPY_BYTE); if (unlikely(!__pyx_t_4)) __PYX_ERR(1, 837, __pyx_L1_error) + __pyx_t_4 = __Pyx_PyInt_From_enum__NPY_TYPES(NPY_BYTE); if (unlikely(!__pyx_t_4)) __PYX_ERR(1, 883, __pyx_L1_error) __Pyx_GOTREF(__pyx_t_4); - __pyx_t_3 = PyObject_RichCompare(__pyx_v_t, __pyx_t_4, Py_EQ); __Pyx_XGOTREF(__pyx_t_3); if (unlikely(!__pyx_t_3)) __PYX_ERR(1, 837, __pyx_L1_error) + __pyx_t_3 = PyObject_RichCompare(__pyx_v_t, __pyx_t_4, Py_EQ); __Pyx_XGOTREF(__pyx_t_3); if (unlikely(!__pyx_t_3)) __PYX_ERR(1, 883, __pyx_L1_error) __Pyx_DECREF(__pyx_t_4); __pyx_t_4 = 0; - __pyx_t_6 = __Pyx_PyObject_IsTrue(__pyx_t_3); if (unlikely(__pyx_t_6 < 0)) __PYX_ERR(1, 837, __pyx_L1_error) + __pyx_t_6 = __Pyx_PyObject_IsTrue(__pyx_t_3); if (unlikely(__pyx_t_6 < 0)) __PYX_ERR(1, 883, __pyx_L1_error) __Pyx_DECREF(__pyx_t_3); __pyx_t_3 = 0; if (__pyx_t_6) { (__pyx_v_f[0]) = 98; goto __pyx_L15; } - /* "../../../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":838 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":884 * # Until ticket #99 is fixed, use integers to avoid warnings * if t == NPY_BYTE: f[0] = 98 #"b" * elif t == NPY_UBYTE: f[0] = 66 #"B" # <<<<<<<<<<<<<< * elif t == NPY_SHORT: f[0] = 104 #"h" * elif t == NPY_USHORT: f[0] = 72 #"H" */ - __pyx_t_3 = __Pyx_PyInt_From_enum__NPY_TYPES(NPY_UBYTE); if (unlikely(!__pyx_t_3)) __PYX_ERR(1, 838, __pyx_L1_error) + __pyx_t_3 = __Pyx_PyInt_From_enum__NPY_TYPES(NPY_UBYTE); if (unlikely(!__pyx_t_3)) __PYX_ERR(1, 884, __pyx_L1_error) __Pyx_GOTREF(__pyx_t_3); - __pyx_t_4 = PyObject_RichCompare(__pyx_v_t, __pyx_t_3, Py_EQ); __Pyx_XGOTREF(__pyx_t_4); if (unlikely(!__pyx_t_4)) __PYX_ERR(1, 838, __pyx_L1_error) + __pyx_t_4 = PyObject_RichCompare(__pyx_v_t, __pyx_t_3, Py_EQ); __Pyx_XGOTREF(__pyx_t_4); if (unlikely(!__pyx_t_4)) __PYX_ERR(1, 884, __pyx_L1_error) __Pyx_DECREF(__pyx_t_3); __pyx_t_3 = 0; - __pyx_t_6 = __Pyx_PyObject_IsTrue(__pyx_t_4); if (unlikely(__pyx_t_6 < 0)) __PYX_ERR(1, 838, __pyx_L1_error) + __pyx_t_6 = __Pyx_PyObject_IsTrue(__pyx_t_4); if (unlikely(__pyx_t_6 < 0)) __PYX_ERR(1, 884, __pyx_L1_error) __Pyx_DECREF(__pyx_t_4); __pyx_t_4 = 0; if (__pyx_t_6) { (__pyx_v_f[0]) = 66; goto __pyx_L15; } - /* "../../../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":839 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":885 * if t == NPY_BYTE: f[0] = 98 #"b" * elif t == NPY_UBYTE: f[0] = 66 #"B" * elif t == NPY_SHORT: f[0] = 104 #"h" # <<<<<<<<<<<<<< * elif t == NPY_USHORT: f[0] = 72 #"H" * elif t == NPY_INT: f[0] = 105 #"i" */ - __pyx_t_4 = __Pyx_PyInt_From_enum__NPY_TYPES(NPY_SHORT); if (unlikely(!__pyx_t_4)) __PYX_ERR(1, 839, __pyx_L1_error) + __pyx_t_4 = __Pyx_PyInt_From_enum__NPY_TYPES(NPY_SHORT); if (unlikely(!__pyx_t_4)) __PYX_ERR(1, 885, __pyx_L1_error) __Pyx_GOTREF(__pyx_t_4); - __pyx_t_3 = PyObject_RichCompare(__pyx_v_t, __pyx_t_4, Py_EQ); __Pyx_XGOTREF(__pyx_t_3); if (unlikely(!__pyx_t_3)) __PYX_ERR(1, 839, __pyx_L1_error) + __pyx_t_3 = PyObject_RichCompare(__pyx_v_t, __pyx_t_4, Py_EQ); __Pyx_XGOTREF(__pyx_t_3); if (unlikely(!__pyx_t_3)) __PYX_ERR(1, 885, __pyx_L1_error) __Pyx_DECREF(__pyx_t_4); __pyx_t_4 = 0; - __pyx_t_6 = __Pyx_PyObject_IsTrue(__pyx_t_3); if (unlikely(__pyx_t_6 < 0)) __PYX_ERR(1, 839, __pyx_L1_error) + __pyx_t_6 = __Pyx_PyObject_IsTrue(__pyx_t_3); if (unlikely(__pyx_t_6 < 0)) __PYX_ERR(1, 885, __pyx_L1_error) __Pyx_DECREF(__pyx_t_3); __pyx_t_3 = 0; if (__pyx_t_6) { (__pyx_v_f[0]) = 0x68; goto __pyx_L15; } - /* "../../../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":840 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":886 * elif t == NPY_UBYTE: f[0] = 66 #"B" * elif t == NPY_SHORT: f[0] = 104 #"h" * elif t == NPY_USHORT: f[0] = 72 #"H" # <<<<<<<<<<<<<< * elif t == NPY_INT: f[0] = 105 #"i" * elif t == NPY_UINT: f[0] = 73 #"I" */ - __pyx_t_3 = __Pyx_PyInt_From_enum__NPY_TYPES(NPY_USHORT); if (unlikely(!__pyx_t_3)) __PYX_ERR(1, 840, __pyx_L1_error) + __pyx_t_3 = __Pyx_PyInt_From_enum__NPY_TYPES(NPY_USHORT); if (unlikely(!__pyx_t_3)) __PYX_ERR(1, 886, __pyx_L1_error) __Pyx_GOTREF(__pyx_t_3); - __pyx_t_4 = PyObject_RichCompare(__pyx_v_t, __pyx_t_3, Py_EQ); __Pyx_XGOTREF(__pyx_t_4); if (unlikely(!__pyx_t_4)) __PYX_ERR(1, 840, __pyx_L1_error) + __pyx_t_4 = PyObject_RichCompare(__pyx_v_t, __pyx_t_3, Py_EQ); __Pyx_XGOTREF(__pyx_t_4); if (unlikely(!__pyx_t_4)) __PYX_ERR(1, 886, __pyx_L1_error) __Pyx_DECREF(__pyx_t_3); __pyx_t_3 = 0; - __pyx_t_6 = __Pyx_PyObject_IsTrue(__pyx_t_4); if (unlikely(__pyx_t_6 < 0)) __PYX_ERR(1, 840, __pyx_L1_error) + __pyx_t_6 = __Pyx_PyObject_IsTrue(__pyx_t_4); if (unlikely(__pyx_t_6 < 0)) __PYX_ERR(1, 886, __pyx_L1_error) __Pyx_DECREF(__pyx_t_4); __pyx_t_4 = 0; if (__pyx_t_6) { (__pyx_v_f[0]) = 72; goto __pyx_L15; } - /* "../../../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":841 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":887 * elif t == NPY_SHORT: f[0] = 104 #"h" * elif t == NPY_USHORT: f[0] = 72 #"H" * elif t == NPY_INT: f[0] = 105 #"i" # <<<<<<<<<<<<<< * elif t == NPY_UINT: f[0] = 73 #"I" * elif t == NPY_LONG: f[0] = 108 #"l" */ - __pyx_t_4 = __Pyx_PyInt_From_enum__NPY_TYPES(NPY_INT); if (unlikely(!__pyx_t_4)) __PYX_ERR(1, 841, __pyx_L1_error) + __pyx_t_4 = __Pyx_PyInt_From_enum__NPY_TYPES(NPY_INT); if (unlikely(!__pyx_t_4)) __PYX_ERR(1, 887, __pyx_L1_error) __Pyx_GOTREF(__pyx_t_4); - __pyx_t_3 = PyObject_RichCompare(__pyx_v_t, __pyx_t_4, Py_EQ); __Pyx_XGOTREF(__pyx_t_3); if (unlikely(!__pyx_t_3)) __PYX_ERR(1, 841, __pyx_L1_error) + __pyx_t_3 = PyObject_RichCompare(__pyx_v_t, __pyx_t_4, Py_EQ); __Pyx_XGOTREF(__pyx_t_3); if (unlikely(!__pyx_t_3)) __PYX_ERR(1, 887, __pyx_L1_error) __Pyx_DECREF(__pyx_t_4); __pyx_t_4 = 0; - __pyx_t_6 = __Pyx_PyObject_IsTrue(__pyx_t_3); if (unlikely(__pyx_t_6 < 0)) __PYX_ERR(1, 841, __pyx_L1_error) + __pyx_t_6 = __Pyx_PyObject_IsTrue(__pyx_t_3); if (unlikely(__pyx_t_6 < 0)) __PYX_ERR(1, 887, __pyx_L1_error) __Pyx_DECREF(__pyx_t_3); __pyx_t_3 = 0; if (__pyx_t_6) { (__pyx_v_f[0]) = 0x69; goto __pyx_L15; } - /* "../../../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":842 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":888 * elif t == NPY_USHORT: f[0] = 72 #"H" * elif t == NPY_INT: f[0] = 105 #"i" * elif t == NPY_UINT: f[0] = 73 #"I" # <<<<<<<<<<<<<< * elif t == NPY_LONG: f[0] = 108 #"l" * elif t == NPY_ULONG: f[0] = 76 #"L" */ - __pyx_t_3 = __Pyx_PyInt_From_enum__NPY_TYPES(NPY_UINT); if (unlikely(!__pyx_t_3)) __PYX_ERR(1, 842, __pyx_L1_error) + __pyx_t_3 = __Pyx_PyInt_From_enum__NPY_TYPES(NPY_UINT); if (unlikely(!__pyx_t_3)) __PYX_ERR(1, 888, __pyx_L1_error) __Pyx_GOTREF(__pyx_t_3); - __pyx_t_4 = PyObject_RichCompare(__pyx_v_t, __pyx_t_3, Py_EQ); __Pyx_XGOTREF(__pyx_t_4); if (unlikely(!__pyx_t_4)) __PYX_ERR(1, 842, __pyx_L1_error) + __pyx_t_4 = PyObject_RichCompare(__pyx_v_t, __pyx_t_3, Py_EQ); __Pyx_XGOTREF(__pyx_t_4); if (unlikely(!__pyx_t_4)) __PYX_ERR(1, 888, __pyx_L1_error) __Pyx_DECREF(__pyx_t_3); __pyx_t_3 = 0; - __pyx_t_6 = __Pyx_PyObject_IsTrue(__pyx_t_4); if (unlikely(__pyx_t_6 < 0)) __PYX_ERR(1, 842, __pyx_L1_error) + __pyx_t_6 = __Pyx_PyObject_IsTrue(__pyx_t_4); if (unlikely(__pyx_t_6 < 0)) __PYX_ERR(1, 888, __pyx_L1_error) __Pyx_DECREF(__pyx_t_4); __pyx_t_4 = 0; if (__pyx_t_6) { (__pyx_v_f[0]) = 73; goto __pyx_L15; } - /* "../../../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":843 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":889 * elif t == NPY_INT: f[0] = 105 #"i" * elif t == NPY_UINT: f[0] = 73 #"I" * elif t == NPY_LONG: f[0] = 108 #"l" # <<<<<<<<<<<<<< * elif t == NPY_ULONG: f[0] = 76 #"L" * elif t == NPY_LONGLONG: f[0] = 113 #"q" */ - __pyx_t_4 = __Pyx_PyInt_From_enum__NPY_TYPES(NPY_LONG); if (unlikely(!__pyx_t_4)) __PYX_ERR(1, 843, __pyx_L1_error) + __pyx_t_4 = __Pyx_PyInt_From_enum__NPY_TYPES(NPY_LONG); if (unlikely(!__pyx_t_4)) __PYX_ERR(1, 889, __pyx_L1_error) __Pyx_GOTREF(__pyx_t_4); - __pyx_t_3 = PyObject_RichCompare(__pyx_v_t, __pyx_t_4, Py_EQ); __Pyx_XGOTREF(__pyx_t_3); if (unlikely(!__pyx_t_3)) __PYX_ERR(1, 843, __pyx_L1_error) + __pyx_t_3 = PyObject_RichCompare(__pyx_v_t, __pyx_t_4, Py_EQ); __Pyx_XGOTREF(__pyx_t_3); if (unlikely(!__pyx_t_3)) __PYX_ERR(1, 889, __pyx_L1_error) __Pyx_DECREF(__pyx_t_4); __pyx_t_4 = 0; - __pyx_t_6 = __Pyx_PyObject_IsTrue(__pyx_t_3); if (unlikely(__pyx_t_6 < 0)) __PYX_ERR(1, 843, __pyx_L1_error) + __pyx_t_6 = __Pyx_PyObject_IsTrue(__pyx_t_3); if (unlikely(__pyx_t_6 < 0)) __PYX_ERR(1, 889, __pyx_L1_error) __Pyx_DECREF(__pyx_t_3); __pyx_t_3 = 0; if (__pyx_t_6) { (__pyx_v_f[0]) = 0x6C; goto __pyx_L15; } - /* "../../../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":844 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":890 * elif t == NPY_UINT: f[0] = 73 #"I" * elif t == NPY_LONG: f[0] = 108 #"l" * elif t == NPY_ULONG: f[0] = 76 #"L" # <<<<<<<<<<<<<< * elif t == NPY_LONGLONG: f[0] = 113 #"q" * elif t == NPY_ULONGLONG: f[0] = 81 #"Q" */ - __pyx_t_3 = __Pyx_PyInt_From_enum__NPY_TYPES(NPY_ULONG); if (unlikely(!__pyx_t_3)) __PYX_ERR(1, 844, __pyx_L1_error) + __pyx_t_3 = __Pyx_PyInt_From_enum__NPY_TYPES(NPY_ULONG); if (unlikely(!__pyx_t_3)) __PYX_ERR(1, 890, __pyx_L1_error) __Pyx_GOTREF(__pyx_t_3); - __pyx_t_4 = PyObject_RichCompare(__pyx_v_t, __pyx_t_3, Py_EQ); __Pyx_XGOTREF(__pyx_t_4); if (unlikely(!__pyx_t_4)) __PYX_ERR(1, 844, __pyx_L1_error) + __pyx_t_4 = PyObject_RichCompare(__pyx_v_t, __pyx_t_3, Py_EQ); __Pyx_XGOTREF(__pyx_t_4); if (unlikely(!__pyx_t_4)) __PYX_ERR(1, 890, __pyx_L1_error) __Pyx_DECREF(__pyx_t_3); __pyx_t_3 = 0; - __pyx_t_6 = __Pyx_PyObject_IsTrue(__pyx_t_4); if (unlikely(__pyx_t_6 < 0)) __PYX_ERR(1, 844, __pyx_L1_error) + __pyx_t_6 = __Pyx_PyObject_IsTrue(__pyx_t_4); if (unlikely(__pyx_t_6 < 0)) __PYX_ERR(1, 890, __pyx_L1_error) __Pyx_DECREF(__pyx_t_4); __pyx_t_4 = 0; if (__pyx_t_6) { (__pyx_v_f[0]) = 76; goto __pyx_L15; } - /* "../../../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":845 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":891 * elif t == NPY_LONG: f[0] = 108 #"l" * elif t == NPY_ULONG: f[0] = 76 #"L" * elif t == NPY_LONGLONG: f[0] = 113 #"q" # <<<<<<<<<<<<<< * elif t == NPY_ULONGLONG: f[0] = 81 #"Q" * elif t == NPY_FLOAT: f[0] = 102 #"f" */ - __pyx_t_4 = __Pyx_PyInt_From_enum__NPY_TYPES(NPY_LONGLONG); if (unlikely(!__pyx_t_4)) __PYX_ERR(1, 845, __pyx_L1_error) + __pyx_t_4 = __Pyx_PyInt_From_enum__NPY_TYPES(NPY_LONGLONG); if (unlikely(!__pyx_t_4)) __PYX_ERR(1, 891, __pyx_L1_error) __Pyx_GOTREF(__pyx_t_4); - __pyx_t_3 = PyObject_RichCompare(__pyx_v_t, __pyx_t_4, Py_EQ); __Pyx_XGOTREF(__pyx_t_3); if (unlikely(!__pyx_t_3)) __PYX_ERR(1, 845, __pyx_L1_error) + __pyx_t_3 = PyObject_RichCompare(__pyx_v_t, __pyx_t_4, Py_EQ); __Pyx_XGOTREF(__pyx_t_3); if (unlikely(!__pyx_t_3)) __PYX_ERR(1, 891, __pyx_L1_error) __Pyx_DECREF(__pyx_t_4); __pyx_t_4 = 0; - __pyx_t_6 = __Pyx_PyObject_IsTrue(__pyx_t_3); if (unlikely(__pyx_t_6 < 0)) __PYX_ERR(1, 845, __pyx_L1_error) + __pyx_t_6 = __Pyx_PyObject_IsTrue(__pyx_t_3); if (unlikely(__pyx_t_6 < 0)) __PYX_ERR(1, 891, __pyx_L1_error) __Pyx_DECREF(__pyx_t_3); __pyx_t_3 = 0; if (__pyx_t_6) { (__pyx_v_f[0]) = 0x71; goto __pyx_L15; } - /* "../../../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":846 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":892 * elif t == NPY_ULONG: f[0] = 76 #"L" * elif t == NPY_LONGLONG: f[0] = 113 #"q" * elif t == NPY_ULONGLONG: f[0] = 81 #"Q" # <<<<<<<<<<<<<< * elif t == NPY_FLOAT: f[0] = 102 #"f" * elif t == NPY_DOUBLE: f[0] = 100 #"d" */ - __pyx_t_3 = __Pyx_PyInt_From_enum__NPY_TYPES(NPY_ULONGLONG); if (unlikely(!__pyx_t_3)) __PYX_ERR(1, 846, __pyx_L1_error) + __pyx_t_3 = __Pyx_PyInt_From_enum__NPY_TYPES(NPY_ULONGLONG); if (unlikely(!__pyx_t_3)) __PYX_ERR(1, 892, __pyx_L1_error) __Pyx_GOTREF(__pyx_t_3); - __pyx_t_4 = PyObject_RichCompare(__pyx_v_t, __pyx_t_3, Py_EQ); __Pyx_XGOTREF(__pyx_t_4); if (unlikely(!__pyx_t_4)) __PYX_ERR(1, 846, __pyx_L1_error) + __pyx_t_4 = PyObject_RichCompare(__pyx_v_t, __pyx_t_3, Py_EQ); __Pyx_XGOTREF(__pyx_t_4); if (unlikely(!__pyx_t_4)) __PYX_ERR(1, 892, __pyx_L1_error) __Pyx_DECREF(__pyx_t_3); __pyx_t_3 = 0; - __pyx_t_6 = __Pyx_PyObject_IsTrue(__pyx_t_4); if (unlikely(__pyx_t_6 < 0)) __PYX_ERR(1, 846, __pyx_L1_error) + __pyx_t_6 = __Pyx_PyObject_IsTrue(__pyx_t_4); if (unlikely(__pyx_t_6 < 0)) __PYX_ERR(1, 892, __pyx_L1_error) __Pyx_DECREF(__pyx_t_4); __pyx_t_4 = 0; if (__pyx_t_6) { (__pyx_v_f[0]) = 81; goto __pyx_L15; } - /* "../../../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":847 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":893 * elif t == NPY_LONGLONG: f[0] = 113 #"q" * elif t == NPY_ULONGLONG: f[0] = 81 #"Q" * elif t == NPY_FLOAT: f[0] = 102 #"f" # <<<<<<<<<<<<<< * elif t == NPY_DOUBLE: f[0] = 100 #"d" * elif t == NPY_LONGDOUBLE: f[0] = 103 #"g" */ - __pyx_t_4 = __Pyx_PyInt_From_enum__NPY_TYPES(NPY_FLOAT); if (unlikely(!__pyx_t_4)) __PYX_ERR(1, 847, __pyx_L1_error) + __pyx_t_4 = __Pyx_PyInt_From_enum__NPY_TYPES(NPY_FLOAT); if (unlikely(!__pyx_t_4)) __PYX_ERR(1, 893, __pyx_L1_error) __Pyx_GOTREF(__pyx_t_4); - __pyx_t_3 = PyObject_RichCompare(__pyx_v_t, __pyx_t_4, Py_EQ); __Pyx_XGOTREF(__pyx_t_3); if (unlikely(!__pyx_t_3)) __PYX_ERR(1, 847, __pyx_L1_error) + __pyx_t_3 = PyObject_RichCompare(__pyx_v_t, __pyx_t_4, Py_EQ); __Pyx_XGOTREF(__pyx_t_3); if (unlikely(!__pyx_t_3)) __PYX_ERR(1, 893, __pyx_L1_error) __Pyx_DECREF(__pyx_t_4); __pyx_t_4 = 0; - __pyx_t_6 = __Pyx_PyObject_IsTrue(__pyx_t_3); if (unlikely(__pyx_t_6 < 0)) __PYX_ERR(1, 847, __pyx_L1_error) + __pyx_t_6 = __Pyx_PyObject_IsTrue(__pyx_t_3); if (unlikely(__pyx_t_6 < 0)) __PYX_ERR(1, 893, __pyx_L1_error) __Pyx_DECREF(__pyx_t_3); __pyx_t_3 = 0; if (__pyx_t_6) { (__pyx_v_f[0]) = 0x66; goto __pyx_L15; } - /* "../../../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":848 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":894 * elif t == NPY_ULONGLONG: f[0] = 81 #"Q" * elif t == NPY_FLOAT: f[0] = 102 #"f" * elif t == NPY_DOUBLE: f[0] = 100 #"d" # <<<<<<<<<<<<<< * elif t == NPY_LONGDOUBLE: f[0] = 103 #"g" * elif t == NPY_CFLOAT: f[0] = 90; f[1] = 102; f += 1 # Zf */ - __pyx_t_3 = __Pyx_PyInt_From_enum__NPY_TYPES(NPY_DOUBLE); if (unlikely(!__pyx_t_3)) __PYX_ERR(1, 848, __pyx_L1_error) + __pyx_t_3 = __Pyx_PyInt_From_enum__NPY_TYPES(NPY_DOUBLE); if (unlikely(!__pyx_t_3)) __PYX_ERR(1, 894, __pyx_L1_error) __Pyx_GOTREF(__pyx_t_3); - __pyx_t_4 = PyObject_RichCompare(__pyx_v_t, __pyx_t_3, Py_EQ); __Pyx_XGOTREF(__pyx_t_4); if (unlikely(!__pyx_t_4)) __PYX_ERR(1, 848, __pyx_L1_error) + __pyx_t_4 = PyObject_RichCompare(__pyx_v_t, __pyx_t_3, Py_EQ); __Pyx_XGOTREF(__pyx_t_4); if (unlikely(!__pyx_t_4)) __PYX_ERR(1, 894, __pyx_L1_error) __Pyx_DECREF(__pyx_t_3); __pyx_t_3 = 0; - __pyx_t_6 = __Pyx_PyObject_IsTrue(__pyx_t_4); if (unlikely(__pyx_t_6 < 0)) __PYX_ERR(1, 848, __pyx_L1_error) + __pyx_t_6 = __Pyx_PyObject_IsTrue(__pyx_t_4); if (unlikely(__pyx_t_6 < 0)) __PYX_ERR(1, 894, __pyx_L1_error) __Pyx_DECREF(__pyx_t_4); __pyx_t_4 = 0; if (__pyx_t_6) { (__pyx_v_f[0]) = 0x64; goto __pyx_L15; } - /* "../../../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":849 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":895 * elif t == NPY_FLOAT: f[0] = 102 #"f" * elif t == NPY_DOUBLE: f[0] = 100 #"d" * elif t == NPY_LONGDOUBLE: f[0] = 103 #"g" # <<<<<<<<<<<<<< * elif t == NPY_CFLOAT: f[0] = 90; f[1] = 102; f += 1 # Zf * elif t == NPY_CDOUBLE: f[0] = 90; f[1] = 100; f += 1 # Zd */ - __pyx_t_4 = __Pyx_PyInt_From_enum__NPY_TYPES(NPY_LONGDOUBLE); if (unlikely(!__pyx_t_4)) __PYX_ERR(1, 849, __pyx_L1_error) + __pyx_t_4 = __Pyx_PyInt_From_enum__NPY_TYPES(NPY_LONGDOUBLE); if (unlikely(!__pyx_t_4)) __PYX_ERR(1, 895, __pyx_L1_error) __Pyx_GOTREF(__pyx_t_4); - __pyx_t_3 = PyObject_RichCompare(__pyx_v_t, __pyx_t_4, Py_EQ); __Pyx_XGOTREF(__pyx_t_3); if (unlikely(!__pyx_t_3)) __PYX_ERR(1, 849, __pyx_L1_error) + __pyx_t_3 = PyObject_RichCompare(__pyx_v_t, __pyx_t_4, Py_EQ); __Pyx_XGOTREF(__pyx_t_3); if (unlikely(!__pyx_t_3)) __PYX_ERR(1, 895, __pyx_L1_error) __Pyx_DECREF(__pyx_t_4); __pyx_t_4 = 0; - __pyx_t_6 = __Pyx_PyObject_IsTrue(__pyx_t_3); if (unlikely(__pyx_t_6 < 0)) __PYX_ERR(1, 849, __pyx_L1_error) + __pyx_t_6 = __Pyx_PyObject_IsTrue(__pyx_t_3); if (unlikely(__pyx_t_6 < 0)) __PYX_ERR(1, 895, __pyx_L1_error) __Pyx_DECREF(__pyx_t_3); __pyx_t_3 = 0; if (__pyx_t_6) { (__pyx_v_f[0]) = 0x67; goto __pyx_L15; } - /* "../../../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":850 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":896 * elif t == NPY_DOUBLE: f[0] = 100 #"d" * elif t == NPY_LONGDOUBLE: f[0] = 103 #"g" * elif t == NPY_CFLOAT: f[0] = 90; f[1] = 102; f += 1 # Zf # <<<<<<<<<<<<<< * elif t == NPY_CDOUBLE: f[0] = 90; f[1] = 100; f += 1 # Zd * elif t == NPY_CLONGDOUBLE: f[0] = 90; f[1] = 103; f += 1 # Zg */ - __pyx_t_3 = __Pyx_PyInt_From_enum__NPY_TYPES(NPY_CFLOAT); if (unlikely(!__pyx_t_3)) __PYX_ERR(1, 850, __pyx_L1_error) + __pyx_t_3 = __Pyx_PyInt_From_enum__NPY_TYPES(NPY_CFLOAT); if (unlikely(!__pyx_t_3)) __PYX_ERR(1, 896, __pyx_L1_error) __Pyx_GOTREF(__pyx_t_3); - __pyx_t_4 = PyObject_RichCompare(__pyx_v_t, __pyx_t_3, Py_EQ); __Pyx_XGOTREF(__pyx_t_4); if (unlikely(!__pyx_t_4)) __PYX_ERR(1, 850, __pyx_L1_error) + __pyx_t_4 = PyObject_RichCompare(__pyx_v_t, __pyx_t_3, Py_EQ); __Pyx_XGOTREF(__pyx_t_4); if (unlikely(!__pyx_t_4)) __PYX_ERR(1, 896, __pyx_L1_error) __Pyx_DECREF(__pyx_t_3); __pyx_t_3 = 0; - __pyx_t_6 = __Pyx_PyObject_IsTrue(__pyx_t_4); if (unlikely(__pyx_t_6 < 0)) __PYX_ERR(1, 850, __pyx_L1_error) + __pyx_t_6 = __Pyx_PyObject_IsTrue(__pyx_t_4); if (unlikely(__pyx_t_6 < 0)) __PYX_ERR(1, 896, __pyx_L1_error) __Pyx_DECREF(__pyx_t_4); __pyx_t_4 = 0; if (__pyx_t_6) { (__pyx_v_f[0]) = 90; @@ -10311,18 +10367,18 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx goto __pyx_L15; } - /* "../../../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":851 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":897 * elif t == NPY_LONGDOUBLE: f[0] = 103 #"g" * elif t == NPY_CFLOAT: f[0] = 90; f[1] = 102; f += 1 # Zf * elif t == NPY_CDOUBLE: f[0] = 90; f[1] = 100; f += 1 # Zd # <<<<<<<<<<<<<< * elif t == NPY_CLONGDOUBLE: f[0] = 90; f[1] = 103; f += 1 # Zg * elif t == NPY_OBJECT: f[0] = 79 #"O" */ - __pyx_t_4 = __Pyx_PyInt_From_enum__NPY_TYPES(NPY_CDOUBLE); if (unlikely(!__pyx_t_4)) __PYX_ERR(1, 851, __pyx_L1_error) + __pyx_t_4 = __Pyx_PyInt_From_enum__NPY_TYPES(NPY_CDOUBLE); if (unlikely(!__pyx_t_4)) __PYX_ERR(1, 897, __pyx_L1_error) __Pyx_GOTREF(__pyx_t_4); - __pyx_t_3 = PyObject_RichCompare(__pyx_v_t, __pyx_t_4, Py_EQ); __Pyx_XGOTREF(__pyx_t_3); if (unlikely(!__pyx_t_3)) __PYX_ERR(1, 851, __pyx_L1_error) + __pyx_t_3 = PyObject_RichCompare(__pyx_v_t, __pyx_t_4, Py_EQ); __Pyx_XGOTREF(__pyx_t_3); if (unlikely(!__pyx_t_3)) __PYX_ERR(1, 897, __pyx_L1_error) __Pyx_DECREF(__pyx_t_4); __pyx_t_4 = 0; - __pyx_t_6 = __Pyx_PyObject_IsTrue(__pyx_t_3); if (unlikely(__pyx_t_6 < 0)) __PYX_ERR(1, 851, __pyx_L1_error) + __pyx_t_6 = __Pyx_PyObject_IsTrue(__pyx_t_3); if (unlikely(__pyx_t_6 < 0)) __PYX_ERR(1, 897, __pyx_L1_error) __Pyx_DECREF(__pyx_t_3); __pyx_t_3 = 0; if (__pyx_t_6) { (__pyx_v_f[0]) = 90; @@ -10331,18 +10387,18 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx goto __pyx_L15; } - /* "../../../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":852 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":898 * elif t == NPY_CFLOAT: f[0] = 90; f[1] = 102; f += 1 # Zf * elif t == NPY_CDOUBLE: f[0] = 90; f[1] = 100; f += 1 # Zd * elif t == NPY_CLONGDOUBLE: f[0] = 90; f[1] = 103; f += 1 # Zg # <<<<<<<<<<<<<< * elif t == NPY_OBJECT: f[0] = 79 #"O" * else: */ - __pyx_t_3 = __Pyx_PyInt_From_enum__NPY_TYPES(NPY_CLONGDOUBLE); if (unlikely(!__pyx_t_3)) __PYX_ERR(1, 852, __pyx_L1_error) + __pyx_t_3 = __Pyx_PyInt_From_enum__NPY_TYPES(NPY_CLONGDOUBLE); if (unlikely(!__pyx_t_3)) __PYX_ERR(1, 898, __pyx_L1_error) __Pyx_GOTREF(__pyx_t_3); - __pyx_t_4 = PyObject_RichCompare(__pyx_v_t, __pyx_t_3, Py_EQ); __Pyx_XGOTREF(__pyx_t_4); if (unlikely(!__pyx_t_4)) __PYX_ERR(1, 852, __pyx_L1_error) + __pyx_t_4 = PyObject_RichCompare(__pyx_v_t, __pyx_t_3, Py_EQ); __Pyx_XGOTREF(__pyx_t_4); if (unlikely(!__pyx_t_4)) __PYX_ERR(1, 898, __pyx_L1_error) __Pyx_DECREF(__pyx_t_3); __pyx_t_3 = 0; - __pyx_t_6 = __Pyx_PyObject_IsTrue(__pyx_t_4); if (unlikely(__pyx_t_6 < 0)) __PYX_ERR(1, 852, __pyx_L1_error) + __pyx_t_6 = __Pyx_PyObject_IsTrue(__pyx_t_4); if (unlikely(__pyx_t_6 < 0)) __PYX_ERR(1, 898, __pyx_L1_error) __Pyx_DECREF(__pyx_t_4); __pyx_t_4 = 0; if (__pyx_t_6) { (__pyx_v_f[0]) = 90; @@ -10351,25 +10407,25 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx goto __pyx_L15; } - /* "../../../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":853 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":899 * elif t == NPY_CDOUBLE: f[0] = 90; f[1] = 100; f += 1 # Zd * elif t == NPY_CLONGDOUBLE: f[0] = 90; f[1] = 103; f += 1 # Zg * elif t == NPY_OBJECT: f[0] = 79 #"O" # <<<<<<<<<<<<<< * else: * raise ValueError(u"unknown dtype code in numpy.pxd (%d)" % t) */ - __pyx_t_4 = __Pyx_PyInt_From_enum__NPY_TYPES(NPY_OBJECT); if (unlikely(!__pyx_t_4)) __PYX_ERR(1, 853, __pyx_L1_error) + __pyx_t_4 = __Pyx_PyInt_From_enum__NPY_TYPES(NPY_OBJECT); if (unlikely(!__pyx_t_4)) __PYX_ERR(1, 899, __pyx_L1_error) __Pyx_GOTREF(__pyx_t_4); - __pyx_t_3 = PyObject_RichCompare(__pyx_v_t, __pyx_t_4, Py_EQ); __Pyx_XGOTREF(__pyx_t_3); if (unlikely(!__pyx_t_3)) __PYX_ERR(1, 853, __pyx_L1_error) + __pyx_t_3 = PyObject_RichCompare(__pyx_v_t, __pyx_t_4, Py_EQ); __Pyx_XGOTREF(__pyx_t_3); if (unlikely(!__pyx_t_3)) __PYX_ERR(1, 899, __pyx_L1_error) __Pyx_DECREF(__pyx_t_4); __pyx_t_4 = 0; - __pyx_t_6 = __Pyx_PyObject_IsTrue(__pyx_t_3); if (unlikely(__pyx_t_6 < 0)) __PYX_ERR(1, 853, __pyx_L1_error) + __pyx_t_6 = __Pyx_PyObject_IsTrue(__pyx_t_3); if (unlikely(__pyx_t_6 < 0)) __PYX_ERR(1, 899, __pyx_L1_error) __Pyx_DECREF(__pyx_t_3); __pyx_t_3 = 0; if (likely(__pyx_t_6)) { (__pyx_v_f[0]) = 79; goto __pyx_L15; } - /* "../../../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":855 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":901 * elif t == NPY_OBJECT: f[0] = 79 #"O" * else: * raise ValueError(u"unknown dtype code in numpy.pxd (%d)" % t) # <<<<<<<<<<<<<< @@ -10377,18 +10433,18 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx * else: */ /*else*/ { - __pyx_t_3 = PyUnicode_Format(__pyx_kp_u_unknown_dtype_code_in_numpy_pxd, __pyx_v_t); if (unlikely(!__pyx_t_3)) __PYX_ERR(1, 855, __pyx_L1_error) + __pyx_t_3 = __Pyx_PyUnicode_FormatSafe(__pyx_kp_u_unknown_dtype_code_in_numpy_pxd, __pyx_v_t); if (unlikely(!__pyx_t_3)) __PYX_ERR(1, 901, __pyx_L1_error) __Pyx_GOTREF(__pyx_t_3); - __pyx_t_4 = __Pyx_PyObject_CallOneArg(__pyx_builtin_ValueError, __pyx_t_3); if (unlikely(!__pyx_t_4)) __PYX_ERR(1, 855, __pyx_L1_error) + __pyx_t_4 = __Pyx_PyObject_CallOneArg(__pyx_builtin_ValueError, __pyx_t_3); if (unlikely(!__pyx_t_4)) __PYX_ERR(1, 901, __pyx_L1_error) __Pyx_GOTREF(__pyx_t_4); __Pyx_DECREF(__pyx_t_3); __pyx_t_3 = 0; __Pyx_Raise(__pyx_t_4, 0, 0, 0); __Pyx_DECREF(__pyx_t_4); __pyx_t_4 = 0; - __PYX_ERR(1, 855, __pyx_L1_error) + __PYX_ERR(1, 901, __pyx_L1_error) } __pyx_L15:; - /* "../../../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":856 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":902 * else: * raise ValueError(u"unknown dtype code in numpy.pxd (%d)" % t) * f += 1 # <<<<<<<<<<<<<< @@ -10397,7 +10453,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx */ __pyx_v_f = (__pyx_v_f + 1); - /* "../../../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":831 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":877 * offset[0] += child.itemsize * * if not PyDataType_HASFIELDS(child): # <<<<<<<<<<<<<< @@ -10407,7 +10463,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx goto __pyx_L13; } - /* "../../../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":860 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":906 * # Cython ignores struct boundary information ("T{...}"), * # so don't output it * f = _util_dtypestring(child, f, end, offset) # <<<<<<<<<<<<<< @@ -10415,12 +10471,12 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx * */ /*else*/ { - __pyx_t_9 = __pyx_f_5numpy__util_dtypestring(__pyx_v_child, __pyx_v_f, __pyx_v_end, __pyx_v_offset); if (unlikely(__pyx_t_9 == ((char *)NULL))) __PYX_ERR(1, 860, __pyx_L1_error) + __pyx_t_9 = __pyx_f_5numpy__util_dtypestring(__pyx_v_child, __pyx_v_f, __pyx_v_end, __pyx_v_offset); if (unlikely(__pyx_t_9 == ((char *)NULL))) __PYX_ERR(1, 906, __pyx_L1_error) __pyx_v_f = __pyx_t_9; } __pyx_L13:; - /* "../../../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":805 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":851 * cdef tuple fields * * for childname in descr.names: # <<<<<<<<<<<<<< @@ -10430,7 +10486,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx } __Pyx_DECREF(__pyx_t_1); __pyx_t_1 = 0; - /* "../../../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":861 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":907 * # so don't output it * f = _util_dtypestring(child, f, end, offset) * return f # <<<<<<<<<<<<<< @@ -10440,7 +10496,7 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx __pyx_r = __pyx_v_f; goto __pyx_L0; - /* "../../../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":796 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":842 * return () * * cdef inline char* _util_dtypestring(dtype descr, char* f, char* end, int* offset) except NULL: # <<<<<<<<<<<<<< @@ -10465,166 +10521,120 @@ static CYTHON_INLINE char *__pyx_f_5numpy__util_dtypestring(PyArray_Descr *__pyx return __pyx_r; } -/* "../../../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":977 - * +/* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":1022 + * int _import_umath() except -1 * * cdef inline void set_array_base(ndarray arr, object base): # <<<<<<<<<<<<<< - * cdef PyObject* baseptr - * if base is None: + * Py_INCREF(base) # important to do this before stealing the reference below! + * PyArray_SetBaseObject(arr, base) */ static CYTHON_INLINE void __pyx_f_5numpy_set_array_base(PyArrayObject *__pyx_v_arr, PyObject *__pyx_v_base) { - PyObject *__pyx_v_baseptr; __Pyx_RefNannyDeclarations - int __pyx_t_1; - int __pyx_t_2; __Pyx_RefNannySetupContext("set_array_base", 0); - /* "../../../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":979 - * cdef inline void set_array_base(ndarray arr, object base): - * cdef PyObject* baseptr - * if base is None: # <<<<<<<<<<<<<< - * baseptr = NULL - * else: - */ - __pyx_t_1 = (__pyx_v_base == Py_None); - __pyx_t_2 = (__pyx_t_1 != 0); - if (__pyx_t_2) { - - /* "../../../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":980 - * cdef PyObject* baseptr - * if base is None: - * baseptr = NULL # <<<<<<<<<<<<<< - * else: - * Py_INCREF(base) # important to do this before decref below! - */ - __pyx_v_baseptr = NULL; - - /* "../../../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":979 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":1023 + * * cdef inline void set_array_base(ndarray arr, object base): - * cdef PyObject* baseptr - * if base is None: # <<<<<<<<<<<<<< - * baseptr = NULL - * else: - */ - goto __pyx_L3; - } - - /* "../../../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":982 - * baseptr = NULL - * else: - * Py_INCREF(base) # important to do this before decref below! # <<<<<<<<<<<<<< - * baseptr = base - * Py_XDECREF(arr.base) - */ - /*else*/ { - Py_INCREF(__pyx_v_base); - - /* "../../../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":983 - * else: - * Py_INCREF(base) # important to do this before decref below! - * baseptr = base # <<<<<<<<<<<<<< - * Py_XDECREF(arr.base) - * arr.base = baseptr - */ - __pyx_v_baseptr = ((PyObject *)__pyx_v_base); - } - __pyx_L3:; - - /* "../../../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":984 - * Py_INCREF(base) # important to do this before decref below! - * baseptr = base - * Py_XDECREF(arr.base) # <<<<<<<<<<<<<< - * arr.base = baseptr + * Py_INCREF(base) # important to do this before stealing the reference below! # <<<<<<<<<<<<<< + * PyArray_SetBaseObject(arr, base) * */ - Py_XDECREF(__pyx_v_arr->base); + Py_INCREF(__pyx_v_base); - /* "../../../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":985 - * baseptr = base - * Py_XDECREF(arr.base) - * arr.base = baseptr # <<<<<<<<<<<<<< + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":1024 + * cdef inline void set_array_base(ndarray arr, object base): + * Py_INCREF(base) # important to do this before stealing the reference below! + * PyArray_SetBaseObject(arr, base) # <<<<<<<<<<<<<< * * cdef inline object get_array_base(ndarray arr): */ - __pyx_v_arr->base = __pyx_v_baseptr; + (void)(PyArray_SetBaseObject(__pyx_v_arr, __pyx_v_base)); - /* "../../../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":977 - * + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":1022 + * int _import_umath() except -1 * * cdef inline void set_array_base(ndarray arr, object base): # <<<<<<<<<<<<<< - * cdef PyObject* baseptr - * if base is None: + * Py_INCREF(base) # important to do this before stealing the reference below! + * PyArray_SetBaseObject(arr, base) */ /* function exit code */ __Pyx_RefNannyFinishContext(); } -/* "../../../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":987 - * arr.base = baseptr +/* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":1026 + * PyArray_SetBaseObject(arr, base) * * cdef inline object get_array_base(ndarray arr): # <<<<<<<<<<<<<< - * if arr.base is NULL: - * return None + * base = PyArray_BASE(arr) + * if base is NULL: */ static CYTHON_INLINE PyObject *__pyx_f_5numpy_get_array_base(PyArrayObject *__pyx_v_arr) { + PyObject *__pyx_v_base; PyObject *__pyx_r = NULL; __Pyx_RefNannyDeclarations int __pyx_t_1; __Pyx_RefNannySetupContext("get_array_base", 0); - /* "../../../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":988 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":1027 * * cdef inline object get_array_base(ndarray arr): - * if arr.base is NULL: # <<<<<<<<<<<<<< + * base = PyArray_BASE(arr) # <<<<<<<<<<<<<< + * if base is NULL: * return None - * else: */ - __pyx_t_1 = ((__pyx_v_arr->base == NULL) != 0); - if (__pyx_t_1) { + __pyx_v_base = PyArray_BASE(__pyx_v_arr); - /* "../../../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":989 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":1028 * cdef inline object get_array_base(ndarray arr): - * if arr.base is NULL: + * base = PyArray_BASE(arr) + * if base is NULL: # <<<<<<<<<<<<<< + * return None + * return base + */ + __pyx_t_1 = ((__pyx_v_base == NULL) != 0); + if (__pyx_t_1) { + + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":1029 + * base = PyArray_BASE(arr) + * if base is NULL: * return None # <<<<<<<<<<<<<< - * else: - * return arr.base + * return base + * */ __Pyx_XDECREF(__pyx_r); __pyx_r = Py_None; __Pyx_INCREF(Py_None); goto __pyx_L0; - /* "../../../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":988 - * + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":1028 * cdef inline object get_array_base(ndarray arr): - * if arr.base is NULL: # <<<<<<<<<<<<<< + * base = PyArray_BASE(arr) + * if base is NULL: # <<<<<<<<<<<<<< * return None - * else: + * return base */ } - /* "../../../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":991 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":1030 + * if base is NULL: * return None - * else: - * return arr.base # <<<<<<<<<<<<<< - * + * return base # <<<<<<<<<<<<<< * + * # Versions of the import_* functions which are more suitable for */ - /*else*/ { - __Pyx_XDECREF(__pyx_r); - __Pyx_INCREF(((PyObject *)__pyx_v_arr->base)); - __pyx_r = ((PyObject *)__pyx_v_arr->base); - goto __pyx_L0; - } + __Pyx_XDECREF(__pyx_r); + __Pyx_INCREF(((PyObject *)__pyx_v_base)); + __pyx_r = ((PyObject *)__pyx_v_base); + goto __pyx_L0; - /* "../../../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":987 - * arr.base = baseptr + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":1026 + * PyArray_SetBaseObject(arr, base) * * cdef inline object get_array_base(ndarray arr): # <<<<<<<<<<<<<< - * if arr.base is NULL: - * return None + * base = PyArray_BASE(arr) + * if base is NULL: */ /* function exit code */ @@ -10634,7 +10644,7 @@ static CYTHON_INLINE PyObject *__pyx_f_5numpy_get_array_base(PyArrayObject *__py return __pyx_r; } -/* "../../../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":996 +/* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":1034 * # Versions of the import_* functions which are more suitable for * # Cython code. * cdef inline int import_array() except -1: # <<<<<<<<<<<<<< @@ -10655,7 +10665,7 @@ static CYTHON_INLINE int __pyx_f_5numpy_import_array(void) { PyObject *__pyx_t_8 = NULL; __Pyx_RefNannySetupContext("import_array", 0); - /* "../../../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":997 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":1035 * # Cython code. * cdef inline int import_array() except -1: * try: # <<<<<<<<<<<<<< @@ -10671,16 +10681,16 @@ static CYTHON_INLINE int __pyx_f_5numpy_import_array(void) { __Pyx_XGOTREF(__pyx_t_3); /*try:*/ { - /* "../../../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":998 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":1036 * cdef inline int import_array() except -1: * try: * _import_array() # <<<<<<<<<<<<<< * except Exception: * raise ImportError("numpy.core.multiarray failed to import") */ - __pyx_t_4 = _import_array(); if (unlikely(__pyx_t_4 == ((int)-1))) __PYX_ERR(1, 998, __pyx_L3_error) + __pyx_t_4 = _import_array(); if (unlikely(__pyx_t_4 == ((int)-1))) __PYX_ERR(1, 1036, __pyx_L3_error) - /* "../../../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":997 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":1035 * # Cython code. * cdef inline int import_array() except -1: * try: # <<<<<<<<<<<<<< @@ -10694,7 +10704,7 @@ static CYTHON_INLINE int __pyx_f_5numpy_import_array(void) { goto __pyx_L8_try_end; __pyx_L3_error:; - /* "../../../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":999 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":1037 * try: * _import_array() * except Exception: # <<<<<<<<<<<<<< @@ -10704,28 +10714,28 @@ static CYTHON_INLINE int __pyx_f_5numpy_import_array(void) { __pyx_t_4 = __Pyx_PyErr_ExceptionMatches(((PyObject *)(&((PyTypeObject*)PyExc_Exception)[0]))); if (__pyx_t_4) { __Pyx_AddTraceback("numpy.import_array", __pyx_clineno, __pyx_lineno, __pyx_filename); - if (__Pyx_GetException(&__pyx_t_5, &__pyx_t_6, &__pyx_t_7) < 0) __PYX_ERR(1, 999, __pyx_L5_except_error) + if (__Pyx_GetException(&__pyx_t_5, &__pyx_t_6, &__pyx_t_7) < 0) __PYX_ERR(1, 1037, __pyx_L5_except_error) __Pyx_GOTREF(__pyx_t_5); __Pyx_GOTREF(__pyx_t_6); __Pyx_GOTREF(__pyx_t_7); - /* "../../../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1000 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":1038 * _import_array() * except Exception: * raise ImportError("numpy.core.multiarray failed to import") # <<<<<<<<<<<<<< * * cdef inline int import_umath() except -1: */ - __pyx_t_8 = __Pyx_PyObject_Call(__pyx_builtin_ImportError, __pyx_tuple__9, NULL); if (unlikely(!__pyx_t_8)) __PYX_ERR(1, 1000, __pyx_L5_except_error) + __pyx_t_8 = __Pyx_PyObject_Call(__pyx_builtin_ImportError, __pyx_tuple__7, NULL); if (unlikely(!__pyx_t_8)) __PYX_ERR(1, 1038, __pyx_L5_except_error) __Pyx_GOTREF(__pyx_t_8); __Pyx_Raise(__pyx_t_8, 0, 0, 0); __Pyx_DECREF(__pyx_t_8); __pyx_t_8 = 0; - __PYX_ERR(1, 1000, __pyx_L5_except_error) + __PYX_ERR(1, 1038, __pyx_L5_except_error) } goto __pyx_L5_except_error; __pyx_L5_except_error:; - /* "../../../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":997 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":1035 * # Cython code. * cdef inline int import_array() except -1: * try: # <<<<<<<<<<<<<< @@ -10740,7 +10750,7 @@ static CYTHON_INLINE int __pyx_f_5numpy_import_array(void) { __pyx_L8_try_end:; } - /* "../../../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":996 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":1034 * # Versions of the import_* functions which are more suitable for * # Cython code. * cdef inline int import_array() except -1: # <<<<<<<<<<<<<< @@ -10763,7 +10773,7 @@ static CYTHON_INLINE int __pyx_f_5numpy_import_array(void) { return __pyx_r; } -/* "../../../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1002 +/* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":1040 * raise ImportError("numpy.core.multiarray failed to import") * * cdef inline int import_umath() except -1: # <<<<<<<<<<<<<< @@ -10784,7 +10794,7 @@ static CYTHON_INLINE int __pyx_f_5numpy_import_umath(void) { PyObject *__pyx_t_8 = NULL; __Pyx_RefNannySetupContext("import_umath", 0); - /* "../../../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1003 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":1041 * * cdef inline int import_umath() except -1: * try: # <<<<<<<<<<<<<< @@ -10800,16 +10810,16 @@ static CYTHON_INLINE int __pyx_f_5numpy_import_umath(void) { __Pyx_XGOTREF(__pyx_t_3); /*try:*/ { - /* "../../../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1004 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":1042 * cdef inline int import_umath() except -1: * try: * _import_umath() # <<<<<<<<<<<<<< * except Exception: * raise ImportError("numpy.core.umath failed to import") */ - __pyx_t_4 = _import_umath(); if (unlikely(__pyx_t_4 == ((int)-1))) __PYX_ERR(1, 1004, __pyx_L3_error) + __pyx_t_4 = _import_umath(); if (unlikely(__pyx_t_4 == ((int)-1))) __PYX_ERR(1, 1042, __pyx_L3_error) - /* "../../../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1003 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":1041 * * cdef inline int import_umath() except -1: * try: # <<<<<<<<<<<<<< @@ -10823,7 +10833,7 @@ static CYTHON_INLINE int __pyx_f_5numpy_import_umath(void) { goto __pyx_L8_try_end; __pyx_L3_error:; - /* "../../../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1005 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":1043 * try: * _import_umath() * except Exception: # <<<<<<<<<<<<<< @@ -10833,28 +10843,28 @@ static CYTHON_INLINE int __pyx_f_5numpy_import_umath(void) { __pyx_t_4 = __Pyx_PyErr_ExceptionMatches(((PyObject *)(&((PyTypeObject*)PyExc_Exception)[0]))); if (__pyx_t_4) { __Pyx_AddTraceback("numpy.import_umath", __pyx_clineno, __pyx_lineno, __pyx_filename); - if (__Pyx_GetException(&__pyx_t_5, &__pyx_t_6, &__pyx_t_7) < 0) __PYX_ERR(1, 1005, __pyx_L5_except_error) + if (__Pyx_GetException(&__pyx_t_5, &__pyx_t_6, &__pyx_t_7) < 0) __PYX_ERR(1, 1043, __pyx_L5_except_error) __Pyx_GOTREF(__pyx_t_5); __Pyx_GOTREF(__pyx_t_6); __Pyx_GOTREF(__pyx_t_7); - /* "../../../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1006 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":1044 * _import_umath() * except Exception: * raise ImportError("numpy.core.umath failed to import") # <<<<<<<<<<<<<< * * cdef inline int import_ufunc() except -1: */ - __pyx_t_8 = __Pyx_PyObject_Call(__pyx_builtin_ImportError, __pyx_tuple__10, NULL); if (unlikely(!__pyx_t_8)) __PYX_ERR(1, 1006, __pyx_L5_except_error) + __pyx_t_8 = __Pyx_PyObject_Call(__pyx_builtin_ImportError, __pyx_tuple__8, NULL); if (unlikely(!__pyx_t_8)) __PYX_ERR(1, 1044, __pyx_L5_except_error) __Pyx_GOTREF(__pyx_t_8); __Pyx_Raise(__pyx_t_8, 0, 0, 0); __Pyx_DECREF(__pyx_t_8); __pyx_t_8 = 0; - __PYX_ERR(1, 1006, __pyx_L5_except_error) + __PYX_ERR(1, 1044, __pyx_L5_except_error) } goto __pyx_L5_except_error; __pyx_L5_except_error:; - /* "../../../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1003 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":1041 * * cdef inline int import_umath() except -1: * try: # <<<<<<<<<<<<<< @@ -10869,7 +10879,7 @@ static CYTHON_INLINE int __pyx_f_5numpy_import_umath(void) { __pyx_L8_try_end:; } - /* "../../../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1002 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":1040 * raise ImportError("numpy.core.multiarray failed to import") * * cdef inline int import_umath() except -1: # <<<<<<<<<<<<<< @@ -10892,7 +10902,7 @@ static CYTHON_INLINE int __pyx_f_5numpy_import_umath(void) { return __pyx_r; } -/* "../../../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1008 +/* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":1046 * raise ImportError("numpy.core.umath failed to import") * * cdef inline int import_ufunc() except -1: # <<<<<<<<<<<<<< @@ -10913,7 +10923,7 @@ static CYTHON_INLINE int __pyx_f_5numpy_import_ufunc(void) { PyObject *__pyx_t_8 = NULL; __Pyx_RefNannySetupContext("import_ufunc", 0); - /* "../../../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1009 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":1047 * * cdef inline int import_ufunc() except -1: * try: # <<<<<<<<<<<<<< @@ -10929,16 +10939,16 @@ static CYTHON_INLINE int __pyx_f_5numpy_import_ufunc(void) { __Pyx_XGOTREF(__pyx_t_3); /*try:*/ { - /* "../../../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1010 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":1048 * cdef inline int import_ufunc() except -1: * try: * _import_umath() # <<<<<<<<<<<<<< * except Exception: * raise ImportError("numpy.core.umath failed to import") */ - __pyx_t_4 = _import_umath(); if (unlikely(__pyx_t_4 == ((int)-1))) __PYX_ERR(1, 1010, __pyx_L3_error) + __pyx_t_4 = _import_umath(); if (unlikely(__pyx_t_4 == ((int)-1))) __PYX_ERR(1, 1048, __pyx_L3_error) - /* "../../../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1009 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":1047 * * cdef inline int import_ufunc() except -1: * try: # <<<<<<<<<<<<<< @@ -10952,7 +10962,7 @@ static CYTHON_INLINE int __pyx_f_5numpy_import_ufunc(void) { goto __pyx_L8_try_end; __pyx_L3_error:; - /* "../../../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1011 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":1049 * try: * _import_umath() * except Exception: # <<<<<<<<<<<<<< @@ -10961,26 +10971,26 @@ static CYTHON_INLINE int __pyx_f_5numpy_import_ufunc(void) { __pyx_t_4 = __Pyx_PyErr_ExceptionMatches(((PyObject *)(&((PyTypeObject*)PyExc_Exception)[0]))); if (__pyx_t_4) { __Pyx_AddTraceback("numpy.import_ufunc", __pyx_clineno, __pyx_lineno, __pyx_filename); - if (__Pyx_GetException(&__pyx_t_5, &__pyx_t_6, &__pyx_t_7) < 0) __PYX_ERR(1, 1011, __pyx_L5_except_error) + if (__Pyx_GetException(&__pyx_t_5, &__pyx_t_6, &__pyx_t_7) < 0) __PYX_ERR(1, 1049, __pyx_L5_except_error) __Pyx_GOTREF(__pyx_t_5); __Pyx_GOTREF(__pyx_t_6); __Pyx_GOTREF(__pyx_t_7); - /* "../../../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1012 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":1050 * _import_umath() * except Exception: * raise ImportError("numpy.core.umath failed to import") # <<<<<<<<<<<<<< */ - __pyx_t_8 = __Pyx_PyObject_Call(__pyx_builtin_ImportError, __pyx_tuple__11, NULL); if (unlikely(!__pyx_t_8)) __PYX_ERR(1, 1012, __pyx_L5_except_error) + __pyx_t_8 = __Pyx_PyObject_Call(__pyx_builtin_ImportError, __pyx_tuple__8, NULL); if (unlikely(!__pyx_t_8)) __PYX_ERR(1, 1050, __pyx_L5_except_error) __Pyx_GOTREF(__pyx_t_8); __Pyx_Raise(__pyx_t_8, 0, 0, 0); __Pyx_DECREF(__pyx_t_8); __pyx_t_8 = 0; - __PYX_ERR(1, 1012, __pyx_L5_except_error) + __PYX_ERR(1, 1050, __pyx_L5_except_error) } goto __pyx_L5_except_error; __pyx_L5_except_error:; - /* "../../../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1009 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":1047 * * cdef inline int import_ufunc() except -1: * try: # <<<<<<<<<<<<<< @@ -10995,7 +11005,7 @@ static CYTHON_INLINE int __pyx_f_5numpy_import_ufunc(void) { __pyx_L8_try_end:; } - /* "../../../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1008 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":1046 * raise ImportError("numpy.core.umath failed to import") * * cdef inline int import_ufunc() except -1: # <<<<<<<<<<<<<< @@ -11053,6 +11063,15 @@ static struct PyModuleDef __pyx_moduledef = { NULL /* m_free */ }; #endif +#ifndef CYTHON_SMALL_CODE +#if defined(__clang__) + #define CYTHON_SMALL_CODE +#elif defined(__GNUC__) && (__GNUC__ > 4 || (__GNUC__ == 4 && __GNUC_MINOR__ >= 3)) + #define CYTHON_SMALL_CODE __attribute__((cold)) +#else + #define CYTHON_SMALL_CODE +#endif +#endif static __Pyx_StringTabEntry __pyx_string_tab[] = { {&__pyx_n_s_EXP_TABLE, __pyx_k_EXP_TABLE, sizeof(__pyx_k_EXP_TABLE), 0, 0, 1, 1}, @@ -11065,7 +11084,7 @@ static __Pyx_StringTabEntry __pyx_string_tab[] = { {&__pyx_n_s_REAL, __pyx_k_REAL, sizeof(__pyx_k_REAL), 0, 0, 1, 1}, {&__pyx_n_s_RuntimeError, __pyx_k_RuntimeError, sizeof(__pyx_k_RuntimeError), 0, 0, 1, 1}, {&__pyx_n_s_ValueError, __pyx_k_ValueError, sizeof(__pyx_k_ValueError), 0, 0, 1, 1}, - {&__pyx_n_s__12, __pyx_k__12, sizeof(__pyx_k__12), 0, 0, 1, 1}, + {&__pyx_n_s__9, __pyx_k__9, sizeof(__pyx_k__9), 0, 0, 1, 1}, {&__pyx_n_s_alpha, __pyx_k_alpha, sizeof(__pyx_k_alpha), 0, 0, 1, 1}, {&__pyx_n_s_c, __pyx_k_c, sizeof(__pyx_k_c), 0, 0, 1, 1}, {&__pyx_n_s_cbow_mean, __pyx_k_cbow_mean, sizeof(__pyx_k_cbow_mean), 0, 0, 1, 1}, @@ -11084,6 +11103,7 @@ static __Pyx_StringTabEntry __pyx_string_tab[] = { {&__pyx_n_s_fblas, __pyx_k_fblas, sizeof(__pyx_k_fblas), 0, 0, 1, 1}, {&__pyx_n_s_float32, __pyx_k_float32, sizeof(__pyx_k_float32), 0, 0, 1, 1}, {&__pyx_n_s_gensim_models_word2vec_inner, __pyx_k_gensim_models_word2vec_inner, sizeof(__pyx_k_gensim_models_word2vec_inner), 0, 0, 1, 1}, + {&__pyx_kp_s_gensim_models_word2vec_inner_pyx, __pyx_k_gensim_models_word2vec_inner_pyx, sizeof(__pyx_k_gensim_models_word2vec_inner_pyx), 0, 0, 1, 0}, {&__pyx_n_s_hs, __pyx_k_hs, sizeof(__pyx_k_hs), 0, 0, 1, 1}, {&__pyx_n_s_i, __pyx_k_i, sizeof(__pyx_k_i), 0, 0, 1, 1}, {&__pyx_n_s_idx_end, __pyx_k_idx_end, sizeof(__pyx_k_idx_end), 0, 0, 1, 1}, @@ -11096,6 +11116,7 @@ static __Pyx_StringTabEntry __pyx_string_tab[] = { {&__pyx_n_s_k, __pyx_k_k, sizeof(__pyx_k_k), 0, 0, 1, 1}, {&__pyx_n_s_main, __pyx_k_main, sizeof(__pyx_k_main), 0, 0, 1, 1}, {&__pyx_n_s_model, __pyx_k_model, sizeof(__pyx_k_model), 0, 0, 1, 1}, + {&__pyx_n_s_name, __pyx_k_name, sizeof(__pyx_k_name), 0, 0, 1, 1}, {&__pyx_kp_u_ndarray_is_not_C_contiguous, __pyx_k_ndarray_is_not_C_contiguous, sizeof(__pyx_k_ndarray_is_not_C_contiguous), 0, 1, 0, 0}, {&__pyx_kp_u_ndarray_is_not_Fortran_contiguou, __pyx_k_ndarray_is_not_Fortran_contiguou, sizeof(__pyx_k_ndarray_is_not_Fortran_contiguou), 0, 1, 0, 0}, {&__pyx_n_s_negative, __pyx_k_negative, sizeof(__pyx_k_negative), 0, 0, 1, 1}, @@ -11114,7 +11135,6 @@ static __Pyx_StringTabEntry __pyx_string_tab[] = { {&__pyx_n_s_range, __pyx_k_range, sizeof(__pyx_k_range), 0, 0, 1, 1}, {&__pyx_n_s_result, __pyx_k_result, sizeof(__pyx_k_result), 0, 0, 1, 1}, {&__pyx_n_s_running_training_loss, __pyx_k_running_training_loss, sizeof(__pyx_k_running_training_loss), 0, 0, 1, 1}, - {&__pyx_n_s_running_training_loss_sample, __pyx_k_running_training_loss_sample, sizeof(__pyx_k_running_training_loss_sample), 0, 0, 1, 1}, {&__pyx_n_s_sample, __pyx_k_sample, sizeof(__pyx_k_sample), 0, 0, 1, 1}, {&__pyx_n_s_sample_int, __pyx_k_sample_int, sizeof(__pyx_k_sample_int), 0, 0, 1, 1}, {&__pyx_n_s_saxpy, __pyx_k_saxpy, sizeof(__pyx_k_saxpy), 0, 0, 1, 1}, @@ -11147,7 +11167,6 @@ static __Pyx_StringTabEntry __pyx_string_tab[] = { {&__pyx_n_s_vocabulary, __pyx_k_vocabulary, sizeof(__pyx_k_vocabulary), 0, 0, 1, 1}, {&__pyx_n_s_window, __pyx_k_window, sizeof(__pyx_k_window), 0, 0, 1, 1}, {&__pyx_n_s_word, __pyx_k_word, sizeof(__pyx_k_word), 0, 0, 1, 1}, - {&__pyx_kp_s_word2vec_inner_pyx, __pyx_k_word2vec_inner_pyx, sizeof(__pyx_k_word2vec_inner_pyx), 0, 0, 1, 0}, {&__pyx_n_s_work, __pyx_k_work, sizeof(__pyx_k_work), 0, 0, 1, 1}, {&__pyx_n_s_workers, __pyx_k_workers, sizeof(__pyx_k_workers), 0, 0, 1, 1}, {&__pyx_n_s_wv, __pyx_k_wv, sizeof(__pyx_k_wv), 0, 0, 1, 1}, @@ -11155,18 +11174,18 @@ static __Pyx_StringTabEntry __pyx_string_tab[] = { {&__pyx_n_s_y, __pyx_k_y, sizeof(__pyx_k_y), 0, 0, 1, 1}, {0, 0, 0, 0, 0, 0, 0} }; -static int __Pyx_InitCachedBuiltins(void) { +static CYTHON_SMALL_CODE int __Pyx_InitCachedBuiltins(void) { __pyx_builtin_ImportError = __Pyx_GetBuiltinName(__pyx_n_s_ImportError); if (!__pyx_builtin_ImportError) __PYX_ERR(0, 25, __pyx_L1_error) __pyx_builtin_range = __Pyx_GetBuiltinName(__pyx_n_s_range); if (!__pyx_builtin_range) __PYX_ERR(0, 119, __pyx_L1_error) __pyx_builtin_enumerate = __Pyx_GetBuiltinName(__pyx_n_s_enumerate); if (!__pyx_builtin_enumerate) __PYX_ERR(0, 566, __pyx_L1_error) - __pyx_builtin_ValueError = __Pyx_GetBuiltinName(__pyx_n_s_ValueError); if (!__pyx_builtin_ValueError) __PYX_ERR(1, 229, __pyx_L1_error) - __pyx_builtin_RuntimeError = __Pyx_GetBuiltinName(__pyx_n_s_RuntimeError); if (!__pyx_builtin_RuntimeError) __PYX_ERR(1, 810, __pyx_L1_error) + __pyx_builtin_ValueError = __Pyx_GetBuiltinName(__pyx_n_s_ValueError); if (!__pyx_builtin_ValueError) __PYX_ERR(1, 272, __pyx_L1_error) + __pyx_builtin_RuntimeError = __Pyx_GetBuiltinName(__pyx_n_s_RuntimeError); if (!__pyx_builtin_RuntimeError) __PYX_ERR(1, 856, __pyx_L1_error) return 0; __pyx_L1_error:; return -1; } -static int __Pyx_InitCachedConstants(void) { +static CYTHON_SMALL_CODE int __Pyx_InitCachedConstants(void) { __Pyx_RefNannyDeclarations __Pyx_RefNannySetupContext("__Pyx_InitCachedConstants", 0); @@ -11180,106 +11199,83 @@ static int __Pyx_InitCachedConstants(void) { __pyx_tuple_ = PyTuple_Pack(2, __pyx_int_0, __pyx_int_16777216); if (unlikely(!__pyx_tuple_)) __PYX_ERR(0, 491, __pyx_L1_error) __Pyx_GOTREF(__pyx_tuple_); __Pyx_GIVEREF(__pyx_tuple_); - __pyx_tuple__2 = PyTuple_Pack(2, __pyx_int_0, __pyx_int_16777216); if (unlikely(!__pyx_tuple__2)) __PYX_ERR(0, 491, __pyx_L1_error) - __Pyx_GOTREF(__pyx_tuple__2); - __Pyx_GIVEREF(__pyx_tuple__2); - /* "../../../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":229 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":272 * if ((flags & pybuf.PyBUF_C_CONTIGUOUS == pybuf.PyBUF_C_CONTIGUOUS) - * and not PyArray_CHKFLAGS(self, NPY_C_CONTIGUOUS)): + * and not PyArray_CHKFLAGS(self, NPY_ARRAY_C_CONTIGUOUS)): * raise ValueError(u"ndarray is not C contiguous") # <<<<<<<<<<<<<< * * if ((flags & pybuf.PyBUF_F_CONTIGUOUS == pybuf.PyBUF_F_CONTIGUOUS) */ - __pyx_tuple__3 = PyTuple_Pack(1, __pyx_kp_u_ndarray_is_not_C_contiguous); if (unlikely(!__pyx_tuple__3)) __PYX_ERR(1, 229, __pyx_L1_error) - __Pyx_GOTREF(__pyx_tuple__3); - __Pyx_GIVEREF(__pyx_tuple__3); + __pyx_tuple__2 = PyTuple_Pack(1, __pyx_kp_u_ndarray_is_not_C_contiguous); if (unlikely(!__pyx_tuple__2)) __PYX_ERR(1, 272, __pyx_L1_error) + __Pyx_GOTREF(__pyx_tuple__2); + __Pyx_GIVEREF(__pyx_tuple__2); - /* "../../../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":233 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":276 * if ((flags & pybuf.PyBUF_F_CONTIGUOUS == pybuf.PyBUF_F_CONTIGUOUS) - * and not PyArray_CHKFLAGS(self, NPY_F_CONTIGUOUS)): + * and not PyArray_CHKFLAGS(self, NPY_ARRAY_F_CONTIGUOUS)): * raise ValueError(u"ndarray is not Fortran contiguous") # <<<<<<<<<<<<<< * * info.buf = PyArray_DATA(self) */ - __pyx_tuple__4 = PyTuple_Pack(1, __pyx_kp_u_ndarray_is_not_Fortran_contiguou); if (unlikely(!__pyx_tuple__4)) __PYX_ERR(1, 233, __pyx_L1_error) - __Pyx_GOTREF(__pyx_tuple__4); - __Pyx_GIVEREF(__pyx_tuple__4); + __pyx_tuple__3 = PyTuple_Pack(1, __pyx_kp_u_ndarray_is_not_Fortran_contiguou); if (unlikely(!__pyx_tuple__3)) __PYX_ERR(1, 276, __pyx_L1_error) + __Pyx_GOTREF(__pyx_tuple__3); + __Pyx_GIVEREF(__pyx_tuple__3); - /* "../../../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":263 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":306 * if ((descr.byteorder == c'>' and little_endian) or * (descr.byteorder == c'<' and not little_endian)): * raise ValueError(u"Non-native byte order not supported") # <<<<<<<<<<<<<< * if t == NPY_BYTE: f = "b" * elif t == NPY_UBYTE: f = "B" */ - __pyx_tuple__5 = PyTuple_Pack(1, __pyx_kp_u_Non_native_byte_order_not_suppor); if (unlikely(!__pyx_tuple__5)) __PYX_ERR(1, 263, __pyx_L1_error) - __Pyx_GOTREF(__pyx_tuple__5); - __Pyx_GIVEREF(__pyx_tuple__5); + __pyx_tuple__4 = PyTuple_Pack(1, __pyx_kp_u_Non_native_byte_order_not_suppor); if (unlikely(!__pyx_tuple__4)) __PYX_ERR(1, 306, __pyx_L1_error) + __Pyx_GOTREF(__pyx_tuple__4); + __Pyx_GIVEREF(__pyx_tuple__4); - /* "../../../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":810 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":856 * * if (end - f) - (new_offset - offset[0]) < 15: * raise RuntimeError(u"Format string allocated too short, see comment in numpy.pxd") # <<<<<<<<<<<<<< * * if ((child.byteorder == c'>' and little_endian) or */ - __pyx_tuple__6 = PyTuple_Pack(1, __pyx_kp_u_Format_string_allocated_too_shor); if (unlikely(!__pyx_tuple__6)) __PYX_ERR(1, 810, __pyx_L1_error) - __Pyx_GOTREF(__pyx_tuple__6); - __Pyx_GIVEREF(__pyx_tuple__6); - - /* "../../../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":814 - * if ((child.byteorder == c'>' and little_endian) or - * (child.byteorder == c'<' and not little_endian)): - * raise ValueError(u"Non-native byte order not supported") # <<<<<<<<<<<<<< - * # One could encode it in the format string and have Cython - * # complain instead, BUT: < and > in format strings also imply - */ - __pyx_tuple__7 = PyTuple_Pack(1, __pyx_kp_u_Non_native_byte_order_not_suppor); if (unlikely(!__pyx_tuple__7)) __PYX_ERR(1, 814, __pyx_L1_error) - __Pyx_GOTREF(__pyx_tuple__7); - __Pyx_GIVEREF(__pyx_tuple__7); + __pyx_tuple__5 = PyTuple_Pack(1, __pyx_kp_u_Format_string_allocated_too_shor); if (unlikely(!__pyx_tuple__5)) __PYX_ERR(1, 856, __pyx_L1_error) + __Pyx_GOTREF(__pyx_tuple__5); + __Pyx_GIVEREF(__pyx_tuple__5); - /* "../../../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":834 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":880 * t = child.type_num * if end - f < 5: * raise RuntimeError(u"Format string allocated too short.") # <<<<<<<<<<<<<< * * # Until ticket #99 is fixed, use integers to avoid warnings */ - __pyx_tuple__8 = PyTuple_Pack(1, __pyx_kp_u_Format_string_allocated_too_shor_2); if (unlikely(!__pyx_tuple__8)) __PYX_ERR(1, 834, __pyx_L1_error) - __Pyx_GOTREF(__pyx_tuple__8); - __Pyx_GIVEREF(__pyx_tuple__8); + __pyx_tuple__6 = PyTuple_Pack(1, __pyx_kp_u_Format_string_allocated_too_shor_2); if (unlikely(!__pyx_tuple__6)) __PYX_ERR(1, 880, __pyx_L1_error) + __Pyx_GOTREF(__pyx_tuple__6); + __Pyx_GIVEREF(__pyx_tuple__6); - /* "../../../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1000 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":1038 * _import_array() * except Exception: * raise ImportError("numpy.core.multiarray failed to import") # <<<<<<<<<<<<<< * * cdef inline int import_umath() except -1: */ - __pyx_tuple__9 = PyTuple_Pack(1, __pyx_kp_s_numpy_core_multiarray_failed_to); if (unlikely(!__pyx_tuple__9)) __PYX_ERR(1, 1000, __pyx_L1_error) - __Pyx_GOTREF(__pyx_tuple__9); - __Pyx_GIVEREF(__pyx_tuple__9); + __pyx_tuple__7 = PyTuple_Pack(1, __pyx_kp_s_numpy_core_multiarray_failed_to); if (unlikely(!__pyx_tuple__7)) __PYX_ERR(1, 1038, __pyx_L1_error) + __Pyx_GOTREF(__pyx_tuple__7); + __Pyx_GIVEREF(__pyx_tuple__7); - /* "../../../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1006 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":1044 * _import_umath() * except Exception: * raise ImportError("numpy.core.umath failed to import") # <<<<<<<<<<<<<< * * cdef inline int import_ufunc() except -1: */ - __pyx_tuple__10 = PyTuple_Pack(1, __pyx_kp_s_numpy_core_umath_failed_to_impor); if (unlikely(!__pyx_tuple__10)) __PYX_ERR(1, 1006, __pyx_L1_error) - __Pyx_GOTREF(__pyx_tuple__10); - __Pyx_GIVEREF(__pyx_tuple__10); - - /* "../../../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1012 - * _import_umath() - * except Exception: - * raise ImportError("numpy.core.umath failed to import") # <<<<<<<<<<<<<< - */ - __pyx_tuple__11 = PyTuple_Pack(1, __pyx_kp_s_numpy_core_umath_failed_to_impor); if (unlikely(!__pyx_tuple__11)) __PYX_ERR(1, 1012, __pyx_L1_error) - __Pyx_GOTREF(__pyx_tuple__11); - __Pyx_GIVEREF(__pyx_tuple__11); + __pyx_tuple__8 = PyTuple_Pack(1, __pyx_kp_s_numpy_core_umath_failed_to_impor); if (unlikely(!__pyx_tuple__8)) __PYX_ERR(1, 1044, __pyx_L1_error) + __Pyx_GOTREF(__pyx_tuple__8); + __Pyx_GIVEREF(__pyx_tuple__8); /* "gensim/models/word2vec_inner.pyx":500 * @@ -11288,58 +11284,58 @@ static int __Pyx_InitCachedConstants(void) { * """Update skip-gram model by training on a batch of sentences. * */ - __pyx_tuple__13 = PyTuple_Pack(21, __pyx_n_s_model, __pyx_n_s_sentences, __pyx_n_s_alpha, __pyx_n_s_work, __pyx_n_s_compute_loss, __pyx_n_s_c, __pyx_n_s_i, __pyx_n_s_j, __pyx_n_s_k, __pyx_n_s_effective_words, __pyx_n_s_effective_sentences, __pyx_n_s_effective_samples, __pyx_n_s_sent_idx, __pyx_n_s_idx_start, __pyx_n_s_idx_end, __pyx_n_s_vlookup, __pyx_n_s_sent, __pyx_n_s_token, __pyx_n_s_word, __pyx_n_s_item, __pyx_n_s_running_training_loss_sample); if (unlikely(!__pyx_tuple__13)) __PYX_ERR(0, 500, __pyx_L1_error) - __Pyx_GOTREF(__pyx_tuple__13); - __Pyx_GIVEREF(__pyx_tuple__13); - __pyx_codeobj__14 = (PyObject*)__Pyx_PyCode_New(5, 0, 21, 0, CO_OPTIMIZED|CO_NEWLOCALS, __pyx_empty_bytes, __pyx_empty_tuple, __pyx_empty_tuple, __pyx_tuple__13, __pyx_empty_tuple, __pyx_empty_tuple, __pyx_kp_s_word2vec_inner_pyx, __pyx_n_s_train_batch_sg, 500, __pyx_empty_bytes); if (unlikely(!__pyx_codeobj__14)) __PYX_ERR(0, 500, __pyx_L1_error) + __pyx_tuple__10 = PyTuple_Pack(20, __pyx_n_s_model, __pyx_n_s_sentences, __pyx_n_s_alpha, __pyx_n_s_work, __pyx_n_s_compute_loss, __pyx_n_s_c, __pyx_n_s_i, __pyx_n_s_j, __pyx_n_s_k, __pyx_n_s_effective_words, __pyx_n_s_effective_sentences, __pyx_n_s_effective_samples, __pyx_n_s_sent_idx, __pyx_n_s_idx_start, __pyx_n_s_idx_end, __pyx_n_s_vlookup, __pyx_n_s_sent, __pyx_n_s_token, __pyx_n_s_word, __pyx_n_s_item); if (unlikely(!__pyx_tuple__10)) __PYX_ERR(0, 500, __pyx_L1_error) + __Pyx_GOTREF(__pyx_tuple__10); + __Pyx_GIVEREF(__pyx_tuple__10); + __pyx_codeobj__11 = (PyObject*)__Pyx_PyCode_New(5, 0, 20, 0, CO_OPTIMIZED|CO_NEWLOCALS, __pyx_empty_bytes, __pyx_empty_tuple, __pyx_empty_tuple, __pyx_tuple__10, __pyx_empty_tuple, __pyx_empty_tuple, __pyx_kp_s_gensim_models_word2vec_inner_pyx, __pyx_n_s_train_batch_sg, 500, __pyx_empty_bytes); if (unlikely(!__pyx_codeobj__11)) __PYX_ERR(0, 500, __pyx_L1_error) - /* "gensim/models/word2vec_inner.pyx":595 + /* "gensim/models/word2vec_inner.pyx":594 * * * def train_batch_cbow(model, sentences, alpha, _work, _neu1, compute_loss): # <<<<<<<<<<<<<< * """Update CBOW model by training on a batch of sentences. * */ - __pyx_tuple__15 = PyTuple_Pack(20, __pyx_n_s_model, __pyx_n_s_sentences, __pyx_n_s_alpha, __pyx_n_s_work, __pyx_n_s_neu1, __pyx_n_s_compute_loss, __pyx_n_s_c, __pyx_n_s_i, __pyx_n_s_j, __pyx_n_s_k, __pyx_n_s_effective_words, __pyx_n_s_effective_sentences, __pyx_n_s_sent_idx, __pyx_n_s_idx_start, __pyx_n_s_idx_end, __pyx_n_s_vlookup, __pyx_n_s_sent, __pyx_n_s_token, __pyx_n_s_word, __pyx_n_s_item); if (unlikely(!__pyx_tuple__15)) __PYX_ERR(0, 595, __pyx_L1_error) - __Pyx_GOTREF(__pyx_tuple__15); - __Pyx_GIVEREF(__pyx_tuple__15); - __pyx_codeobj__16 = (PyObject*)__Pyx_PyCode_New(6, 0, 20, 0, CO_OPTIMIZED|CO_NEWLOCALS, __pyx_empty_bytes, __pyx_empty_tuple, __pyx_empty_tuple, __pyx_tuple__15, __pyx_empty_tuple, __pyx_empty_tuple, __pyx_kp_s_word2vec_inner_pyx, __pyx_n_s_train_batch_cbow, 595, __pyx_empty_bytes); if (unlikely(!__pyx_codeobj__16)) __PYX_ERR(0, 595, __pyx_L1_error) + __pyx_tuple__12 = PyTuple_Pack(20, __pyx_n_s_model, __pyx_n_s_sentences, __pyx_n_s_alpha, __pyx_n_s_work, __pyx_n_s_neu1, __pyx_n_s_compute_loss, __pyx_n_s_c, __pyx_n_s_i, __pyx_n_s_j, __pyx_n_s_k, __pyx_n_s_effective_words, __pyx_n_s_effective_sentences, __pyx_n_s_sent_idx, __pyx_n_s_idx_start, __pyx_n_s_idx_end, __pyx_n_s_vlookup, __pyx_n_s_sent, __pyx_n_s_token, __pyx_n_s_word, __pyx_n_s_item); if (unlikely(!__pyx_tuple__12)) __PYX_ERR(0, 594, __pyx_L1_error) + __Pyx_GOTREF(__pyx_tuple__12); + __Pyx_GIVEREF(__pyx_tuple__12); + __pyx_codeobj__13 = (PyObject*)__Pyx_PyCode_New(6, 0, 20, 0, CO_OPTIMIZED|CO_NEWLOCALS, __pyx_empty_bytes, __pyx_empty_tuple, __pyx_empty_tuple, __pyx_tuple__12, __pyx_empty_tuple, __pyx_empty_tuple, __pyx_kp_s_gensim_models_word2vec_inner_pyx, __pyx_n_s_train_batch_cbow, 594, __pyx_empty_bytes); if (unlikely(!__pyx_codeobj__13)) __PYX_ERR(0, 594, __pyx_L1_error) - /* "gensim/models/word2vec_inner.pyx":687 + /* "gensim/models/word2vec_inner.pyx":686 * * * def score_sentence_sg(model, sentence, _work): # <<<<<<<<<<<<<< * """Obtain likelihood score for a single sentence in a fitted skip-gram representation. * */ - __pyx_tuple__17 = PyTuple_Pack(12, __pyx_n_s_model, __pyx_n_s_sentence, __pyx_n_s_work, __pyx_n_s_c, __pyx_n_s_i, __pyx_n_s_j, __pyx_n_s_k, __pyx_n_s_result, __pyx_n_s_sentence_len, __pyx_n_s_vlookup, __pyx_n_s_token, __pyx_n_s_word); if (unlikely(!__pyx_tuple__17)) __PYX_ERR(0, 687, __pyx_L1_error) - __Pyx_GOTREF(__pyx_tuple__17); - __Pyx_GIVEREF(__pyx_tuple__17); - __pyx_codeobj__18 = (PyObject*)__Pyx_PyCode_New(3, 0, 12, 0, CO_OPTIMIZED|CO_NEWLOCALS, __pyx_empty_bytes, __pyx_empty_tuple, __pyx_empty_tuple, __pyx_tuple__17, __pyx_empty_tuple, __pyx_empty_tuple, __pyx_kp_s_word2vec_inner_pyx, __pyx_n_s_score_sentence_sg, 687, __pyx_empty_bytes); if (unlikely(!__pyx_codeobj__18)) __PYX_ERR(0, 687, __pyx_L1_error) + __pyx_tuple__14 = PyTuple_Pack(12, __pyx_n_s_model, __pyx_n_s_sentence, __pyx_n_s_work, __pyx_n_s_c, __pyx_n_s_i, __pyx_n_s_j, __pyx_n_s_k, __pyx_n_s_result, __pyx_n_s_sentence_len, __pyx_n_s_vlookup, __pyx_n_s_token, __pyx_n_s_word); if (unlikely(!__pyx_tuple__14)) __PYX_ERR(0, 686, __pyx_L1_error) + __Pyx_GOTREF(__pyx_tuple__14); + __Pyx_GIVEREF(__pyx_tuple__14); + __pyx_codeobj__15 = (PyObject*)__Pyx_PyCode_New(3, 0, 12, 0, CO_OPTIMIZED|CO_NEWLOCALS, __pyx_empty_bytes, __pyx_empty_tuple, __pyx_empty_tuple, __pyx_tuple__14, __pyx_empty_tuple, __pyx_empty_tuple, __pyx_kp_s_gensim_models_word2vec_inner_pyx, __pyx_n_s_score_sentence_sg, 686, __pyx_empty_bytes); if (unlikely(!__pyx_codeobj__15)) __PYX_ERR(0, 686, __pyx_L1_error) - /* "gensim/models/word2vec_inner.pyx":780 + /* "gensim/models/word2vec_inner.pyx":779 * work[0] += f * * def score_sentence_cbow(model, sentence, _work, _neu1): # <<<<<<<<<<<<<< * """Obtain likelihood score for a single sentence in a fitted CBOW representation. * */ - __pyx_tuple__19 = PyTuple_Pack(13, __pyx_n_s_model, __pyx_n_s_sentence, __pyx_n_s_work, __pyx_n_s_neu1, __pyx_n_s_c, __pyx_n_s_i, __pyx_n_s_j, __pyx_n_s_k, __pyx_n_s_result, __pyx_n_s_vlookup, __pyx_n_s_token, __pyx_n_s_word, __pyx_n_s_sentence_len); if (unlikely(!__pyx_tuple__19)) __PYX_ERR(0, 780, __pyx_L1_error) - __Pyx_GOTREF(__pyx_tuple__19); - __Pyx_GIVEREF(__pyx_tuple__19); - __pyx_codeobj__20 = (PyObject*)__Pyx_PyCode_New(4, 0, 13, 0, CO_OPTIMIZED|CO_NEWLOCALS, __pyx_empty_bytes, __pyx_empty_tuple, __pyx_empty_tuple, __pyx_tuple__19, __pyx_empty_tuple, __pyx_empty_tuple, __pyx_kp_s_word2vec_inner_pyx, __pyx_n_s_score_sentence_cbow, 780, __pyx_empty_bytes); if (unlikely(!__pyx_codeobj__20)) __PYX_ERR(0, 780, __pyx_L1_error) + __pyx_tuple__16 = PyTuple_Pack(13, __pyx_n_s_model, __pyx_n_s_sentence, __pyx_n_s_work, __pyx_n_s_neu1, __pyx_n_s_c, __pyx_n_s_i, __pyx_n_s_j, __pyx_n_s_k, __pyx_n_s_result, __pyx_n_s_vlookup, __pyx_n_s_token, __pyx_n_s_word, __pyx_n_s_sentence_len); if (unlikely(!__pyx_tuple__16)) __PYX_ERR(0, 779, __pyx_L1_error) + __Pyx_GOTREF(__pyx_tuple__16); + __Pyx_GIVEREF(__pyx_tuple__16); + __pyx_codeobj__17 = (PyObject*)__Pyx_PyCode_New(4, 0, 13, 0, CO_OPTIMIZED|CO_NEWLOCALS, __pyx_empty_bytes, __pyx_empty_tuple, __pyx_empty_tuple, __pyx_tuple__16, __pyx_empty_tuple, __pyx_empty_tuple, __pyx_kp_s_gensim_models_word2vec_inner_pyx, __pyx_n_s_score_sentence_cbow, 779, __pyx_empty_bytes); if (unlikely(!__pyx_codeobj__17)) __PYX_ERR(0, 779, __pyx_L1_error) - /* "gensim/models/word2vec_inner.pyx":888 + /* "gensim/models/word2vec_inner.pyx":887 * * * def init(): # <<<<<<<<<<<<<< * """Precompute function `sigmoid(x) = 1 / (1 + exp(-x))`, for x values discretized into table EXP_TABLE. * Also calculate log(sigmoid(x)) into LOG_TABLE. */ - __pyx_tuple__21 = PyTuple_Pack(7, __pyx_n_s_i, __pyx_n_s_x, __pyx_n_s_y, __pyx_n_s_expected, __pyx_n_s_size, __pyx_n_s_d_res, __pyx_n_s_p_res); if (unlikely(!__pyx_tuple__21)) __PYX_ERR(0, 888, __pyx_L1_error) - __Pyx_GOTREF(__pyx_tuple__21); - __Pyx_GIVEREF(__pyx_tuple__21); - __pyx_codeobj__22 = (PyObject*)__Pyx_PyCode_New(0, 0, 7, 0, CO_OPTIMIZED|CO_NEWLOCALS, __pyx_empty_bytes, __pyx_empty_tuple, __pyx_empty_tuple, __pyx_tuple__21, __pyx_empty_tuple, __pyx_empty_tuple, __pyx_kp_s_word2vec_inner_pyx, __pyx_n_s_init, 888, __pyx_empty_bytes); if (unlikely(!__pyx_codeobj__22)) __PYX_ERR(0, 888, __pyx_L1_error) + __pyx_tuple__18 = PyTuple_Pack(7, __pyx_n_s_i, __pyx_n_s_x, __pyx_n_s_y, __pyx_n_s_expected, __pyx_n_s_size, __pyx_n_s_d_res, __pyx_n_s_p_res); if (unlikely(!__pyx_tuple__18)) __PYX_ERR(0, 887, __pyx_L1_error) + __Pyx_GOTREF(__pyx_tuple__18); + __Pyx_GIVEREF(__pyx_tuple__18); + __pyx_codeobj__19 = (PyObject*)__Pyx_PyCode_New(0, 0, 7, 0, CO_OPTIMIZED|CO_NEWLOCALS, __pyx_empty_bytes, __pyx_empty_tuple, __pyx_empty_tuple, __pyx_tuple__18, __pyx_empty_tuple, __pyx_empty_tuple, __pyx_kp_s_gensim_models_word2vec_inner_pyx, __pyx_n_s_init, 887, __pyx_empty_bytes); if (unlikely(!__pyx_codeobj__19)) __PYX_ERR(0, 887, __pyx_L1_error) __Pyx_RefNannyFinishContext(); return 0; __pyx_L1_error:; @@ -11347,7 +11343,7 @@ static int __Pyx_InitCachedConstants(void) { return -1; } -static int __Pyx_InitGlobals(void) { +static CYTHON_SMALL_CODE int __Pyx_InitGlobals(void) { if (__Pyx_InitStrings(__pyx_string_tab) < 0) __PYX_ERR(0, 1, __pyx_L1_error); __pyx_int_0 = PyInt_FromLong(0); if (unlikely(!__pyx_int_0)) __PYX_ERR(0, 1, __pyx_L1_error) __pyx_int_1 = PyInt_FromLong(1); if (unlikely(!__pyx_int_1)) __PYX_ERR(0, 1, __pyx_L1_error) @@ -11359,13 +11355,13 @@ static int __Pyx_InitGlobals(void) { return -1; } -static int __Pyx_modinit_global_init_code(void); /*proto*/ -static int __Pyx_modinit_variable_export_code(void); /*proto*/ -static int __Pyx_modinit_function_export_code(void); /*proto*/ -static int __Pyx_modinit_type_init_code(void); /*proto*/ -static int __Pyx_modinit_type_import_code(void); /*proto*/ -static int __Pyx_modinit_variable_import_code(void); /*proto*/ -static int __Pyx_modinit_function_import_code(void); /*proto*/ +static CYTHON_SMALL_CODE int __Pyx_modinit_global_init_code(void); /*proto*/ +static CYTHON_SMALL_CODE int __Pyx_modinit_variable_export_code(void); /*proto*/ +static CYTHON_SMALL_CODE int __Pyx_modinit_function_export_code(void); /*proto*/ +static CYTHON_SMALL_CODE int __Pyx_modinit_type_init_code(void); /*proto*/ +static CYTHON_SMALL_CODE int __Pyx_modinit_type_import_code(void); /*proto*/ +static CYTHON_SMALL_CODE int __Pyx_modinit_variable_import_code(void); /*proto*/ +static CYTHON_SMALL_CODE int __Pyx_modinit_function_import_code(void); /*proto*/ static int __Pyx_modinit_global_init_code(void) { __Pyx_RefNannyDeclarations @@ -11427,23 +11423,37 @@ static int __Pyx_modinit_type_init_code(void) { static int __Pyx_modinit_type_import_code(void) { __Pyx_RefNannyDeclarations + PyObject *__pyx_t_1 = NULL; __Pyx_RefNannySetupContext("__Pyx_modinit_type_import_code", 0); /*--- Type import code ---*/ - __pyx_ptype_7cpython_4type_type = __Pyx_ImportType(__Pyx_BUILTIN_MODULE_NAME, "type", + __pyx_t_1 = PyImport_ImportModule(__Pyx_BUILTIN_MODULE_NAME); if (unlikely(!__pyx_t_1)) __PYX_ERR(2, 9, __pyx_L1_error) + __Pyx_GOTREF(__pyx_t_1); + __pyx_ptype_7cpython_4type_type = __Pyx_ImportType(__pyx_t_1, __Pyx_BUILTIN_MODULE_NAME, "type", #if defined(PYPY_VERSION_NUM) && PYPY_VERSION_NUM < 0x050B0000 sizeof(PyTypeObject), #else sizeof(PyHeapTypeObject), #endif - 0); if (unlikely(!__pyx_ptype_7cpython_4type_type)) __PYX_ERR(2, 9, __pyx_L1_error) - __pyx_ptype_5numpy_dtype = __Pyx_ImportType("numpy", "dtype", sizeof(PyArray_Descr), 0); if (unlikely(!__pyx_ptype_5numpy_dtype)) __PYX_ERR(1, 164, __pyx_L1_error) - __pyx_ptype_5numpy_flatiter = __Pyx_ImportType("numpy", "flatiter", sizeof(PyArrayIterObject), 0); if (unlikely(!__pyx_ptype_5numpy_flatiter)) __PYX_ERR(1, 186, __pyx_L1_error) - __pyx_ptype_5numpy_broadcast = __Pyx_ImportType("numpy", "broadcast", sizeof(PyArrayMultiIterObject), 0); if (unlikely(!__pyx_ptype_5numpy_broadcast)) __PYX_ERR(1, 190, __pyx_L1_error) - __pyx_ptype_5numpy_ndarray = __Pyx_ImportType("numpy", "ndarray", sizeof(PyArrayObject), 0); if (unlikely(!__pyx_ptype_5numpy_ndarray)) __PYX_ERR(1, 199, __pyx_L1_error) - __pyx_ptype_5numpy_ufunc = __Pyx_ImportType("numpy", "ufunc", sizeof(PyUFuncObject), 0); if (unlikely(!__pyx_ptype_5numpy_ufunc)) __PYX_ERR(1, 872, __pyx_L1_error) + __Pyx_ImportType_CheckSize_Warn); + if (!__pyx_ptype_7cpython_4type_type) __PYX_ERR(2, 9, __pyx_L1_error) + __Pyx_DECREF(__pyx_t_1); __pyx_t_1 = 0; + __pyx_t_1 = PyImport_ImportModule("numpy"); if (unlikely(!__pyx_t_1)) __PYX_ERR(1, 206, __pyx_L1_error) + __Pyx_GOTREF(__pyx_t_1); + __pyx_ptype_5numpy_dtype = __Pyx_ImportType(__pyx_t_1, "numpy", "dtype", sizeof(PyArray_Descr), __Pyx_ImportType_CheckSize_Ignore); + if (!__pyx_ptype_5numpy_dtype) __PYX_ERR(1, 206, __pyx_L1_error) + __pyx_ptype_5numpy_flatiter = __Pyx_ImportType(__pyx_t_1, "numpy", "flatiter", sizeof(PyArrayIterObject), __Pyx_ImportType_CheckSize_Warn); + if (!__pyx_ptype_5numpy_flatiter) __PYX_ERR(1, 229, __pyx_L1_error) + __pyx_ptype_5numpy_broadcast = __Pyx_ImportType(__pyx_t_1, "numpy", "broadcast", sizeof(PyArrayMultiIterObject), __Pyx_ImportType_CheckSize_Warn); + if (!__pyx_ptype_5numpy_broadcast) __PYX_ERR(1, 233, __pyx_L1_error) + __pyx_ptype_5numpy_ndarray = __Pyx_ImportType(__pyx_t_1, "numpy", "ndarray", sizeof(PyArrayObject), __Pyx_ImportType_CheckSize_Ignore); + if (!__pyx_ptype_5numpy_ndarray) __PYX_ERR(1, 242, __pyx_L1_error) + __pyx_ptype_5numpy_ufunc = __Pyx_ImportType(__pyx_t_1, "numpy", "ufunc", sizeof(PyUFuncObject), __Pyx_ImportType_CheckSize_Warn); + if (!__pyx_ptype_5numpy_ufunc) __PYX_ERR(1, 918, __pyx_L1_error) + __Pyx_DECREF(__pyx_t_1); __pyx_t_1 = 0; __Pyx_RefNannyFinishContext(); return 0; __pyx_L1_error:; + __Pyx_XDECREF(__pyx_t_1); __Pyx_RefNannyFinishContext(); return -1; } @@ -11478,15 +11488,6 @@ static int __Pyx_modinit_function_import_code(void) { #define __Pyx_PyMODINIT_FUNC PyMODINIT_FUNC #endif #endif -#ifndef CYTHON_SMALL_CODE -#if defined(__clang__) - #define CYTHON_SMALL_CODE -#elif defined(__GNUC__) && (!(defined(__cplusplus)) || (__GNUC__ > 4 || (__GNUC__ == 4 && __GNUC_MINOR__ > 4))) - #define CYTHON_SMALL_CODE __attribute__((optimize("Os"))) -#else - #define CYTHON_SMALL_CODE -#endif -#endif #if PY_MAJOR_VERSION < 3 @@ -11499,11 +11500,36 @@ __Pyx_PyMODINIT_FUNC PyInit_word2vec_inner(void) { return PyModuleDef_Init(&__pyx_moduledef); } -static int __Pyx_copy_spec_to_module(PyObject *spec, PyObject *moddict, const char* from_name, const char* to_name) { +static CYTHON_SMALL_CODE int __Pyx_check_single_interpreter(void) { + #if PY_VERSION_HEX >= 0x030700A1 + static PY_INT64_T main_interpreter_id = -1; + PY_INT64_T current_id = PyInterpreterState_GetID(PyThreadState_Get()->interp); + if (main_interpreter_id == -1) { + main_interpreter_id = current_id; + return (unlikely(current_id == -1)) ? -1 : 0; + } else if (unlikely(main_interpreter_id != current_id)) + #else + static PyInterpreterState *main_interpreter = NULL; + PyInterpreterState *current_interpreter = PyThreadState_Get()->interp; + if (!main_interpreter) { + main_interpreter = current_interpreter; + } else if (unlikely(main_interpreter != current_interpreter)) + #endif + { + PyErr_SetString( + PyExc_ImportError, + "Interpreter change detected - this module can only be loaded into one interpreter per process."); + return -1; + } + return 0; +} +static CYTHON_SMALL_CODE int __Pyx_copy_spec_to_module(PyObject *spec, PyObject *moddict, const char* from_name, const char* to_name, int allow_none) { PyObject *value = PyObject_GetAttrString(spec, from_name); int result = 0; if (likely(value)) { - result = PyDict_SetItemString(moddict, to_name, value); + if (allow_none || value != Py_None) { + result = PyDict_SetItemString(moddict, to_name, value); + } Py_DECREF(value); } else if (PyErr_ExceptionMatches(PyExc_AttributeError)) { PyErr_Clear(); @@ -11512,8 +11538,10 @@ static int __Pyx_copy_spec_to_module(PyObject *spec, PyObject *moddict, const ch } return result; } -static PyObject* __pyx_pymod_create(PyObject *spec, CYTHON_UNUSED PyModuleDef *def) { +static CYTHON_SMALL_CODE PyObject* __pyx_pymod_create(PyObject *spec, CYTHON_UNUSED PyModuleDef *def) { PyObject *module = NULL, *moddict, *modname; + if (__Pyx_check_single_interpreter()) + return NULL; if (__pyx_m) return __Pyx_NewRef(__pyx_m); modname = PyObject_GetAttrString(spec, "name"); @@ -11523,10 +11551,10 @@ static PyObject* __pyx_pymod_create(PyObject *spec, CYTHON_UNUSED PyModuleDef *d if (unlikely(!module)) goto bad; moddict = PyModule_GetDict(module); if (unlikely(!moddict)) goto bad; - if (unlikely(__Pyx_copy_spec_to_module(spec, moddict, "loader", "__loader__") < 0)) goto bad; - if (unlikely(__Pyx_copy_spec_to_module(spec, moddict, "origin", "__file__") < 0)) goto bad; - if (unlikely(__Pyx_copy_spec_to_module(spec, moddict, "parent", "__package__") < 0)) goto bad; - if (unlikely(__Pyx_copy_spec_to_module(spec, moddict, "submodule_search_locations", "__path__") < 0)) goto bad; + if (unlikely(__Pyx_copy_spec_to_module(spec, moddict, "loader", "__loader__", 1) < 0)) goto bad; + if (unlikely(__Pyx_copy_spec_to_module(spec, moddict, "origin", "__file__", 1) < 0)) goto bad; + if (unlikely(__Pyx_copy_spec_to_module(spec, moddict, "parent", "__package__", 1) < 0)) goto bad; + if (unlikely(__Pyx_copy_spec_to_module(spec, moddict, "submodule_search_locations", "__path__", 0) < 0)) goto bad; return module; bad: Py_XDECREF(module); @@ -11534,7 +11562,7 @@ static PyObject* __pyx_pymod_create(PyObject *spec, CYTHON_UNUSED PyModuleDef *d } -static int __pyx_pymod_exec_word2vec_inner(PyObject *__pyx_pyinit_module) +static CYTHON_SMALL_CODE int __pyx_pymod_exec_word2vec_inner(PyObject *__pyx_pyinit_module) #endif #endif { @@ -11549,7 +11577,11 @@ static int __pyx_pymod_exec_word2vec_inner(PyObject *__pyx_pyinit_module) PyObject *__pyx_t_9 = NULL; __Pyx_RefNannyDeclarations #if CYTHON_PEP489_MULTI_PHASE_INIT - if (__pyx_m && __pyx_m == __pyx_pyinit_module) return 0; + if (__pyx_m) { + if (__pyx_m == __pyx_pyinit_module) return 0; + PyErr_SetString(PyExc_RuntimeError, "Module 'word2vec_inner' has already been imported. Re-initialisation is not supported."); + return -1; + } #elif PY_MAJOR_VERSION >= 3 if (__pyx_m) return __Pyx_NewRef(__pyx_m); #endif @@ -11564,6 +11596,9 @@ if (!__Pyx_RefNanny) { #endif __Pyx_RefNannySetupContext("__Pyx_PyMODINIT_FUNC PyInit_word2vec_inner(void)", 0); if (__Pyx_check_binary_version() < 0) __PYX_ERR(0, 1, __pyx_L1_error) + #ifdef __Pxy_PyFrame_Initialize_Offsets + __Pxy_PyFrame_Initialize_Offsets(); + #endif __pyx_empty_tuple = PyTuple_New(0); if (unlikely(!__pyx_empty_tuple)) __PYX_ERR(0, 1, __pyx_L1_error) __pyx_empty_bytes = PyBytes_FromStringAndSize("", 0); if (unlikely(!__pyx_empty_bytes)) __PYX_ERR(0, 1, __pyx_L1_error) __pyx_empty_unicode = PyUnicode_FromStringAndSize("", 0); if (unlikely(!__pyx_empty_unicode)) __PYX_ERR(0, 1, __pyx_L1_error) @@ -11618,7 +11653,7 @@ if (!__Pyx_RefNanny) { if (__Pyx_init_sys_getdefaultencoding_params() < 0) __PYX_ERR(0, 1, __pyx_L1_error) #endif if (__pyx_module_is_main_gensim__models__word2vec_inner) { - if (PyObject_SetAttrString(__pyx_m, "__name__", __pyx_n_s_main) < 0) __PYX_ERR(0, 1, __pyx_L1_error) + if (PyObject_SetAttr(__pyx_m, __pyx_n_s_name, __pyx_n_s_main) < 0) __PYX_ERR(0, 1, __pyx_L1_error) } #if PY_MAJOR_VERSION >= 3 { @@ -11734,17 +11769,17 @@ if (!__Pyx_RefNanny) { */ __pyx_t_8 = PyList_New(1); if (unlikely(!__pyx_t_8)) __PYX_ERR(0, 27, __pyx_L4_except_error) __Pyx_GOTREF(__pyx_t_8); - __Pyx_INCREF(__pyx_n_s__12); - __Pyx_GIVEREF(__pyx_n_s__12); - PyList_SET_ITEM(__pyx_t_8, 0, __pyx_n_s__12); + __Pyx_INCREF(__pyx_n_s__9); + __Pyx_GIVEREF(__pyx_n_s__9); + PyList_SET_ITEM(__pyx_t_8, 0, __pyx_n_s__9); __pyx_t_9 = __Pyx_Import(__pyx_n_s_scipy_linalg_blas, __pyx_t_8, -1); if (unlikely(!__pyx_t_9)) __PYX_ERR(0, 27, __pyx_L4_except_error) __Pyx_GOTREF(__pyx_t_9); __Pyx_DECREF(__pyx_t_8); __pyx_t_8 = 0; if (PyDict_SetItem(__pyx_d, __pyx_n_s_fblas, __pyx_t_9) < 0) __PYX_ERR(0, 27, __pyx_L4_except_error) __Pyx_DECREF(__pyx_t_9); __pyx_t_9 = 0; - __Pyx_DECREF(__pyx_t_5); __pyx_t_5 = 0; - __Pyx_DECREF(__pyx_t_1); __pyx_t_1 = 0; - __Pyx_DECREF(__pyx_t_7); __pyx_t_7 = 0; + __Pyx_XDECREF(__pyx_t_5); __pyx_t_5 = 0; + __Pyx_XDECREF(__pyx_t_1); __pyx_t_1 = 0; + __Pyx_XDECREF(__pyx_t_7); __pyx_t_7 = 0; goto __pyx_L3_exception_handled; } goto __pyx_L4_except_error; @@ -11777,7 +11812,7 @@ if (!__Pyx_RefNanny) { * * DEF MAX_SENTENCE_LEN = 10000 */ - __pyx_t_7 = __Pyx_GetModuleGlobalName(__pyx_n_s_np); if (unlikely(!__pyx_t_7)) __PYX_ERR(0, 29, __pyx_L1_error) + __Pyx_GetModuleGlobalName(__pyx_t_7, __pyx_n_s_np); if (unlikely(!__pyx_t_7)) __PYX_ERR(0, 29, __pyx_L1_error) __Pyx_GOTREF(__pyx_t_7); __pyx_t_1 = __Pyx_PyObject_GetAttrStr(__pyx_t_7, __pyx_n_s_float32); if (unlikely(!__pyx_t_1)) __PYX_ERR(0, 29, __pyx_L1_error) __Pyx_GOTREF(__pyx_t_1); @@ -11792,7 +11827,7 @@ if (!__Pyx_RefNanny) { * cdef saxpy_ptr saxpy=PyCObject_AsVoidPtr(fblas.saxpy._cpointer) # y += alpha * x * cdef sdot_ptr sdot=PyCObject_AsVoidPtr(fblas.sdot._cpointer) # float = dot(x, y) */ - __pyx_t_1 = __Pyx_GetModuleGlobalName(__pyx_n_s_fblas); if (unlikely(!__pyx_t_1)) __PYX_ERR(0, 33, __pyx_L1_error) + __Pyx_GetModuleGlobalName(__pyx_t_1, __pyx_n_s_fblas); if (unlikely(!__pyx_t_1)) __PYX_ERR(0, 33, __pyx_L1_error) __Pyx_GOTREF(__pyx_t_1); __pyx_t_7 = __Pyx_PyObject_GetAttrStr(__pyx_t_1, __pyx_n_s_scopy); if (unlikely(!__pyx_t_7)) __PYX_ERR(0, 33, __pyx_L1_error) __Pyx_GOTREF(__pyx_t_7); @@ -11810,7 +11845,7 @@ if (!__Pyx_RefNanny) { * cdef sdot_ptr sdot=PyCObject_AsVoidPtr(fblas.sdot._cpointer) # float = dot(x, y) * cdef dsdot_ptr dsdot=PyCObject_AsVoidPtr(fblas.sdot._cpointer) # double = dot(x, y) */ - __pyx_t_1 = __Pyx_GetModuleGlobalName(__pyx_n_s_fblas); if (unlikely(!__pyx_t_1)) __PYX_ERR(0, 34, __pyx_L1_error) + __Pyx_GetModuleGlobalName(__pyx_t_1, __pyx_n_s_fblas); if (unlikely(!__pyx_t_1)) __PYX_ERR(0, 34, __pyx_L1_error) __Pyx_GOTREF(__pyx_t_1); __pyx_t_7 = __Pyx_PyObject_GetAttrStr(__pyx_t_1, __pyx_n_s_saxpy); if (unlikely(!__pyx_t_7)) __PYX_ERR(0, 34, __pyx_L1_error) __Pyx_GOTREF(__pyx_t_7); @@ -11828,7 +11863,7 @@ if (!__Pyx_RefNanny) { * cdef dsdot_ptr dsdot=PyCObject_AsVoidPtr(fblas.sdot._cpointer) # double = dot(x, y) * cdef snrm2_ptr snrm2=PyCObject_AsVoidPtr(fblas.snrm2._cpointer) # sqrt(x^2) */ - __pyx_t_1 = __Pyx_GetModuleGlobalName(__pyx_n_s_fblas); if (unlikely(!__pyx_t_1)) __PYX_ERR(0, 35, __pyx_L1_error) + __Pyx_GetModuleGlobalName(__pyx_t_1, __pyx_n_s_fblas); if (unlikely(!__pyx_t_1)) __PYX_ERR(0, 35, __pyx_L1_error) __Pyx_GOTREF(__pyx_t_1); __pyx_t_7 = __Pyx_PyObject_GetAttrStr(__pyx_t_1, __pyx_n_s_sdot); if (unlikely(!__pyx_t_7)) __PYX_ERR(0, 35, __pyx_L1_error) __Pyx_GOTREF(__pyx_t_7); @@ -11846,7 +11881,7 @@ if (!__Pyx_RefNanny) { * cdef snrm2_ptr snrm2=PyCObject_AsVoidPtr(fblas.snrm2._cpointer) # sqrt(x^2) * cdef sscal_ptr sscal=PyCObject_AsVoidPtr(fblas.sscal._cpointer) # x = alpha * x */ - __pyx_t_1 = __Pyx_GetModuleGlobalName(__pyx_n_s_fblas); if (unlikely(!__pyx_t_1)) __PYX_ERR(0, 36, __pyx_L1_error) + __Pyx_GetModuleGlobalName(__pyx_t_1, __pyx_n_s_fblas); if (unlikely(!__pyx_t_1)) __PYX_ERR(0, 36, __pyx_L1_error) __Pyx_GOTREF(__pyx_t_1); __pyx_t_7 = __Pyx_PyObject_GetAttrStr(__pyx_t_1, __pyx_n_s_sdot); if (unlikely(!__pyx_t_7)) __PYX_ERR(0, 36, __pyx_L1_error) __Pyx_GOTREF(__pyx_t_7); @@ -11864,7 +11899,7 @@ if (!__Pyx_RefNanny) { * cdef sscal_ptr sscal=PyCObject_AsVoidPtr(fblas.sscal._cpointer) # x = alpha * x * */ - __pyx_t_1 = __Pyx_GetModuleGlobalName(__pyx_n_s_fblas); if (unlikely(!__pyx_t_1)) __PYX_ERR(0, 37, __pyx_L1_error) + __Pyx_GetModuleGlobalName(__pyx_t_1, __pyx_n_s_fblas); if (unlikely(!__pyx_t_1)) __PYX_ERR(0, 37, __pyx_L1_error) __Pyx_GOTREF(__pyx_t_1); __pyx_t_7 = __Pyx_PyObject_GetAttrStr(__pyx_t_1, __pyx_n_s_snrm2); if (unlikely(!__pyx_t_7)) __PYX_ERR(0, 37, __pyx_L1_error) __Pyx_GOTREF(__pyx_t_7); @@ -11882,7 +11917,7 @@ if (!__Pyx_RefNanny) { * * DEF EXP_TABLE_SIZE = 1000 */ - __pyx_t_1 = __Pyx_GetModuleGlobalName(__pyx_n_s_fblas); if (unlikely(!__pyx_t_1)) __PYX_ERR(0, 38, __pyx_L1_error) + __Pyx_GetModuleGlobalName(__pyx_t_1, __pyx_n_s_fblas); if (unlikely(!__pyx_t_1)) __PYX_ERR(0, 38, __pyx_L1_error) __Pyx_GOTREF(__pyx_t_1); __pyx_t_7 = __Pyx_PyObject_GetAttrStr(__pyx_t_1, __pyx_n_s_sscal); if (unlikely(!__pyx_t_7)) __PYX_ERR(0, 38, __pyx_L1_error) __Pyx_GOTREF(__pyx_t_7); @@ -11923,74 +11958,74 @@ if (!__Pyx_RefNanny) { if (PyDict_SetItem(__pyx_d, __pyx_n_s_train_batch_sg, __pyx_t_1) < 0) __PYX_ERR(0, 500, __pyx_L1_error) __Pyx_DECREF(__pyx_t_1); __pyx_t_1 = 0; - /* "gensim/models/word2vec_inner.pyx":595 + /* "gensim/models/word2vec_inner.pyx":594 * * * def train_batch_cbow(model, sentences, alpha, _work, _neu1, compute_loss): # <<<<<<<<<<<<<< * """Update CBOW model by training on a batch of sentences. * */ - __pyx_t_1 = PyCFunction_NewEx(&__pyx_mdef_6gensim_6models_14word2vec_inner_3train_batch_cbow, NULL, __pyx_n_s_gensim_models_word2vec_inner); if (unlikely(!__pyx_t_1)) __PYX_ERR(0, 595, __pyx_L1_error) + __pyx_t_1 = PyCFunction_NewEx(&__pyx_mdef_6gensim_6models_14word2vec_inner_3train_batch_cbow, NULL, __pyx_n_s_gensim_models_word2vec_inner); if (unlikely(!__pyx_t_1)) __PYX_ERR(0, 594, __pyx_L1_error) __Pyx_GOTREF(__pyx_t_1); - if (PyDict_SetItem(__pyx_d, __pyx_n_s_train_batch_cbow, __pyx_t_1) < 0) __PYX_ERR(0, 595, __pyx_L1_error) + if (PyDict_SetItem(__pyx_d, __pyx_n_s_train_batch_cbow, __pyx_t_1) < 0) __PYX_ERR(0, 594, __pyx_L1_error) __Pyx_DECREF(__pyx_t_1); __pyx_t_1 = 0; - /* "gensim/models/word2vec_inner.pyx":687 + /* "gensim/models/word2vec_inner.pyx":686 * * * def score_sentence_sg(model, sentence, _work): # <<<<<<<<<<<<<< * """Obtain likelihood score for a single sentence in a fitted skip-gram representation. * */ - __pyx_t_1 = PyCFunction_NewEx(&__pyx_mdef_6gensim_6models_14word2vec_inner_5score_sentence_sg, NULL, __pyx_n_s_gensim_models_word2vec_inner); if (unlikely(!__pyx_t_1)) __PYX_ERR(0, 687, __pyx_L1_error) + __pyx_t_1 = PyCFunction_NewEx(&__pyx_mdef_6gensim_6models_14word2vec_inner_5score_sentence_sg, NULL, __pyx_n_s_gensim_models_word2vec_inner); if (unlikely(!__pyx_t_1)) __PYX_ERR(0, 686, __pyx_L1_error) __Pyx_GOTREF(__pyx_t_1); - if (PyDict_SetItem(__pyx_d, __pyx_n_s_score_sentence_sg, __pyx_t_1) < 0) __PYX_ERR(0, 687, __pyx_L1_error) + if (PyDict_SetItem(__pyx_d, __pyx_n_s_score_sentence_sg, __pyx_t_1) < 0) __PYX_ERR(0, 686, __pyx_L1_error) __Pyx_DECREF(__pyx_t_1); __pyx_t_1 = 0; - /* "gensim/models/word2vec_inner.pyx":780 + /* "gensim/models/word2vec_inner.pyx":779 * work[0] += f * * def score_sentence_cbow(model, sentence, _work, _neu1): # <<<<<<<<<<<<<< * """Obtain likelihood score for a single sentence in a fitted CBOW representation. * */ - __pyx_t_1 = PyCFunction_NewEx(&__pyx_mdef_6gensim_6models_14word2vec_inner_7score_sentence_cbow, NULL, __pyx_n_s_gensim_models_word2vec_inner); if (unlikely(!__pyx_t_1)) __PYX_ERR(0, 780, __pyx_L1_error) + __pyx_t_1 = PyCFunction_NewEx(&__pyx_mdef_6gensim_6models_14word2vec_inner_7score_sentence_cbow, NULL, __pyx_n_s_gensim_models_word2vec_inner); if (unlikely(!__pyx_t_1)) __PYX_ERR(0, 779, __pyx_L1_error) __Pyx_GOTREF(__pyx_t_1); - if (PyDict_SetItem(__pyx_d, __pyx_n_s_score_sentence_cbow, __pyx_t_1) < 0) __PYX_ERR(0, 780, __pyx_L1_error) + if (PyDict_SetItem(__pyx_d, __pyx_n_s_score_sentence_cbow, __pyx_t_1) < 0) __PYX_ERR(0, 779, __pyx_L1_error) __Pyx_DECREF(__pyx_t_1); __pyx_t_1 = 0; - /* "gensim/models/word2vec_inner.pyx":888 + /* "gensim/models/word2vec_inner.pyx":887 * * * def init(): # <<<<<<<<<<<<<< * """Precompute function `sigmoid(x) = 1 / (1 + exp(-x))`, for x values discretized into table EXP_TABLE. * Also calculate log(sigmoid(x)) into LOG_TABLE. */ - __pyx_t_1 = PyCFunction_NewEx(&__pyx_mdef_6gensim_6models_14word2vec_inner_9init, NULL, __pyx_n_s_gensim_models_word2vec_inner); if (unlikely(!__pyx_t_1)) __PYX_ERR(0, 888, __pyx_L1_error) + __pyx_t_1 = PyCFunction_NewEx(&__pyx_mdef_6gensim_6models_14word2vec_inner_9init, NULL, __pyx_n_s_gensim_models_word2vec_inner); if (unlikely(!__pyx_t_1)) __PYX_ERR(0, 887, __pyx_L1_error) __Pyx_GOTREF(__pyx_t_1); - if (PyDict_SetItem(__pyx_d, __pyx_n_s_init, __pyx_t_1) < 0) __PYX_ERR(0, 888, __pyx_L1_error) + if (PyDict_SetItem(__pyx_d, __pyx_n_s_init, __pyx_t_1) < 0) __PYX_ERR(0, 887, __pyx_L1_error) __Pyx_DECREF(__pyx_t_1); __pyx_t_1 = 0; - /* "gensim/models/word2vec_inner.pyx":935 + /* "gensim/models/word2vec_inner.pyx":934 * return 2 * * FAST_VERSION = init() # initialize the module # <<<<<<<<<<<<<< * MAX_WORDS_IN_BATCH = MAX_SENTENCE_LEN */ - __pyx_t_1 = __Pyx_GetModuleGlobalName(__pyx_n_s_init); if (unlikely(!__pyx_t_1)) __PYX_ERR(0, 935, __pyx_L1_error) + __Pyx_GetModuleGlobalName(__pyx_t_1, __pyx_n_s_init); if (unlikely(!__pyx_t_1)) __PYX_ERR(0, 934, __pyx_L1_error) __Pyx_GOTREF(__pyx_t_1); - __pyx_t_7 = __Pyx_PyObject_CallNoArg(__pyx_t_1); if (unlikely(!__pyx_t_7)) __PYX_ERR(0, 935, __pyx_L1_error) + __pyx_t_7 = __Pyx_PyObject_CallNoArg(__pyx_t_1); if (unlikely(!__pyx_t_7)) __PYX_ERR(0, 934, __pyx_L1_error) __Pyx_GOTREF(__pyx_t_7); __Pyx_DECREF(__pyx_t_1); __pyx_t_1 = 0; - if (PyDict_SetItem(__pyx_d, __pyx_n_s_FAST_VERSION, __pyx_t_7) < 0) __PYX_ERR(0, 935, __pyx_L1_error) + if (PyDict_SetItem(__pyx_d, __pyx_n_s_FAST_VERSION, __pyx_t_7) < 0) __PYX_ERR(0, 934, __pyx_L1_error) __Pyx_DECREF(__pyx_t_7); __pyx_t_7 = 0; - /* "gensim/models/word2vec_inner.pyx":936 + /* "gensim/models/word2vec_inner.pyx":935 * * FAST_VERSION = init() # initialize the module * MAX_WORDS_IN_BATCH = MAX_SENTENCE_LEN # <<<<<<<<<<<<<< */ - if (PyDict_SetItem(__pyx_d, __pyx_n_s_MAX_WORDS_IN_BATCH, __pyx_int_10000) < 0) __PYX_ERR(0, 936, __pyx_L1_error) + if (PyDict_SetItem(__pyx_d, __pyx_n_s_MAX_WORDS_IN_BATCH, __pyx_int_10000) < 0) __PYX_ERR(0, 935, __pyx_L1_error) /* "gensim/models/word2vec_inner.pyx":1 * #!/usr/bin/env cython # <<<<<<<<<<<<<< @@ -12002,7 +12037,7 @@ if (!__Pyx_RefNanny) { if (PyDict_SetItem(__pyx_d, __pyx_n_s_test, __pyx_t_7) < 0) __PYX_ERR(0, 1, __pyx_L1_error) __Pyx_DECREF(__pyx_t_7); __pyx_t_7 = 0; - /* "../../../../anaconda/lib/python2.7/site-packages/Cython/Includes/numpy/__init__.pxd":1008 + /* "../../envs/gensim/lib/python3.7/site-packages/Cython/Includes/numpy/__init__.pxd":1046 * raise ImportError("numpy.core.umath failed to import") * * cdef inline int import_ufunc() except -1: # <<<<<<<<<<<<<< @@ -12021,9 +12056,9 @@ if (!__Pyx_RefNanny) { __Pyx_XDECREF(__pyx_t_9); if (__pyx_m) { if (__pyx_d) { - __Pyx_AddTraceback("init gensim.models.word2vec_inner", 0, __pyx_lineno, __pyx_filename); + __Pyx_AddTraceback("init gensim.models.word2vec_inner", __pyx_clineno, __pyx_lineno, __pyx_filename); } - Py_DECREF(__pyx_m); __pyx_m = 0; + Py_CLEAR(__pyx_m); } else if (!PyErr_Occurred()) { PyErr_SetString(PyExc_ImportError, "init gensim.models.word2vec_inner"); } @@ -12044,9 +12079,9 @@ if (!__Pyx_RefNanny) { static __Pyx_RefNannyAPIStruct *__Pyx_RefNannyImportAPI(const char *modname) { PyObject *m = NULL, *p = NULL; void *r = NULL; - m = PyImport_ImportModule((char *)modname); + m = PyImport_ImportModule(modname); if (!m) goto end; - p = PyObject_GetAttrString(m, (char *)"RefNannyAPI"); + p = PyObject_GetAttrString(m, "RefNannyAPI"); if (!p) goto end; r = PyLong_AsVoidPtr(p); end: @@ -12084,6 +12119,73 @@ static PyObject *__Pyx_GetBuiltinName(PyObject *name) { return result; } +/* PyIntCompare */ +static CYTHON_INLINE PyObject* __Pyx_PyInt_NeObjC(PyObject *op1, PyObject *op2, CYTHON_UNUSED long intval, CYTHON_UNUSED long inplace) { + if (op1 == op2) { + Py_RETURN_FALSE; + } + #if PY_MAJOR_VERSION < 3 + if (likely(PyInt_CheckExact(op1))) { + const long b = intval; + long a = PyInt_AS_LONG(op1); + if (a != b) Py_RETURN_TRUE; else Py_RETURN_FALSE; + } + #endif + #if CYTHON_USE_PYLONG_INTERNALS + if (likely(PyLong_CheckExact(op1))) { + int unequal; + unsigned long uintval; + Py_ssize_t size = Py_SIZE(op1); + const digit* digits = ((PyLongObject*)op1)->ob_digit; + if (intval == 0) { + if (size != 0) Py_RETURN_TRUE; else Py_RETURN_FALSE; + } else if (intval < 0) { + if (size >= 0) + Py_RETURN_TRUE; + intval = -intval; + size = -size; + } else { + if (size <= 0) + Py_RETURN_TRUE; + } + uintval = (unsigned long) intval; +#if PyLong_SHIFT * 4 < SIZEOF_LONG*8 + if (uintval >> (PyLong_SHIFT * 4)) { + unequal = (size != 5) || (digits[0] != (uintval & (unsigned long) PyLong_MASK)) + | (digits[1] != ((uintval >> (1 * PyLong_SHIFT)) & (unsigned long) PyLong_MASK)) | (digits[2] != ((uintval >> (2 * PyLong_SHIFT)) & (unsigned long) PyLong_MASK)) | (digits[3] != ((uintval >> (3 * PyLong_SHIFT)) & (unsigned long) PyLong_MASK)) | (digits[4] != ((uintval >> (4 * PyLong_SHIFT)) & (unsigned long) PyLong_MASK)); + } else +#endif +#if PyLong_SHIFT * 3 < SIZEOF_LONG*8 + if (uintval >> (PyLong_SHIFT * 3)) { + unequal = (size != 4) || (digits[0] != (uintval & (unsigned long) PyLong_MASK)) + | (digits[1] != ((uintval >> (1 * PyLong_SHIFT)) & (unsigned long) PyLong_MASK)) | (digits[2] != ((uintval >> (2 * PyLong_SHIFT)) & (unsigned long) PyLong_MASK)) | (digits[3] != ((uintval >> (3 * PyLong_SHIFT)) & (unsigned long) PyLong_MASK)); + } else +#endif +#if PyLong_SHIFT * 2 < SIZEOF_LONG*8 + if (uintval >> (PyLong_SHIFT * 2)) { + unequal = (size != 3) || (digits[0] != (uintval & (unsigned long) PyLong_MASK)) + | (digits[1] != ((uintval >> (1 * PyLong_SHIFT)) & (unsigned long) PyLong_MASK)) | (digits[2] != ((uintval >> (2 * PyLong_SHIFT)) & (unsigned long) PyLong_MASK)); + } else +#endif +#if PyLong_SHIFT * 1 < SIZEOF_LONG*8 + if (uintval >> (PyLong_SHIFT * 1)) { + unequal = (size != 2) || (digits[0] != (uintval & (unsigned long) PyLong_MASK)) + | (digits[1] != ((uintval >> (1 * PyLong_SHIFT)) & (unsigned long) PyLong_MASK)); + } else +#endif + unequal = (size != 1) || (((unsigned long) digits[0]) != (uintval & (unsigned long) PyLong_MASK)); + if (unequal != 0) Py_RETURN_TRUE; else Py_RETURN_FALSE; + } + #endif + if (PyFloat_CheckExact(op1)) { + const long b = intval; + double a = PyFloat_AS_DOUBLE(op1); + if ((double)a != (double)b) Py_RETURN_TRUE; else Py_RETURN_FALSE; + } + return ( + PyObject_RichCompare(op1, op2, Py_NE)); +} + /* ExtTypeTest */ static CYTHON_INLINE int __Pyx_TypeTest(PyObject *obj, PyTypeObject *type) { if (unlikely(!type)) { @@ -12275,7 +12377,7 @@ static CYTHON_INLINE PyObject *__Pyx_GetItemInt_List_Fast(PyObject *o, Py_ssize_ if (wraparound & unlikely(i < 0)) { wrapped_i += PyList_GET_SIZE(o); } - if ((!boundscheck) || likely((0 <= wrapped_i) & (wrapped_i < PyList_GET_SIZE(o)))) { + if ((!boundscheck) || likely(__Pyx_is_valid_index(wrapped_i, PyList_GET_SIZE(o)))) { PyObject *r = PyList_GET_ITEM(o, wrapped_i); Py_INCREF(r); return r; @@ -12293,7 +12395,7 @@ static CYTHON_INLINE PyObject *__Pyx_GetItemInt_Tuple_Fast(PyObject *o, Py_ssize if (wraparound & unlikely(i < 0)) { wrapped_i += PyTuple_GET_SIZE(o); } - if ((!boundscheck) || likely((0 <= wrapped_i) & (wrapped_i < PyTuple_GET_SIZE(o)))) { + if ((!boundscheck) || likely(__Pyx_is_valid_index(wrapped_i, PyTuple_GET_SIZE(o)))) { PyObject *r = PyTuple_GET_ITEM(o, wrapped_i); Py_INCREF(r); return r; @@ -12309,7 +12411,7 @@ static CYTHON_INLINE PyObject *__Pyx_GetItemInt_Fast(PyObject *o, Py_ssize_t i, #if CYTHON_ASSUME_SAFE_MACROS && !CYTHON_AVOID_BORROWED_REFS && CYTHON_USE_TYPE_SLOTS if (is_list || PyList_CheckExact(o)) { Py_ssize_t n = ((!wraparound) | likely(i >= 0)) ? i : i + PyList_GET_SIZE(o); - if ((!boundscheck) || (likely((n >= 0) & (n < PyList_GET_SIZE(o))))) { + if ((!boundscheck) || (likely(__Pyx_is_valid_index(n, PyList_GET_SIZE(o))))) { PyObject *r = PyList_GET_ITEM(o, n); Py_INCREF(r); return r; @@ -12317,7 +12419,7 @@ static CYTHON_INLINE PyObject *__Pyx_GetItemInt_Fast(PyObject *o, Py_ssize_t i, } else if (PyTuple_CheckExact(o)) { Py_ssize_t n = ((!wraparound) | likely(i >= 0)) ? i : i + PyTuple_GET_SIZE(o); - if ((!boundscheck) || likely((n >= 0) & (n < PyTuple_GET_SIZE(o)))) { + if ((!boundscheck) || likely(__Pyx_is_valid_index(n, PyTuple_GET_SIZE(o)))) { PyObject *r = PyTuple_GET_ITEM(o, n); Py_INCREF(r); return r; @@ -12377,7 +12479,6 @@ static PyObject *__Pyx_PyObject_GetItem(PyObject *obj, PyObject* key) { /* PyFunctionFastCall */ #if CYTHON_FAST_PYCALL -#include "frameobject.h" static PyObject* __Pyx_PyFunction_FastCallNoKw(PyCodeObject *co, PyObject **args, Py_ssize_t na, PyObject *globals) { PyFrameObject *f; @@ -12395,7 +12496,7 @@ static PyObject* __Pyx_PyFunction_FastCallNoKw(PyCodeObject *co, PyObject **args if (f == NULL) { return NULL; } - fastlocals = f->f_localsplus; + fastlocals = __Pyx_PyFrame_GetLocalsplus(f); for (i = 0; i < na; i++) { Py_INCREF(*args); fastlocals[i] = *args++; @@ -12503,7 +12604,7 @@ static CYTHON_INLINE PyObject * __Pyx_PyCFunction_FastCall(PyObject *func_obj, P PyObject *self = PyCFunction_GET_SELF(func); int flags = PyCFunction_GET_FLAGS(func); assert(PyCFunction_Check(func)); - assert(METH_FASTCALL == (flags & ~(METH_CLASS | METH_STATIC | METH_COEXIST | METH_KEYWORDS))); + assert(METH_FASTCALL == (flags & ~(METH_CLASS | METH_STATIC | METH_COEXIST | METH_KEYWORDS | METH_STACKLESS))); assert(nargs >= 0); assert(nargs == 0 || args != NULL); /* _PyCFunction_FastCallDict() must not be called with an exception set, @@ -12511,9 +12612,9 @@ static CYTHON_INLINE PyObject * __Pyx_PyCFunction_FastCall(PyObject *func_obj, P caller loses its exception */ assert(!PyErr_Occurred()); if ((PY_VERSION_HEX < 0x030700A0) || unlikely(flags & METH_KEYWORDS)) { - return (*((__Pyx_PyCFunctionFastWithKeywords)meth)) (self, args, nargs, NULL); + return (*((__Pyx_PyCFunctionFastWithKeywords)(void*)meth)) (self, args, nargs, NULL); } else { - return (*((__Pyx_PyCFunctionFast)meth)) (self, args, nargs); + return (*((__Pyx_PyCFunctionFast)(void*)meth)) (self, args, nargs); } } #endif @@ -12782,10 +12883,15 @@ static PyObject *__Pyx_PyDict_GetItem(PyObject *d, PyObject* key) { value = PyDict_GetItemWithError(d, key); if (unlikely(!value)) { if (!PyErr_Occurred()) { - PyObject* args = PyTuple_Pack(1, key); - if (likely(args)) - PyErr_SetObject(PyExc_KeyError, args); - Py_XDECREF(args); + if (unlikely(PyTuple_Check(key))) { + PyObject* args = PyTuple_Pack(1, key); + if (likely(args)) { + PyErr_SetObject(PyExc_KeyError, args); + Py_DECREF(args); + } + } else { + PyErr_SetObject(PyExc_KeyError, key); + } } return NULL; } @@ -12812,13 +12918,29 @@ static CYTHON_INLINE void __Pyx_RaiseNoneNotIterableError(void) { PyErr_SetString(PyExc_TypeError, "'NoneType' object is not iterable"); } +/* GetTopmostException */ +#if CYTHON_USE_EXC_INFO_STACK +static _PyErr_StackItem * +__Pyx_PyErr_GetTopmostException(PyThreadState *tstate) +{ + _PyErr_StackItem *exc_info = tstate->exc_info; + while ((exc_info->exc_type == NULL || exc_info->exc_type == Py_None) && + exc_info->previous_item != NULL) + { + exc_info = exc_info->previous_item; + } + return exc_info; +} +#endif + /* SaveResetException */ #if CYTHON_FAST_THREAD_STATE static CYTHON_INLINE void __Pyx__ExceptionSave(PyThreadState *tstate, PyObject **type, PyObject **value, PyObject **tb) { - #if PY_VERSION_HEX >= 0x030700A3 - *type = tstate->exc_state.exc_type; - *value = tstate->exc_state.exc_value; - *tb = tstate->exc_state.exc_traceback; + #if CYTHON_USE_EXC_INFO_STACK + _PyErr_StackItem *exc_info = __Pyx_PyErr_GetTopmostException(tstate); + *type = exc_info->exc_type; + *value = exc_info->exc_value; + *tb = exc_info->exc_traceback; #else *type = tstate->exc_type; *value = tstate->exc_value; @@ -12830,13 +12952,14 @@ static CYTHON_INLINE void __Pyx__ExceptionSave(PyThreadState *tstate, PyObject * } static CYTHON_INLINE void __Pyx__ExceptionReset(PyThreadState *tstate, PyObject *type, PyObject *value, PyObject *tb) { PyObject *tmp_type, *tmp_value, *tmp_tb; - #if PY_VERSION_HEX >= 0x030700A3 - tmp_type = tstate->exc_state.exc_type; - tmp_value = tstate->exc_state.exc_value; - tmp_tb = tstate->exc_state.exc_traceback; - tstate->exc_state.exc_type = type; - tstate->exc_state.exc_value = value; - tstate->exc_state.exc_traceback = tb; + #if CYTHON_USE_EXC_INFO_STACK + _PyErr_StackItem *exc_info = tstate->exc_info; + tmp_type = exc_info->exc_type; + tmp_value = exc_info->exc_value; + tmp_tb = exc_info->exc_traceback; + exc_info->exc_type = type; + exc_info->exc_value = value; + exc_info->exc_traceback = tb; #else tmp_type = tstate->exc_type; tmp_value = tstate->exc_value; @@ -12878,10 +13001,11 @@ static CYTHON_INLINE int __Pyx_PyErr_ExceptionMatchesInState(PyThreadState* tsta /* GetException */ #if CYTHON_FAST_THREAD_STATE -static int __Pyx__GetException(PyThreadState *tstate, PyObject **type, PyObject **value, PyObject **tb) { +static int __Pyx__GetException(PyThreadState *tstate, PyObject **type, PyObject **value, PyObject **tb) #else -static int __Pyx_GetException(PyObject **type, PyObject **value, PyObject **tb) { +static int __Pyx_GetException(PyObject **type, PyObject **value, PyObject **tb) #endif +{ PyObject *local_type, *local_value, *local_tb; #if CYTHON_FAST_THREAD_STATE PyObject *tmp_type, *tmp_value, *tmp_tb; @@ -12914,13 +13038,16 @@ static int __Pyx_GetException(PyObject **type, PyObject **value, PyObject **tb) *value = local_value; *tb = local_tb; #if CYTHON_FAST_THREAD_STATE - #if PY_VERSION_HEX >= 0x030700A3 - tmp_type = tstate->exc_state.exc_type; - tmp_value = tstate->exc_state.exc_value; - tmp_tb = tstate->exc_state.exc_traceback; - tstate->exc_state.exc_type = local_type; - tstate->exc_state.exc_value = local_value; - tstate->exc_state.exc_traceback = local_tb; + #if CYTHON_USE_EXC_INFO_STACK + { + _PyErr_StackItem *exc_info = tstate->exc_info; + tmp_type = exc_info->exc_type; + tmp_value = exc_info->exc_value; + tmp_tb = exc_info->exc_traceback; + exc_info->exc_type = local_type; + exc_info->exc_value = local_value; + exc_info->exc_traceback = local_tb; + } #else tmp_type = tstate->exc_type; tmp_value = tstate->exc_value; @@ -12946,8 +13073,69 @@ static int __Pyx_GetException(PyObject **type, PyObject **value, PyObject **tb) return -1; } +/* TypeImport */ +#ifndef __PYX_HAVE_RT_ImportType +#define __PYX_HAVE_RT_ImportType +static PyTypeObject *__Pyx_ImportType(PyObject *module, const char *module_name, const char *class_name, + size_t size, enum __Pyx_ImportType_CheckSize check_size) +{ + PyObject *result = 0; + char warning[200]; + Py_ssize_t basicsize; +#ifdef Py_LIMITED_API + PyObject *py_basicsize; +#endif + result = PyObject_GetAttrString(module, class_name); + if (!result) + goto bad; + if (!PyType_Check(result)) { + PyErr_Format(PyExc_TypeError, + "%.200s.%.200s is not a type object", + module_name, class_name); + goto bad; + } +#ifndef Py_LIMITED_API + basicsize = ((PyTypeObject *)result)->tp_basicsize; +#else + py_basicsize = PyObject_GetAttrString(result, "__basicsize__"); + if (!py_basicsize) + goto bad; + basicsize = PyLong_AsSsize_t(py_basicsize); + Py_DECREF(py_basicsize); + py_basicsize = 0; + if (basicsize == (Py_ssize_t)-1 && PyErr_Occurred()) + goto bad; +#endif + if ((size_t)basicsize < size) { + PyErr_Format(PyExc_ValueError, + "%.200s.%.200s size changed, may indicate binary incompatibility. " + "Expected %zd from C header, got %zd from PyObject", + module_name, class_name, size, basicsize); + goto bad; + } + if (check_size == __Pyx_ImportType_CheckSize_Error && (size_t)basicsize != size) { + PyErr_Format(PyExc_ValueError, + "%.200s.%.200s size changed, may indicate binary incompatibility. " + "Expected %zd from C header, got %zd from PyObject", + module_name, class_name, size, basicsize); + goto bad; + } + else if (check_size == __Pyx_ImportType_CheckSize_Warn && (size_t)basicsize > size) { + PyOS_snprintf(warning, sizeof(warning), + "%s.%s size changed, may indicate binary incompatibility. " + "Expected %zd from C header, got %zd from PyObject", + module_name, class_name, size, basicsize); + if (PyErr_WarnEx(NULL, warning, 0) < 0) goto bad; + } + return (PyTypeObject *)result; +bad: + Py_XDECREF(result); + return NULL; +} +#endif + /* Import */ - static PyObject *__Pyx_Import(PyObject *name, PyObject *from_list, int level) { +static PyObject *__Pyx_Import(PyObject *name, PyObject *from_list, int level) { PyObject *empty_list = 0; PyObject *module = 0; PyObject *global_dict = 0; @@ -12994,7 +13182,7 @@ static int __Pyx_GetException(PyObject **type, PyObject **value, PyObject **tb) if (!py_level) goto bad; module = PyObject_CallFunctionObjArgs(py_import, - name, global_dict, empty_dict, list, py_level, NULL); + name, global_dict, empty_dict, list, py_level, (PyObject *)NULL); Py_DECREF(py_level); #else module = PyImport_ImportModuleLevelObject( @@ -13012,7 +13200,7 @@ static int __Pyx_GetException(PyObject **type, PyObject **value, PyObject **tb) } /* ImportFrom */ - static PyObject* __Pyx_ImportFrom(PyObject* module, PyObject* name) { +static PyObject* __Pyx_ImportFrom(PyObject* module, PyObject* name) { PyObject* value = __Pyx_PyObject_GetAttrStr(module, name); if (unlikely(!value) && PyErr_ExceptionMatches(PyExc_AttributeError)) { PyErr_Format(PyExc_ImportError, @@ -13026,34 +13214,42 @@ static int __Pyx_GetException(PyObject **type, PyObject **value, PyObject **tb) } /* GetModuleGlobalName */ - static CYTHON_INLINE PyObject *__Pyx_GetModuleGlobalName(PyObject *name) { +#if CYTHON_USE_DICT_VERSIONS +static PyObject *__Pyx__GetModuleGlobalName(PyObject *name, PY_UINT64_T *dict_version, PyObject **dict_cached_value) +#else +static CYTHON_INLINE PyObject *__Pyx__GetModuleGlobalName(PyObject *name) +#endif +{ PyObject *result; #if !CYTHON_AVOID_BORROWED_REFS #if CYTHON_COMPILING_IN_CPYTHON && PY_VERSION_HEX >= 0x030500A1 result = _PyDict_GetItem_KnownHash(__pyx_d, name, ((PyASCIIObject *) name)->hash); + __PYX_UPDATE_DICT_CACHE(__pyx_d, result, *dict_cached_value, *dict_version) if (likely(result)) { - Py_INCREF(result); + return __Pyx_NewRef(result); } else if (unlikely(PyErr_Occurred())) { - result = NULL; - } else { + return NULL; + } #else result = PyDict_GetItem(__pyx_d, name); + __PYX_UPDATE_DICT_CACHE(__pyx_d, result, *dict_cached_value, *dict_version) if (likely(result)) { - Py_INCREF(result); - } else { + return __Pyx_NewRef(result); + } #endif #else result = PyObject_GetItem(__pyx_d, name); - if (!result) { - PyErr_Clear(); -#endif - result = __Pyx_GetBuiltinName(name); + __PYX_UPDATE_DICT_CACHE(__pyx_d, result, *dict_cached_value, *dict_version) + if (likely(result)) { + return __Pyx_NewRef(result); } - return result; + PyErr_Clear(); +#endif + return __Pyx_GetBuiltinName(name); } /* PyObjectCallNoArg */ - #if CYTHON_COMPILING_IN_CPYTHON +#if CYTHON_COMPILING_IN_CPYTHON static CYTHON_INLINE PyObject* __Pyx_PyObject_CallNoArg(PyObject *func) { #if CYTHON_FAST_PYCALL if (PyFunction_Check(func)) { @@ -13061,10 +13257,11 @@ static CYTHON_INLINE PyObject* __Pyx_PyObject_CallNoArg(PyObject *func) { } #endif #ifdef __Pyx_CyFunction_USED - if (likely(PyCFunction_Check(func) || __Pyx_TypeCheck(func, __pyx_CyFunctionType))) { + if (likely(PyCFunction_Check(func) || __Pyx_CyFunction_Check(func))) #else - if (likely(PyCFunction_Check(func))) { + if (likely(PyCFunction_Check(func))) #endif + { if (likely(PyCFunction_GET_FLAGS(func) & METH_NOARGS)) { return __Pyx_PyObject_CallMethO(func, NULL); } @@ -13074,8 +13271,8 @@ static CYTHON_INLINE PyObject* __Pyx_PyObject_CallNoArg(PyObject *func) { #endif /* CLineInTraceback */ - #ifndef CYTHON_CLINE_IN_TRACEBACK -static int __Pyx_CLineForTraceback(CYTHON_UNUSED PyThreadState *tstate, int c_line) { +#ifndef CYTHON_CLINE_IN_TRACEBACK +static int __Pyx_CLineForTraceback(PyThreadState *tstate, int c_line) { PyObject *use_cline; PyObject *ptype, *pvalue, *ptraceback; #if CYTHON_COMPILING_IN_CPYTHON @@ -13088,7 +13285,9 @@ static int __Pyx_CLineForTraceback(CYTHON_UNUSED PyThreadState *tstate, int c_li #if CYTHON_COMPILING_IN_CPYTHON cython_runtime_dict = _PyObject_GetDictPtr(__pyx_cython_runtime); if (likely(cython_runtime_dict)) { - use_cline = __Pyx_PyDict_GetItemStr(*cython_runtime_dict, __pyx_n_s_cline_in_traceback); + __PYX_PY_DICT_LOOKUP_IF_MODIFIED( + use_cline, *cython_runtime_dict, + __Pyx_PyDict_GetItemStr(*cython_runtime_dict, __pyx_n_s_cline_in_traceback)) } else #endif { @@ -13105,7 +13304,7 @@ static int __Pyx_CLineForTraceback(CYTHON_UNUSED PyThreadState *tstate, int c_li c_line = 0; PyObject_SetAttr(__pyx_cython_runtime, __pyx_n_s_cline_in_traceback, Py_False); } - else if (PyObject_Not(use_cline) != 0) { + else if (use_cline == Py_False || (use_cline != Py_True && PyObject_Not(use_cline) != 0)) { c_line = 0; } __Pyx_ErrRestoreInState(tstate, ptype, pvalue, ptraceback); @@ -13114,7 +13313,7 @@ static int __Pyx_CLineForTraceback(CYTHON_UNUSED PyThreadState *tstate, int c_li #endif /* CodeObjectCache */ - static int __pyx_bisect_code_objects(__Pyx_CodeObjectCacheEntry* entries, int count, int code_line) { +static int __pyx_bisect_code_objects(__Pyx_CodeObjectCacheEntry* entries, int count, int code_line) { int start = 0, mid = 0, end = count - 1; if (end >= 0 && code_line > entries[end].code_line) { return count; @@ -13194,7 +13393,7 @@ static void __pyx_insert_code_object(int code_line, PyCodeObject* code_object) { } /* AddTraceback */ - #include "compile.h" +#include "compile.h" #include "frameobject.h" #include "traceback.h" static PyCodeObject* __Pyx_CreateCodeObjectForTraceback( @@ -13279,8 +13478,8 @@ static void __Pyx_AddTraceback(const char *funcname, int c_line, } /* CIntToPy */ - static CYTHON_INLINE PyObject* __Pyx_PyInt_From_int(int value) { - const int neg_one = (int) -1, const_zero = (int) 0; +static CYTHON_INLINE PyObject* __Pyx_PyInt_From_int(int value) { + const int neg_one = (int) ((int) 0 - (int) 1), const_zero = (int) 0; const int is_unsigned = neg_one > const_zero; if (is_unsigned) { if (sizeof(int) < sizeof(long)) { @@ -13310,7 +13509,7 @@ static void __Pyx_AddTraceback(const char *funcname, int c_line, } /* CIntFromPyVerify */ - #define __PYX_VERIFY_RETURN_INT(target_type, func_type, func_value)\ +#define __PYX_VERIFY_RETURN_INT(target_type, func_type, func_value)\ __PYX__VERIFY_RETURN_INT(target_type, func_type, func_value, 0) #define __PYX_VERIFY_RETURN_INT_EXC(target_type, func_type, func_value)\ __PYX__VERIFY_RETURN_INT(target_type, func_type, func_value, 1) @@ -13332,7 +13531,7 @@ static void __Pyx_AddTraceback(const char *funcname, int c_line, } /* None */ - static CYTHON_INLINE long __Pyx_pow_long(long b, long e) { +static CYTHON_INLINE long __Pyx_pow_long(long b, long e) { long t = b; switch (e) { case 3: @@ -13359,8 +13558,8 @@ static void __Pyx_AddTraceback(const char *funcname, int c_line, } /* CIntToPy */ - static CYTHON_INLINE PyObject* __Pyx_PyInt_From_long(long value) { - const long neg_one = (long) -1, const_zero = (long) 0; +static CYTHON_INLINE PyObject* __Pyx_PyInt_From_long(long value) { + const long neg_one = (long) ((long) 0 - (long) 1), const_zero = (long) 0; const int is_unsigned = neg_one > const_zero; if (is_unsigned) { if (sizeof(long) < sizeof(long)) { @@ -13390,8 +13589,8 @@ static void __Pyx_AddTraceback(const char *funcname, int c_line, } /* CIntToPy */ - static CYTHON_INLINE PyObject* __Pyx_PyInt_From_unsigned_PY_LONG_LONG(unsigned PY_LONG_LONG value) { - const unsigned PY_LONG_LONG neg_one = (unsigned PY_LONG_LONG) -1, const_zero = (unsigned PY_LONG_LONG) 0; +static CYTHON_INLINE PyObject* __Pyx_PyInt_From_unsigned_PY_LONG_LONG(unsigned PY_LONG_LONG value) { + const unsigned PY_LONG_LONG neg_one = (unsigned PY_LONG_LONG) ((unsigned PY_LONG_LONG) 0 - (unsigned PY_LONG_LONG) 1), const_zero = (unsigned PY_LONG_LONG) 0; const int is_unsigned = neg_one > const_zero; if (is_unsigned) { if (sizeof(unsigned PY_LONG_LONG) < sizeof(long)) { @@ -13421,7 +13620,7 @@ static void __Pyx_AddTraceback(const char *funcname, int c_line, } /* Declarations */ - #if CYTHON_CCOMPLEX +#if CYTHON_CCOMPLEX #ifdef __cplusplus static CYTHON_INLINE __pyx_t_float_complex __pyx_t_float_complex_from_parts(float x, float y) { return ::std::complex< float >(x, y); @@ -13441,7 +13640,7 @@ static void __Pyx_AddTraceback(const char *funcname, int c_line, #endif /* Arithmetic */ - #if CYTHON_CCOMPLEX +#if CYTHON_CCOMPLEX #else static CYTHON_INLINE int __Pyx_c_eq_float(__pyx_t_float_complex a, __pyx_t_float_complex b) { return (a.real == b.real) && (a.imag == b.imag); @@ -13576,7 +13775,7 @@ static void __Pyx_AddTraceback(const char *funcname, int c_line, #endif /* Declarations */ - #if CYTHON_CCOMPLEX +#if CYTHON_CCOMPLEX #ifdef __cplusplus static CYTHON_INLINE __pyx_t_double_complex __pyx_t_double_complex_from_parts(double x, double y) { return ::std::complex< double >(x, y); @@ -13596,7 +13795,7 @@ static void __Pyx_AddTraceback(const char *funcname, int c_line, #endif /* Arithmetic */ - #if CYTHON_CCOMPLEX +#if CYTHON_CCOMPLEX #else static CYTHON_INLINE int __Pyx_c_eq_double(__pyx_t_double_complex a, __pyx_t_double_complex b) { return (a.real == b.real) && (a.imag == b.imag); @@ -13731,8 +13930,8 @@ static void __Pyx_AddTraceback(const char *funcname, int c_line, #endif /* CIntToPy */ - static CYTHON_INLINE PyObject* __Pyx_PyInt_From_enum__NPY_TYPES(enum NPY_TYPES value) { - const enum NPY_TYPES neg_one = (enum NPY_TYPES) -1, const_zero = (enum NPY_TYPES) 0; +static CYTHON_INLINE PyObject* __Pyx_PyInt_From_enum__NPY_TYPES(enum NPY_TYPES value) { + const enum NPY_TYPES neg_one = (enum NPY_TYPES) ((enum NPY_TYPES) 0 - (enum NPY_TYPES) 1), const_zero = (enum NPY_TYPES) 0; const int is_unsigned = neg_one > const_zero; if (is_unsigned) { if (sizeof(enum NPY_TYPES) < sizeof(long)) { @@ -13762,8 +13961,8 @@ static void __Pyx_AddTraceback(const char *funcname, int c_line, } /* CIntFromPy */ - static CYTHON_INLINE PY_LONG_LONG __Pyx_PyInt_As_PY_LONG_LONG(PyObject *x) { - const PY_LONG_LONG neg_one = (PY_LONG_LONG) -1, const_zero = (PY_LONG_LONG) 0; +static CYTHON_INLINE PY_LONG_LONG __Pyx_PyInt_As_PY_LONG_LONG(PyObject *x) { + const PY_LONG_LONG neg_one = (PY_LONG_LONG) ((PY_LONG_LONG) 0 - (PY_LONG_LONG) 1), const_zero = (PY_LONG_LONG) 0; const int is_unsigned = neg_one > const_zero; #if PY_MAJOR_VERSION < 3 if (likely(PyInt_Check(x))) { @@ -13951,8 +14150,8 @@ static void __Pyx_AddTraceback(const char *funcname, int c_line, } /* CIntFromPy */ - static CYTHON_INLINE int __Pyx_PyInt_As_int(PyObject *x) { - const int neg_one = (int) -1, const_zero = (int) 0; +static CYTHON_INLINE int __Pyx_PyInt_As_int(PyObject *x) { + const int neg_one = (int) ((int) 0 - (int) 1), const_zero = (int) 0; const int is_unsigned = neg_one > const_zero; #if PY_MAJOR_VERSION < 3 if (likely(PyInt_Check(x))) { @@ -14140,8 +14339,8 @@ static void __Pyx_AddTraceback(const char *funcname, int c_line, } /* CIntFromPy */ - static CYTHON_INLINE unsigned PY_LONG_LONG __Pyx_PyInt_As_unsigned_PY_LONG_LONG(PyObject *x) { - const unsigned PY_LONG_LONG neg_one = (unsigned PY_LONG_LONG) -1, const_zero = (unsigned PY_LONG_LONG) 0; +static CYTHON_INLINE unsigned PY_LONG_LONG __Pyx_PyInt_As_unsigned_PY_LONG_LONG(PyObject *x) { + const unsigned PY_LONG_LONG neg_one = (unsigned PY_LONG_LONG) ((unsigned PY_LONG_LONG) 0 - (unsigned PY_LONG_LONG) 1), const_zero = (unsigned PY_LONG_LONG) 0; const int is_unsigned = neg_one > const_zero; #if PY_MAJOR_VERSION < 3 if (likely(PyInt_Check(x))) { @@ -14329,8 +14528,8 @@ static void __Pyx_AddTraceback(const char *funcname, int c_line, } /* CIntFromPy */ - static CYTHON_INLINE npy_uint32 __Pyx_PyInt_As_npy_uint32(PyObject *x) { - const npy_uint32 neg_one = (npy_uint32) -1, const_zero = (npy_uint32) 0; +static CYTHON_INLINE npy_uint32 __Pyx_PyInt_As_npy_uint32(PyObject *x) { + const npy_uint32 neg_one = (npy_uint32) ((npy_uint32) 0 - (npy_uint32) 1), const_zero = (npy_uint32) 0; const int is_unsigned = neg_one > const_zero; #if PY_MAJOR_VERSION < 3 if (likely(PyInt_Check(x))) { @@ -14518,8 +14717,8 @@ static void __Pyx_AddTraceback(const char *funcname, int c_line, } /* CIntFromPy */ - static CYTHON_INLINE long __Pyx_PyInt_As_long(PyObject *x) { - const long neg_one = (long) -1, const_zero = (long) 0; +static CYTHON_INLINE long __Pyx_PyInt_As_long(PyObject *x) { + const long neg_one = (long) ((long) 0 - (long) 1), const_zero = (long) 0; const int is_unsigned = neg_one > const_zero; #if PY_MAJOR_VERSION < 3 if (likely(PyInt_Check(x))) { @@ -14707,7 +14906,7 @@ static void __Pyx_AddTraceback(const char *funcname, int c_line, } /* FastTypeChecks */ - #if CYTHON_COMPILING_IN_CPYTHON +#if CYTHON_COMPILING_IN_CPYTHON static int __Pyx_InBases(PyTypeObject *a, PyTypeObject *b) { while (a) { a = a->tp_base; @@ -14807,7 +15006,7 @@ static CYTHON_INLINE int __Pyx_PyErr_GivenExceptionMatches2(PyObject *err, PyObj #endif /* CheckBinaryVersion */ - static int __Pyx_check_binary_version(void) { +static int __Pyx_check_binary_version(void) { char ctversion[4], rtversion[4]; PyOS_snprintf(ctversion, 4, "%d.%d", PY_MAJOR_VERSION, PY_MINOR_VERSION); PyOS_snprintf(rtversion, 4, "%s", Py_GetVersion()); @@ -14823,7 +15022,7 @@ static CYTHON_INLINE int __Pyx_PyErr_GivenExceptionMatches2(PyObject *err, PyObj } /* VoidPtrExport */ - static int __Pyx_ExportVoidPtr(PyObject *name, void *p, const char *sig) { +static int __Pyx_ExportVoidPtr(PyObject *name, void *p, const char *sig) { PyObject *d; PyObject *cobj = 0; d = PyDict_GetItem(__pyx_d, __pyx_n_s_pyx_capi); @@ -14854,7 +15053,7 @@ static CYTHON_INLINE int __Pyx_PyErr_GivenExceptionMatches2(PyObject *err, PyObj } /* FunctionExport */ - static int __Pyx_ExportFunction(const char *name, void (*f)(void), const char *sig) { +static int __Pyx_ExportFunction(const char *name, void (*f)(void), const char *sig) { PyObject *d = 0; PyObject *cobj = 0; union { @@ -14890,91 +15089,8 @@ static CYTHON_INLINE int __Pyx_PyErr_GivenExceptionMatches2(PyObject *err, PyObj return -1; } -/* ModuleImport */ - #ifndef __PYX_HAVE_RT_ImportModule -#define __PYX_HAVE_RT_ImportModule -static PyObject *__Pyx_ImportModule(const char *name) { - PyObject *py_name = 0; - PyObject *py_module = 0; - py_name = __Pyx_PyIdentifier_FromString(name); - if (!py_name) - goto bad; - py_module = PyImport_Import(py_name); - Py_DECREF(py_name); - return py_module; -bad: - Py_XDECREF(py_name); - return 0; -} -#endif - -/* TypeImport */ - #ifndef __PYX_HAVE_RT_ImportType -#define __PYX_HAVE_RT_ImportType -static PyTypeObject *__Pyx_ImportType(const char *module_name, const char *class_name, - size_t size, int strict) -{ - PyObject *py_module = 0; - PyObject *result = 0; - PyObject *py_name = 0; - char warning[200]; - Py_ssize_t basicsize; -#ifdef Py_LIMITED_API - PyObject *py_basicsize; -#endif - py_module = __Pyx_ImportModule(module_name); - if (!py_module) - goto bad; - py_name = __Pyx_PyIdentifier_FromString(class_name); - if (!py_name) - goto bad; - result = PyObject_GetAttr(py_module, py_name); - Py_DECREF(py_name); - py_name = 0; - Py_DECREF(py_module); - py_module = 0; - if (!result) - goto bad; - if (!PyType_Check(result)) { - PyErr_Format(PyExc_TypeError, - "%.200s.%.200s is not a type object", - module_name, class_name); - goto bad; - } -#ifndef Py_LIMITED_API - basicsize = ((PyTypeObject *)result)->tp_basicsize; -#else - py_basicsize = PyObject_GetAttrString(result, "__basicsize__"); - if (!py_basicsize) - goto bad; - basicsize = PyLong_AsSsize_t(py_basicsize); - Py_DECREF(py_basicsize); - py_basicsize = 0; - if (basicsize == (Py_ssize_t)-1 && PyErr_Occurred()) - goto bad; -#endif - if (!strict && (size_t)basicsize > size) { - PyOS_snprintf(warning, sizeof(warning), - "%s.%s size changed, may indicate binary incompatibility. Expected %zd, got %zd", - module_name, class_name, basicsize, size); - if (PyErr_WarnEx(NULL, warning, 0) < 0) goto bad; - } - else if ((size_t)basicsize != size) { - PyErr_Format(PyExc_ValueError, - "%.200s.%.200s has the wrong size, try recompiling. Expected %zd, got %zd", - module_name, class_name, basicsize, size); - goto bad; - } - return (PyTypeObject *)result; -bad: - Py_XDECREF(py_module); - Py_XDECREF(result); - return NULL; -} -#endif - /* InitStrings */ - static int __Pyx_InitStrings(__Pyx_StringTabEntry *t) { +static int __Pyx_InitStrings(__Pyx_StringTabEntry *t) { while (t->p) { #if PY_MAJOR_VERSION < 3 if (t->is_unicode) { @@ -15083,6 +15199,13 @@ static CYTHON_INLINE int __Pyx_PyObject_IsTrue(PyObject* x) { if (is_true | (x == Py_False) | (x == Py_None)) return is_true; else return PyObject_IsTrue(x); } +static CYTHON_INLINE int __Pyx_PyObject_IsTrueAndDecref(PyObject* x) { + int retval; + if (unlikely(!x)) return -1; + retval = __Pyx_PyObject_IsTrue(x); + Py_DECREF(x); + return retval; +} static PyObject* __Pyx_PyNumber_IntOrLongWrongResultType(PyObject* result, const char* type_name) { #if PY_MAJOR_VERSION >= 3 if (PyLong_Check(result)) { @@ -15160,7 +15283,7 @@ static CYTHON_INLINE Py_ssize_t __Pyx_PyIndex_AsSsize_t(PyObject* b) { if (sizeof(Py_ssize_t) >= sizeof(long)) return PyInt_AS_LONG(b); else - return PyInt_AsSsize_t(x); + return PyInt_AsSsize_t(b); } #endif if (likely(PyLong_CheckExact(b))) { diff --git a/gensim/similarities/__init__.py b/gensim/similarities/__init__.py index 1becd76831..3c670ba95b 100644 --- a/gensim/similarities/__init__.py +++ b/gensim/similarities/__init__.py @@ -3,6 +3,15 @@ """ # bring classes directly into package namespace, to save some typing -from .docsim import Similarity, MatrixSimilarity, SparseMatrixSimilarity, SoftCosineSimilarity, WmdSimilarity # noqa:F401 -from .termsim import TermSimilarityIndex, UniformTermSimilarityIndex, SparseTermSimilarityMatrix # noqa:F401 + +from .docsim import ( # noqa:F401 + Similarity, + MatrixSimilarity, + SparseMatrixSimilarity, + SoftCosineSimilarity, + WmdSimilarity) +from .termsim import ( # noqa:F401 + TermSimilarityIndex, + UniformTermSimilarityIndex, + SparseTermSimilarityMatrix) from .levenshtein import LevenshteinSimilarityIndex # noqa:F401 diff --git a/gensim/similarities/docsim.py b/gensim/similarities/docsim.py index bb7b4f402b..10e061310a 100755 --- a/gensim/similarities/docsim.py +++ b/gensim/similarities/docsim.py @@ -866,13 +866,13 @@ class SoftCosineSimilarity(interfaces.SimilarityABC): >>> from gensim.test.utils import common_texts >>> from gensim.corpora import Dictionary >>> from gensim.models import Word2Vec, WordEmbeddingSimilarityIndex - >>> from gensim.similarities import SoftCosineSimilarity, TermSimilarityMatrix + >>> from gensim.similarities import SoftCosineSimilarity, SparseTermSimilarityMatrix >>> >>> model = Word2Vec(common_texts, size=20, min_count=1) # train word-vectors - >>> termsim_index = WordEmbeddingSimilarityIndex(model) + >>> termsim_index = WordEmbeddingSimilarityIndex(model.wv) >>> dictionary = Dictionary(common_texts) >>> bow_corpus = [dictionary.doc2bow(document) for document in common_texts] - >>> similarity_matrix = TermSimilarityMatrix(termsim_index, dictionary) # construct similarity matrix + >>> similarity_matrix = SparseTermSimilarityMatrix(termsim_index, dictionary) # construct similarity matrix >>> docsim_index = SoftCosineSimilarity(bow_corpus, similarity_matrix, num_best=10) >>> >>> query = 'graph trees computer'.split() # make a query diff --git a/gensim/similarities/termsim.py b/gensim/similarities/termsim.py index 6a0b6d12b5..167b73b241 100644 --- a/gensim/similarities/termsim.py +++ b/gensim/similarities/termsim.py @@ -128,13 +128,13 @@ class SparseTermSimilarityMatrix(SaveLoad): >>> from gensim.test.utils import common_texts >>> from gensim.corpora import Dictionary >>> from gensim.models import Word2Vec, WordEmbeddingSimilarityIndex - >>> from gensim.similarities import SoftCosineSimilarity, TermSimilarityMatrix + >>> from gensim.similarities import SoftCosineSimilarity, SparseTermSimilarityMatrix >>> >>> model = Word2Vec(common_texts, size=20, min_count=1) # train word-vectors - >>> termsim_index = WordEmbeddingSimilarityIndex(model) + >>> termsim_index = WordEmbeddingSimilarityIndex(model.wv) >>> dictionary = Dictionary(common_texts) >>> bow_corpus = [dictionary.doc2bow(document) for document in common_texts] - >>> similarity_matrix = TermSimilarityMatrix(termsim_index, dictionary) # construct similarity matrix + >>> similarity_matrix = SparseTermSimilarityMatrix(termsim_index, dictionary) # construct similarity matrix >>> docsim_index = SoftCosineSimilarity(bow_corpus, similarity_matrix, num_best=10) >>> >>> query = 'graph trees computer'.split() # make a query diff --git a/gensim/test/test_data/fb-ngrams.txt b/gensim/test/test_data/fb-ngrams.txt new file mode 100644 index 0000000000..3296d85c6a --- /dev/null +++ b/gensim/test/test_data/fb-ngrams.txt @@ -0,0 +1,89 @@ + +test +test 0 0 0 0 0 + -0.058167 0.084801 -0.10452 0.085963 -0.14475 +tes 0.066033 0.011132 0.13224 0.19839 -0.037827 +test -0.12628 0.053912 0.051677 0.24844 0.083743 +test> -0.016497 0.1322 0.21391 0.20869 -0.044566 +est -0.12915 -0.02457 0.10145 0.23414 0.17121 +est> -0.1776 0.19906 -0.15572 0.16449 -0.12887 +st> -0.13712 0.028013 -0.041927 0.11244 0.12261 + + +at the +at the 0 0 0 0 0 + 0.17667 0.026172 -0.15457 0.081664 -0.1315 + th 0.1095 0.077397 0.052745 -0.043956 0.033436 + the -0.15504 0.11166 -0.16434 0.089162 -0.16199 + the> 0.097803 -0.054657 -0.028828 0.21607 0.11286 +the -0.046122 -0.071463 0.20759 0.25732 0.23174 +the> 0.04535 0.15192 -0.0021161 0.014343 0.12982 +he> -0.046122 -0.071463 0.20759 0.25732 0.23174 + + +atnthe +atnthe 0 0 0 0 0 + -0.065392 -0.085291 0.088378 0.024628 0.12715 +nth 0.067156 -0.068108 0.16394 0.18192 0.18902 +nthe 0.13526 -0.023216 -0.10788 0.24512 -0.022174 +nthe> -0.20296 -0.11805 0.20277 0.063027 -0.041727 +the -0.046122 -0.071463 0.20759 0.25732 0.23174 +the> 0.04535 0.15192 -0.0021161 0.014343 0.12982 +he> -0.046122 -0.071463 0.20759 0.25732 0.23174 + + +тест +тест 0 0 0 0 0 +<те -0.17079 -0.029842 0.10298 -0.12632 -0.14488 +<тес -0.026151 0.13071 0.20833 0.17143 0.040533 +<тест 0.17667 0.026172 -0.15457 0.081664 -0.1315 +<тест> -0.065392 -0.085291 0.088378 0.024628 0.12715 +тес -0.08172 -0.13699 0.14081 -0.036949 -0.037403 +тест -0.11209 0.068818 -0.137 -0.088165 0.13144 +тест> -0.20296 -0.11805 0.20277 0.063027 -0.041727 +ест -0.17079 -0.029842 0.10298 -0.12632 -0.14488 +ест> 0.16922 -0.1162 0.1462 0.1085 0.02952 +ст> -0.17261 0.086891 0.21772 0.10036 0.19114 + + +テスト +テスト 0 0 0 0 0 +<テス 0.066033 0.011132 0.13224 0.19839 -0.037827 +<テスト -0.12915 -0.02457 0.10145 0.23414 0.17121 +<テスト> -0.10241 0.0090735 0.097437 0.055768 0.03622 +テスト 0.048443 0.15183 -0.058779 -0.1095 0.10566 +テスト> -0.12628 0.053912 0.051677 0.24844 0.083743 +スト> 0.12972 0.18282 -0.18266 -0.072433 0.19318 + + +試し +試し 0 0 0 0 0 +<試し 0.1095 0.077397 0.052745 -0.043956 0.033436 +<試し> 0.11952 0.15093 -0.075759 0.18327 0.12471 +試し> -0.14656 0.072651 -0.16777 0.20026 0.21199 + diff --git a/gensim/test/test_data/ft_kv_3.6.0.model.gz b/gensim/test/test_data/ft_kv_3.6.0.model.gz new file mode 100644 index 0000000000..55fd042b54 Binary files /dev/null and b/gensim/test/test_data/ft_kv_3.6.0.model.gz differ diff --git a/gensim/test/test_data/pretrained.vec b/gensim/test/test_data/pretrained.vec new file mode 100644 index 0000000000..d38bd8529b --- /dev/null +++ b/gensim/test/test_data/pretrained.vec @@ -0,0 +1,2 @@ +3 5 +dummy 0.069324 0.18155 0.080453 -0.1799 0.032043 diff --git a/gensim/test/test_data/toy-model-pretrained.bin b/gensim/test/test_data/toy-model-pretrained.bin new file mode 100644 index 0000000000..5f7dabd622 Binary files /dev/null and b/gensim/test/test_data/toy-model-pretrained.bin differ diff --git a/gensim/test/test_fasttext.py b/gensim/test/test_fasttext.py index 67b035549b..4a1056a109 100644 --- a/gensim/test/test_fasttext.py +++ b/gensim/test/test_fasttext.py @@ -2,6 +2,7 @@ # -*- coding: utf-8 -*- from __future__ import division +import io import logging import unittest import os @@ -19,6 +20,8 @@ from gensim.models.wrappers.fasttext import FastText as FT_wrapper from gensim.models.keyedvectors import Word2VecKeyedVectors from gensim.test.utils import datapath, get_tmpfile, temporary_file, common_texts as sentences +import gensim.models._fasttext_bin + try: from pyemd import emd # noqa:F401 @@ -59,6 +62,21 @@ def setUp(self): self.test_model = FT_gensim.load_fasttext_format(self.test_model_file) self.test_new_model_file = datapath('lee_fasttext_new') + def test_native_partial_model(self): + """Can we skip loading the NN and still get a working model?""" + model = FT_gensim.load_fasttext_format(self.test_model_file, full_model=False) + + # + # Training continuation should be impossible + # + self.assertIsNone(model.trainables.syn1neg) + self.assertRaises(ValueError, model.train, sentences, + total_examples=model.corpus_count, epochs=model.epochs) + + model.wv['green'] + model.wv['foobar'] + model.wv['thisworddoesnotexist'] + def test_training(self): model = FT_gensim(size=10, min_count=1, hs=1, negative=0, seed=42, workers=1) model.build_vocab(sentences) @@ -1099,6 +1117,29 @@ def test_save_load_native(self): model.save(model_name) + def test_load_native_pretrained(self): + model = FT_gensim.load_fasttext_format(datapath('toy-model-pretrained.bin')) + actual = model['monarchist'] + expected = np.array([0.76222, 1.0669, 0.7055, -0.090969, -0.53508]) + self.assertTrue(np.allclose(expected, actual, atol=10e-4)) + + +def _train_model_with_pretrained_vectors(): + """Generate toy-model-pretrained.bin for use in test_load_native_pretrained. + + Requires https://github.com/facebookresearch/fastText/tree/master/python to be installed. + + """ + import fastText + + training_text = datapath('toy-data.txt') + pretrained_file = datapath('pretrained.vec') + model = fastText.train_unsupervised( + training_text, + bucket=100, model='skipgram', dim=5, pretrainedVectors=pretrained_file + ) + model.save_model(datapath('toy-model-pretrained.bin')) + class HashCompatibilityTest(unittest.TestCase): def test_compatibility_true(self): @@ -1171,6 +1212,69 @@ def test_out_of_vocab(self): self.assertRaises(KeyError, model.wv.word_vec, 'streamtrain') +class UnicodeVocabTest(unittest.TestCase): + def test_ascii(self): + buf = io.BytesIO() + buf.name = 'dummy name to keep fasttext happy' + buf.write(struct.pack('@3i', 2, -1, -1)) # vocab_size, nwords, nlabels + buf.write(struct.pack('@1q', -1)) + buf.write(b'hello') + buf.write(b'\x00') + buf.write(struct.pack('@qb', 1, -1)) + buf.write(b'world') + buf.write(b'\x00') + buf.write(struct.pack('@qb', 2, -1)) + buf.seek(0) + + raw_vocab, vocab_size, nlabels = gensim.models._fasttext_bin._load_vocab(buf, False) + expected = {'hello': 1, 'world': 2} + self.assertEqual(expected, dict(raw_vocab)) + + self.assertEqual(vocab_size, 2) + self.assertEqual(nlabels, -1) + + def test_bad_unicode(self): + buf = io.BytesIO() + buf.name = 'dummy name to keep fasttext happy' + buf.write(struct.pack('@3i', 2, -1, -1)) # vocab_size, nwords, nlabels + buf.write(struct.pack('@1q', -1)) + # + # encountered in https://github.com/RaRe-Technologies/gensim/issues/2378 + # The model from downloaded from + # https://s3-us-west-1.amazonaws.com/fasttext-vectors/wiki-news-300d-1M-subword.bin.zip + # suffers from bad characters in a few of the vocab terms. The native + # fastText utility loads the model fine, but we trip up over the bad + # characters. + # + buf.write( + b'\xe8\x8b\xb1\xe8\xaa\x9e\xe7\x89\x88\xe3\x82\xa6\xe3\x82\xa3\xe3' + b'\x82\xad\xe3\x83\x9a\xe3\x83\x87\xe3\x82\xa3\xe3\x82\xa2\xe3\x81' + b'\xb8\xe3\x81\xae\xe6\x8a\x95\xe7\xa8\xbf\xe3\x81\xaf\xe3\x81\x84' + b'\xe3\x81\xa4\xe3\x81\xa7\xe3\x82\x82\xe6' + ) + buf.write(b'\x00') + buf.write(struct.pack('@qb', 1, -1)) + buf.write( + b'\xd0\xb0\xd0\xb4\xd0\xbc\xd0\xb8\xd0\xbd\xd0\xb8\xd1\x81\xd1\x82' + b'\xd1\x80\xd0\xb0\xd1\x82\xd0\xb8\xd0\xb2\xd0\xbd\xd0\xbe-\xd1\x82' + b'\xd0\xb5\xd1\x80\xd1\x80\xd0\xb8\xd1\x82\xd0\xbe\xd1\x80\xd0\xb8' + b'\xd0\xb0\xd0\xbb\xd1\x8c\xd0\xbd\xd1' + ) + buf.write(b'\x00') + buf.write(struct.pack('@qb', 2, -1)) + buf.seek(0) + + raw_vocab, vocab_size, nlabels = gensim.models._fasttext_bin._load_vocab(buf, False) + expected = { + u'英語版ウィキペディアへの投稿はいつでも': 1, + u'административно-территориальн': 2, + } + self.assertEqual(expected, dict(raw_vocab)) + + self.assertEqual(vocab_size, 2) + self.assertEqual(nlabels, -1) + + if __name__ == '__main__': logging.basicConfig(format='%(asctime)s : %(levelname)s : %(message)s', level=logging.DEBUG) unittest.main() diff --git a/gensim/test/test_keyedvectors.py b/gensim/test/test_keyedvectors.py index 2170403342..59e361cc6c 100644 --- a/gensim/test/test_keyedvectors.py +++ b/gensim/test/test_keyedvectors.py @@ -15,7 +15,8 @@ import numpy as np from gensim.corpora import Dictionary -from gensim.models import KeyedVectors as EuclideanKeyedVectors, WordEmbeddingSimilarityIndex +from gensim.models.keyedvectors import KeyedVectors as EuclideanKeyedVectors, WordEmbeddingSimilarityIndex, \ + FastTextKeyedVectors from gensim.test.utils import datapath import gensim.models.keyedvectors @@ -279,6 +280,19 @@ def test_set_item(self): for ent, vector in zip(entities, vectors): self.assertTrue(np.allclose(self.vectors[ent], vector)) + def test_ft_kv_backward_compat_w_360(self): + kv = EuclideanKeyedVectors.load(datapath("ft_kv_3.6.0.model.gz")) + ft_kv = FastTextKeyedVectors.load(datapath("ft_kv_3.6.0.model.gz")) + + expected = ['trees', 'survey', 'system', 'graph', 'interface'] + actual = [word for (word, similarity) in kv.most_similar("human", topn=5)] + + self.assertEqual(actual, expected) + + actual = [word for (word, similarity) in ft_kv.most_similar("human", topn=5)] + + self.assertEqual(actual, expected) + class L2NormTest(unittest.TestCase): def test(self): diff --git a/gensim/test/test_ldaseqmodel.py b/gensim/test/test_ldaseqmodel.py index eb6ea120f6..227c78b4f6 100644 --- a/gensim/test/test_ldaseqmodel.py +++ b/gensim/test/test_ldaseqmodel.py @@ -13,7 +13,7 @@ class TestLdaSeq(unittest.TestCase): - # we are setting up a DTM model and fitting it, and checking topic-word and doc-topic results. + # we are setting up a DTM model and fitting it, and checking topic-word and doc-topic results. def setUp(self): texts = [ [u'senior', u'studios', u'studios', u'studios', u'creators', u'award', u'mobile', u'currently', diff --git a/gensim/test/test_utils.py b/gensim/test/test_utils.py index 74ca8b941f..c23087580f 100644 --- a/gensim/test/test_utils.py +++ b/gensim/test/test_utils.py @@ -6,8 +6,9 @@ """ Automated tests for checking various utils functions. """ +from __future__ import unicode_literals - +import sys import logging import unittest @@ -19,6 +20,8 @@ import gensim.models.utils_any2vec +import smart_open + DISABLE_CYTHON_TESTS = getattr(gensim.models.utils_any2vec, 'FAST_VERSION', None) == -1 @@ -269,12 +272,13 @@ def hash_main(alg): import six assert six.PY3, 'this only works under Py3' + assert not DISABLE_CYTHON_TESTS, 'this only works if Cython extensions available' hashmap = { - 'py': gensim.models.utils_any2vec._ft_hash_py, - 'py_broken': gensim.models.utils_any2vec._ft_hash_py_broken, - 'cy': gensim.models.utils_any2vec._ft_hash_py, - 'cy_broken': gensim.models.utils_any2vec._ft_hash_py_broken, + 'py_broken': gensim.models.utils_any2vec._ft_hash_broken_py, + 'py_bytes': gensim.models.utils_any2vec._ft_hash_bytes_py, + 'cy_broken': gensim.models.utils_any2vec._ft_hash_broken_py, + 'cy_bytes': gensim.models.utils_any2vec._ft_hash_bytes_cy, } try: fun = hashmap[alg] @@ -282,7 +286,11 @@ def hash_main(alg): raise KeyError('invalid alg: %r expected one of %r' % (alg, sorted(hashmap))) for line in sys.stdin: - for word in line.rstrip().split(' '): + if 'bytes' in alg: + words = line.encode('utf-8').rstrip().split(b' ') + else: + words = line.rstrip().split(' ') + for word in words: print('u%r: %r,' % (word, fun(word))) @@ -293,7 +301,7 @@ def setUp(self): # # $ echo word1 ... wordN | python -c 'from gensim.test.test_utils import hash_main;hash_main("alg")' # noqa: E501 # - # where alg is one of py, py_broken, cy, cy_broken. + # where alg is one of py_bytes, py_broken, cy_bytes, cy_broken. # self.expected = { @@ -330,24 +338,241 @@ def setUp(self): } def test_python(self): - actual = {k: gensim.models.utils_any2vec._ft_hash_py(k) for k in self.expected} + actual = {k: gensim.models.utils_any2vec._ft_hash_bytes_py(k.encode('utf-8')) for k in self.expected} self.assertEqual(self.expected, actual) @unittest.skipIf(DISABLE_CYTHON_TESTS, 'Cython functions are not properly compiled') def test_cython(self): - actual = {k: gensim.models.utils_any2vec._ft_hash_cy(k) for k in self.expected} + actual = {k: gensim.models.utils_any2vec._ft_hash_bytes_cy(k.encode('utf-8')) for k in self.expected} self.assertEqual(self.expected, actual) def test_python_broken(self): - actual = {k: gensim.models.utils_any2vec._ft_hash_py_broken(k) for k in self.expected} + actual = {k: gensim.models.utils_any2vec._ft_hash_broken_py(k) for k in self.expected} self.assertEqual(self.expected_broken, actual) @unittest.skipIf(DISABLE_CYTHON_TESTS, 'Cython functions are not properly compiled') def test_cython_broken(self): - actual = {k: gensim.models.utils_any2vec._ft_hash_cy_broken(k) for k in self.expected} + actual = {k: gensim.models.utils_any2vec._ft_hash_broken_cy(k) for k in self.expected} self.assertEqual(self.expected_broken, actual) +# +# Run with: +# +# python -c 'import gensim.test.test_utils as t;t.ngram_main()' py_text 3 5 +# +def ngram_main(): + """Generate ngrams for tests from standard input.""" + import sys + import six + + alg = sys.argv[1] + minn = int(sys.argv[2]) + maxn = int(sys.argv[3]) + + assert six.PY3, 'this only works under Py3' + assert not DISABLE_CYTHON_TESTS, 'this only works if Cython extensions available' + assert minn <= maxn, 'expected sane command-line parameters' + + hashmap = { + 'py_text': gensim.models.utils_any2vec._compute_ngrams_py, + 'py_bytes': gensim.models.utils_any2vec._compute_ngrams_bytes_py, + 'cy_text': gensim.models.utils_any2vec._compute_ngrams_cy, + 'cy_bytes': gensim.models.utils_any2vec._compute_ngrams_bytes_cy, + } + try: + fun = hashmap[alg] + except KeyError: + raise KeyError('invalid alg: %r expected one of %r' % (alg, sorted(hashmap))) + + for line in sys.stdin: + word = line.rstrip('\n') + ngrams = fun(word, minn, maxn) + print("%r: %r," % (word, ngrams)) + + +class NgramsTest(unittest.TestCase): + def setUp(self): + self.expected_text = { + 'test': ['', '', ''], + 'at the': [ + '', + '', '' + ], + 'at\nthe': [ + '', + '', '' + ], + 'тест': ['<те', 'тес', 'ест', 'ст>', '<тес', 'тест', 'ест>', '<тест', 'тест>'], + 'テスト': ['<テス', 'テスト', 'スト>', '<テスト', 'テスト>', '<テスト>'], + '試し': ['<試し', '試し>', '<試し>'], + } + self.expected_bytes = { + 'test': [b'', b'est', b'est>', b'st>'], + 'at the': [ + b'', b'the', b'the>', b'he>' + ], + 'тест': [ + b'<\xd1\x82\xd0\xb5', b'<\xd1\x82\xd0\xb5\xd1\x81', b'<\xd1\x82\xd0\xb5\xd1\x81\xd1\x82', + b'\xd1\x82\xd0\xb5\xd1\x81', b'\xd1\x82\xd0\xb5\xd1\x81\xd1\x82', b'\xd1\x82\xd0\xb5\xd1\x81\xd1\x82>', + b'\xd0\xb5\xd1\x81\xd1\x82', b'\xd0\xb5\xd1\x81\xd1\x82>', b'\xd1\x81\xd1\x82>' + ], + 'テスト': [ + b'<\xe3\x83\x86\xe3\x82\xb9', b'<\xe3\x83\x86\xe3\x82\xb9\xe3\x83\x88', + b'<\xe3\x83\x86\xe3\x82\xb9\xe3\x83\x88>', b'\xe3\x83\x86\xe3\x82\xb9\xe3\x83\x88', + b'\xe3\x83\x86\xe3\x82\xb9\xe3\x83\x88>', b'\xe3\x82\xb9\xe3\x83\x88>' + ], + '試し': [b'<\xe8\xa9\xa6\xe3\x81\x97', b'<\xe8\xa9\xa6\xe3\x81\x97>', b'\xe8\xa9\xa6\xe3\x81\x97>'], + } + + self.expected_text_wide_unicode = { + '🚑🚒🚓🚕': [ + '<🚑🚒', '🚑🚒🚓', '🚒🚓🚕', '🚓🚕>', + '<🚑🚒🚓', '🚑🚒🚓🚕', '🚒🚓🚕>', '<🚑🚒🚓🚕', '🚑🚒🚓🚕>' + ], + } + self.expected_bytes_wide_unicode = { + '🚑🚒🚓🚕': [ + b'<\xf0\x9f\x9a\x91\xf0\x9f\x9a\x92', + b'<\xf0\x9f\x9a\x91\xf0\x9f\x9a\x92\xf0\x9f\x9a\x93', + b'<\xf0\x9f\x9a\x91\xf0\x9f\x9a\x92\xf0\x9f\x9a\x93\xf0\x9f\x9a\x95', + b'\xf0\x9f\x9a\x91\xf0\x9f\x9a\x92\xf0\x9f\x9a\x93', + b'\xf0\x9f\x9a\x91\xf0\x9f\x9a\x92\xf0\x9f\x9a\x93\xf0\x9f\x9a\x95', + b'\xf0\x9f\x9a\x91\xf0\x9f\x9a\x92\xf0\x9f\x9a\x93\xf0\x9f\x9a\x95>', + b'\xf0\x9f\x9a\x92\xf0\x9f\x9a\x93\xf0\x9f\x9a\x95', + b'\xf0\x9f\x9a\x92\xf0\x9f\x9a\x93\xf0\x9f\x9a\x95>', + b'\xf0\x9f\x9a\x93\xf0\x9f\x9a\x95>' + ], + } + + def test_text_py(self): + for word in self.expected_text: + expected = self.expected_text[word] + actual = gensim.models.utils_any2vec._compute_ngrams_py(word, 3, 5) + self.assertEqual(expected, actual) + + @unittest.skipIf(sys.maxunicode == 0xffff, "Python interpreter doesn't support UCS-4 (wide unicode)") + def test_text_py_wide_unicode(self): + for word in self.expected_text_wide_unicode: + expected = self.expected_text_wide_unicode[word] + actual = gensim.models.utils_any2vec._compute_ngrams_py(word, 3, 5) + self.assertEqual(expected, actual) + + @unittest.skipIf(DISABLE_CYTHON_TESTS, 'Cython functions are not properly compiled') + def test_text_cy(self): + for word in self.expected_text: + expected = self.expected_text[word] + actual = gensim.models.utils_any2vec._compute_ngrams_cy(word, 3, 5) + self.assertEqual(expected, actual) + + @unittest.skipIf(DISABLE_CYTHON_TESTS, 'Cython functions are not properly compiled') + @unittest.skipIf(sys.maxunicode == 0xffff, "Python interpreter doesn't support UCS-4 (wide unicode)") + def test_text_cy_wide_unicode(self): + for word in self.expected_text_wide_unicode: + expected = self.expected_text_wide_unicode[word] + actual = gensim.models.utils_any2vec._compute_ngrams_cy(word, 3, 5) + self.assertEqual(expected, actual) + + def test_bytes_py(self): + for word in self.expected_bytes: + expected = self.expected_bytes[word] + actual = gensim.models.utils_any2vec._compute_ngrams_bytes_py(word, 3, 5) + self.assertEqual(expected, actual) + + expected_text = self.expected_text[word] + actual_text = [n.decode('utf-8') for n in actual] + # + # The text and byte implementations yield ngrams in different + # order, so the test ignores ngram order. + # + self.assertEqual(sorted(expected_text), sorted(actual_text)) + + for word in self.expected_bytes_wide_unicode: + expected = self.expected_bytes_wide_unicode[word] + actual = gensim.models.utils_any2vec._compute_ngrams_bytes_py(word, 3, 5) + self.assertEqual(expected, actual) + + expected_text = self.expected_text_wide_unicode[word] + actual_text = [n.decode('utf-8') for n in actual] + + self.assertEqual(sorted(expected_text), sorted(actual_text)) + + @unittest.skipIf(DISABLE_CYTHON_TESTS, 'Cython functions are not properly compiled') + def test_bytes_cy(self): + for word in self.expected_bytes: + expected = self.expected_bytes[word] + actual = gensim.models.utils_any2vec._compute_ngrams_bytes_cy(word, 3, 5) + self.assertEqual(expected, actual) + + expected_text = self.expected_text[word] + actual_text = [n.decode('utf-8') for n in actual] + self.assertEqual(sorted(expected_text), sorted(actual_text)) + + for word in self.expected_bytes_wide_unicode: + expected = self.expected_bytes_wide_unicode[word] + actual = gensim.models.utils_any2vec._compute_ngrams_bytes_cy(word, 3, 5) + self.assertEqual(expected, actual) + + expected_text = self.expected_text_wide_unicode[word] + actual_text = [n.decode('utf-8') for n in actual] + self.assertEqual(sorted(expected_text), sorted(actual_text)) + + def test_fb(self): + """Test against results from Facebook's implementation.""" + with smart_open.smart_open(datapath('fb-ngrams.txt'), 'r', encoding='utf-8') as fin: + fb = dict(_read_fb(fin)) + + for word, expected in fb.items(): + # + # The model was trained with minn=3, maxn=6 + # + actual = gensim.models.utils_any2vec._compute_ngrams_py(word, 3, 6) + self.assertEqual(sorted(expected), sorted(actual)) + + +def _read_fb(fin): + """Read ngrams from output of the FB utility.""" + # + # $ cat words.txt + # test + # at the + # at\nthe + # тест + # テスト + # 試し + # 🚑🚒🚓🚕 + # $ while read w; + # do + # echo ""; + # echo $w; + # ./fasttext print-ngrams gensim/test/test_data/crime-and-punishment.bin "$w"; + # echo ""; + # done < words.txt > gensim/test/test_data/fb-ngrams.txt + # + while fin: + line = fin.readline().rstrip() + if not line: + break + + assert line == '' + word = fin.readline().rstrip() + + fin.readline() # ignore this line, it contains an origin vector for the full term + + ngrams = [] + while True: + line = fin.readline().rstrip() + if line == '': + break + + columns = line.split(' ') + term = ' '.join(columns[:-5]) + ngrams.append(term) + + yield word, ngrams + + if __name__ == '__main__': logging.root.setLevel(logging.WARNING) unittest.main() diff --git a/setup.py b/setup.py index 0de5e535c5..0e60453d01 100644 --- a/setup.py +++ b/setup.py @@ -301,7 +301,7 @@ def finalize_options(self): setup( name='gensim', - version='3.7.0', + version='3.7.1', description='Python framework for fast Vector Space Modelling', long_description=LONG_DESCRIPTION,