diff --git a/notebooks/model_wz.ipynb b/notebooks/model_wz.ipynb new file mode 100644 index 0000000000000000000000000000000000000000..76fc9a889bb13f55640a53397d673f043c7db0e1 --- /dev/null +++ b/notebooks/model_wz.ipynb @@ -0,0 +1,5712 @@ +{ + "cells": [ + { + "cell_type": "code", + "execution_count": 1, + "id": "aae7ed22-70fd-40c9-96b3-ab95128778ed", + "metadata": {}, + "outputs": [], + "source": [ + "import os\n", + "import csv\n", + "import pathlib\n", + "import pandas as pd\n", + "import numpy as np\n", + "import matplotlib.pyplot as plt\n", + "import seaborn as sns\n", + "import nltk\n", + "import re\n", + "import statistics\n", + "import string\n", + "from collections import Counter\n", + "from collections import defaultdict\n", + "from sklearn.model_selection import train_test_split\n", + "import octis\n", + "import gensim\n", + "import spacy\n", + "import sklearn\n", + "import torch\n", + "import libsvm\n", + "import flask\n", + "import sentence_transformers\n", + "import requests\n", + "import tomotopy" + ] + }, + { + "cell_type": "code", + "execution_count": 2, + "id": "44cdbc43-3210-44e1-aae2-3df85cd58804", + "metadata": {}, + "outputs": [], + "source": [ + "import warnings\n", + "warnings.filterwarnings(\"ignore\")" + ] + }, + { + "cell_type": "code", + "execution_count": 3, + "id": "e5279737-393b-4780-b4e3-4cb6fe300f98", + "metadata": {}, + "outputs": [], + "source": [ + "os.chdir(r\"C:\\Users\\onb1202\\OneDrive - Österreichische Nationalbibliothek\\Praktikum TK\\daten\")" + ] + }, + { + "cell_type": "code", + "execution_count": 11, + "id": "ba20b025-7c11-4b1e-bfd5-f3b180740a6e", + "metadata": {}, + "outputs": [], + "source": [ + "wz_clean = pd.read_csv('wz_clean5.tsv', sep = '\\t', encoding='utf-8')" + ] + }, + { + "cell_type": "code", + "execution_count": 12, + "id": "48b406dc-8d9b-454c-98ed-ceed68d3be5f", + "metadata": {}, + "outputs": [], + "source": [ + "wz_clean = wz_clean.iloc[: , 1:]" + ] + }, + { + "cell_type": "code", + "execution_count": 13, + "id": "c4d03ec1-c2a6-4e7c-9c47-d1b6276fe214", + "metadata": {}, + "outputs": [], + "source": [ + "wz_clean = wz_clean.drop(columns=['year'])" + ] + }, + { + "cell_type": "code", + "execution_count": 14, + "id": "2405f8c4-7457-4872-8bd1-bc0fe53f304c", + "metadata": {}, + "outputs": [ + { + "data": { + "text/html": [ + "
\n", + "\n", + "\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
ocrsplitmanifest_id
0sonnabend iäner inländische begebenheiten bens...testwrz17890103
1mittewoche ianer inländische begebenheit wien ...trainwrz17890107
2dtii inländische begebenheiten vorthei zugleic...testwrz17890110
3mittewoche begebenheiten sonntag hofe gottesdi...trainwrz17890114
4sonnabend inländische begebenheit horch kret r...trainwrz17890117
............
1090sonnabend december inländische majestät habew ...trainwrz17991214
1091sranj unft ober unftre gehn tlgen stieg turd m...validwrz17991218
1092sonnabend december inländische begebenheiten w...validwrz17991221
1093zmar mittewoche december inländische vegebenhe...testwrz17991225
1094sonnabend december inländische bege hell chris...testwrz17991228
\n", + "

1095 rows × 3 columns

\n", + "
" + ], + "text/plain": [ + " ocr split manifest_id\n", + "0 sonnabend iäner inländische begebenheiten bens... test wrz17890103\n", + "1 mittewoche ianer inländische begebenheit wien ... train wrz17890107\n", + "2 dtii inländische begebenheiten vorthei zugleic... test wrz17890110\n", + "3 mittewoche begebenheiten sonntag hofe gottesdi... train wrz17890114\n", + "4 sonnabend inländische begebenheit horch kret r... train wrz17890117\n", + "... ... ... ...\n", + "1090 sonnabend december inländische majestät habew ... train wrz17991214\n", + "1091 sranj unft ober unftre gehn tlgen stieg turd m... valid wrz17991218\n", + "1092 sonnabend december inländische begebenheiten w... valid wrz17991221\n", + "1093 zmar mittewoche december inländische vegebenhe... test wrz17991225\n", + "1094 sonnabend december inländische bege hell chris... test wrz17991228\n", + "\n", + "[1095 rows x 3 columns]" + ] + }, + "execution_count": 14, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "wz_clean" + ] + }, + { + "cell_type": "code", + "execution_count": 15, + "id": "3b31742f-7ee4-4bee-97e8-0325980c605c", + "metadata": {}, + "outputs": [ + { + "data": { + "text/plain": [ + "train 652\n", + "test 222\n", + "valid 221\n", + "Name: split, dtype: int64" + ] + }, + "execution_count": 15, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "wz_clean['split'].value_counts()" + ] + }, + { + "cell_type": "code", + "execution_count": 53, + "id": "0271ae15-71f5-4465-ac28-5d69320944b4", + "metadata": {}, + "outputs": [], + "source": [ + "wz_clean.to_csv('corpus_wz_clean5.tsv', sep='\\t', index=False, header=False)" + ] + }, + { + "cell_type": "markdown", + "id": "4e2208c9-f8d6-4ea2-a746-b52df8a030f5", + "metadata": {}, + "source": [ + "

vocabulary creation

" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "id": "552e66ef-def5-407b-9de8-d4ee89fb1039", + "metadata": {}, + "outputs": [], + "source": [ + "wz_clean = pd.read_csv('wz_clean5.tsv', sep = '\\t', encoding='utf-8')" + ] + }, + { + "cell_type": "code", + "execution_count": 54, + "id": "bc4bba2a-8c43-4f1a-946c-34c3fda4c0f3", + "metadata": {}, + "outputs": [], + "source": [ + "texts_wz = wz_clean['ocr'].sum()" + ] + }, + { + "cell_type": "code", + "execution_count": 55, + "id": "fdf64a4c-a1eb-4c7e-92b5-53743d766d47", + "metadata": {}, + "outputs": [], + "source": [ + "texts_wz = texts_wz.split(\" \")" + ] + }, + { + "cell_type": "code", + "execution_count": 56, + "id": "7c98bb56-c77a-4fd1-b593-0a1f4d3b468b", + "metadata": {}, + "outputs": [], + "source": [ + "vocabulary_wz = set(texts_wz)" + ] + }, + { + "cell_type": "code", + "execution_count": 57, + "id": "45bb9dc8-8595-470a-bbcd-4139cf583ece", + "metadata": {}, + "outputs": [ + { + "data": { + "text/plain": [ + "118936" + ] + }, + "execution_count": 57, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "len(vocabulary_wz)" + ] + }, + { + "cell_type": "code", + "execution_count": 58, + "id": "fc674043-e3a6-4df2-bd32-5f7d82d8ee44", + "metadata": {}, + "outputs": [], + "source": [ + "textfile = open(\"vocabulary_wz_enc5.txt\", \"w\", encoding='cp1252')\n", + "for element in vocabulary_wz:\n", + " textfile.write(element + \"\\n\")\n", + "textfile.close()" + ] + }, + { + "cell_type": "markdown", + "id": "591b33ac-3660-49a3-9a80-5a6a1ec16e57", + "metadata": {}, + "source": [ + "

default model

" + ] + }, + { + "cell_type": "code", + "execution_count": 4, + "id": "25625a43-6351-4aec-b651-6a738229e899", + "metadata": {}, + "outputs": [], + "source": [ + "from octis.models.ETM import ETM\n", + "from octis.dataset.dataset import Dataset" + ] + }, + { + "cell_type": "code", + "execution_count": 5, + "id": "d209323b-9993-485d-9f45-f624dcda96ce", + "metadata": {}, + "outputs": [], + "source": [ + "dataset = Dataset()\n", + "dataset.load_custom_dataset_from_folder(r\"C:\\Users\\onb1202\\OneDrive - Österreichische Nationalbibliothek\\Praktikum TK\\daten\\corpus_wz_5\")" + ] + }, + { + "cell_type": "code", + "execution_count": 6, + "id": "df1890b9-2f23-4c36-ad66-06065546b360", + "metadata": {}, + "outputs": [], + "source": [ + "model = ETM(num_topics=100, num_epochs=150, t_hidden_size=1000, rho_size=600,\n", + "embedding_size=800, activation='relu', dropout=0.1, lr=0.005,\n", + "optimizer='adam', batch_size=128, clip=0.0, wdecay=1.2e-06, bow_norm=1,\n", + "device='cpu', top_word=25, train_embeddings=True, embeddings_path=None,\n", + "embeddings_type='pickle', binary_embeddings=True,\n", + "headerless_embeddings=False, use_partitions=True)" + ] + }, + { + "cell_type": "code", + "execution_count": 7, + "id": "80234356-807b-4de0-a76b-80f9ad404928", + "metadata": {}, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "model: ETM(\n", + " (t_drop): Dropout(p=0.1, inplace=False)\n", + " (theta_act): ReLU()\n", + " (rho): Linear(in_features=600, out_features=118936, bias=False)\n", + " (alphas): Linear(in_features=600, out_features=100, bias=False)\n", + " (q_theta): Sequential(\n", + " (0): Linear(in_features=118936, out_features=1000, bias=True)\n", + " (1): ReLU()\n", + " (2): Linear(in_features=1000, out_features=1000, bias=True)\n", + " (3): ReLU()\n", + " )\n", + " (mu_q_theta): Linear(in_features=1000, out_features=100, bias=True)\n", + " (logsigma_q_theta): Linear(in_features=1000, out_features=100, bias=True)\n", + ")\n", + "****************************************************************************************************\n", + "Epoch----->1 .. LR: 0.005 .. KL_theta: 1.28 .. Rec_loss: 88905.47 .. NELBO: 88906.75\n", + "****************************************************************************************************\n", + "****************************************************************************************************\n", + "VALIDATION .. LR: 0.005 .. KL_theta: nan .. Rec_loss: nan .. NELBO: nan\n", + "****************************************************************************************************\n" + ] + } + ], + "source": [ + "model_output = model.train_model(dataset)" + ] + }, + { + "cell_type": "code", + "execution_count": 263, + "id": "b54d6245-9776-4fef-9088-96fba86028fa", + "metadata": {}, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "hinaus nachher befanden unfehlbar entschieden mauern gleich widrigenfalls königl rden\n", + "bevollmächtig oktober gebe groß scho fortgesetzt nahm zinn bücher herr\n", + "gränze sagten befanden adler stellte hinaus wenigstens flotte herrschaft eiche\n", + "tten oktober nung wenigstens mauern herr adler vorsicht könn nehme\n", + "oktober herr freyherrn mauern eiche wieden zimmer schein keller tages\n", + "alda ters dortigen ischen hinaus wage scho eigenschaft verdienste grossen\n", + "adler barometerstand gleich widrigenfalls such anzumelden falls bestehend theil ersteren\n", + "bevollmächtig traf hinaus tages general oktober that priester ansprü schein\n", + "herr wenzel eigene erhielt bevollmächtig mber dürfen sieben golde gegeben\n", + "schön rben bestehend anzumelden jahr gebe gebliebenen lehen keller versichern\n", + "eiche gleich hinaus tages termins scho königl walter nahe oktober\n", + "such richtig dienstbare hinaus melde gattung ledige gelegen ferd eiche\n", + "mauern bevollmächtig jahren eiche dürfen wenigstens such anführer ausfindig unsern\n", + "mauern königl dukaten geschickte gebrauch reiche gesandt wenigstens tüch stellte\n", + "gesetzt mauern gemäß scho melde sprach gibt hiesige sieben befanden\n", + "verlasse unfehlbar pfen voraus gleich wesen such ledige berliner bothen\n", + "bevollmächtig termins fragen oktober wieden gebe such bedacht gerichtet gethan\n", + "dortigen stellte gränze gesandt bedacht dritte abtheilung bewegung traf rden\n", + "volle herr dienstbare sagten ranz erworben anzumelden königl niger bücher\n", + "büchern cher indessen mauern herr scho hinaus gemäß bedacht beding\n", + "starten blieb befanden diejenigen gebührte französisch alda mauern wenigstens rden\n", + "dienstbare anzumelden mauern dritte eigene schweden rußische vorzuladen theil scho\n", + "such hinaus wäscher könn vergleich befindlich bücher volle erweisen gedenke\n", + "eder mühle adler rechr hinaus erweisen anmelden tzen sebast mauern\n", + "gleich oktober sieben schweden wind beding theil hundert dukaten ulrich\n", + "drey herr dortigen hinaus nachher scho bücher kaiser niemand ranz\n", + "scho eigene stellte erscheinen ferd wahrscheinlich darunter königl schönes tages\n", + "hinaus ranz theil ledige befanden kleinen cher traf keller kleider\n", + "dahin gläubiger widrigenfalls anzumelden schweden dienstbare schein zahlung eiche dieft\n", + "bevollmächtig grossen volle befanden mittels oktober erweisen gränze erhielt gesetzt\n", + "herr eigene bevollmächtig oktober gränze rden verlangte schweden setzen rechr\n", + "staaten gegenwärtig herr mittels nachricht befanden adler wenigstens scho gesandt\n", + "schweden gesamm rung fragen mauern zeitung eigene beding lande kaiser\n", + "hinaus weniger schweden scho gattung gleich größten herr stellte schein\n", + "königl jahren mauern bevollmächtig unfehlbar rung gegenwärtig gnade stellte vorzu\n", + "mauern hinaus eder befanden unserer zimmer widrigenfalls einzelne oktober wenigstens\n", + "abends grossen weichen fragen vergleich aeckern einzelne mittels adler untersuchung\n", + "sieben scho dienstbare arbeit dritte dortigen schweden bevollmächtig waaren herrschaft\n", + "hinaus mauern verdienste oktober adler kleinen rußische enthalten theils zimmer\n", + "scho nachher stellte anzumelden reiche gebührte cher weniger gebe okto\n", + "unfehlbar herr ischen anzumelden eigene wenigstens wind unternehmung dürften fragen\n", + "kleider mauern deutsch grösse such eder sachen herr anzumelden diensten\n", + "wenigstens schweden theil oktober rische gleich dortigen vermögen bier zeit\n", + "niemand hinaus walter dienstbare zimmer verdienste general nahm bücher dritte\n", + "königl scho gesetzt mauern ersteren theil hinaus fragen drey nahm\n", + "nöthig ferd bevollmächtig keller hende schein generale rung strenge hergestellt\n", + "offizieren rechr schweden mente that wohlfahrt weniger mauern königl gleich\n", + "königl widrigenfalls schweden bevollmächtig hell oktober walter anführer eigene grossen\n", + "wenigstens todt groß erklärung dukaten niger niemand termins fortgesetzt nämlich\n", + "mauern eiche kurzem begebenheiten höher nutzen zimmer anzumelden erweisen gruber\n", + "ters ferd eifer weiss hinaus gegenwärtig scho rück gebührte ausfindig\n", + "oktober gränze schein bevollmächtig rechr adler erweisen verkaufe bisher bücher\n", + "herr höchste hinaus gattung befanden vorschrift bevollmächtig voraus erklärung walter\n", + "angriffe stellte leere oktober schuldig anführer erweisen ffen niemand darunter\n", + "wenigstens gleich anzumelden mittels kaiser schweren bevollmächtig ferd gattung hinaus\n", + "darf rechr mauern befanden raab verlauf stellte wenigstens gegeben zeit\n", + "such scho tages erklärung deutsch hinaus jahren königl anzumelden wenigstens\n", + "verdienste oktober bevollmächtig letzten silber ehre verlangte betrag hinaus mittels\n", + "angriffe adler dürfen mittels könn erweisen wiesen traf hauptstadt zimmer\n", + "hinaus könn vier theil rechr grossen erstgedacht kaiser heuboden mauern\n", + "hinaus verlangte liget niger kaiser widrigenfalls unfehlbar eigene weiss kund\n", + "mauern hinaus jahr verkaufe befindliche gruber lande general bevollmächtig adler\n", + "wenigstens oktober nutzen wich dürfen bücher geschieht mauern dung beweisen\n", + "wenigstens anzumelden hinaus grossen adler rden fragen letzten abtheilung starken\n", + "masse dortigen gegenden unternehmung cheln scho anfragen grossen gebe herr\n", + "meister gedenke oktober letzt schweden befanden widrigenfalls schuldig wenigstens aeckern\n", + "mauern kleinen scho wenigstens rische deutsch schuldig bäume standes termins\n", + "hinaus ferd mauern doktor zimmer anzumelden blatt oktober habm eiche\n", + "eigene höchste herr beweg kleinere hundert weniger darf bücher sagten\n", + "aeckern hinaus mauern traf julius vermögen adler gemäß such königl\n", + "befindlich stellte mauern theil adler gränze unfehlbar dienstbare bestehend näher\n", + "gemeldet rden hinaus dritte ferd nahm woche sagten ider gränze\n", + "königl oktober hinaus sagten rechr enthalten vorder stände nahm eiche\n", + "hinaus magistrat termins lande keller ferd widrigenfalls gebirg übrig eigene\n", + "meistens hinaus nutzen wech mauern zimmer erde setzen ende ofen\n", + "gebe jahren letzten dritte dortigen unfehlbar heit keller vollkommen zimmer\n", + "such bevollmächtig hinaus schein staaten scho meistens jahren theil braunen\n", + "adler hinaus wenigstens letzten schweren neuesten rück schuldig wahrend mangel\n", + "nutzen gebührte groß hinaus mittels königl gattung kleider tische widrigenfalls\n", + "niemand mauern walter adler sagten wäscher hauptstadt unterhaltung vergleich nahe\n", + "starken unterm stellte aeckern sagten mauern barometerstand anzumelden verkaufe gränze\n", + "gebührte erweisen ofen bevollmächtig mauern anzumelden grossen gebrauch magistrat stände\n", + "hinaus unterm förmliche bevor hofe nutzen hicmit befindliche hiesige traf\n", + "such schweden kaiser zimmer sagten eiche hinaus beding nutzen letzt\n", + "ferd freyherrn wahrend kurzem weiss anzumelden illum beweg sagten letzt\n", + "rechr königl mauern versichern bevollmächtig richten hinaus unternehmung kaiser wert\n", + "nachher termins gebrauch bevollmächtig unterhaltung hinaus ulrich wenigstens unfehlbar bewegung\n", + "strenge adler interessen mauern begebenheiten gebührte fund erweisen vorgeladen oktober\n", + "sachen schweden ischen stellte bevollmächtig nachrichten nachricht beding rosina gebliebenen\n", + "gebirg könn wenigstens hauptstadt gebührte adler erweisen unbekannt bevollmächtig berliner\n", + "herr gemeldet eigene hinaus unternehmung groß königl barb mannschaft oktober\n", + "scho keller unfehlbar königl ferd kleider gebe dritte kart dürften\n", + "richten walter bücher bevollmächtig stande ters erweisen gerichtet fchen beding\n", + "grossen bücher bevollmächtig gebührte meistens lande schuldig geschrieben dritte nachrichten\n", + "gleich mittels höher befanden mauern angriffe unternehmung ischen tages unterhalt\n", + "vermögen ferd eröffnen kleinen hinaus dritte traf niemand ranz raab\n", + "befanden mauern oktober richtig kammer hinaus zugeben rechr diensten rden\n", + "widrigenfalls darunter anzumelden bevollmächtig gemeldet gebe eigene traf mauern betreffend\n", + "deutsch unfehlbar hinaus erschienen schweden angehörigen wenigstens weicher verdienste abends\n", + "zimmer gleich münchen ranz starken oktober rosina kirchen vermeinen mauern\n" + ] + } + ], + "source": [ + "for t in model_output['topics']:\n", + " print(\" \".join(t))" + ] + }, + { + "cell_type": "markdown", + "id": "be195592-c0a9-400d-b816-cd11d47100c4", + "metadata": {}, + "source": [ + "

check topic distribution

" + ] + }, + { + "cell_type": "code", + "execution_count": 264, + "id": "7cd3af7a-d01f-4fee-b509-da028801bb0e", + "metadata": {}, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "0.0059787964725444105\n", + "0.00769818471487543\n", + "0.007845006928139258\n", + "0.01287745649103601\n", + "0.007882614055808429\n", + "0.021140513627395673\n", + "0.0063803652158589816\n", + "0.003840347867676177\n", + "0.004482069944797164\n", + "0.009222705558548035\n", + "0.020719753923980188\n", + "0.012815042394584765\n", + "0.0036802868079536945\n", + "0.0038627161897227535\n", + "0.003942424188613709\n", + "0.010904119111471837\n", + "0.02083862852305174\n", + "0.0039198275136281425\n", + "0.003930344608429523\n", + "0.019912233673310353\n", + "0.009020648005367057\n", + "0.018197241619206463\n", + "0.007845113325315567\n", + "0.020443208261387298\n", + "0.007630307515911712\n", + "0.0038729453722923493\n", + "0.003944417128576526\n", + "0.019241918109791593\n", + "0.006635155320236105\n", + "0.005551625108146366\n", + "0.021718534940933707\n", + "0.007321812053199606\n", + "0.005683674732011749\n", + "0.013743482955782874\n", + "0.015188533702773824\n", + "0.0058729551401149275\n", + "0.003977611751661299\n", + "0.0051438200910307146\n", + "0.0046773377700246\n", + "0.005799026364900537\n", + "0.017189493779938645\n", + "0.021009703523885072\n", + "0.020543984457439074\n", + "0.02112997764652949\n", + "0.015288039062035047\n", + "0.006784754181052187\n", + "0.007869153709202274\n", + "0.00585381303731055\n", + "0.02105999588566415\n", + "0.005403961653484066\n", + "0.012953664470418283\n", + "0.012613967865236973\n", + "0.005746458852063705\n", + "0.005720107985426175\n", + "0.011443835176081836\n", + "0.004239832541042585\n", + "0.0045247736774053585\n", + "0.0140295498418776\n", + "0.005426113865841066\n", + "0.015673086711382664\n", + "0.01046041199120413\n", + "0.0041382441881392725\n", + "0.005948414665395451\n", + "0.012997421380303846\n", + "0.005786573506486059\n", + "0.006074188288552629\n", + "0.006132205834675101\n", + "0.007801057174487576\n", + "0.009358633673846995\n", + "0.017313944270114408\n", + "0.004158880121640267\n", + "0.0039015584286056643\n", + "0.017692697925801658\n", + "0.005685131463359333\n", + "0.006272824476130215\n", + "0.015042053701276063\n", + "0.020335983999210633\n", + "0.01280361829336984\n", + "0.01406441831195647\n", + "0.005614401967596103\n", + "0.005594803066067169\n", + "0.004014016096223077\n", + "0.006813921707116662\n", + "0.02118835557949232\n", + "0.005006143916112605\n", + "0.020362335885732087\n", + "0.01003323871630924\n", + "0.010151861646881134\n", + "0.010257397226966414\n", + "0.003919887495372856\n", + "0.005887601066786407\n", + "0.007057942212216464\n", + "0.006157704665428428\n", + "0.011487390160377772\n", + "0.009505817069574917\n", + "0.016725525834191977\n", + "0.014215720797448985\n", + "0.011327869850182278\n", + "0.0038987879024995663\n", + "0.006923938894278707\n" + ] + } + ], + "source": [ + "for list in model_output['topic-document-matrix']:\n", + " print(((sum(list))/652))" + ] + }, + { + "cell_type": "code", + "execution_count": 265, + "id": "f10410dd-c938-4bc9-948a-88dadc0e2b6f", + "metadata": {}, + "outputs": [ + { + "data": { + "text/plain": [ + "100" + ] + }, + "execution_count": 265, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "len(model_output['topic-document-matrix'])" + ] + }, + { + "cell_type": "code", + "execution_count": 266, + "id": "b0b46352-d952-44b9-86b9-cc6cfb548885", + "metadata": {}, + "outputs": [], + "source": [ + "top_doc_matrix = model_output['topic-document-matrix']" + ] + }, + { + "cell_type": "code", + "execution_count": 267, + "id": "63b6dc49-5441-4ffc-b82a-352014c4dced", + "metadata": {}, + "outputs": [], + "source": [ + "df = pd.DataFrame(top_doc_matrix).T" + ] + }, + { + "cell_type": "code", + "execution_count": 269, + "id": "29085dee-47b8-4360-82f4-93ed12e4da08", + "metadata": {}, + "outputs": [ + { + "data": { + "text/html": [ + "
\n", + "\n", + "\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
0123456789...90919293949596979899
00.0059980.0077140.0078600.0128720.0078970.0210790.0063980.0038610.0045030.009234...0.0059060.0070750.0061760.0114900.0095150.0166960.0142050.0113310.0039190.006941
10.0060120.0077260.0078730.0128670.0079090.0210330.0064130.0038760.0045190.009242...0.0059210.0070880.0061900.0114920.0095220.0166720.0141960.0113340.0039350.006956
20.0060100.0077240.0078710.0128680.0079070.0210390.0064110.0038740.0045170.009240...0.0059190.0070860.0061880.0114920.0095210.0166750.0141980.0113340.0039330.006953
30.0060150.0077280.0078740.0128670.0079100.0210250.0064140.0038790.0045210.009244...0.0059230.0070910.0061920.0114920.0095230.0166690.0141940.0113330.0039380.006957
40.0060180.0077310.0078800.0128650.0079140.0210100.0064200.0038840.0045270.009245...0.0059280.0070930.0061970.0114940.0095270.0166620.0141930.0113360.0039430.006963
..................................................................
6470.0059570.0076800.0078290.0128830.0078670.0212070.0063620.0038180.0044600.009209...0.0058670.0070380.0061370.0114870.0094970.0167590.0142290.0113260.0038760.006906
6480.0059600.0076820.0078310.0128820.0078680.0211990.0063640.0038210.0044620.009211...0.0058690.0070400.0061400.0114870.0094980.0167550.0142270.0113260.0038790.006908
6490.0059480.0076720.0078210.0128860.0078590.0212390.0063520.0038070.0044490.009204...0.0058570.0070290.0061280.0114850.0094930.0167750.0142350.0113240.0038650.006896
6500.0059670.0076880.0078360.0128810.0078740.0211780.0063700.0038280.0044690.009215...0.0058760.0070470.0061460.0114870.0095010.0167440.0142230.0113270.0038860.006914
6510.0059550.0076790.0078270.0128840.0078650.0212150.0063590.0038150.0044570.009209...0.0058650.0070360.0061350.0114850.0094950.0167630.0142300.0113250.0038730.006903
\n", + "

652 rows × 100 columns

\n", + "
" + ], + "text/plain": [ + " 0 1 2 3 4 5 6 \\\n", + "0 0.005998 0.007714 0.007860 0.012872 0.007897 0.021079 0.006398 \n", + "1 0.006012 0.007726 0.007873 0.012867 0.007909 0.021033 0.006413 \n", + "2 0.006010 0.007724 0.007871 0.012868 0.007907 0.021039 0.006411 \n", + "3 0.006015 0.007728 0.007874 0.012867 0.007910 0.021025 0.006414 \n", + "4 0.006018 0.007731 0.007880 0.012865 0.007914 0.021010 0.006420 \n", + ".. ... ... ... ... ... ... ... \n", + "647 0.005957 0.007680 0.007829 0.012883 0.007867 0.021207 0.006362 \n", + "648 0.005960 0.007682 0.007831 0.012882 0.007868 0.021199 0.006364 \n", + "649 0.005948 0.007672 0.007821 0.012886 0.007859 0.021239 0.006352 \n", + "650 0.005967 0.007688 0.007836 0.012881 0.007874 0.021178 0.006370 \n", + "651 0.005955 0.007679 0.007827 0.012884 0.007865 0.021215 0.006359 \n", + "\n", + " 7 8 9 ... 90 91 92 \\\n", + "0 0.003861 0.004503 0.009234 ... 0.005906 0.007075 0.006176 \n", + "1 0.003876 0.004519 0.009242 ... 0.005921 0.007088 0.006190 \n", + "2 0.003874 0.004517 0.009240 ... 0.005919 0.007086 0.006188 \n", + "3 0.003879 0.004521 0.009244 ... 0.005923 0.007091 0.006192 \n", + "4 0.003884 0.004527 0.009245 ... 0.005928 0.007093 0.006197 \n", + ".. ... ... ... ... ... ... ... \n", + "647 0.003818 0.004460 0.009209 ... 0.005867 0.007038 0.006137 \n", + "648 0.003821 0.004462 0.009211 ... 0.005869 0.007040 0.006140 \n", + "649 0.003807 0.004449 0.009204 ... 0.005857 0.007029 0.006128 \n", + "650 0.003828 0.004469 0.009215 ... 0.005876 0.007047 0.006146 \n", + "651 0.003815 0.004457 0.009209 ... 0.005865 0.007036 0.006135 \n", + "\n", + " 93 94 95 96 97 98 99 \n", + "0 0.011490 0.009515 0.016696 0.014205 0.011331 0.003919 0.006941 \n", + "1 0.011492 0.009522 0.016672 0.014196 0.011334 0.003935 0.006956 \n", + "2 0.011492 0.009521 0.016675 0.014198 0.011334 0.003933 0.006953 \n", + "3 0.011492 0.009523 0.016669 0.014194 0.011333 0.003938 0.006957 \n", + "4 0.011494 0.009527 0.016662 0.014193 0.011336 0.003943 0.006963 \n", + ".. ... ... ... ... ... ... ... \n", + "647 0.011487 0.009497 0.016759 0.014229 0.011326 0.003876 0.006906 \n", + "648 0.011487 0.009498 0.016755 0.014227 0.011326 0.003879 0.006908 \n", + "649 0.011485 0.009493 0.016775 0.014235 0.011324 0.003865 0.006896 \n", + "650 0.011487 0.009501 0.016744 0.014223 0.011327 0.003886 0.006914 \n", + "651 0.011485 0.009495 0.016763 0.014230 0.011325 0.003873 0.006903 \n", + "\n", + "[652 rows x 100 columns]" + ] + }, + "execution_count": 269, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "df" + ] + }, + { + "cell_type": "code", + "execution_count": 270, + "id": "47fb5f79-1bd9-4d7e-92a5-7a7ca0869a79", + "metadata": {}, + "outputs": [], + "source": [ + "wz = pd.read_csv('wz_clean.tsv', sep = '\\t', encoding='utf-8')" + ] + }, + { + "cell_type": "code", + "execution_count": 271, + "id": "deb3780d-eb8b-4961-b094-a8b7138ee687", + "metadata": {}, + "outputs": [], + "source": [ + "wz = wz.iloc[: , 1:]" + ] + }, + { + "cell_type": "code", + "execution_count": 272, + "id": "585642c2-892a-4435-8d73-74234cc3a09c", + "metadata": {}, + "outputs": [], + "source": [ + "wz = wz.iloc[: , 1:]" + ] + }, + { + "cell_type": "code", + "execution_count": 274, + "id": "3989efb9-e7ec-40f8-8170-15497cfbe2b8", + "metadata": {}, + "outputs": [], + "source": [ + "df_split = wz[wz['split'] == 'train']" + ] + }, + { + "cell_type": "code", + "execution_count": 275, + "id": "a62f613d-1a2c-4cff-9395-8123a716ead6", + "metadata": {}, + "outputs": [], + "source": [ + "df_split = df_split.reset_index(drop=True)" + ] + }, + { + "cell_type": "code", + "execution_count": 276, + "id": "5574d790-7cb4-4559-87aa-673fecdb4b5e", + "metadata": {}, + "outputs": [], + "source": [ + "df_top_doc_mat = pd.concat([df_split, df], axis=\"columns\")" + ] + }, + { + "cell_type": "code", + "execution_count": 277, + "id": "a3713d66-4846-4970-aa3e-d53871b2e1db", + "metadata": {}, + "outputs": [ + { + "data": { + "text/html": [ + "
\n", + "\n", + "\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
splitmanifest_idyear0123456...90919293949596979899
0trainwrz1789010717890.0059980.0077140.0078600.0128720.0078970.0210790.006398...0.0059060.0070750.0061760.0114900.0095150.0166960.0142050.0113310.0039190.006941
1trainwrz1789011417890.0060120.0077260.0078730.0128670.0079090.0210330.006413...0.0059210.0070880.0061900.0114920.0095220.0166720.0141960.0113340.0039350.006956
2trainwrz1789011717890.0060100.0077240.0078710.0128680.0079070.0210390.006411...0.0059190.0070860.0061880.0114920.0095210.0166750.0141980.0113340.0039330.006953
3trainwrz1789012817890.0060150.0077280.0078740.0128670.0079100.0210250.006414...0.0059230.0070910.0061920.0114920.0095230.0166690.0141940.0113330.0039380.006957
4trainwrz1789020717890.0060180.0077310.0078800.0128650.0079140.0210100.006420...0.0059280.0070930.0061970.0114940.0095270.0166620.0141930.0113360.0039430.006963
..................................................................
647trainwrz1799112717990.0059570.0076800.0078290.0128830.0078670.0212070.006362...0.0058670.0070380.0061370.0114870.0094970.0167590.0142290.0113260.0038760.006906
648trainwrz1799120417990.0059600.0076820.0078310.0128820.0078680.0211990.006364...0.0058690.0070400.0061400.0114870.0094980.0167550.0142270.0113260.0038790.006908
649trainwrz1799120717990.0059480.0076720.0078210.0128860.0078590.0212390.006352...0.0058570.0070290.0061280.0114850.0094930.0167750.0142350.0113240.0038650.006896
650trainwrz1799121117990.0059670.0076880.0078360.0128810.0078740.0211780.006370...0.0058760.0070470.0061460.0114870.0095010.0167440.0142230.0113270.0038860.006914
651trainwrz1799121417990.0059550.0076790.0078270.0128840.0078650.0212150.006359...0.0058650.0070360.0061350.0114850.0094950.0167630.0142300.0113250.0038730.006903
\n", + "

652 rows × 103 columns

\n", + "
" + ], + "text/plain": [ + " split manifest_id year 0 1 2 3 \\\n", + "0 train wrz17890107 1789 0.005998 0.007714 0.007860 0.012872 \n", + "1 train wrz17890114 1789 0.006012 0.007726 0.007873 0.012867 \n", + "2 train wrz17890117 1789 0.006010 0.007724 0.007871 0.012868 \n", + "3 train wrz17890128 1789 0.006015 0.007728 0.007874 0.012867 \n", + "4 train wrz17890207 1789 0.006018 0.007731 0.007880 0.012865 \n", + ".. ... ... ... ... ... ... ... \n", + "647 train wrz17991127 1799 0.005957 0.007680 0.007829 0.012883 \n", + "648 train wrz17991204 1799 0.005960 0.007682 0.007831 0.012882 \n", + "649 train wrz17991207 1799 0.005948 0.007672 0.007821 0.012886 \n", + "650 train wrz17991211 1799 0.005967 0.007688 0.007836 0.012881 \n", + "651 train wrz17991214 1799 0.005955 0.007679 0.007827 0.012884 \n", + "\n", + " 4 5 6 ... 90 91 92 \\\n", + "0 0.007897 0.021079 0.006398 ... 0.005906 0.007075 0.006176 \n", + "1 0.007909 0.021033 0.006413 ... 0.005921 0.007088 0.006190 \n", + "2 0.007907 0.021039 0.006411 ... 0.005919 0.007086 0.006188 \n", + "3 0.007910 0.021025 0.006414 ... 0.005923 0.007091 0.006192 \n", + "4 0.007914 0.021010 0.006420 ... 0.005928 0.007093 0.006197 \n", + ".. ... ... ... ... ... ... ... \n", + "647 0.007867 0.021207 0.006362 ... 0.005867 0.007038 0.006137 \n", + "648 0.007868 0.021199 0.006364 ... 0.005869 0.007040 0.006140 \n", + "649 0.007859 0.021239 0.006352 ... 0.005857 0.007029 0.006128 \n", + "650 0.007874 0.021178 0.006370 ... 0.005876 0.007047 0.006146 \n", + "651 0.007865 0.021215 0.006359 ... 0.005865 0.007036 0.006135 \n", + "\n", + " 93 94 95 96 97 98 99 \n", + "0 0.011490 0.009515 0.016696 0.014205 0.011331 0.003919 0.006941 \n", + "1 0.011492 0.009522 0.016672 0.014196 0.011334 0.003935 0.006956 \n", + "2 0.011492 0.009521 0.016675 0.014198 0.011334 0.003933 0.006953 \n", + "3 0.011492 0.009523 0.016669 0.014194 0.011333 0.003938 0.006957 \n", + "4 0.011494 0.009527 0.016662 0.014193 0.011336 0.003943 0.006963 \n", + ".. ... ... ... ... ... ... ... \n", + "647 0.011487 0.009497 0.016759 0.014229 0.011326 0.003876 0.006906 \n", + "648 0.011487 0.009498 0.016755 0.014227 0.011326 0.003879 0.006908 \n", + "649 0.011485 0.009493 0.016775 0.014235 0.011324 0.003865 0.006896 \n", + "650 0.011487 0.009501 0.016744 0.014223 0.011327 0.003886 0.006914 \n", + "651 0.011485 0.009495 0.016763 0.014230 0.011325 0.003873 0.006903 \n", + "\n", + "[652 rows x 103 columns]" + ] + }, + "execution_count": 277, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "df_top_doc_mat" + ] + }, + { + "cell_type": "code", + "execution_count": 278, + "id": "3d1161e4-da16-4908-9084-dda1d04f8bb1", + "metadata": {}, + "outputs": [], + "source": [ + "df_top_doc_mat['year'] = df_top_doc_mat['year'].astype(str)" + ] + }, + { + "cell_type": "code", + "execution_count": 279, + "id": "35d3d86b-0e24-4dbc-96c2-27607f62298c", + "metadata": {}, + "outputs": [], + "source": [ + "df_melted = df_top_doc_mat.melt(id_vars = ['split', 'manifest_id', 'year'], var_name = 'topics', value_name = 'values')" + ] + }, + { + "cell_type": "code", + "execution_count": 280, + "id": "e0f85447-7566-4dba-85c6-9254cee185b2", + "metadata": {}, + "outputs": [], + "source": [ + "df_melted['topics'] = df_melted['topics'].astype(str)" + ] + }, + { + "cell_type": "code", + "execution_count": 281, + "id": "421a02af-9bd8-4e79-9671-89fb2b56a917", + "metadata": {}, + "outputs": [ + { + "data": { + "text/plain": [ + "1793 7000\n", + "1795 7000\n", + "1791 6500\n", + "1790 6400\n", + "1792 6300\n", + "1794 6100\n", + "1796 6100\n", + "1798 6100\n", + "1797 5500\n", + "1789 5100\n", + "1799 3100\n", + "Name: year, dtype: int64" + ] + }, + "execution_count": 281, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "df_melted['year'].value_counts()" + ] + }, + { + "cell_type": "code", + "execution_count": 282, + "id": "8c0e699d-6f02-438f-97fe-7f27463fcb83", + "metadata": {}, + "outputs": [ + { + "data": { + "text/html": [ + "
\n", + "\n", + "\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
splitmanifest_idyeartopicsvalues
0trainwrz17890107178900.005998
1trainwrz17890114178900.006012
2trainwrz17890117178900.006010
3trainwrz17890128178900.006015
4trainwrz17890207178900.006018
..................
65195trainwrz179911271799990.006906
65196trainwrz179912041799990.006908
65197trainwrz179912071799990.006896
65198trainwrz179912111799990.006914
65199trainwrz179912141799990.006903
\n", + "

65200 rows × 5 columns

\n", + "
" + ], + "text/plain": [ + " split manifest_id year topics values\n", + "0 train wrz17890107 1789 0 0.005998\n", + "1 train wrz17890114 1789 0 0.006012\n", + "2 train wrz17890117 1789 0 0.006010\n", + "3 train wrz17890128 1789 0 0.006015\n", + "4 train wrz17890207 1789 0 0.006018\n", + "... ... ... ... ... ...\n", + "65195 train wrz17991127 1799 99 0.006906\n", + "65196 train wrz17991204 1799 99 0.006908\n", + "65197 train wrz17991207 1799 99 0.006896\n", + "65198 train wrz17991211 1799 99 0.006914\n", + "65199 train wrz17991214 1799 99 0.006903\n", + "\n", + "[65200 rows x 5 columns]" + ] + }, + "execution_count": 282, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "df_melted" + ] + }, + { + "cell_type": "code", + "execution_count": 283, + "id": "6b203d91-1c6f-43b4-b550-323c01b29446", + "metadata": {}, + "outputs": [ + { + "name": "stderr", + "output_type": "stream", + "text": [ + "C:\\ProgramData\\Anaconda3\\lib\\site-packages\\seaborn\\relational.py:436: MatplotlibDeprecationWarning: Support for passing numbers through unit converters is deprecated since 3.5 and support will be removed two minor releases later; use Axis.convert_units instead.\n", + " scout, = ax.plot([], [], **kws)\n", + "C:\\ProgramData\\Anaconda3\\lib\\site-packages\\seaborn\\relational.py:514: MatplotlibDeprecationWarning: Support for passing numbers through unit converters is deprecated since 3.5 and support will be removed two minor releases later; use Axis.convert_units instead.\n", + " line, = ax.plot([], [], **kws)\n", + "C:\\ProgramData\\Anaconda3\\lib\\site-packages\\seaborn\\relational.py:514: MatplotlibDeprecationWarning: Support for passing numbers through unit converters is deprecated since 3.5 and support will be removed two minor releases later; use Axis.convert_units instead.\n", + " line, = ax.plot([], [], **kws)\n", + "C:\\ProgramData\\Anaconda3\\lib\\site-packages\\seaborn\\relational.py:514: MatplotlibDeprecationWarning: Support for passing numbers through unit converters is deprecated since 3.5 and support will be removed two minor releases later; use Axis.convert_units instead.\n", + " line, = ax.plot([], [], **kws)\n", + "C:\\ProgramData\\Anaconda3\\lib\\site-packages\\seaborn\\relational.py:514: MatplotlibDeprecationWarning: Support for passing numbers through unit converters is deprecated since 3.5 and support will be removed two minor releases later; use Axis.convert_units instead.\n", + " line, = ax.plot([], [], **kws)\n", + "C:\\ProgramData\\Anaconda3\\lib\\site-packages\\seaborn\\relational.py:514: MatplotlibDeprecationWarning: Support for passing numbers through unit converters is deprecated since 3.5 and support will be removed two minor releases later; use Axis.convert_units instead.\n", + " line, = ax.plot([], [], **kws)\n", + "C:\\ProgramData\\Anaconda3\\lib\\site-packages\\seaborn\\relational.py:514: MatplotlibDeprecationWarning: Support for passing numbers through unit converters is deprecated since 3.5 and support will be removed two minor releases later; use Axis.convert_units instead.\n", + " line, = ax.plot([], [], **kws)\n", + "C:\\ProgramData\\Anaconda3\\lib\\site-packages\\seaborn\\relational.py:514: MatplotlibDeprecationWarning: Support for passing numbers through unit converters is deprecated since 3.5 and support will be removed two minor releases later; use Axis.convert_units instead.\n", + " line, = ax.plot([], [], **kws)\n", + "C:\\ProgramData\\Anaconda3\\lib\\site-packages\\seaborn\\relational.py:514: MatplotlibDeprecationWarning: Support for passing numbers through unit converters is deprecated since 3.5 and support will be removed two minor releases later; use Axis.convert_units instead.\n", + " line, = ax.plot([], [], **kws)\n", + "C:\\ProgramData\\Anaconda3\\lib\\site-packages\\seaborn\\relational.py:514: MatplotlibDeprecationWarning: Support for passing numbers through unit converters is deprecated since 3.5 and support will be removed two minor releases later; use Axis.convert_units instead.\n", + " line, = ax.plot([], [], **kws)\n", + "C:\\ProgramData\\Anaconda3\\lib\\site-packages\\seaborn\\relational.py:514: MatplotlibDeprecationWarning: Support for passing numbers through unit converters is deprecated since 3.5 and support will be removed two minor releases later; use Axis.convert_units instead.\n", + " line, = ax.plot([], [], **kws)\n", + "C:\\ProgramData\\Anaconda3\\lib\\site-packages\\seaborn\\relational.py:514: MatplotlibDeprecationWarning: Support for passing numbers through unit converters is deprecated since 3.5 and support will be removed two minor releases later; use Axis.convert_units instead.\n", + " line, = ax.plot([], [], **kws)\n", + "C:\\ProgramData\\Anaconda3\\lib\\site-packages\\seaborn\\relational.py:514: MatplotlibDeprecationWarning: Support for passing numbers through unit converters is deprecated since 3.5 and support will be removed two minor releases later; use Axis.convert_units instead.\n", + " line, = ax.plot([], [], **kws)\n", + "C:\\ProgramData\\Anaconda3\\lib\\site-packages\\seaborn\\relational.py:514: MatplotlibDeprecationWarning: Support for passing numbers through unit converters is deprecated since 3.5 and support will be removed two minor releases later; use Axis.convert_units instead.\n", + " line, = ax.plot([], [], **kws)\n", + "C:\\ProgramData\\Anaconda3\\lib\\site-packages\\seaborn\\relational.py:514: MatplotlibDeprecationWarning: Support for passing numbers through unit converters is deprecated since 3.5 and support will be removed two minor releases later; use Axis.convert_units instead.\n", + " line, = ax.plot([], [], **kws)\n", + "C:\\ProgramData\\Anaconda3\\lib\\site-packages\\seaborn\\relational.py:514: MatplotlibDeprecationWarning: Support for passing numbers through unit converters is deprecated since 3.5 and support will be removed two minor releases later; use Axis.convert_units instead.\n", + " line, = ax.plot([], [], **kws)\n", + "C:\\ProgramData\\Anaconda3\\lib\\site-packages\\seaborn\\relational.py:514: MatplotlibDeprecationWarning: Support for passing numbers through unit converters is deprecated since 3.5 and support will be removed two minor releases later; use Axis.convert_units instead.\n", + " line, = ax.plot([], [], **kws)\n", + "C:\\ProgramData\\Anaconda3\\lib\\site-packages\\seaborn\\relational.py:514: MatplotlibDeprecationWarning: Support for passing numbers through unit converters is deprecated since 3.5 and support will be removed two minor releases later; use Axis.convert_units instead.\n", + " line, = ax.plot([], [], **kws)\n", + "C:\\ProgramData\\Anaconda3\\lib\\site-packages\\seaborn\\relational.py:514: MatplotlibDeprecationWarning: Support for passing numbers through unit converters is deprecated since 3.5 and support will be removed two minor releases later; use Axis.convert_units instead.\n", + " line, = ax.plot([], [], **kws)\n", + "C:\\ProgramData\\Anaconda3\\lib\\site-packages\\seaborn\\relational.py:514: MatplotlibDeprecationWarning: Support for passing numbers through unit converters is deprecated since 3.5 and support will be removed two minor releases later; use Axis.convert_units instead.\n", + " line, = ax.plot([], [], **kws)\n", + "C:\\ProgramData\\Anaconda3\\lib\\site-packages\\seaborn\\relational.py:514: MatplotlibDeprecationWarning: Support for passing numbers through unit converters is deprecated since 3.5 and support will be removed two minor releases later; use Axis.convert_units instead.\n", + " line, = ax.plot([], [], **kws)\n", + "C:\\ProgramData\\Anaconda3\\lib\\site-packages\\seaborn\\relational.py:514: MatplotlibDeprecationWarning: Support for passing numbers through unit converters is deprecated since 3.5 and support will be removed two minor releases later; use Axis.convert_units instead.\n", + " line, = ax.plot([], [], **kws)\n", + "C:\\ProgramData\\Anaconda3\\lib\\site-packages\\seaborn\\relational.py:514: MatplotlibDeprecationWarning: Support for passing numbers through unit converters is deprecated since 3.5 and support will be removed two minor releases later; use Axis.convert_units instead.\n", + " line, = ax.plot([], [], **kws)\n", + "C:\\ProgramData\\Anaconda3\\lib\\site-packages\\seaborn\\relational.py:514: MatplotlibDeprecationWarning: Support for passing numbers through unit converters is deprecated since 3.5 and support will be removed two minor releases later; use Axis.convert_units instead.\n", + " line, = ax.plot([], [], **kws)\n", + "C:\\ProgramData\\Anaconda3\\lib\\site-packages\\seaborn\\relational.py:514: MatplotlibDeprecationWarning: Support for passing numbers through unit converters is deprecated since 3.5 and support will be removed two minor releases later; use Axis.convert_units instead.\n", + " line, = ax.plot([], [], **kws)\n", + "C:\\ProgramData\\Anaconda3\\lib\\site-packages\\seaborn\\relational.py:514: MatplotlibDeprecationWarning: Support for passing numbers through unit converters is deprecated since 3.5 and support will be removed two minor releases later; use Axis.convert_units instead.\n", + " line, = ax.plot([], [], **kws)\n", + "C:\\ProgramData\\Anaconda3\\lib\\site-packages\\seaborn\\relational.py:514: MatplotlibDeprecationWarning: Support for passing numbers through unit converters is deprecated since 3.5 and support will be removed two minor releases later; use Axis.convert_units instead.\n", + " line, = ax.plot([], [], **kws)\n", + "C:\\ProgramData\\Anaconda3\\lib\\site-packages\\seaborn\\relational.py:514: MatplotlibDeprecationWarning: Support for passing numbers through unit converters is deprecated since 3.5 and support will be removed two minor releases later; use Axis.convert_units instead.\n", + " line, = ax.plot([], [], **kws)\n", + "C:\\ProgramData\\Anaconda3\\lib\\site-packages\\seaborn\\relational.py:514: MatplotlibDeprecationWarning: Support for passing numbers through unit converters is deprecated since 3.5 and support will be removed two minor releases later; use Axis.convert_units instead.\n", + " line, = ax.plot([], [], **kws)\n", + "C:\\ProgramData\\Anaconda3\\lib\\site-packages\\seaborn\\relational.py:514: MatplotlibDeprecationWarning: Support for passing numbers through unit converters is deprecated since 3.5 and support will be removed two minor releases later; use Axis.convert_units instead.\n", + " line, = ax.plot([], [], **kws)\n", + "C:\\ProgramData\\Anaconda3\\lib\\site-packages\\seaborn\\relational.py:514: MatplotlibDeprecationWarning: Support for passing numbers through unit converters is deprecated since 3.5 and support will be removed two minor releases later; use Axis.convert_units instead.\n", + " line, = ax.plot([], [], **kws)\n", + "C:\\ProgramData\\Anaconda3\\lib\\site-packages\\seaborn\\relational.py:514: MatplotlibDeprecationWarning: Support for passing numbers through unit converters is deprecated since 3.5 and support will be removed two minor releases later; use Axis.convert_units instead.\n", + " line, = ax.plot([], [], **kws)\n", + "C:\\ProgramData\\Anaconda3\\lib\\site-packages\\seaborn\\relational.py:514: MatplotlibDeprecationWarning: Support for passing numbers through unit converters is deprecated since 3.5 and support will be removed two minor releases later; use Axis.convert_units instead.\n", + " line, = ax.plot([], [], **kws)\n", + "C:\\ProgramData\\Anaconda3\\lib\\site-packages\\seaborn\\relational.py:514: MatplotlibDeprecationWarning: Support for passing numbers through unit converters is deprecated since 3.5 and support will be removed two minor releases later; use Axis.convert_units instead.\n", + " line, = ax.plot([], [], **kws)\n", + "C:\\ProgramData\\Anaconda3\\lib\\site-packages\\seaborn\\relational.py:514: MatplotlibDeprecationWarning: Support for passing numbers through unit converters is deprecated since 3.5 and support will be removed two minor releases later; use Axis.convert_units instead.\n", + " line, = ax.plot([], [], **kws)\n", + "C:\\ProgramData\\Anaconda3\\lib\\site-packages\\seaborn\\relational.py:514: MatplotlibDeprecationWarning: Support for passing numbers through unit converters is deprecated since 3.5 and support will be removed two minor releases later; use Axis.convert_units instead.\n", + " line, = ax.plot([], [], **kws)\n", + "C:\\ProgramData\\Anaconda3\\lib\\site-packages\\seaborn\\relational.py:514: MatplotlibDeprecationWarning: Support for passing numbers through unit converters is deprecated since 3.5 and support will be removed two minor releases later; use Axis.convert_units instead.\n", + " line, = ax.plot([], [], **kws)\n", + "C:\\ProgramData\\Anaconda3\\lib\\site-packages\\seaborn\\relational.py:514: MatplotlibDeprecationWarning: Support for passing numbers through unit converters is deprecated since 3.5 and support will be removed two minor releases later; use Axis.convert_units instead.\n", + " line, = ax.plot([], [], **kws)\n", + "C:\\ProgramData\\Anaconda3\\lib\\site-packages\\seaborn\\relational.py:514: MatplotlibDeprecationWarning: Support for passing numbers through unit converters is deprecated since 3.5 and support will be removed two minor releases later; use Axis.convert_units instead.\n", + " line, = ax.plot([], [], **kws)\n", + "C:\\ProgramData\\Anaconda3\\lib\\site-packages\\seaborn\\relational.py:514: MatplotlibDeprecationWarning: Support for passing numbers through unit converters is deprecated since 3.5 and support will be removed two minor releases later; use Axis.convert_units instead.\n", + " line, = ax.plot([], [], **kws)\n", + "C:\\ProgramData\\Anaconda3\\lib\\site-packages\\seaborn\\relational.py:514: MatplotlibDeprecationWarning: Support for passing numbers through unit converters is deprecated since 3.5 and support will be removed two minor releases later; use Axis.convert_units instead.\n", + " line, = ax.plot([], [], **kws)\n", + "C:\\ProgramData\\Anaconda3\\lib\\site-packages\\seaborn\\relational.py:514: MatplotlibDeprecationWarning: Support for passing numbers through unit converters is deprecated since 3.5 and support will be removed two minor releases later; use Axis.convert_units instead.\n", + " line, = ax.plot([], [], **kws)\n", + "C:\\ProgramData\\Anaconda3\\lib\\site-packages\\seaborn\\relational.py:514: MatplotlibDeprecationWarning: Support for passing numbers through unit converters is deprecated since 3.5 and support will be removed two minor releases later; use Axis.convert_units instead.\n", + " line, = ax.plot([], [], **kws)\n", + "C:\\ProgramData\\Anaconda3\\lib\\site-packages\\seaborn\\relational.py:514: MatplotlibDeprecationWarning: Support for passing numbers through unit converters is deprecated since 3.5 and support will be removed two minor releases later; use Axis.convert_units instead.\n", + " line, = ax.plot([], [], **kws)\n", + "C:\\ProgramData\\Anaconda3\\lib\\site-packages\\seaborn\\relational.py:514: MatplotlibDeprecationWarning: Support for passing numbers through unit converters is deprecated since 3.5 and support will be removed two minor releases later; use Axis.convert_units instead.\n", + " line, = ax.plot([], [], **kws)\n", + "C:\\ProgramData\\Anaconda3\\lib\\site-packages\\seaborn\\relational.py:514: MatplotlibDeprecationWarning: Support for passing numbers through unit converters is deprecated since 3.5 and support will be removed two minor releases later; use Axis.convert_units instead.\n", + " line, = ax.plot([], [], **kws)\n", + "C:\\ProgramData\\Anaconda3\\lib\\site-packages\\seaborn\\relational.py:514: MatplotlibDeprecationWarning: Support for passing numbers through unit converters is deprecated since 3.5 and support will be removed two minor releases later; use Axis.convert_units instead.\n", + " line, = ax.plot([], [], **kws)\n", + "C:\\ProgramData\\Anaconda3\\lib\\site-packages\\seaborn\\relational.py:514: MatplotlibDeprecationWarning: Support for passing numbers through unit converters is deprecated since 3.5 and support will be removed two minor releases later; use Axis.convert_units instead.\n", + " line, = ax.plot([], [], **kws)\n", + "C:\\ProgramData\\Anaconda3\\lib\\site-packages\\seaborn\\relational.py:514: MatplotlibDeprecationWarning: Support for passing numbers through unit converters is deprecated since 3.5 and support will be removed two minor releases later; use Axis.convert_units instead.\n", + " line, = ax.plot([], [], **kws)\n", + "C:\\ProgramData\\Anaconda3\\lib\\site-packages\\seaborn\\relational.py:514: MatplotlibDeprecationWarning: Support for passing numbers through unit converters is deprecated since 3.5 and support will be removed two minor releases later; use Axis.convert_units instead.\n", + " line, = ax.plot([], [], **kws)\n", + "C:\\ProgramData\\Anaconda3\\lib\\site-packages\\seaborn\\relational.py:514: MatplotlibDeprecationWarning: Support for passing numbers through unit converters is deprecated since 3.5 and support will be removed two minor releases later; use Axis.convert_units instead.\n", + " line, = ax.plot([], [], **kws)\n", + "C:\\ProgramData\\Anaconda3\\lib\\site-packages\\seaborn\\relational.py:514: MatplotlibDeprecationWarning: Support for passing numbers through unit converters is deprecated since 3.5 and support will be removed two minor releases later; use Axis.convert_units instead.\n", + " line, = ax.plot([], [], **kws)\n", + "C:\\ProgramData\\Anaconda3\\lib\\site-packages\\seaborn\\relational.py:514: MatplotlibDeprecationWarning: Support for passing numbers through unit converters is deprecated since 3.5 and support will be removed two minor releases later; use Axis.convert_units instead.\n", + " line, = ax.plot([], [], **kws)\n", + "C:\\ProgramData\\Anaconda3\\lib\\site-packages\\seaborn\\relational.py:514: MatplotlibDeprecationWarning: Support for passing numbers through unit converters is deprecated since 3.5 and support will be removed two minor releases later; use Axis.convert_units instead.\n", + " line, = ax.plot([], [], **kws)\n", + "C:\\ProgramData\\Anaconda3\\lib\\site-packages\\seaborn\\relational.py:514: MatplotlibDeprecationWarning: Support for passing numbers through unit converters is deprecated since 3.5 and support will be removed two minor releases later; use Axis.convert_units instead.\n", + " line, = ax.plot([], [], **kws)\n", + "C:\\ProgramData\\Anaconda3\\lib\\site-packages\\seaborn\\relational.py:514: MatplotlibDeprecationWarning: Support for passing numbers through unit converters is deprecated since 3.5 and support will be removed two minor releases later; use Axis.convert_units instead.\n", + " line, = ax.plot([], [], **kws)\n", + "C:\\ProgramData\\Anaconda3\\lib\\site-packages\\seaborn\\relational.py:514: MatplotlibDeprecationWarning: Support for passing numbers through unit converters is deprecated since 3.5 and support will be removed two minor releases later; use Axis.convert_units instead.\n", + " line, = ax.plot([], [], **kws)\n", + "C:\\ProgramData\\Anaconda3\\lib\\site-packages\\seaborn\\relational.py:514: MatplotlibDeprecationWarning: Support for passing numbers through unit converters is deprecated since 3.5 and support will be removed two minor releases later; use Axis.convert_units instead.\n", + " line, = ax.plot([], [], **kws)\n", + "C:\\ProgramData\\Anaconda3\\lib\\site-packages\\seaborn\\relational.py:514: MatplotlibDeprecationWarning: Support for passing numbers through unit converters is deprecated since 3.5 and support will be removed two minor releases later; use Axis.convert_units instead.\n", + " line, = ax.plot([], [], **kws)\n", + "C:\\ProgramData\\Anaconda3\\lib\\site-packages\\seaborn\\relational.py:514: MatplotlibDeprecationWarning: Support for passing numbers through unit converters is deprecated since 3.5 and support will be removed two minor releases later; use Axis.convert_units instead.\n", + " line, = ax.plot([], [], **kws)\n", + "C:\\ProgramData\\Anaconda3\\lib\\site-packages\\seaborn\\relational.py:514: MatplotlibDeprecationWarning: Support for passing numbers through unit converters is deprecated since 3.5 and support will be removed two minor releases later; use Axis.convert_units instead.\n", + " line, = ax.plot([], [], **kws)\n", + "C:\\ProgramData\\Anaconda3\\lib\\site-packages\\seaborn\\relational.py:514: MatplotlibDeprecationWarning: Support for passing numbers through unit converters is deprecated since 3.5 and support will be removed two minor releases later; use Axis.convert_units instead.\n", + " line, = ax.plot([], [], **kws)\n", + "C:\\ProgramData\\Anaconda3\\lib\\site-packages\\seaborn\\relational.py:514: MatplotlibDeprecationWarning: Support for passing numbers through unit converters is deprecated since 3.5 and support will be removed two minor releases later; use Axis.convert_units instead.\n", + " line, = ax.plot([], [], **kws)\n", + "C:\\ProgramData\\Anaconda3\\lib\\site-packages\\seaborn\\relational.py:514: MatplotlibDeprecationWarning: Support for passing numbers through unit converters is deprecated since 3.5 and support will be removed two minor releases later; use Axis.convert_units instead.\n", + " line, = ax.plot([], [], **kws)\n", + "C:\\ProgramData\\Anaconda3\\lib\\site-packages\\seaborn\\relational.py:514: MatplotlibDeprecationWarning: Support for passing numbers through unit converters is deprecated since 3.5 and support will be removed two minor releases later; use Axis.convert_units instead.\n", + " line, = ax.plot([], [], **kws)\n", + "C:\\ProgramData\\Anaconda3\\lib\\site-packages\\seaborn\\relational.py:514: MatplotlibDeprecationWarning: Support for passing numbers through unit converters is deprecated since 3.5 and support will be removed two minor releases later; use Axis.convert_units instead.\n", + " line, = ax.plot([], [], **kws)\n", + "C:\\ProgramData\\Anaconda3\\lib\\site-packages\\seaborn\\relational.py:514: MatplotlibDeprecationWarning: Support for passing numbers through unit converters is deprecated since 3.5 and support will be removed two minor releases later; use Axis.convert_units instead.\n", + " line, = ax.plot([], [], **kws)\n", + "C:\\ProgramData\\Anaconda3\\lib\\site-packages\\seaborn\\relational.py:514: MatplotlibDeprecationWarning: Support for passing numbers through unit converters is deprecated since 3.5 and support will be removed two minor releases later; use Axis.convert_units instead.\n", + " line, = ax.plot([], [], **kws)\n", + "C:\\ProgramData\\Anaconda3\\lib\\site-packages\\seaborn\\relational.py:514: MatplotlibDeprecationWarning: Support for passing numbers through unit converters is deprecated since 3.5 and support will be removed two minor releases later; use Axis.convert_units instead.\n", + " line, = ax.plot([], [], **kws)\n", + "C:\\ProgramData\\Anaconda3\\lib\\site-packages\\seaborn\\relational.py:514: MatplotlibDeprecationWarning: Support for passing numbers through unit converters is deprecated since 3.5 and support will be removed two minor releases later; use Axis.convert_units instead.\n", + " line, = ax.plot([], [], **kws)\n", + "C:\\ProgramData\\Anaconda3\\lib\\site-packages\\seaborn\\relational.py:514: MatplotlibDeprecationWarning: Support for passing numbers through unit converters is deprecated since 3.5 and support will be removed two minor releases later; use Axis.convert_units instead.\n", + " line, = ax.plot([], [], **kws)\n", + "C:\\ProgramData\\Anaconda3\\lib\\site-packages\\seaborn\\relational.py:514: MatplotlibDeprecationWarning: Support for passing numbers through unit converters is deprecated since 3.5 and support will be removed two minor releases later; use Axis.convert_units instead.\n", + " line, = ax.plot([], [], **kws)\n", + "C:\\ProgramData\\Anaconda3\\lib\\site-packages\\seaborn\\relational.py:514: MatplotlibDeprecationWarning: Support for passing numbers through unit converters is deprecated since 3.5 and support will be removed two minor releases later; use Axis.convert_units instead.\n", + " line, = ax.plot([], [], **kws)\n", + "C:\\ProgramData\\Anaconda3\\lib\\site-packages\\seaborn\\relational.py:514: MatplotlibDeprecationWarning: Support for passing numbers through unit converters is deprecated since 3.5 and support will be removed two minor releases later; use Axis.convert_units instead.\n", + " line, = ax.plot([], [], **kws)\n", + "C:\\ProgramData\\Anaconda3\\lib\\site-packages\\seaborn\\relational.py:514: MatplotlibDeprecationWarning: Support for passing numbers through unit converters is deprecated since 3.5 and support will be removed two minor releases later; use Axis.convert_units instead.\n", + " line, = ax.plot([], [], **kws)\n", + "C:\\ProgramData\\Anaconda3\\lib\\site-packages\\seaborn\\relational.py:514: MatplotlibDeprecationWarning: Support for passing numbers through unit converters is deprecated since 3.5 and support will be removed two minor releases later; use Axis.convert_units instead.\n", + " line, = ax.plot([], [], **kws)\n", + "C:\\ProgramData\\Anaconda3\\lib\\site-packages\\seaborn\\relational.py:514: MatplotlibDeprecationWarning: Support for passing numbers through unit converters is deprecated since 3.5 and support will be removed two minor releases later; use Axis.convert_units instead.\n", + " line, = ax.plot([], [], **kws)\n", + "C:\\ProgramData\\Anaconda3\\lib\\site-packages\\seaborn\\relational.py:514: MatplotlibDeprecationWarning: Support for passing numbers through unit converters is deprecated since 3.5 and support will be removed two minor releases later; use Axis.convert_units instead.\n", + " line, = ax.plot([], [], **kws)\n", + "C:\\ProgramData\\Anaconda3\\lib\\site-packages\\seaborn\\relational.py:514: MatplotlibDeprecationWarning: Support for passing numbers through unit converters is deprecated since 3.5 and support will be removed two minor releases later; use Axis.convert_units instead.\n", + " line, = ax.plot([], [], **kws)\n", + "C:\\ProgramData\\Anaconda3\\lib\\site-packages\\seaborn\\relational.py:514: MatplotlibDeprecationWarning: Support for passing numbers through unit converters is deprecated since 3.5 and support will be removed two minor releases later; use Axis.convert_units instead.\n", + " line, = ax.plot([], [], **kws)\n", + "C:\\ProgramData\\Anaconda3\\lib\\site-packages\\seaborn\\relational.py:514: MatplotlibDeprecationWarning: Support for passing numbers through unit converters is deprecated since 3.5 and support will be removed two minor releases later; use Axis.convert_units instead.\n", + " line, = ax.plot([], [], **kws)\n", + "C:\\ProgramData\\Anaconda3\\lib\\site-packages\\seaborn\\relational.py:514: MatplotlibDeprecationWarning: Support for passing numbers through unit converters is deprecated since 3.5 and support will be removed two minor releases later; use Axis.convert_units instead.\n", + " line, = ax.plot([], [], **kws)\n", + "C:\\ProgramData\\Anaconda3\\lib\\site-packages\\seaborn\\relational.py:514: MatplotlibDeprecationWarning: Support for passing numbers through unit converters is deprecated since 3.5 and support will be removed two minor releases later; use Axis.convert_units instead.\n", + " line, = ax.plot([], [], **kws)\n", + "C:\\ProgramData\\Anaconda3\\lib\\site-packages\\seaborn\\relational.py:514: MatplotlibDeprecationWarning: Support for passing numbers through unit converters is deprecated since 3.5 and support will be removed two minor releases later; use Axis.convert_units instead.\n", + " line, = ax.plot([], [], **kws)\n", + "C:\\ProgramData\\Anaconda3\\lib\\site-packages\\seaborn\\relational.py:514: MatplotlibDeprecationWarning: Support for passing numbers through unit converters is deprecated since 3.5 and support will be removed two minor releases later; use Axis.convert_units instead.\n", + " line, = ax.plot([], [], **kws)\n", + "C:\\ProgramData\\Anaconda3\\lib\\site-packages\\seaborn\\relational.py:514: MatplotlibDeprecationWarning: Support for passing numbers through unit converters is deprecated since 3.5 and support will be removed two minor releases later; use Axis.convert_units instead.\n", + " line, = ax.plot([], [], **kws)\n", + "C:\\ProgramData\\Anaconda3\\lib\\site-packages\\seaborn\\relational.py:514: MatplotlibDeprecationWarning: Support for passing numbers through unit converters is deprecated since 3.5 and support will be removed two minor releases later; use Axis.convert_units instead.\n", + " line, = ax.plot([], [], **kws)\n", + "C:\\ProgramData\\Anaconda3\\lib\\site-packages\\seaborn\\relational.py:514: MatplotlibDeprecationWarning: Support for passing numbers through unit converters is deprecated since 3.5 and support will be removed two minor releases later; use Axis.convert_units instead.\n", + " line, = ax.plot([], [], **kws)\n", + "C:\\ProgramData\\Anaconda3\\lib\\site-packages\\seaborn\\relational.py:514: MatplotlibDeprecationWarning: Support for passing numbers through unit converters is deprecated since 3.5 and support will be removed two minor releases later; use Axis.convert_units instead.\n", + " line, = ax.plot([], [], **kws)\n", + "C:\\ProgramData\\Anaconda3\\lib\\site-packages\\seaborn\\relational.py:514: MatplotlibDeprecationWarning: Support for passing numbers through unit converters is deprecated since 3.5 and support will be removed two minor releases later; use Axis.convert_units instead.\n", + " line, = ax.plot([], [], **kws)\n", + "C:\\ProgramData\\Anaconda3\\lib\\site-packages\\seaborn\\relational.py:514: MatplotlibDeprecationWarning: Support for passing numbers through unit converters is deprecated since 3.5 and support will be removed two minor releases later; use Axis.convert_units instead.\n", + " line, = ax.plot([], [], **kws)\n", + "C:\\ProgramData\\Anaconda3\\lib\\site-packages\\seaborn\\relational.py:514: MatplotlibDeprecationWarning: Support for passing numbers through unit converters is deprecated since 3.5 and support will be removed two minor releases later; use Axis.convert_units instead.\n", + " line, = ax.plot([], [], **kws)\n", + "C:\\ProgramData\\Anaconda3\\lib\\site-packages\\seaborn\\relational.py:514: MatplotlibDeprecationWarning: Support for passing numbers through unit converters is deprecated since 3.5 and support will be removed two minor releases later; use Axis.convert_units instead.\n", + " line, = ax.plot([], [], **kws)\n", + "C:\\ProgramData\\Anaconda3\\lib\\site-packages\\seaborn\\relational.py:514: MatplotlibDeprecationWarning: Support for passing numbers through unit converters is deprecated since 3.5 and support will be removed two minor releases later; use Axis.convert_units instead.\n", + " line, = ax.plot([], [], **kws)\n", + "C:\\ProgramData\\Anaconda3\\lib\\site-packages\\seaborn\\relational.py:514: MatplotlibDeprecationWarning: Support for passing numbers through unit converters is deprecated since 3.5 and support will be removed two minor releases later; use Axis.convert_units instead.\n", + " line, = ax.plot([], [], **kws)\n", + "C:\\ProgramData\\Anaconda3\\lib\\site-packages\\seaborn\\relational.py:514: MatplotlibDeprecationWarning: Support for passing numbers through unit converters is deprecated since 3.5 and support will be removed two minor releases later; use Axis.convert_units instead.\n", + " line, = ax.plot([], [], **kws)\n", + "C:\\ProgramData\\Anaconda3\\lib\\site-packages\\seaborn\\relational.py:514: MatplotlibDeprecationWarning: Support for passing numbers through unit converters is deprecated since 3.5 and support will be removed two minor releases later; use Axis.convert_units instead.\n", + " line, = ax.plot([], [], **kws)\n", + "C:\\ProgramData\\Anaconda3\\lib\\site-packages\\seaborn\\relational.py:514: MatplotlibDeprecationWarning: Support for passing numbers through unit converters is deprecated since 3.5 and support will be removed two minor releases later; use Axis.convert_units instead.\n", + " line, = ax.plot([], [], **kws)\n", + "C:\\ProgramData\\Anaconda3\\lib\\site-packages\\seaborn\\relational.py:514: MatplotlibDeprecationWarning: Support for passing numbers through unit converters is deprecated since 3.5 and support will be removed two minor releases later; use Axis.convert_units instead.\n", + " line, = ax.plot([], [], **kws)\n", + "C:\\ProgramData\\Anaconda3\\lib\\site-packages\\seaborn\\relational.py:514: MatplotlibDeprecationWarning: Support for passing numbers through unit converters is deprecated since 3.5 and support will be removed two minor releases later; use Axis.convert_units instead.\n", + " line, = ax.plot([], [], **kws)\n", + "C:\\ProgramData\\Anaconda3\\lib\\site-packages\\seaborn\\relational.py:514: MatplotlibDeprecationWarning: Support for passing numbers through unit converters is deprecated since 3.5 and support will be removed two minor releases later; use Axis.convert_units instead.\n", + " line, = ax.plot([], [], **kws)\n", + "C:\\ProgramData\\Anaconda3\\lib\\site-packages\\seaborn\\relational.py:337: MatplotlibDeprecationWarning: Support for passing numbers through unit converters is deprecated since 3.5 and support will be removed two minor releases later; use Axis.convert_units instead.\n", + " artist = func([], [], label=label, **use_kws)\n", + "C:\\ProgramData\\Anaconda3\\lib\\site-packages\\seaborn\\relational.py:337: MatplotlibDeprecationWarning: Support for passing numbers through unit converters is deprecated since 3.5 and support will be removed two minor releases later; use Axis.convert_units instead.\n", + " artist = func([], [], label=label, **use_kws)\n", + "C:\\ProgramData\\Anaconda3\\lib\\site-packages\\seaborn\\relational.py:337: MatplotlibDeprecationWarning: Support for passing numbers through unit converters is deprecated since 3.5 and support will be removed two minor releases later; use Axis.convert_units instead.\n", + " artist = func([], [], label=label, **use_kws)\n", + "C:\\ProgramData\\Anaconda3\\lib\\site-packages\\seaborn\\relational.py:337: MatplotlibDeprecationWarning: Support for passing numbers through unit converters is deprecated since 3.5 and support will be removed two minor releases later; use Axis.convert_units instead.\n", + " artist = func([], [], label=label, **use_kws)\n", + "C:\\ProgramData\\Anaconda3\\lib\\site-packages\\seaborn\\relational.py:337: MatplotlibDeprecationWarning: Support for passing numbers through unit converters is deprecated since 3.5 and support will be removed two minor releases later; use Axis.convert_units instead.\n", + " artist = func([], [], label=label, **use_kws)\n", + "C:\\ProgramData\\Anaconda3\\lib\\site-packages\\seaborn\\relational.py:337: MatplotlibDeprecationWarning: Support for passing numbers through unit converters is deprecated since 3.5 and support will be removed two minor releases later; use Axis.convert_units instead.\n", + " artist = func([], [], label=label, **use_kws)\n", + "C:\\ProgramData\\Anaconda3\\lib\\site-packages\\seaborn\\relational.py:337: MatplotlibDeprecationWarning: Support for passing numbers through unit converters is deprecated since 3.5 and support will be removed two minor releases later; use Axis.convert_units instead.\n", + " artist = func([], [], label=label, **use_kws)\n", + "C:\\ProgramData\\Anaconda3\\lib\\site-packages\\seaborn\\relational.py:337: MatplotlibDeprecationWarning: Support for passing numbers through unit converters is deprecated since 3.5 and support will be removed two minor releases later; use Axis.convert_units instead.\n", + " artist = func([], [], label=label, **use_kws)\n", + "C:\\ProgramData\\Anaconda3\\lib\\site-packages\\seaborn\\relational.py:337: MatplotlibDeprecationWarning: Support for passing numbers through unit converters is deprecated since 3.5 and support will be removed two minor releases later; use Axis.convert_units instead.\n", + " artist = func([], [], label=label, **use_kws)\n", + "C:\\ProgramData\\Anaconda3\\lib\\site-packages\\seaborn\\relational.py:337: MatplotlibDeprecationWarning: Support for passing numbers through unit converters is deprecated since 3.5 and support will be removed two minor releases later; use Axis.convert_units instead.\n", + " artist = func([], [], label=label, **use_kws)\n", + "C:\\ProgramData\\Anaconda3\\lib\\site-packages\\seaborn\\relational.py:337: MatplotlibDeprecationWarning: Support for passing numbers through unit converters is deprecated since 3.5 and support will be removed two minor releases later; use Axis.convert_units instead.\n", + " artist = func([], [], label=label, **use_kws)\n", + "C:\\ProgramData\\Anaconda3\\lib\\site-packages\\seaborn\\relational.py:337: MatplotlibDeprecationWarning: Support for passing numbers through unit converters is deprecated since 3.5 and support will be removed two minor releases later; use Axis.convert_units instead.\n", + " artist = func([], [], label=label, **use_kws)\n", + "C:\\ProgramData\\Anaconda3\\lib\\site-packages\\seaborn\\relational.py:337: MatplotlibDeprecationWarning: Support for passing numbers through unit converters is deprecated since 3.5 and support will be removed two minor releases later; use Axis.convert_units instead.\n", + " artist = func([], [], label=label, **use_kws)\n", + "C:\\ProgramData\\Anaconda3\\lib\\site-packages\\seaborn\\relational.py:337: MatplotlibDeprecationWarning: Support for passing numbers through unit converters is deprecated since 3.5 and support will be removed two minor releases later; use Axis.convert_units instead.\n", + " artist = func([], [], label=label, **use_kws)\n", + "C:\\ProgramData\\Anaconda3\\lib\\site-packages\\seaborn\\relational.py:337: MatplotlibDeprecationWarning: Support for passing numbers through unit converters is deprecated since 3.5 and support will be removed two minor releases later; use Axis.convert_units instead.\n", + " artist = func([], [], label=label, **use_kws)\n", + "C:\\ProgramData\\Anaconda3\\lib\\site-packages\\seaborn\\relational.py:337: MatplotlibDeprecationWarning: Support for passing numbers through unit converters is deprecated since 3.5 and support will be removed two minor releases later; use Axis.convert_units instead.\n", + " artist = func([], [], label=label, **use_kws)\n", + "C:\\ProgramData\\Anaconda3\\lib\\site-packages\\seaborn\\relational.py:337: MatplotlibDeprecationWarning: Support for passing numbers through unit converters is deprecated since 3.5 and support will be removed two minor releases later; use Axis.convert_units instead.\n", + " artist = func([], [], label=label, **use_kws)\n", + "C:\\ProgramData\\Anaconda3\\lib\\site-packages\\seaborn\\relational.py:337: MatplotlibDeprecationWarning: Support for passing numbers through unit converters is deprecated since 3.5 and support will be removed two minor releases later; use Axis.convert_units instead.\n", + " artist = func([], [], label=label, **use_kws)\n", + "C:\\ProgramData\\Anaconda3\\lib\\site-packages\\seaborn\\relational.py:337: MatplotlibDeprecationWarning: Support for passing numbers through unit converters is deprecated since 3.5 and support will be removed two minor releases later; use Axis.convert_units instead.\n", + " artist = func([], [], label=label, **use_kws)\n", + "C:\\ProgramData\\Anaconda3\\lib\\site-packages\\seaborn\\relational.py:337: MatplotlibDeprecationWarning: Support for passing numbers through unit converters is deprecated since 3.5 and support will be removed two minor releases later; use Axis.convert_units instead.\n", + " artist = func([], [], label=label, **use_kws)\n", + "C:\\ProgramData\\Anaconda3\\lib\\site-packages\\seaborn\\relational.py:337: MatplotlibDeprecationWarning: Support for passing numbers through unit converters is deprecated since 3.5 and support will be removed two minor releases later; use Axis.convert_units instead.\n", + " artist = func([], [], label=label, **use_kws)\n", + "C:\\ProgramData\\Anaconda3\\lib\\site-packages\\seaborn\\relational.py:337: MatplotlibDeprecationWarning: Support for passing numbers through unit converters is deprecated since 3.5 and support will be removed two minor releases later; use Axis.convert_units instead.\n", + " artist = func([], [], label=label, **use_kws)\n", + "C:\\ProgramData\\Anaconda3\\lib\\site-packages\\seaborn\\relational.py:337: MatplotlibDeprecationWarning: Support for passing numbers through unit converters is deprecated since 3.5 and support will be removed two minor releases later; use Axis.convert_units instead.\n", + " artist = func([], [], label=label, **use_kws)\n", + "C:\\ProgramData\\Anaconda3\\lib\\site-packages\\seaborn\\relational.py:337: MatplotlibDeprecationWarning: Support for passing numbers through unit converters is deprecated since 3.5 and support will be removed two minor releases later; use Axis.convert_units instead.\n", + " artist = func([], [], label=label, **use_kws)\n", + "C:\\ProgramData\\Anaconda3\\lib\\site-packages\\seaborn\\relational.py:337: MatplotlibDeprecationWarning: Support for passing numbers through unit converters is deprecated since 3.5 and support will be removed two minor releases later; use Axis.convert_units instead.\n", + " artist = func([], [], label=label, **use_kws)\n", + "C:\\ProgramData\\Anaconda3\\lib\\site-packages\\seaborn\\relational.py:337: MatplotlibDeprecationWarning: Support for passing numbers through unit converters is deprecated since 3.5 and support will be removed two minor releases later; use Axis.convert_units instead.\n", + " artist = func([], [], label=label, **use_kws)\n", + "C:\\ProgramData\\Anaconda3\\lib\\site-packages\\seaborn\\relational.py:337: MatplotlibDeprecationWarning: Support for passing numbers through unit converters is deprecated since 3.5 and support will be removed two minor releases later; use Axis.convert_units instead.\n", + " artist = func([], [], label=label, **use_kws)\n", + "C:\\ProgramData\\Anaconda3\\lib\\site-packages\\seaborn\\relational.py:337: MatplotlibDeprecationWarning: Support for passing numbers through unit converters is deprecated since 3.5 and support will be removed two minor releases later; use Axis.convert_units instead.\n", + " artist = func([], [], label=label, **use_kws)\n", + "C:\\ProgramData\\Anaconda3\\lib\\site-packages\\seaborn\\relational.py:337: MatplotlibDeprecationWarning: Support for passing numbers through unit converters is deprecated since 3.5 and support will be removed two minor releases later; use Axis.convert_units instead.\n", + " artist = func([], [], label=label, **use_kws)\n", + "C:\\ProgramData\\Anaconda3\\lib\\site-packages\\seaborn\\relational.py:337: MatplotlibDeprecationWarning: Support for passing numbers through unit converters is deprecated since 3.5 and support will be removed two minor releases later; use Axis.convert_units instead.\n", + " artist = func([], [], label=label, **use_kws)\n", + "C:\\ProgramData\\Anaconda3\\lib\\site-packages\\seaborn\\relational.py:337: MatplotlibDeprecationWarning: Support for passing numbers through unit converters is deprecated since 3.5 and support will be removed two minor releases later; use Axis.convert_units instead.\n", + " artist = func([], [], label=label, **use_kws)\n", + "C:\\ProgramData\\Anaconda3\\lib\\site-packages\\seaborn\\relational.py:337: MatplotlibDeprecationWarning: Support for passing numbers through unit converters is deprecated since 3.5 and support will be removed two minor releases later; use Axis.convert_units instead.\n", + " artist = func([], [], label=label, **use_kws)\n", + "C:\\ProgramData\\Anaconda3\\lib\\site-packages\\seaborn\\relational.py:337: MatplotlibDeprecationWarning: Support for passing numbers through unit converters is deprecated since 3.5 and support will be removed two minor releases later; use Axis.convert_units instead.\n", + " artist = func([], [], label=label, **use_kws)\n", + "C:\\ProgramData\\Anaconda3\\lib\\site-packages\\seaborn\\relational.py:337: MatplotlibDeprecationWarning: Support for passing numbers through unit converters is deprecated since 3.5 and support will be removed two minor releases later; use Axis.convert_units instead.\n", + " artist = func([], [], label=label, **use_kws)\n", + "C:\\ProgramData\\Anaconda3\\lib\\site-packages\\seaborn\\relational.py:337: MatplotlibDeprecationWarning: Support for passing numbers through unit converters is deprecated since 3.5 and support will be removed two minor releases later; use Axis.convert_units instead.\n", + " artist = func([], [], label=label, **use_kws)\n", + "C:\\ProgramData\\Anaconda3\\lib\\site-packages\\seaborn\\relational.py:337: MatplotlibDeprecationWarning: Support for passing numbers through unit converters is deprecated since 3.5 and support will be removed two minor releases later; use Axis.convert_units instead.\n", + " artist = func([], [], label=label, **use_kws)\n", + "C:\\ProgramData\\Anaconda3\\lib\\site-packages\\seaborn\\relational.py:337: MatplotlibDeprecationWarning: Support for passing numbers through unit converters is deprecated since 3.5 and support will be removed two minor releases later; use Axis.convert_units instead.\n", + " artist = func([], [], label=label, **use_kws)\n", + "C:\\ProgramData\\Anaconda3\\lib\\site-packages\\seaborn\\relational.py:337: MatplotlibDeprecationWarning: Support for passing numbers through unit converters is deprecated since 3.5 and support will be removed two minor releases later; use Axis.convert_units instead.\n", + " artist = func([], [], label=label, **use_kws)\n", + "C:\\ProgramData\\Anaconda3\\lib\\site-packages\\seaborn\\relational.py:337: MatplotlibDeprecationWarning: Support for passing numbers through unit converters is deprecated since 3.5 and support will be removed two minor releases later; use Axis.convert_units instead.\n", + " artist = func([], [], label=label, **use_kws)\n", + "C:\\ProgramData\\Anaconda3\\lib\\site-packages\\seaborn\\relational.py:337: MatplotlibDeprecationWarning: Support for passing numbers through unit converters is deprecated since 3.5 and support will be removed two minor releases later; use Axis.convert_units instead.\n", + " artist = func([], [], label=label, **use_kws)\n", + "C:\\ProgramData\\Anaconda3\\lib\\site-packages\\seaborn\\relational.py:337: MatplotlibDeprecationWarning: Support for passing numbers through unit converters is deprecated since 3.5 and support will be removed two minor releases later; use Axis.convert_units instead.\n", + " artist = func([], [], label=label, **use_kws)\n", + "C:\\ProgramData\\Anaconda3\\lib\\site-packages\\seaborn\\relational.py:337: MatplotlibDeprecationWarning: Support for passing numbers through unit converters is deprecated since 3.5 and support will be removed two minor releases later; use Axis.convert_units instead.\n", + " artist = func([], [], label=label, **use_kws)\n", + "C:\\ProgramData\\Anaconda3\\lib\\site-packages\\seaborn\\relational.py:337: MatplotlibDeprecationWarning: Support for passing numbers through unit converters is deprecated since 3.5 and support will be removed two minor releases later; use Axis.convert_units instead.\n", + " artist = func([], [], label=label, **use_kws)\n", + "C:\\ProgramData\\Anaconda3\\lib\\site-packages\\seaborn\\relational.py:337: MatplotlibDeprecationWarning: Support for passing numbers through unit converters is deprecated since 3.5 and support will be removed two minor releases later; use Axis.convert_units instead.\n", + " artist = func([], [], label=label, **use_kws)\n", + "C:\\ProgramData\\Anaconda3\\lib\\site-packages\\seaborn\\relational.py:337: MatplotlibDeprecationWarning: Support for passing numbers through unit converters is deprecated since 3.5 and support will be removed two minor releases later; use Axis.convert_units instead.\n", + " artist = func([], [], label=label, **use_kws)\n", + "C:\\ProgramData\\Anaconda3\\lib\\site-packages\\seaborn\\relational.py:337: MatplotlibDeprecationWarning: Support for passing numbers through unit converters is deprecated since 3.5 and support will be removed two minor releases later; use Axis.convert_units instead.\n", + " artist = func([], [], label=label, **use_kws)\n", + "C:\\ProgramData\\Anaconda3\\lib\\site-packages\\seaborn\\relational.py:337: MatplotlibDeprecationWarning: Support for passing numbers through unit converters is deprecated since 3.5 and support will be removed two minor releases later; use Axis.convert_units instead.\n", + " artist = func([], [], label=label, **use_kws)\n", + "C:\\ProgramData\\Anaconda3\\lib\\site-packages\\seaborn\\relational.py:337: MatplotlibDeprecationWarning: Support for passing numbers through unit converters is deprecated since 3.5 and support will be removed two minor releases later; use Axis.convert_units instead.\n", + " artist = func([], [], label=label, **use_kws)\n", + "C:\\ProgramData\\Anaconda3\\lib\\site-packages\\seaborn\\relational.py:337: MatplotlibDeprecationWarning: Support for passing numbers through unit converters is deprecated since 3.5 and support will be removed two minor releases later; use Axis.convert_units instead.\n", + " artist = func([], [], label=label, **use_kws)\n", + "C:\\ProgramData\\Anaconda3\\lib\\site-packages\\seaborn\\relational.py:337: MatplotlibDeprecationWarning: Support for passing numbers through unit converters is deprecated since 3.5 and support will be removed two minor releases later; use Axis.convert_units instead.\n", + " artist = func([], [], label=label, **use_kws)\n", + "C:\\ProgramData\\Anaconda3\\lib\\site-packages\\seaborn\\relational.py:337: MatplotlibDeprecationWarning: Support for passing numbers through unit converters is deprecated since 3.5 and support will be removed two minor releases later; use Axis.convert_units instead.\n", + " artist = func([], [], label=label, **use_kws)\n", + "C:\\ProgramData\\Anaconda3\\lib\\site-packages\\seaborn\\relational.py:337: MatplotlibDeprecationWarning: Support for passing numbers through unit converters is deprecated since 3.5 and support will be removed two minor releases later; use Axis.convert_units instead.\n", + " artist = func([], [], label=label, **use_kws)\n", + "C:\\ProgramData\\Anaconda3\\lib\\site-packages\\seaborn\\relational.py:337: MatplotlibDeprecationWarning: Support for passing numbers through unit converters is deprecated since 3.5 and support will be removed two minor releases later; use Axis.convert_units instead.\n", + " artist = func([], [], label=label, **use_kws)\n", + "C:\\ProgramData\\Anaconda3\\lib\\site-packages\\seaborn\\relational.py:337: MatplotlibDeprecationWarning: Support for passing numbers through unit converters is deprecated since 3.5 and support will be removed two minor releases later; use Axis.convert_units instead.\n", + " artist = func([], [], label=label, **use_kws)\n", + "C:\\ProgramData\\Anaconda3\\lib\\site-packages\\seaborn\\relational.py:337: MatplotlibDeprecationWarning: Support for passing numbers through unit converters is deprecated since 3.5 and support will be removed two minor releases later; use Axis.convert_units instead.\n", + " artist = func([], [], label=label, **use_kws)\n", + "C:\\ProgramData\\Anaconda3\\lib\\site-packages\\seaborn\\relational.py:337: MatplotlibDeprecationWarning: Support for passing numbers through unit converters is deprecated since 3.5 and support will be removed two minor releases later; use Axis.convert_units instead.\n", + " artist = func([], [], label=label, **use_kws)\n", + "C:\\ProgramData\\Anaconda3\\lib\\site-packages\\seaborn\\relational.py:337: MatplotlibDeprecationWarning: Support for passing numbers through unit converters is deprecated since 3.5 and support will be removed two minor releases later; use Axis.convert_units instead.\n", + " artist = func([], [], label=label, **use_kws)\n", + "C:\\ProgramData\\Anaconda3\\lib\\site-packages\\seaborn\\relational.py:337: MatplotlibDeprecationWarning: Support for passing numbers through unit converters is deprecated since 3.5 and support will be removed two minor releases later; use Axis.convert_units instead.\n", + " artist = func([], [], label=label, **use_kws)\n", + "C:\\ProgramData\\Anaconda3\\lib\\site-packages\\seaborn\\relational.py:337: MatplotlibDeprecationWarning: Support for passing numbers through unit converters is deprecated since 3.5 and support will be removed two minor releases later; use Axis.convert_units instead.\n", + " artist = func([], [], label=label, **use_kws)\n", + "C:\\ProgramData\\Anaconda3\\lib\\site-packages\\seaborn\\relational.py:337: MatplotlibDeprecationWarning: Support for passing numbers through unit converters is deprecated since 3.5 and support will be removed two minor releases later; use Axis.convert_units instead.\n", + " artist = func([], [], label=label, **use_kws)\n", + "C:\\ProgramData\\Anaconda3\\lib\\site-packages\\seaborn\\relational.py:337: MatplotlibDeprecationWarning: Support for passing numbers through unit converters is deprecated since 3.5 and support will be removed two minor releases later; use Axis.convert_units instead.\n", + " artist = func([], [], label=label, **use_kws)\n", + "C:\\ProgramData\\Anaconda3\\lib\\site-packages\\seaborn\\relational.py:337: MatplotlibDeprecationWarning: Support for passing numbers through unit converters is deprecated since 3.5 and support will be removed two minor releases later; use Axis.convert_units instead.\n", + " artist = func([], [], label=label, **use_kws)\n", + "C:\\ProgramData\\Anaconda3\\lib\\site-packages\\seaborn\\relational.py:337: MatplotlibDeprecationWarning: Support for passing numbers through unit converters is deprecated since 3.5 and support will be removed two minor releases later; use Axis.convert_units instead.\n", + " artist = func([], [], label=label, **use_kws)\n", + "C:\\ProgramData\\Anaconda3\\lib\\site-packages\\seaborn\\relational.py:337: MatplotlibDeprecationWarning: Support for passing numbers through unit converters is deprecated since 3.5 and support will be removed two minor releases later; use Axis.convert_units instead.\n", + " artist = func([], [], label=label, **use_kws)\n", + "C:\\ProgramData\\Anaconda3\\lib\\site-packages\\seaborn\\relational.py:337: MatplotlibDeprecationWarning: Support for passing numbers through unit converters is deprecated since 3.5 and support will be removed two minor releases later; use Axis.convert_units instead.\n", + " artist = func([], [], label=label, **use_kws)\n", + "C:\\ProgramData\\Anaconda3\\lib\\site-packages\\seaborn\\relational.py:337: MatplotlibDeprecationWarning: Support for passing numbers through unit converters is deprecated since 3.5 and support will be removed two minor releases later; use Axis.convert_units instead.\n", + " artist = func([], [], label=label, **use_kws)\n", + "C:\\ProgramData\\Anaconda3\\lib\\site-packages\\seaborn\\relational.py:337: MatplotlibDeprecationWarning: Support for passing numbers through unit converters is deprecated since 3.5 and support will be removed two minor releases later; use Axis.convert_units instead.\n", + " artist = func([], [], label=label, **use_kws)\n", + "C:\\ProgramData\\Anaconda3\\lib\\site-packages\\seaborn\\relational.py:337: MatplotlibDeprecationWarning: Support for passing numbers through unit converters is deprecated since 3.5 and support will be removed two minor releases later; use Axis.convert_units instead.\n", + " artist = func([], [], label=label, **use_kws)\n", + "C:\\ProgramData\\Anaconda3\\lib\\site-packages\\seaborn\\relational.py:337: MatplotlibDeprecationWarning: Support for passing numbers through unit converters is deprecated since 3.5 and support will be removed two minor releases later; use Axis.convert_units instead.\n", + " artist = func([], [], label=label, **use_kws)\n", + "C:\\ProgramData\\Anaconda3\\lib\\site-packages\\seaborn\\relational.py:337: MatplotlibDeprecationWarning: Support for passing numbers through unit converters is deprecated since 3.5 and support will be removed two minor releases later; use Axis.convert_units instead.\n", + " artist = func([], [], label=label, **use_kws)\n", + "C:\\ProgramData\\Anaconda3\\lib\\site-packages\\seaborn\\relational.py:337: MatplotlibDeprecationWarning: Support for passing numbers through unit converters is deprecated since 3.5 and support will be removed two minor releases later; use Axis.convert_units instead.\n", + " artist = func([], [], label=label, **use_kws)\n", + "C:\\ProgramData\\Anaconda3\\lib\\site-packages\\seaborn\\relational.py:337: MatplotlibDeprecationWarning: Support for passing numbers through unit converters is deprecated since 3.5 and support will be removed two minor releases later; use Axis.convert_units instead.\n", + " artist = func([], [], label=label, **use_kws)\n", + "C:\\ProgramData\\Anaconda3\\lib\\site-packages\\seaborn\\relational.py:337: MatplotlibDeprecationWarning: Support for passing numbers through unit converters is deprecated since 3.5 and support will be removed two minor releases later; use Axis.convert_units instead.\n", + " artist = func([], [], label=label, **use_kws)\n", + "C:\\ProgramData\\Anaconda3\\lib\\site-packages\\seaborn\\relational.py:337: MatplotlibDeprecationWarning: Support for passing numbers through unit converters is deprecated since 3.5 and support will be removed two minor releases later; use Axis.convert_units instead.\n", + " artist = func([], [], label=label, **use_kws)\n", + "C:\\ProgramData\\Anaconda3\\lib\\site-packages\\seaborn\\relational.py:337: MatplotlibDeprecationWarning: Support for passing numbers through unit converters is deprecated since 3.5 and support will be removed two minor releases later; use Axis.convert_units instead.\n", + " artist = func([], [], label=label, **use_kws)\n", + "C:\\ProgramData\\Anaconda3\\lib\\site-packages\\seaborn\\relational.py:337: MatplotlibDeprecationWarning: Support for passing numbers through unit converters is deprecated since 3.5 and support will be removed two minor releases later; use Axis.convert_units instead.\n", + " artist = func([], [], label=label, **use_kws)\n", + "C:\\ProgramData\\Anaconda3\\lib\\site-packages\\seaborn\\relational.py:337: MatplotlibDeprecationWarning: Support for passing numbers through unit converters is deprecated since 3.5 and support will be removed two minor releases later; use Axis.convert_units instead.\n", + " artist = func([], [], label=label, **use_kws)\n", + "C:\\ProgramData\\Anaconda3\\lib\\site-packages\\seaborn\\relational.py:337: MatplotlibDeprecationWarning: Support for passing numbers through unit converters is deprecated since 3.5 and support will be removed two minor releases later; use Axis.convert_units instead.\n", + " artist = func([], [], label=label, **use_kws)\n", + "C:\\ProgramData\\Anaconda3\\lib\\site-packages\\seaborn\\relational.py:337: MatplotlibDeprecationWarning: Support for passing numbers through unit converters is deprecated since 3.5 and support will be removed two minor releases later; use Axis.convert_units instead.\n", + " artist = func([], [], label=label, **use_kws)\n", + "C:\\ProgramData\\Anaconda3\\lib\\site-packages\\seaborn\\relational.py:337: MatplotlibDeprecationWarning: Support for passing numbers through unit converters is deprecated since 3.5 and support will be removed two minor releases later; use Axis.convert_units instead.\n", + " artist = func([], [], label=label, **use_kws)\n", + "C:\\ProgramData\\Anaconda3\\lib\\site-packages\\seaborn\\relational.py:337: MatplotlibDeprecationWarning: Support for passing numbers through unit converters is deprecated since 3.5 and support will be removed two minor releases later; use Axis.convert_units instead.\n", + " artist = func([], [], label=label, **use_kws)\n", + "C:\\ProgramData\\Anaconda3\\lib\\site-packages\\seaborn\\relational.py:337: MatplotlibDeprecationWarning: Support for passing numbers through unit converters is deprecated since 3.5 and support will be removed two minor releases later; use Axis.convert_units instead.\n", + " artist = func([], [], label=label, **use_kws)\n", + "C:\\ProgramData\\Anaconda3\\lib\\site-packages\\seaborn\\relational.py:337: MatplotlibDeprecationWarning: Support for passing numbers through unit converters is deprecated since 3.5 and support will be removed two minor releases later; use Axis.convert_units instead.\n", + " artist = func([], [], label=label, **use_kws)\n", + "C:\\ProgramData\\Anaconda3\\lib\\site-packages\\seaborn\\relational.py:337: MatplotlibDeprecationWarning: Support for passing numbers through unit converters is deprecated since 3.5 and support will be removed two minor releases later; use Axis.convert_units instead.\n", + " artist = func([], [], label=label, **use_kws)\n", + "C:\\ProgramData\\Anaconda3\\lib\\site-packages\\seaborn\\relational.py:337: MatplotlibDeprecationWarning: Support for passing numbers through unit converters is deprecated since 3.5 and support will be removed two minor releases later; use Axis.convert_units instead.\n", + " artist = func([], [], label=label, **use_kws)\n", + "C:\\ProgramData\\Anaconda3\\lib\\site-packages\\seaborn\\relational.py:337: MatplotlibDeprecationWarning: Support for passing numbers through unit converters is deprecated since 3.5 and support will be removed two minor releases later; use Axis.convert_units instead.\n", + " artist = func([], [], label=label, **use_kws)\n", + "C:\\ProgramData\\Anaconda3\\lib\\site-packages\\seaborn\\relational.py:337: MatplotlibDeprecationWarning: Support for passing numbers through unit converters is deprecated since 3.5 and support will be removed two minor releases later; use Axis.convert_units instead.\n", + " artist = func([], [], label=label, **use_kws)\n", + "C:\\ProgramData\\Anaconda3\\lib\\site-packages\\seaborn\\relational.py:337: MatplotlibDeprecationWarning: Support for passing numbers through unit converters is deprecated since 3.5 and support will be removed two minor releases later; use Axis.convert_units instead.\n", + " artist = func([], [], label=label, **use_kws)\n", + "C:\\ProgramData\\Anaconda3\\lib\\site-packages\\seaborn\\relational.py:337: MatplotlibDeprecationWarning: Support for passing numbers through unit converters is deprecated since 3.5 and support will be removed two minor releases later; use Axis.convert_units instead.\n", + " artist = func([], [], label=label, **use_kws)\n", + "C:\\ProgramData\\Anaconda3\\lib\\site-packages\\seaborn\\relational.py:337: MatplotlibDeprecationWarning: Support for passing numbers through unit converters is deprecated since 3.5 and support will be removed two minor releases later; use Axis.convert_units instead.\n", + " artist = func([], [], label=label, **use_kws)\n", + "C:\\ProgramData\\Anaconda3\\lib\\site-packages\\seaborn\\relational.py:337: MatplotlibDeprecationWarning: Support for passing numbers through unit converters is deprecated since 3.5 and support will be removed two minor releases later; use Axis.convert_units instead.\n", + " artist = func([], [], label=label, **use_kws)\n", + "C:\\ProgramData\\Anaconda3\\lib\\site-packages\\seaborn\\relational.py:337: MatplotlibDeprecationWarning: Support for passing numbers through unit converters is deprecated since 3.5 and support will be removed two minor releases later; use Axis.convert_units instead.\n", + " artist = func([], [], label=label, **use_kws)\n", + "C:\\ProgramData\\Anaconda3\\lib\\site-packages\\seaborn\\relational.py:337: MatplotlibDeprecationWarning: Support for passing numbers through unit converters is deprecated since 3.5 and support will be removed two minor releases later; use Axis.convert_units instead.\n", + " artist = func([], [], label=label, **use_kws)\n", + "C:\\ProgramData\\Anaconda3\\lib\\site-packages\\seaborn\\relational.py:337: MatplotlibDeprecationWarning: Support for passing numbers through unit converters is deprecated since 3.5 and support will be removed two minor releases later; use Axis.convert_units instead.\n", + " artist = func([], [], label=label, **use_kws)\n", + "C:\\ProgramData\\Anaconda3\\lib\\site-packages\\seaborn\\relational.py:337: MatplotlibDeprecationWarning: Support for passing numbers through unit converters is deprecated since 3.5 and support will be removed two minor releases later; use Axis.convert_units instead.\n", + " artist = func([], [], label=label, **use_kws)\n", + "C:\\ProgramData\\Anaconda3\\lib\\site-packages\\seaborn\\relational.py:337: MatplotlibDeprecationWarning: Support for passing numbers through unit converters is deprecated since 3.5 and support will be removed two minor releases later; use Axis.convert_units instead.\n", + " artist = func([], [], label=label, **use_kws)\n", + "C:\\ProgramData\\Anaconda3\\lib\\site-packages\\seaborn\\relational.py:337: MatplotlibDeprecationWarning: Support for passing numbers through unit converters is deprecated since 3.5 and support will be removed two minor releases later; use Axis.convert_units instead.\n", + " artist = func([], [], label=label, **use_kws)\n", + "C:\\ProgramData\\Anaconda3\\lib\\site-packages\\seaborn\\relational.py:337: MatplotlibDeprecationWarning: Support for passing numbers through unit converters is deprecated since 3.5 and support will be removed two minor releases later; use Axis.convert_units instead.\n", + " artist = func([], [], label=label, **use_kws)\n", + "C:\\ProgramData\\Anaconda3\\lib\\site-packages\\seaborn\\relational.py:337: MatplotlibDeprecationWarning: Support for passing numbers through unit converters is deprecated since 3.5 and support will be removed two minor releases later; use Axis.convert_units instead.\n", + " artist = func([], [], label=label, **use_kws)\n", + "C:\\ProgramData\\Anaconda3\\lib\\site-packages\\seaborn\\relational.py:337: MatplotlibDeprecationWarning: Support for passing numbers through unit converters is deprecated since 3.5 and support will be removed two minor releases later; use Axis.convert_units instead.\n", + " artist = func([], [], label=label, **use_kws)\n" + ] + }, + { + "data": { + "text/plain": [ + "" + ] + }, + "execution_count": 283, + "metadata": {}, + "output_type": "execute_result" + }, + { + "data": { + "image/png": "\n", + "text/plain": [ + "
" + ] + }, + "metadata": { + "needs_background": "light" + }, + "output_type": "display_data" + } + ], + "source": [ + "sns.lineplot(data=df_melted, x=\"year\", y=\"values\", hue = 'topics')\n", + "plt.legend(bbox_to_anchor=(1.05, 1), loc=2, borderaxespad=0.)" + ] + }, + { + "cell_type": "code", + "execution_count": 284, + "id": "fdce078c-6deb-4d72-921d-bdc007e98366", + "metadata": {}, + "outputs": [ + { + "data": { + "text/plain": [ + "" + ] + }, + "execution_count": 284, + "metadata": {}, + "output_type": "execute_result" + }, + { + "data": { + "image/png": "\n", + "text/plain": [ + "
" + ] + }, + "metadata": { + "needs_background": "light" + }, + "output_type": "display_data" + } + ], + "source": [ + "sns.violinplot(x=\"topics\", y=\"values\", data=df_melted, scale=\"count\")" + ] + }, + { + "cell_type": "code", + "execution_count": 289, + "id": "34c60c35-05a3-4e5e-b854-e5efebf7f6de", + "metadata": {}, + "outputs": [ + { + "data": { + "text/plain": [ + "0.02157101" + ] + }, + "execution_count": 289, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "max(map(lambda x: x[50], model_output['topic-document-matrix']))" + ] + }, + { + "cell_type": "code", + "execution_count": 286, + "id": "8f98529c-35fd-4e04-bc96-bbf73c7eb300", + "metadata": {}, + "outputs": [ + { + "data": { + "text/plain": [ + "0.021952521055936813" + ] + }, + "execution_count": 286, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "max(df_melted['values'])" + ] + }, + { + "cell_type": "code", + "execution_count": 287, + "id": "3b1612e9-6610-4b81-8cda-38abbac3271c", + "metadata": {}, + "outputs": [ + { + "data": { + "text/plain": [ + "" + ] + }, + "execution_count": 287, + "metadata": {}, + "output_type": "execute_result" + }, + { + "data": { + "image/png": "iVBORw0KGgoAAAANSUhEUgAAAXAAAAEGCAYAAAB8Ys7jAAAAOXRFWHRTb2Z0d2FyZQBNYXRwbG90bGliIHZlcnNpb24zLjUuMSwgaHR0cHM6Ly9tYXRwbG90bGliLm9yZy/YYfK9AAAACXBIWXMAAAsTAAALEwEAmpwYAAAMZ0lEQVR4nO3db4xl9V3H8c+PXQpLY8UWirhUV1y1KVVRN0QTq7FqrBiDkURBoxJjKqluNiZ9oKlGTUysD6qFxdhgoqEmWmqNif3DA2NKtImCu7LQNgU7LFZ3W5CWtJYuBUt/Pjhn2LvD/IWZe+53+nolm52995x7vnv2N++5e+78ab33AFDPeVMPAMALI+AARQk4QFECDlCUgAMUtXcrG19yySX9wIEDOzQKwO50/PjxT/feL93ux91SwA8cOJBjx45t9wwAu1pr7RM78bguoQAUJeAARQk4QFECDlCUgAMUJeAARQk4QFECDlCUgAMUJeAARQk4QFECDlCUgAMUJeAARQk4QFECDlCUgAMUJeAARQk4QFFb+pmYnOvo0aNZWlqaeoxtd/r06STJ/v37J57kK8PBgwdz+PDhqcegIAF/EZaWlnLiIx/Lsxe9fOpRttWeM59Lkjz6tOWx0/aceWLqESjMe+iL9OxFL89Tr7526jG21b4HP5Aku+7vtYiWzzW8EK6BAxQl4ABFCThAUQIOUJSAAxQl4ABFCThAUQIOUJSAAxQl4ABFCThAUQIOUJSAAxQl4ABFCThAUQIOUJSAAxQl4ABFCThAUQIOUJSAAxQl4ABFCThAUQIOUJSAAxQl4ABFCThAUQIOUJSAAxQl4ABFCThAUQIOUJSAAxQl4ABFCThAUQIOUJSAAxQl4ABFCThAUQIOUJSAAxQ1l4AfPXo0R48encehALbVIvdr7zwOsrS0NI/DAGy7Re6XSygARQk4QFECDlCUgAMUJeAARQk4QFECDlCUgAMUJeAARQk4QFECDlCUgAMUJeAARQk4QFECDlCUgAMUJeAARQk4QFECDlCUgAMUJeAARQk4QFECDlCUgAMUJeAARQk4QFECDlCUgAMUJeAARQk4QFECDlCUgAMUJeAARQk4QFECDlCUgAMUJeAARQk4QFECDlCUgAMUJeAARe2dx0FOnz6dp556KkeOHJnH4eZmaWkp5z3Tpx6Dws774v9maenzu+59YzdZWlrKvn37ph5jVRs+A2+tvbG1dqy1duzxxx+fx0wAbMKGz8B777cnuT1JDh069IKebu7fvz9Jcsstt7yQ3RfWkSNHcvzkY1OPQWFfvvBlOXjlZbvufWM3WeT/HbkGDlCUgAMUJeAARQk4QFECDlCUgAMUJeAARQk4QFECDlCUgAMUJeAARQk4QFECDlCUgAMUJeAARQk4QFECDlCUgAMUJeAARQk4QFECDlCUgAMUJeAARQk4QFECDlCUgAMUJeAARQk4QFECDlCUgAMUJeAARQk4QFECDlCUgAMUJeAARQk4QFECDlCUgAMUJeAARQk4QFECDlCUgAMUtXceBzl48OA8DgOw7Ra5X3MJ+OHDh+dxGIBtt8j9cgkFoCgBByhKwAGKEnCAogQcoCgBByhKwAGKEnCAogQcoCgBByhKwAGKEnCAogQcoCgBByhKwAGKEnCAogQcoCgBByhKwAGKEnCAogQcoCgBByhKwAGKEnCAogQcoCgBByhKwAGKEnCAogQcoCgBByhKwAGKEnCAogQcoCgBByhKwAGKEnCAogQcoCgBByhKwAGKEnCAovZOPUB1e848kX0PfmDqMbbVnjOfSZJd9/daRHvOPJHksqnHoCgBfxEOHjw49Qg74vTpLyVJ9u8Xlp132a5dR+w8AX8RDh8+PPUIwFcw18ABihJwgKIEHKAoAQcoSsABihJwgKIEHKAoAQcoSsABihJwgKIEHKAoAQcoSsABihJwgKIEHKAoAQcoSsABihJwgKIEHKAoAQcoqvXeN79xa48n+cQOzXJJkk/v0GNvN7PunErzmnXnVJp3M7N+Q+/90u0+8JYCvpNaa8d674emnmMzzLpzKs1r1p1Tad4pZ3UJBaAoAQcoapECfvvUA2yBWXdOpXnNunMqzTvZrAtzDRyArVmkZ+AAbIGAA1TVe9/0ryRvSPJQkqUkv7HK/S3JreP9DyT5ro32TfK7SU4nOTH+unbmvt8ct38oyY+Ot33VzLYnMnz+5dvH+25K8vjMfX88r3mTvCLJB5M8meS2Fcf57iQfHh/r1py9dHVBkjvH2x9M8vCUsya5KMn7x1k+muStM/fNntuHkzy6AOf17vGxlvd55Srn9Z4kvzj1Osjm1+08z+2PJDmeYW0eT/L6BV6zq86aza/ZE5lvD9Y7t3dnc+v2wIZN3kK894z/WFcmeUmS+5O8ZsU21ya5azwR35Pkno32HU/Am1c53mvG7S5I8o3j/ntW2e54ku+f+Qe7baJ5X5rk+5LcnOeH5t4k3zse564kPzbe/qYk7xiP91iS9005a4Z3hh8c335Jkn+emfWmJLct2Hm9O8mhVfZ5U5J3jG/fmCGmk8+70bqd4Nx+Z5KvG99+bZLTC7xmV501m1izE/VgvXN7dzZetzckuXOjLm/lEso1SZZ67yd7788keVeS61Zsc12Sd/bBvya5uLV2+Sb3Xem6JO/qvT/de38kw0ela2Y3aK19c5JXZvhHm3Te3vsXeu8fSvLFFTNenuRlvfd/6cO/zDuT/OTM8e8Yj3d/hkXzf1PN2ns/03v/4Pj2M0n+PckVK3ZfiPO6geXzmiT/neGd7pFFmXeddTvvc3tf7/2T4x8/muTC1toFC7pmV511k2s2mzzmjs+73j45d92+J8kPtdbaejtsJeD7M7wzLDs13raZbTba99daaw+01v68tfY1WzjejRk+SvWZ265vrT2Q5I+SPDHHedeyf9x/tcdaPs7+JP+V5HMZ/gs+1azPaa1dnOQnkvzjzM3XZ1i839Jae9Uax5v3rH/RWjvRWvvtmcU+e5yvzRDTVyzIvMka6zbTntvrk9zXe386i79mZ2d9zlprdgF6sNq8667b3vuXcvbcrmkrAV/tI0Hf5Dbr7funSb4pydVJPpXkbVs43g1J/nrmz+/NcN3o2zNce/qBOc67lvUeq62yTV/x+zxnHQ7U2t4M5/XW3vvJ8eb3JjmQ5M0ZrvndMbPLVLP+XO/925K8bvz186scf/nt2RknO7ejVddtJjq3rbWrkvxhkl/Z4Biz902yZleZdfn2NdfslD1YY97NrNu1ZjzHVgJ+KsmrZv58RZJPbnKbNfftvT/We3+29/7lJH+Ws5dJ1j1ea+07kuztvR9fvq33/pmZj3J3JLl0rf13YN61nMq5/6WbnWP5OKeSfH2Sr87wLGGqWZfdnuTjvfe3L98wc25PJflChhe5Vv595jpr7/30+Pvnk/xVVl87n0pyYc4++5r03G6wbud+bltrVyT5uyS/0Ht/eOYYC7dm15h12XprNpmgB2vNu5l1O35AWj63a+sbXCTvZy+w701yMsMLissX8q9asc2P59wXAe7daN8kl8/s/+sZrnsnyVU590XMk5l5ETPJW5P83orjzz7W9Rn+6zyXeWduuynPf7Ht38bHX35BaPmV6l/N8ILQ3gwvCL1/AWb9/SR/m+S81c7teLxHk9w35azjY10yvn1+hmuGN8+e1/Htn83wIubk62CjdTvvc5vk4nG761eZc6HW7Aazrrtmp+jBWvNm8+v2hiTvXq3F5zzeRhusOPi1Sf4jwyuybxlvu3lmgJbkT8b7P5yZV1pX23e8/S/HbR9I8vcrTshbxu0fyvjK8sx9J5O8esVtf5DhBYP7M3wq1xvnPO9/ZviI+WSGj6bLr1QfSvKR8bFuy9lPybowyd/k7KdKPjLlrBmeWfQkH8vZT3H65VXO7f0LMOtLM3wmxwPjXLdk/AC/4rzem+SXFmEdbHLdzu3cJvmtDM/4T+T5n9K2UGt2rVmz+TU71x6sM+9W1u2VGzXZl9IDFOUrMQGKEnCAogQcoCgBByhKwAGK2jv1ALAVrbULk/xThq8P2JvkPb3332mt3ZnkW8fNLk7y2d771ZMMCXMi4FTzdIZvzflka+38JB9qrd3Ve/+Z5Q1aa2/L8H0kYFcTcErpwxcuPDn+8fzx13NfzDB+Y6CfTvL6+U8H8+UaOOW01va01k4k+Z8k/9B7v2fm7tcleaz3/vFJhoM5EnDK6cM3D7o6w5dRX9Nae+3M3Tfm3O/0B7uWgFNW7/2zGX66yRuS576D209l+LFUsOsJOKW01i4dv3F/Wmv7kvxwhp+HmOW3e++n1tgddhUvYlLN5UnuaK3tyfAE5N299/eN9638QQmwq/luhABFuYQCUJSAAxQl4ABFCThAUQIOUJSAAxQl4ABF/T/++rads8DkpwAAAABJRU5ErkJggg==\n", + "text/plain": [ + "
" + ] + }, + "metadata": { + "needs_background": "light" + }, + "output_type": "display_data" + } + ], + "source": [ + "sns.boxplot(df_top_doc_mat.iloc[:, 40])" + ] + }, + { + "cell_type": "code", + "execution_count": 288, + "id": "0673ffa7-b81a-4de8-8064-ff366b40eebe", + "metadata": {}, + "outputs": [ + { + "name": "stderr", + "output_type": "stream", + "text": [ + "C:\\ProgramData\\Anaconda3\\lib\\site-packages\\seaborn\\axisgrid.py:130: DeprecationWarning: distutils Version classes are deprecated. Use packaging.version instead.\n", + " if LooseVersion(mpl.__version__) < LooseVersion(\"3.0\"):\n", + "C:\\ProgramData\\Anaconda3\\lib\\site-packages\\seaborn\\axisgrid.py:130: DeprecationWarning: distutils Version classes are deprecated. Use packaging.version instead.\n", + " if LooseVersion(mpl.__version__) < LooseVersion(\"3.0\"):\n" + ] + }, + { + "data": { + "text/plain": [ + "" + ] + }, + "execution_count": 288, + "metadata": {}, + "output_type": "execute_result" + }, + { + "data": { + "image/png": "\n", + "text/plain": [ + "
" + ] + }, + "metadata": { + "needs_background": "light" + }, + "output_type": "display_data" + } + ], + "source": [ + "sns.displot(x = df_melted['year'], y = df_melted['values'], hue = df_melted['topics'])" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "id": "9f4ed94a-93be-448f-b48b-f6f15769869d", + "metadata": {}, + "outputs": [], + "source": [] + }, + { + "cell_type": "markdown", + "id": "b2fbeae5-9e38-4365-a20e-6dcf1a30eaed", + "metadata": {}, + "source": [ + "

model optimisation

" + ] + }, + { + "cell_type": "code", + "execution_count": 7, + "id": "bffa6694-19c3-4f4a-9167-76dc6dd9f70d", + "metadata": {}, + "outputs": [], + "source": [ + "from skopt.space.space import Real, Categorical, Integer\n", + "from octis.evaluation_metrics.coherence_metrics import Coherence\n", + "from octis.optimization.optimizer import Optimizer\n", + "from octis.evaluation_metrics.diversity_metrics import TopicDiversity" + ] + }, + { + "cell_type": "code", + "execution_count": 9, + "id": "a54b82da-f6df-4944-933c-6ad1d082c7e0", + "metadata": {}, + "outputs": [], + "source": [ + "search_space = {\"t_hidden_size\": Categorical({700, 1000, 1300})}#, \n", + " #\"num_epochs\": Categorical({100, 150, 200}),\n", + " #\"dropout\": Real(0.0, 0.95)}" + ] + }, + { + "cell_type": "code", + "execution_count": 11, + "id": "b43500c2-92f2-4e99-8d4c-fe3523229e9d", + "metadata": {}, + "outputs": [], + "source": [ + "coherence = Coherence(texts=dataset.get_corpus(), measure = 'c_v')" + ] + }, + { + "cell_type": "code", + "execution_count": 12, + "id": "598461a0-9ea3-4502-9f53-7046de154924", + "metadata": {}, + "outputs": [], + "source": [ + "optimization_runs=15" + ] + }, + { + "cell_type": "code", + "execution_count": 13, + "id": "216a66e0-ae73-4186-b643-13e7b7479410", + "metadata": {}, + "outputs": [], + "source": [ + "model_runs=5" + ] + }, + { + "cell_type": "code", + "execution_count": 26, + "id": "022bc79a-cad6-4d65-9139-9e26901077c0", + "metadata": {}, + "outputs": [], + "source": [ + "optimizer=Optimizer()\n", + "import time\n", + "start = time.time()\n", + "optimization_result = optimizer.optimize(\n", + " model, dataset, coherence, search_space, number_of_call=optimization_runs, \n", + " model_runs=model_runs, save_models=True, \n", + " extra_metrics=None, # to keep track of other metrics\n", + " save_path='results/test_ETMco1_wz//')\n", + "end = time.time()\n", + "duration = end - start\n", + "optimization_result.save_to_csv(\"results_ETMco1_wz.csv\")\n", + "print('Optimizing model took: ' + str(round(duration)) + ' seconds.')" + ] + }, + { + "cell_type": "code", + "execution_count": 17, + "id": "4494c763-6801-4146-a2df-aa7b4871bed2", + "metadata": {}, + "outputs": [ + { + "data": { + "text/plain": [ + "dict_keys(['dataset_name', 'dataset_path', 'is_cached', 'kernel', 'acq_func', 'surrogate_model', 'optimization_type', 'model_runs', 'save_models', 'save_step', 'save_name', 'save_path', 'early_stop', 'early_step', 'plot_model', 'plot_best_seen', 'plot_name', 'log_scale_plot', 'search_space', 'model_name', 'model_attributes', 'use_partitioning', 'metric_name', 'extra_metric_names', 'metric_attributes', 'extra_metric_attributes', 'current_call', 'number_of_call', 'random_state', 'x0', 'y0', 'n_random_starts', 'initial_point_generator', 'topk', 'time_eval', 'dict_model_runs', 'f_val', 'x_iters'])" + ] + }, + "execution_count": 17, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "import json\n", + "results = json.load(open('results/test_ETMco1_wz/result.json','r'))\n", + "results.keys()" + ] + }, + { + "cell_type": "code", + "execution_count": 18, + "id": "54d16953-b086-4ef1-a95d-48da42d336f0", + "metadata": {}, + "outputs": [ + { + "data": { + "image/png": "\n", + "text/plain": [ + "
" + ] + }, + "metadata": { + "needs_background": "light" + }, + "output_type": "display_data" + } + ], + "source": [ + "import matplotlib.pyplot as plt\n", + "plt.xlabel('Iteration')\n", + "plt.ylabel('Coherence score (c_v)')\n", + "plt.title('Median coherence score per iteration')\n", + "plt.plot(results['f_val'])\n", + "plt.show()" + ] + }, + { + "cell_type": "code", + "execution_count": 19, + "id": "5968ac38-254e-4b27-8397-f3a77f2a370b", + "metadata": {}, + "outputs": [ + { + "data": { + "text/plain": [ + "2" + ] + }, + "execution_count": 19, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "results[ 'f_val'].index(max(results[ 'f_val']))" + ] + }, + { + "cell_type": "code", + "execution_count": 23, + "id": "4077e429-892f-4f20-9281-c42ae03f2ab3", + "metadata": {}, + "outputs": [ + { + "data": { + "text/plain": [ + "0.25312598515861223" + ] + }, + "execution_count": 23, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "results[\"f_val\"][2]" + ] + }, + { + "cell_type": "code", + "execution_count": 21, + "id": "08daea25-8827-4ed6-aae8-920c1a11d315", + "metadata": {}, + "outputs": [ + { + "data": { + "text/plain": [ + "dict_keys(['t_hidden_size'])" + ] + }, + "execution_count": 21, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "results['x_iters'].keys()" + ] + }, + { + "cell_type": "code", + "execution_count": 22, + "id": "e00e8ae9-1a08-40ee-80ff-3a030ffd0f1d", + "metadata": {}, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "[700]\n" + ] + } + ], + "source": [ + "print([results['x_iters'][parameter][10] for parameter in results['x_iters'].keys()])" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "id": "45e18e12-127e-402f-b30a-5871f0b32036", + "metadata": {}, + "outputs": [], + "source": [] + }, + { + "cell_type": "code", + "execution_count": 24, + "id": "c9b45fa3-ba30-4f8f-9a5f-2879c7d42861", + "metadata": {}, + "outputs": [], + "source": [ + "model = ETM(num_topics=100, num_epochs=150, t_hidden_size=700, rho_size=600,\n", + "embedding_size=800, activation='relu', dropout=0.1, lr=0.005,\n", + "optimizer='adam', batch_size=128, clip=0.0, wdecay=1.2e-06, bow_norm=1,\n", + "device='cpu', top_word=25, train_embeddings=True, embeddings_path=None,\n", + "embeddings_type='pickle', binary_embeddings=True,\n", + "headerless_embeddings=False, use_partitions=True)" + ] + }, + { + "cell_type": "code", + "execution_count": 25, + "id": "8679676b-5888-48b6-aa88-238ccd5b9ab5", + "metadata": {}, + "outputs": [], + "source": [ + "search_space = {\"rho_size\": Categorical({500, 600, 700, 800})}#, \n", + " #\"num_epochs\": Categorical({100, 150, 200}),\n", + " #\"dropout\": Real(0.0, 0.95)}" + ] + }, + { + "cell_type": "code", + "execution_count": 26, + "id": "134f969e-cc0e-4230-a15b-62025b9f6a8b", + "metadata": {}, + "outputs": [], + "source": [ + "optimization_runs=15" + ] + }, + { + "cell_type": "code", + "execution_count": 27, + "id": "b219d52f-a511-4958-a725-54dc69e4576f", + "metadata": {}, + "outputs": [], + "source": [ + "model_runs=5" + ] + }, + { + "cell_type": "code", + "execution_count": 27, + "id": "1c988bee-6260-4270-a5a8-ed0b6214e841", + "metadata": {}, + "outputs": [], + "source": [ + "optimizer=Optimizer()\n", + "import time\n", + "start = time.time()\n", + "optimization_result = optimizer.optimize(\n", + " model, dataset, coherence, search_space, number_of_call=optimization_runs, \n", + " model_runs=model_runs, save_models=True, \n", + " extra_metrics=None, # to keep track of other metrics\n", + " save_path='results/test_ETMco2_wz//')\n", + "end = time.time()\n", + "duration = end - start\n", + "optimization_result.save_to_csv(\"results_ETMdco2_wz.csv\")\n", + "print('Optimizing model took: ' + str(round(duration)) + ' seconds.')" + ] + }, + { + "cell_type": "code", + "execution_count": 32, + "id": "e627582f-8a16-46cb-a99c-b63905bc7a77", + "metadata": {}, + "outputs": [ + { + "data": { + "text/plain": [ + "dict_keys(['dataset_name', 'dataset_path', 'is_cached', 'kernel', 'acq_func', 'surrogate_model', 'optimization_type', 'model_runs', 'save_models', 'save_step', 'save_name', 'save_path', 'early_stop', 'early_step', 'plot_model', 'plot_best_seen', 'plot_name', 'log_scale_plot', 'search_space', 'model_name', 'model_attributes', 'use_partitioning', 'metric_name', 'extra_metric_names', 'metric_attributes', 'extra_metric_attributes', 'current_call', 'number_of_call', 'random_state', 'x0', 'y0', 'n_random_starts', 'initial_point_generator', 'topk', 'time_eval', 'dict_model_runs', 'f_val', 'x_iters'])" + ] + }, + "execution_count": 32, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "import json\n", + "results = json.load(open('results/test_ETMco2_wz/result.json','r'))\n", + "results.keys()" + ] + }, + { + "cell_type": "code", + "execution_count": 33, + "id": "6b6921cd-7dcb-46fc-8561-dd4aa2cf4b8d", + "metadata": {}, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "[600]\n" + ] + } + ], + "source": [ + "print([results['x_iters'][parameter][10] for parameter in results['x_iters'].keys()])" + ] + }, + { + "cell_type": "code", + "execution_count": 8, + "id": "78505c00-7a78-45a0-9b2b-f15c18a02200", + "metadata": {}, + "outputs": [], + "source": [ + "model = ETM(num_topics=100, num_epochs=150, t_hidden_size=700, rho_size=500,\n", + "embedding_size=600, activation='relu', dropout=0.1, lr=0.005,\n", + "optimizer='adam', batch_size=128, clip=0.0, wdecay=1.2e-06, bow_norm=1,\n", + "device='cpu', top_word=25, train_embeddings=True, embeddings_path=None,\n", + "embeddings_type='pickle', binary_embeddings=True,\n", + "headerless_embeddings=False, use_partitions=True)" + ] + }, + { + "cell_type": "code", + "execution_count": 9, + "id": "b8b9bdba-d331-4918-8315-62df6327c75a", + "metadata": {}, + "outputs": [], + "source": [ + "search_space = {\"embedding_size\": Categorical({700, 800, 900, 1000})}#, \n", + " #\"num_epochs\": Categorical({100, 150, 200}),\n", + " #\"dropout\": Real(0.0, 0.95)}" + ] + }, + { + "cell_type": "code", + "execution_count": 11, + "id": "b031e385-199f-4ff5-a546-51b6c195fe2a", + "metadata": {}, + "outputs": [], + "source": [ + "optimization_runs=15" + ] + }, + { + "cell_type": "code", + "execution_count": 12, + "id": "25bf9566-1d12-48c5-9e87-f6df819585dc", + "metadata": {}, + "outputs": [], + "source": [ + "model_runs = 5" + ] + }, + { + "cell_type": "code", + "execution_count": 28, + "id": "1c574ddd-557d-43f3-b6d9-53f0ed284c41", + "metadata": {}, + "outputs": [], + "source": [ + "optimizer=Optimizer()\n", + "import time\n", + "start = time.time()\n", + "optimization_result = optimizer.optimize(\n", + " model, dataset, topic_diversity, search_space, number_of_call=optimization_runs, \n", + " model_runs=model_runs, save_models=True, \n", + " extra_metrics=None, # to keep track of other metrics\n", + " save_path='results/test_ETMco3_wz//')\n", + "end = time.time()\n", + "duration = end - start\n", + "optimization_result.save_to_csv(\"results_ETMco3_wz.csv\")\n", + "print('Optimizing model took: ' + str(round(duration)) + ' seconds.')" + ] + }, + { + "cell_type": "code", + "execution_count": 15, + "id": "ed4fb6a3-49a1-44c2-a3e7-0e03d90daf32", + "metadata": {}, + "outputs": [], + "source": [ + "import json" + ] + }, + { + "cell_type": "code", + "execution_count": 16, + "id": "40086dfb-11ae-4680-afcf-19e7fe6a7725", + "metadata": {}, + "outputs": [ + { + "data": { + "text/plain": [ + "dict_keys(['dataset_name', 'dataset_path', 'is_cached', 'kernel', 'acq_func', 'surrogate_model', 'optimization_type', 'model_runs', 'save_models', 'save_step', 'save_name', 'save_path', 'early_stop', 'early_step', 'plot_model', 'plot_best_seen', 'plot_name', 'log_scale_plot', 'search_space', 'model_name', 'model_attributes', 'use_partitioning', 'metric_name', 'extra_metric_names', 'metric_attributes', 'extra_metric_attributes', 'current_call', 'number_of_call', 'random_state', 'x0', 'y0', 'n_random_starts', 'initial_point_generator', 'topk', 'time_eval', 'dict_model_runs', 'f_val', 'x_iters'])" + ] + }, + "execution_count": 16, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "results = json.load(open('results/test_ETMco3_wz/result.json','r'))\n", + "results.keys()" + ] + }, + { + "cell_type": "code", + "execution_count": 17, + "id": "25b4f43d-6437-4a1c-bbf6-1b795496505c", + "metadata": {}, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "[800]\n" + ] + } + ], + "source": [ + "print([results['x_iters'][parameter][10] for parameter in results['x_iters'].keys()])" + ] + }, + { + "cell_type": "code", + "execution_count": 34, + "id": "bd504b2f-aaad-480a-8a56-c6099534b2d2", + "metadata": {}, + "outputs": [], + "source": [ + "model = ETM(num_topics=100, num_epochs=150, t_hidden_size=700, rho_size=500,\n", + "embedding_size=800, activation='relu', dropout=0.1, lr=0.005,\n", + "optimizer='adam', batch_size=128, clip=0.0, wdecay=1.2e-06, bow_norm=1,\n", + "device='cpu', top_word=25, train_embeddings=True, embeddings_path=None,\n", + "embeddings_type='pickle', binary_embeddings=True,\n", + "headerless_embeddings=False, use_partitions=True)" + ] + }, + { + "cell_type": "code", + "execution_count": 35, + "id": "ac0fe1f8-6b83-4c37-a345-4006ed70716f", + "metadata": {}, + "outputs": [], + "source": [ + "search_space = {\"num_topics\": Integer(80,160)}" + ] + }, + { + "cell_type": "code", + "execution_count": 36, + "id": "bc4ed882-ebd5-4276-b99d-549b92f3d68a", + "metadata": {}, + "outputs": [], + "source": [ + "topic_diversity = TopicDiversity(topk=10)" + ] + }, + { + "cell_type": "code", + "execution_count": 37, + "id": "2931284e-c71f-45c3-806f-bcdaa3f910a4", + "metadata": {}, + "outputs": [], + "source": [ + "optimization_runs=15" + ] + }, + { + "cell_type": "code", + "execution_count": 38, + "id": "cadbcee7-5d87-44dd-9b60-bcd0fa23a4d4", + "metadata": {}, + "outputs": [], + "source": [ + "model_runs = 5" + ] + }, + { + "cell_type": "code", + "execution_count": 39, + "id": "733a718d-04f9-49c9-a40e-95ee75a6aa4d", + "metadata": {}, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "Current call: 0\n", + "model: ETM(\n", + " (t_drop): Dropout(p=0.1, inplace=False)\n", + " (theta_act): ReLU()\n", + " (rho): Linear(in_features=500, out_features=118936, bias=False)\n", + " (alphas): Linear(in_features=500, out_features=119, bias=False)\n", + " (q_theta): Sequential(\n", + " (0): Linear(in_features=118936, out_features=700, bias=True)\n", + " (1): ReLU()\n", + " (2): Linear(in_features=700, out_features=700, bias=True)\n", + " (3): ReLU()\n", + " )\n", + " (mu_q_theta): Linear(in_features=700, out_features=119, bias=True)\n", + " (logsigma_q_theta): Linear(in_features=700, out_features=119, bias=True)\n", + ")\n", + "****************************************************************************************************\n", + "Epoch----->1 .. LR: 0.005 .. KL_theta: 3.44 .. Rec_loss: 88997.65 .. NELBO: 89001.09\n", + "****************************************************************************************************\n", + "****************************************************************************************************\n", + "VALIDATION .. LR: 0.005 .. KL_theta: nan .. Rec_loss: nan .. NELBO: nan\n", + "****************************************************************************************************\n", + "model: ETM(\n", + " (t_drop): Dropout(p=0.1, inplace=False)\n", + " (theta_act): ReLU()\n", + " (rho): Linear(in_features=500, out_features=118936, bias=False)\n", + " (alphas): Linear(in_features=500, out_features=119, bias=False)\n", + " (q_theta): Sequential(\n", + " (0): Linear(in_features=118936, out_features=700, bias=True)\n", + " (1): ReLU()\n", + " (2): Linear(in_features=700, out_features=700, bias=True)\n", + " (3): ReLU()\n", + " )\n", + " (mu_q_theta): Linear(in_features=700, out_features=119, bias=True)\n", + " (logsigma_q_theta): Linear(in_features=700, out_features=119, bias=True)\n", + ")\n", + "****************************************************************************************************\n", + "Epoch----->1 .. LR: 0.005 .. KL_theta: 1.14 .. Rec_loss: 88974.47 .. NELBO: 88975.61\n", + "****************************************************************************************************\n", + "****************************************************************************************************\n", + "VALIDATION .. LR: 0.005 .. KL_theta: nan .. Rec_loss: nan .. NELBO: nan\n", + "****************************************************************************************************\n", + "model: ETM(\n", + " (t_drop): Dropout(p=0.1, inplace=False)\n", + " (theta_act): ReLU()\n", + " (rho): Linear(in_features=500, out_features=118936, bias=False)\n", + " (alphas): Linear(in_features=500, out_features=119, bias=False)\n", + " (q_theta): Sequential(\n", + " (0): Linear(in_features=118936, out_features=700, bias=True)\n", + " (1): ReLU()\n", + " (2): Linear(in_features=700, out_features=700, bias=True)\n", + " (3): ReLU()\n", + " )\n", + " (mu_q_theta): Linear(in_features=700, out_features=119, bias=True)\n", + " (logsigma_q_theta): Linear(in_features=700, out_features=119, bias=True)\n", + ")\n", + "****************************************************************************************************\n", + "Epoch----->1 .. LR: 0.005 .. KL_theta: 2.13 .. Rec_loss: 89034.72 .. NELBO: 89036.85\n", + "****************************************************************************************************\n", + "****************************************************************************************************\n", + "VALIDATION .. LR: 0.005 .. KL_theta: nan .. Rec_loss: nan .. NELBO: nan\n", + "****************************************************************************************************\n", + "model: ETM(\n", + " (t_drop): Dropout(p=0.1, inplace=False)\n", + " (theta_act): ReLU()\n", + " (rho): Linear(in_features=500, out_features=118936, bias=False)\n", + " (alphas): Linear(in_features=500, out_features=119, bias=False)\n", + " (q_theta): Sequential(\n", + " (0): Linear(in_features=118936, out_features=700, bias=True)\n", + " (1): ReLU()\n", + " (2): Linear(in_features=700, out_features=700, bias=True)\n", + " (3): ReLU()\n", + " )\n", + " (mu_q_theta): Linear(in_features=700, out_features=119, bias=True)\n", + " (logsigma_q_theta): Linear(in_features=700, out_features=119, bias=True)\n", + ")\n", + "****************************************************************************************************\n", + "Epoch----->1 .. LR: 0.005 .. KL_theta: 2.08 .. Rec_loss: 89023.43 .. NELBO: 89025.51\n", + "****************************************************************************************************\n", + "****************************************************************************************************\n", + "VALIDATION .. LR: 0.005 .. KL_theta: nan .. Rec_loss: nan .. NELBO: nan\n", + "****************************************************************************************************\n", + "model: ETM(\n", + " (t_drop): Dropout(p=0.1, inplace=False)\n", + " (theta_act): ReLU()\n", + " (rho): Linear(in_features=500, out_features=118936, bias=False)\n", + " (alphas): Linear(in_features=500, out_features=119, bias=False)\n", + " (q_theta): Sequential(\n", + " (0): Linear(in_features=118936, out_features=700, bias=True)\n", + " (1): ReLU()\n", + " (2): Linear(in_features=700, out_features=700, bias=True)\n", + " (3): ReLU()\n", + " )\n", + " (mu_q_theta): Linear(in_features=700, out_features=119, bias=True)\n", + " (logsigma_q_theta): Linear(in_features=700, out_features=119, bias=True)\n", + ")\n", + "****************************************************************************************************\n", + "Epoch----->1 .. LR: 0.005 .. KL_theta: 2.67 .. Rec_loss: 88995.5 .. NELBO: 88998.17\n", + "****************************************************************************************************\n", + "****************************************************************************************************\n", + "VALIDATION .. LR: 0.005 .. KL_theta: nan .. Rec_loss: nan .. NELBO: nan\n", + "****************************************************************************************************\n", + "Current call: 1\n", + "model: ETM(\n", + " (t_drop): Dropout(p=0.1, inplace=False)\n", + " (theta_act): ReLU()\n", + " (rho): Linear(in_features=500, out_features=118936, bias=False)\n", + " (alphas): Linear(in_features=500, out_features=127, bias=False)\n", + " (q_theta): Sequential(\n", + " (0): Linear(in_features=118936, out_features=700, bias=True)\n", + " (1): ReLU()\n", + " (2): Linear(in_features=700, out_features=700, bias=True)\n", + " (3): ReLU()\n", + " )\n", + " (mu_q_theta): Linear(in_features=700, out_features=127, bias=True)\n", + " (logsigma_q_theta): Linear(in_features=700, out_features=127, bias=True)\n", + ")\n", + "****************************************************************************************************\n", + "Epoch----->1 .. LR: 0.005 .. KL_theta: 1.84 .. Rec_loss: 89054.54 .. NELBO: 89056.38\n", + "****************************************************************************************************\n", + "****************************************************************************************************\n", + "VALIDATION .. LR: 0.005 .. KL_theta: nan .. Rec_loss: nan .. NELBO: nan\n", + "****************************************************************************************************\n", + "model: ETM(\n", + " (t_drop): Dropout(p=0.1, inplace=False)\n", + " (theta_act): ReLU()\n", + " (rho): Linear(in_features=500, out_features=118936, bias=False)\n", + " (alphas): Linear(in_features=500, out_features=127, bias=False)\n", + " (q_theta): Sequential(\n", + " (0): Linear(in_features=118936, out_features=700, bias=True)\n", + " (1): ReLU()\n", + " (2): Linear(in_features=700, out_features=700, bias=True)\n", + " (3): ReLU()\n", + " )\n", + " (mu_q_theta): Linear(in_features=700, out_features=127, bias=True)\n", + " (logsigma_q_theta): Linear(in_features=700, out_features=127, bias=True)\n", + ")\n", + "****************************************************************************************************\n", + "Epoch----->1 .. LR: 0.005 .. KL_theta: 2.32 .. Rec_loss: 89029.5 .. NELBO: 89031.82\n", + "****************************************************************************************************\n", + "****************************************************************************************************\n", + "VALIDATION .. LR: 0.005 .. KL_theta: nan .. Rec_loss: nan .. NELBO: nan\n", + "****************************************************************************************************\n", + "model: ETM(\n", + " (t_drop): Dropout(p=0.1, inplace=False)\n", + " (theta_act): ReLU()\n", + " (rho): Linear(in_features=500, out_features=118936, bias=False)\n", + " (alphas): Linear(in_features=500, out_features=127, bias=False)\n", + " (q_theta): Sequential(\n", + " (0): Linear(in_features=118936, out_features=700, bias=True)\n", + " (1): ReLU()\n", + " (2): Linear(in_features=700, out_features=700, bias=True)\n", + " (3): ReLU()\n", + " )\n", + " (mu_q_theta): Linear(in_features=700, out_features=127, bias=True)\n", + " (logsigma_q_theta): Linear(in_features=700, out_features=127, bias=True)\n", + ")\n", + "****************************************************************************************************\n", + "Epoch----->1 .. LR: 0.005 .. KL_theta: 3.08 .. Rec_loss: 89003.84 .. NELBO: 89006.92\n", + "****************************************************************************************************\n", + "****************************************************************************************************\n", + "VALIDATION .. LR: 0.005 .. KL_theta: nan .. Rec_loss: nan .. NELBO: nan\n", + "****************************************************************************************************\n", + "model: ETM(\n", + " (t_drop): Dropout(p=0.1, inplace=False)\n", + " (theta_act): ReLU()\n", + " (rho): Linear(in_features=500, out_features=118936, bias=False)\n", + " (alphas): Linear(in_features=500, out_features=127, bias=False)\n", + " (q_theta): Sequential(\n", + " (0): Linear(in_features=118936, out_features=700, bias=True)\n", + " (1): ReLU()\n", + " (2): Linear(in_features=700, out_features=700, bias=True)\n", + " (3): ReLU()\n", + " )\n", + " (mu_q_theta): Linear(in_features=700, out_features=127, bias=True)\n", + " (logsigma_q_theta): Linear(in_features=700, out_features=127, bias=True)\n", + ")\n", + "****************************************************************************************************\n", + "Epoch----->1 .. LR: 0.005 .. KL_theta: 3.13 .. Rec_loss: 88993.01 .. NELBO: 88996.14\n", + "****************************************************************************************************\n", + "****************************************************************************************************\n", + "VALIDATION .. LR: 0.005 .. KL_theta: nan .. Rec_loss: nan .. NELBO: nan\n", + "****************************************************************************************************\n", + "model: ETM(\n", + " (t_drop): Dropout(p=0.1, inplace=False)\n", + " (theta_act): ReLU()\n", + " (rho): Linear(in_features=500, out_features=118936, bias=False)\n", + " (alphas): Linear(in_features=500, out_features=127, bias=False)\n", + " (q_theta): Sequential(\n", + " (0): Linear(in_features=118936, out_features=700, bias=True)\n", + " (1): ReLU()\n", + " (2): Linear(in_features=700, out_features=700, bias=True)\n", + " (3): ReLU()\n", + " )\n", + " (mu_q_theta): Linear(in_features=700, out_features=127, bias=True)\n", + " (logsigma_q_theta): Linear(in_features=700, out_features=127, bias=True)\n", + ")\n", + "****************************************************************************************************\n", + "Epoch----->1 .. LR: 0.005 .. KL_theta: 2.7 .. Rec_loss: 88999.83 .. NELBO: 89002.53\n", + "****************************************************************************************************\n", + "****************************************************************************************************\n", + "VALIDATION .. LR: 0.005 .. KL_theta: nan .. Rec_loss: nan .. NELBO: nan\n", + "****************************************************************************************************\n", + "Current call: 2\n", + "model: ETM(\n", + " (t_drop): Dropout(p=0.1, inplace=False)\n", + " (theta_act): ReLU()\n", + " (rho): Linear(in_features=500, out_features=118936, bias=False)\n", + " (alphas): Linear(in_features=500, out_features=99, bias=False)\n", + " (q_theta): Sequential(\n", + " (0): Linear(in_features=118936, out_features=700, bias=True)\n", + " (1): ReLU()\n", + " (2): Linear(in_features=700, out_features=700, bias=True)\n", + " (3): ReLU()\n", + " )\n", + " (mu_q_theta): Linear(in_features=700, out_features=99, bias=True)\n", + " (logsigma_q_theta): Linear(in_features=700, out_features=99, bias=True)\n", + ")\n", + "****************************************************************************************************\n", + "Epoch----->1 .. LR: 0.005 .. KL_theta: 4.27 .. Rec_loss: 88988.58 .. NELBO: 88992.85\n", + "****************************************************************************************************\n", + "****************************************************************************************************\n", + "VALIDATION .. LR: 0.005 .. KL_theta: nan .. Rec_loss: nan .. NELBO: nan\n", + "****************************************************************************************************\n", + "model: ETM(\n", + " (t_drop): Dropout(p=0.1, inplace=False)\n", + " (theta_act): ReLU()\n", + " (rho): Linear(in_features=500, out_features=118936, bias=False)\n", + " (alphas): Linear(in_features=500, out_features=99, bias=False)\n", + " (q_theta): Sequential(\n", + " (0): Linear(in_features=118936, out_features=700, bias=True)\n", + " (1): ReLU()\n", + " (2): Linear(in_features=700, out_features=700, bias=True)\n", + " (3): ReLU()\n", + " )\n", + " (mu_q_theta): Linear(in_features=700, out_features=99, bias=True)\n", + " (logsigma_q_theta): Linear(in_features=700, out_features=99, bias=True)\n", + ")\n", + "****************************************************************************************************\n", + "Epoch----->1 .. LR: 0.005 .. KL_theta: 2.89 .. Rec_loss: 88973.64 .. NELBO: 88976.53\n", + "****************************************************************************************************\n", + "****************************************************************************************************\n", + "VALIDATION .. LR: 0.005 .. KL_theta: nan .. Rec_loss: nan .. NELBO: nan\n", + "****************************************************************************************************\n", + "model: ETM(\n", + " (t_drop): Dropout(p=0.1, inplace=False)\n", + " (theta_act): ReLU()\n", + " (rho): Linear(in_features=500, out_features=118936, bias=False)\n", + " (alphas): Linear(in_features=500, out_features=99, bias=False)\n", + " (q_theta): Sequential(\n", + " (0): Linear(in_features=118936, out_features=700, bias=True)\n", + " (1): ReLU()\n", + " (2): Linear(in_features=700, out_features=700, bias=True)\n", + " (3): ReLU()\n", + " )\n", + " (mu_q_theta): Linear(in_features=700, out_features=99, bias=True)\n", + " (logsigma_q_theta): Linear(in_features=700, out_features=99, bias=True)\n", + ")\n", + "****************************************************************************************************\n", + "Epoch----->1 .. LR: 0.005 .. KL_theta: 2.01 .. Rec_loss: 89013.17 .. NELBO: 89015.18\n", + "****************************************************************************************************\n", + "****************************************************************************************************\n", + "VALIDATION .. LR: 0.005 .. KL_theta: nan .. Rec_loss: nan .. NELBO: nan\n", + "****************************************************************************************************\n", + "model: ETM(\n", + " (t_drop): Dropout(p=0.1, inplace=False)\n", + " (theta_act): ReLU()\n", + " (rho): Linear(in_features=500, out_features=118936, bias=False)\n", + " (alphas): Linear(in_features=500, out_features=99, bias=False)\n", + " (q_theta): Sequential(\n", + " (0): Linear(in_features=118936, out_features=700, bias=True)\n", + " (1): ReLU()\n", + " (2): Linear(in_features=700, out_features=700, bias=True)\n", + " (3): ReLU()\n", + " )\n", + " (mu_q_theta): Linear(in_features=700, out_features=99, bias=True)\n", + " (logsigma_q_theta): Linear(in_features=700, out_features=99, bias=True)\n", + ")\n", + "****************************************************************************************************\n", + "Epoch----->1 .. LR: 0.005 .. KL_theta: 3.7 .. Rec_loss: 89004.62 .. NELBO: 89008.32\n", + "****************************************************************************************************\n", + "****************************************************************************************************\n", + "VALIDATION .. LR: 0.005 .. KL_theta: nan .. Rec_loss: nan .. NELBO: nan\n", + "****************************************************************************************************\n", + "model: ETM(\n", + " (t_drop): Dropout(p=0.1, inplace=False)\n", + " (theta_act): ReLU()\n", + " (rho): Linear(in_features=500, out_features=118936, bias=False)\n", + " (alphas): Linear(in_features=500, out_features=99, bias=False)\n", + " (q_theta): Sequential(\n", + " (0): Linear(in_features=118936, out_features=700, bias=True)\n", + " (1): ReLU()\n", + " (2): Linear(in_features=700, out_features=700, bias=True)\n", + " (3): ReLU()\n", + " )\n", + " (mu_q_theta): Linear(in_features=700, out_features=99, bias=True)\n", + " (logsigma_q_theta): Linear(in_features=700, out_features=99, bias=True)\n", + ")\n", + "****************************************************************************************************\n", + "Epoch----->1 .. LR: 0.005 .. KL_theta: 1.54 .. Rec_loss: 88993.82 .. NELBO: 88995.36\n", + "****************************************************************************************************\n", + "****************************************************************************************************\n", + "VALIDATION .. LR: 0.005 .. KL_theta: nan .. Rec_loss: nan .. NELBO: nan\n", + "****************************************************************************************************\n", + "Current call: 3\n", + "model: ETM(\n", + " (t_drop): Dropout(p=0.1, inplace=False)\n", + " (theta_act): ReLU()\n", + " (rho): Linear(in_features=500, out_features=118936, bias=False)\n", + " (alphas): Linear(in_features=500, out_features=109, bias=False)\n", + " (q_theta): Sequential(\n", + " (0): Linear(in_features=118936, out_features=700, bias=True)\n", + " (1): ReLU()\n", + " (2): Linear(in_features=700, out_features=700, bias=True)\n", + " (3): ReLU()\n", + " )\n", + " (mu_q_theta): Linear(in_features=700, out_features=109, bias=True)\n", + " (logsigma_q_theta): Linear(in_features=700, out_features=109, bias=True)\n", + ")\n", + "****************************************************************************************************\n", + "Epoch----->1 .. LR: 0.005 .. KL_theta: 2.83 .. Rec_loss: 88979.26 .. NELBO: 88982.09\n", + "****************************************************************************************************\n", + "****************************************************************************************************\n", + "VALIDATION .. LR: 0.005 .. KL_theta: nan .. Rec_loss: nan .. NELBO: nan\n", + "****************************************************************************************************\n", + "model: ETM(\n", + " (t_drop): Dropout(p=0.1, inplace=False)\n", + " (theta_act): ReLU()\n", + " (rho): Linear(in_features=500, out_features=118936, bias=False)\n", + " (alphas): Linear(in_features=500, out_features=109, bias=False)\n", + " (q_theta): Sequential(\n", + " (0): Linear(in_features=118936, out_features=700, bias=True)\n", + " (1): ReLU()\n", + " (2): Linear(in_features=700, out_features=700, bias=True)\n", + " (3): ReLU()\n", + " )\n", + " (mu_q_theta): Linear(in_features=700, out_features=109, bias=True)\n", + " (logsigma_q_theta): Linear(in_features=700, out_features=109, bias=True)\n", + ")\n", + "****************************************************************************************************\n", + "Epoch----->1 .. LR: 0.005 .. KL_theta: 2.13 .. Rec_loss: 89005.84 .. NELBO: 89007.97\n", + "****************************************************************************************************\n", + "****************************************************************************************************\n", + "VALIDATION .. LR: 0.005 .. KL_theta: nan .. Rec_loss: nan .. NELBO: nan\n", + "****************************************************************************************************\n", + "model: ETM(\n", + " (t_drop): Dropout(p=0.1, inplace=False)\n", + " (theta_act): ReLU()\n", + " (rho): Linear(in_features=500, out_features=118936, bias=False)\n", + " (alphas): Linear(in_features=500, out_features=109, bias=False)\n", + " (q_theta): Sequential(\n", + " (0): Linear(in_features=118936, out_features=700, bias=True)\n", + " (1): ReLU()\n", + " (2): Linear(in_features=700, out_features=700, bias=True)\n", + " (3): ReLU()\n", + " )\n", + " (mu_q_theta): Linear(in_features=700, out_features=109, bias=True)\n", + " (logsigma_q_theta): Linear(in_features=700, out_features=109, bias=True)\n", + ")\n", + "****************************************************************************************************\n", + "Epoch----->1 .. LR: 0.005 .. KL_theta: 2.97 .. Rec_loss: 89006.06 .. NELBO: 89009.03\n", + "****************************************************************************************************\n", + "****************************************************************************************************\n", + "VALIDATION .. LR: 0.005 .. KL_theta: nan .. Rec_loss: nan .. NELBO: nan\n", + "****************************************************************************************************\n", + "model: ETM(\n", + " (t_drop): Dropout(p=0.1, inplace=False)\n", + " (theta_act): ReLU()\n", + " (rho): Linear(in_features=500, out_features=118936, bias=False)\n", + " (alphas): Linear(in_features=500, out_features=109, bias=False)\n", + " (q_theta): Sequential(\n", + " (0): Linear(in_features=118936, out_features=700, bias=True)\n", + " (1): ReLU()\n", + " (2): Linear(in_features=700, out_features=700, bias=True)\n", + " (3): ReLU()\n", + " )\n", + " (mu_q_theta): Linear(in_features=700, out_features=109, bias=True)\n", + " (logsigma_q_theta): Linear(in_features=700, out_features=109, bias=True)\n", + ")\n", + "****************************************************************************************************\n", + "Epoch----->1 .. LR: 0.005 .. KL_theta: 2.08 .. Rec_loss: 89030.16 .. NELBO: 89032.24\n", + "****************************************************************************************************\n", + "****************************************************************************************************\n", + "VALIDATION .. LR: 0.005 .. KL_theta: nan .. Rec_loss: nan .. NELBO: nan\n", + "****************************************************************************************************\n", + "model: ETM(\n", + " (t_drop): Dropout(p=0.1, inplace=False)\n", + " (theta_act): ReLU()\n", + " (rho): Linear(in_features=500, out_features=118936, bias=False)\n", + " (alphas): Linear(in_features=500, out_features=109, bias=False)\n", + " (q_theta): Sequential(\n", + " (0): Linear(in_features=118936, out_features=700, bias=True)\n", + " (1): ReLU()\n", + " (2): Linear(in_features=700, out_features=700, bias=True)\n", + " (3): ReLU()\n", + " )\n", + " (mu_q_theta): Linear(in_features=700, out_features=109, bias=True)\n", + " (logsigma_q_theta): Linear(in_features=700, out_features=109, bias=True)\n", + ")\n", + "****************************************************************************************************\n", + "Epoch----->1 .. LR: 0.005 .. KL_theta: 2.26 .. Rec_loss: 89038.32 .. NELBO: 89040.58\n", + "****************************************************************************************************\n", + "****************************************************************************************************\n", + "VALIDATION .. LR: 0.005 .. KL_theta: nan .. Rec_loss: nan .. NELBO: nan\n", + "****************************************************************************************************\n", + "Current call: 4\n", + "model: ETM(\n", + " (t_drop): Dropout(p=0.1, inplace=False)\n", + " (theta_act): ReLU()\n", + " (rho): Linear(in_features=500, out_features=118936, bias=False)\n", + " (alphas): Linear(in_features=500, out_features=108, bias=False)\n", + " (q_theta): Sequential(\n", + " (0): Linear(in_features=118936, out_features=700, bias=True)\n", + " (1): ReLU()\n", + " (2): Linear(in_features=700, out_features=700, bias=True)\n", + " (3): ReLU()\n", + " )\n", + " (mu_q_theta): Linear(in_features=700, out_features=108, bias=True)\n", + " (logsigma_q_theta): Linear(in_features=700, out_features=108, bias=True)\n", + ")\n", + "****************************************************************************************************\n", + "Epoch----->1 .. LR: 0.005 .. KL_theta: 1.79 .. Rec_loss: 89004.0 .. NELBO: 89005.79\n", + "****************************************************************************************************\n", + "****************************************************************************************************\n", + "VALIDATION .. LR: 0.005 .. KL_theta: nan .. Rec_loss: nan .. NELBO: nan\n", + "****************************************************************************************************\n", + "model: ETM(\n", + " (t_drop): Dropout(p=0.1, inplace=False)\n", + " (theta_act): ReLU()\n", + " (rho): Linear(in_features=500, out_features=118936, bias=False)\n", + " (alphas): Linear(in_features=500, out_features=108, bias=False)\n", + " (q_theta): Sequential(\n", + " (0): Linear(in_features=118936, out_features=700, bias=True)\n", + " (1): ReLU()\n", + " (2): Linear(in_features=700, out_features=700, bias=True)\n", + " (3): ReLU()\n", + " )\n", + " (mu_q_theta): Linear(in_features=700, out_features=108, bias=True)\n", + " (logsigma_q_theta): Linear(in_features=700, out_features=108, bias=True)\n", + ")\n", + "****************************************************************************************************\n", + "Epoch----->1 .. LR: 0.005 .. KL_theta: 1.98 .. Rec_loss: 89015.57 .. NELBO: 89017.55\n", + "****************************************************************************************************\n", + "****************************************************************************************************\n", + "VALIDATION .. LR: 0.005 .. KL_theta: nan .. Rec_loss: nan .. NELBO: nan\n", + "****************************************************************************************************\n", + "model: ETM(\n", + " (t_drop): Dropout(p=0.1, inplace=False)\n", + " (theta_act): ReLU()\n", + " (rho): Linear(in_features=500, out_features=118936, bias=False)\n", + " (alphas): Linear(in_features=500, out_features=108, bias=False)\n", + " (q_theta): Sequential(\n", + " (0): Linear(in_features=118936, out_features=700, bias=True)\n", + " (1): ReLU()\n", + " (2): Linear(in_features=700, out_features=700, bias=True)\n", + " (3): ReLU()\n", + " )\n", + " (mu_q_theta): Linear(in_features=700, out_features=108, bias=True)\n", + " (logsigma_q_theta): Linear(in_features=700, out_features=108, bias=True)\n", + ")\n", + "****************************************************************************************************\n", + "Epoch----->1 .. LR: 0.005 .. KL_theta: 1.83 .. Rec_loss: 88991.01 .. NELBO: 88992.84\n", + "****************************************************************************************************\n", + "****************************************************************************************************\n", + "VALIDATION .. LR: 0.005 .. KL_theta: nan .. Rec_loss: nan .. NELBO: nan\n", + "****************************************************************************************************\n", + "model: ETM(\n", + " (t_drop): Dropout(p=0.1, inplace=False)\n", + " (theta_act): ReLU()\n", + " (rho): Linear(in_features=500, out_features=118936, bias=False)\n", + " (alphas): Linear(in_features=500, out_features=108, bias=False)\n", + " (q_theta): Sequential(\n", + " (0): Linear(in_features=118936, out_features=700, bias=True)\n", + " (1): ReLU()\n", + " (2): Linear(in_features=700, out_features=700, bias=True)\n", + " (3): ReLU()\n", + " )\n", + " (mu_q_theta): Linear(in_features=700, out_features=108, bias=True)\n", + " (logsigma_q_theta): Linear(in_features=700, out_features=108, bias=True)\n", + ")\n", + "****************************************************************************************************\n", + "Epoch----->1 .. LR: 0.005 .. KL_theta: 1.57 .. Rec_loss: 88979.58 .. NELBO: 88981.15\n", + "****************************************************************************************************\n", + "****************************************************************************************************\n", + "VALIDATION .. LR: 0.005 .. KL_theta: nan .. Rec_loss: nan .. NELBO: nan\n", + "****************************************************************************************************\n", + "model: ETM(\n", + " (t_drop): Dropout(p=0.1, inplace=False)\n", + " (theta_act): ReLU()\n", + " (rho): Linear(in_features=500, out_features=118936, bias=False)\n", + " (alphas): Linear(in_features=500, out_features=108, bias=False)\n", + " (q_theta): Sequential(\n", + " (0): Linear(in_features=118936, out_features=700, bias=True)\n", + " (1): ReLU()\n", + " (2): Linear(in_features=700, out_features=700, bias=True)\n", + " (3): ReLU()\n", + " )\n", + " (mu_q_theta): Linear(in_features=700, out_features=108, bias=True)\n", + " (logsigma_q_theta): Linear(in_features=700, out_features=108, bias=True)\n", + ")\n", + "****************************************************************************************************\n", + "Epoch----->1 .. LR: 0.005 .. KL_theta: 2.43 .. Rec_loss: 88980.47 .. NELBO: 88982.9\n", + "****************************************************************************************************\n", + "****************************************************************************************************\n", + "VALIDATION .. LR: 0.005 .. KL_theta: nan .. Rec_loss: nan .. NELBO: nan\n", + "****************************************************************************************************\n", + "Current call: 5\n", + "model: ETM(\n", + " (t_drop): Dropout(p=0.1, inplace=False)\n", + " (theta_act): ReLU()\n", + " (rho): Linear(in_features=500, out_features=118936, bias=False)\n", + " (alphas): Linear(in_features=500, out_features=90, bias=False)\n", + " (q_theta): Sequential(\n", + " (0): Linear(in_features=118936, out_features=700, bias=True)\n", + " (1): ReLU()\n", + " (2): Linear(in_features=700, out_features=700, bias=True)\n", + " (3): ReLU()\n", + " )\n", + " (mu_q_theta): Linear(in_features=700, out_features=90, bias=True)\n", + " (logsigma_q_theta): Linear(in_features=700, out_features=90, bias=True)\n", + ")\n", + "****************************************************************************************************\n", + "Epoch----->1 .. LR: 0.005 .. KL_theta: 2.81 .. Rec_loss: 88983.06 .. NELBO: 88985.87\n", + "****************************************************************************************************\n", + "****************************************************************************************************\n", + "VALIDATION .. LR: 0.005 .. KL_theta: nan .. Rec_loss: nan .. NELBO: nan\n", + "****************************************************************************************************\n", + "model: ETM(\n", + " (t_drop): Dropout(p=0.1, inplace=False)\n", + " (theta_act): ReLU()\n", + " (rho): Linear(in_features=500, out_features=118936, bias=False)\n", + " (alphas): Linear(in_features=500, out_features=90, bias=False)\n", + " (q_theta): Sequential(\n", + " (0): Linear(in_features=118936, out_features=700, bias=True)\n", + " (1): ReLU()\n", + " (2): Linear(in_features=700, out_features=700, bias=True)\n", + " (3): ReLU()\n", + " )\n", + " (mu_q_theta): Linear(in_features=700, out_features=90, bias=True)\n", + " (logsigma_q_theta): Linear(in_features=700, out_features=90, bias=True)\n", + ")\n", + "****************************************************************************************************\n", + "Epoch----->1 .. LR: 0.005 .. KL_theta: 1.66 .. Rec_loss: 89006.57 .. NELBO: 89008.23\n", + "****************************************************************************************************\n", + "****************************************************************************************************\n", + "VALIDATION .. LR: 0.005 .. KL_theta: nan .. Rec_loss: nan .. NELBO: nan\n", + "****************************************************************************************************\n", + "model: ETM(\n", + " (t_drop): Dropout(p=0.1, inplace=False)\n", + " (theta_act): ReLU()\n", + " (rho): Linear(in_features=500, out_features=118936, bias=False)\n", + " (alphas): Linear(in_features=500, out_features=90, bias=False)\n", + " (q_theta): Sequential(\n", + " (0): Linear(in_features=118936, out_features=700, bias=True)\n", + " (1): ReLU()\n", + " (2): Linear(in_features=700, out_features=700, bias=True)\n", + " (3): ReLU()\n", + " )\n", + " (mu_q_theta): Linear(in_features=700, out_features=90, bias=True)\n", + " (logsigma_q_theta): Linear(in_features=700, out_features=90, bias=True)\n", + ")\n", + "****************************************************************************************************\n", + "Epoch----->1 .. LR: 0.005 .. KL_theta: 3.65 .. Rec_loss: 88995.69 .. NELBO: 88999.34\n", + "****************************************************************************************************\n", + "****************************************************************************************************\n", + "VALIDATION .. LR: 0.005 .. KL_theta: nan .. Rec_loss: nan .. NELBO: nan\n", + "****************************************************************************************************\n", + "model: ETM(\n", + " (t_drop): Dropout(p=0.1, inplace=False)\n", + " (theta_act): ReLU()\n", + " (rho): Linear(in_features=500, out_features=118936, bias=False)\n", + " (alphas): Linear(in_features=500, out_features=90, bias=False)\n", + " (q_theta): Sequential(\n", + " (0): Linear(in_features=118936, out_features=700, bias=True)\n", + " (1): ReLU()\n", + " (2): Linear(in_features=700, out_features=700, bias=True)\n", + " (3): ReLU()\n", + " )\n", + " (mu_q_theta): Linear(in_features=700, out_features=90, bias=True)\n", + " (logsigma_q_theta): Linear(in_features=700, out_features=90, bias=True)\n", + ")\n", + "****************************************************************************************************\n", + "Epoch----->1 .. LR: 0.005 .. KL_theta: 2.8 .. Rec_loss: 88953.95 .. NELBO: 88956.75\n", + "****************************************************************************************************\n", + "****************************************************************************************************\n", + "VALIDATION .. LR: 0.005 .. KL_theta: nan .. Rec_loss: nan .. NELBO: nan\n", + "****************************************************************************************************\n", + "model: ETM(\n", + " (t_drop): Dropout(p=0.1, inplace=False)\n", + " (theta_act): ReLU()\n", + " (rho): Linear(in_features=500, out_features=118936, bias=False)\n", + " (alphas): Linear(in_features=500, out_features=90, bias=False)\n", + " (q_theta): Sequential(\n", + " (0): Linear(in_features=118936, out_features=700, bias=True)\n", + " (1): ReLU()\n", + " (2): Linear(in_features=700, out_features=700, bias=True)\n", + " (3): ReLU()\n", + " )\n", + " (mu_q_theta): Linear(in_features=700, out_features=90, bias=True)\n", + " (logsigma_q_theta): Linear(in_features=700, out_features=90, bias=True)\n", + ")\n", + "****************************************************************************************************\n", + "Epoch----->1 .. LR: 0.005 .. KL_theta: 1.33 .. Rec_loss: 88986.86 .. NELBO: 88988.19\n", + "****************************************************************************************************\n", + "****************************************************************************************************\n", + "VALIDATION .. LR: 0.005 .. KL_theta: nan .. Rec_loss: nan .. NELBO: nan\n", + "****************************************************************************************************\n", + "Current call: 6\n", + "model: ETM(\n", + " (t_drop): Dropout(p=0.1, inplace=False)\n", + " (theta_act): ReLU()\n", + " (rho): Linear(in_features=500, out_features=118936, bias=False)\n", + " (alphas): Linear(in_features=500, out_features=99, bias=False)\n", + " (q_theta): Sequential(\n", + " (0): Linear(in_features=118936, out_features=700, bias=True)\n", + " (1): ReLU()\n", + " (2): Linear(in_features=700, out_features=700, bias=True)\n", + " (3): ReLU()\n", + " )\n", + " (mu_q_theta): Linear(in_features=700, out_features=99, bias=True)\n", + " (logsigma_q_theta): Linear(in_features=700, out_features=99, bias=True)\n", + ")\n", + "****************************************************************************************************\n", + "Epoch----->1 .. LR: 0.005 .. KL_theta: 2.78 .. Rec_loss: 88949.98 .. NELBO: 88952.76\n", + "****************************************************************************************************\n", + "****************************************************************************************************\n", + "VALIDATION .. LR: 0.005 .. KL_theta: nan .. Rec_loss: nan .. NELBO: nan\n", + "****************************************************************************************************\n", + "model: ETM(\n", + " (t_drop): Dropout(p=0.1, inplace=False)\n", + " (theta_act): ReLU()\n", + " (rho): Linear(in_features=500, out_features=118936, bias=False)\n", + " (alphas): Linear(in_features=500, out_features=99, bias=False)\n", + " (q_theta): Sequential(\n", + " (0): Linear(in_features=118936, out_features=700, bias=True)\n", + " (1): ReLU()\n", + " (2): Linear(in_features=700, out_features=700, bias=True)\n", + " (3): ReLU()\n", + " )\n", + " (mu_q_theta): Linear(in_features=700, out_features=99, bias=True)\n", + " (logsigma_q_theta): Linear(in_features=700, out_features=99, bias=True)\n", + ")\n", + "****************************************************************************************************\n", + "Epoch----->1 .. LR: 0.005 .. KL_theta: 2.57 .. Rec_loss: 88974.0 .. NELBO: 88976.57\n", + "****************************************************************************************************\n", + "****************************************************************************************************\n", + "VALIDATION .. LR: 0.005 .. KL_theta: nan .. Rec_loss: nan .. NELBO: nan\n", + "****************************************************************************************************\n", + "model: ETM(\n", + " (t_drop): Dropout(p=0.1, inplace=False)\n", + " (theta_act): ReLU()\n", + " (rho): Linear(in_features=500, out_features=118936, bias=False)\n", + " (alphas): Linear(in_features=500, out_features=99, bias=False)\n", + " (q_theta): Sequential(\n", + " (0): Linear(in_features=118936, out_features=700, bias=True)\n", + " (1): ReLU()\n", + " (2): Linear(in_features=700, out_features=700, bias=True)\n", + " (3): ReLU()\n", + " )\n", + " (mu_q_theta): Linear(in_features=700, out_features=99, bias=True)\n", + " (logsigma_q_theta): Linear(in_features=700, out_features=99, bias=True)\n", + ")\n", + "****************************************************************************************************\n", + "Epoch----->1 .. LR: 0.005 .. KL_theta: 2.98 .. Rec_loss: 88970.07 .. NELBO: 88973.05\n", + "****************************************************************************************************\n", + "****************************************************************************************************\n", + "VALIDATION .. LR: 0.005 .. KL_theta: nan .. Rec_loss: nan .. NELBO: nan\n", + "****************************************************************************************************\n", + "model: ETM(\n", + " (t_drop): Dropout(p=0.1, inplace=False)\n", + " (theta_act): ReLU()\n", + " (rho): Linear(in_features=500, out_features=118936, bias=False)\n", + " (alphas): Linear(in_features=500, out_features=99, bias=False)\n", + " (q_theta): Sequential(\n", + " (0): Linear(in_features=118936, out_features=700, bias=True)\n", + " (1): ReLU()\n", + " (2): Linear(in_features=700, out_features=700, bias=True)\n", + " (3): ReLU()\n", + " )\n", + " (mu_q_theta): Linear(in_features=700, out_features=99, bias=True)\n", + " (logsigma_q_theta): Linear(in_features=700, out_features=99, bias=True)\n", + ")\n", + "****************************************************************************************************\n", + "Epoch----->1 .. LR: 0.005 .. KL_theta: 2.5 .. Rec_loss: 88964.56 .. NELBO: 88967.06\n", + "****************************************************************************************************\n", + "****************************************************************************************************\n", + "VALIDATION .. LR: 0.005 .. KL_theta: nan .. Rec_loss: nan .. NELBO: nan\n", + "****************************************************************************************************\n", + "model: ETM(\n", + " (t_drop): Dropout(p=0.1, inplace=False)\n", + " (theta_act): ReLU()\n", + " (rho): Linear(in_features=500, out_features=118936, bias=False)\n", + " (alphas): Linear(in_features=500, out_features=99, bias=False)\n", + " (q_theta): Sequential(\n", + " (0): Linear(in_features=118936, out_features=700, bias=True)\n", + " (1): ReLU()\n", + " (2): Linear(in_features=700, out_features=700, bias=True)\n", + " (3): ReLU()\n", + " )\n", + " (mu_q_theta): Linear(in_features=700, out_features=99, bias=True)\n", + " (logsigma_q_theta): Linear(in_features=700, out_features=99, bias=True)\n", + ")\n", + "****************************************************************************************************\n", + "Epoch----->1 .. LR: 0.005 .. KL_theta: 1.45 .. Rec_loss: 89007.67 .. NELBO: 89009.12\n", + "****************************************************************************************************\n", + "****************************************************************************************************\n", + "VALIDATION .. LR: 0.005 .. KL_theta: nan .. Rec_loss: nan .. NELBO: nan\n", + "****************************************************************************************************\n", + "Current call: 7\n", + "model: ETM(\n", + " (t_drop): Dropout(p=0.1, inplace=False)\n", + " (theta_act): ReLU()\n", + " (rho): Linear(in_features=500, out_features=118936, bias=False)\n", + " (alphas): Linear(in_features=500, out_features=90, bias=False)\n", + " (q_theta): Sequential(\n", + " (0): Linear(in_features=118936, out_features=700, bias=True)\n", + " (1): ReLU()\n", + " (2): Linear(in_features=700, out_features=700, bias=True)\n", + " (3): ReLU()\n", + " )\n", + " (mu_q_theta): Linear(in_features=700, out_features=90, bias=True)\n", + " (logsigma_q_theta): Linear(in_features=700, out_features=90, bias=True)\n", + ")\n", + "****************************************************************************************************\n", + "Epoch----->1 .. LR: 0.005 .. KL_theta: 3.6 .. Rec_loss: 89012.43 .. NELBO: 89016.03\n", + "****************************************************************************************************\n", + "****************************************************************************************************\n", + "VALIDATION .. LR: 0.005 .. KL_theta: nan .. Rec_loss: nan .. NELBO: nan\n", + "****************************************************************************************************\n", + "model: ETM(\n", + " (t_drop): Dropout(p=0.1, inplace=False)\n", + " (theta_act): ReLU()\n", + " (rho): Linear(in_features=500, out_features=118936, bias=False)\n", + " (alphas): Linear(in_features=500, out_features=90, bias=False)\n", + " (q_theta): Sequential(\n", + " (0): Linear(in_features=118936, out_features=700, bias=True)\n", + " (1): ReLU()\n", + " (2): Linear(in_features=700, out_features=700, bias=True)\n", + " (3): ReLU()\n", + " )\n", + " (mu_q_theta): Linear(in_features=700, out_features=90, bias=True)\n", + " (logsigma_q_theta): Linear(in_features=700, out_features=90, bias=True)\n", + ")\n", + "****************************************************************************************************\n", + "Epoch----->1 .. LR: 0.005 .. KL_theta: 1.19 .. Rec_loss: 88987.99 .. NELBO: 88989.18\n", + "****************************************************************************************************\n", + "****************************************************************************************************\n", + "VALIDATION .. LR: 0.005 .. KL_theta: nan .. Rec_loss: nan .. NELBO: nan\n", + "****************************************************************************************************\n", + "model: ETM(\n", + " (t_drop): Dropout(p=0.1, inplace=False)\n", + " (theta_act): ReLU()\n", + " (rho): Linear(in_features=500, out_features=118936, bias=False)\n", + " (alphas): Linear(in_features=500, out_features=90, bias=False)\n", + " (q_theta): Sequential(\n", + " (0): Linear(in_features=118936, out_features=700, bias=True)\n", + " (1): ReLU()\n", + " (2): Linear(in_features=700, out_features=700, bias=True)\n", + " (3): ReLU()\n", + " )\n", + " (mu_q_theta): Linear(in_features=700, out_features=90, bias=True)\n", + " (logsigma_q_theta): Linear(in_features=700, out_features=90, bias=True)\n", + ")\n", + "****************************************************************************************************\n", + "Epoch----->1 .. LR: 0.005 .. KL_theta: 1.23 .. Rec_loss: 88985.48 .. NELBO: 88986.71\n", + "****************************************************************************************************\n", + "****************************************************************************************************\n", + "VALIDATION .. LR: 0.005 .. KL_theta: nan .. Rec_loss: nan .. NELBO: nan\n", + "****************************************************************************************************\n", + "model: ETM(\n", + " (t_drop): Dropout(p=0.1, inplace=False)\n", + " (theta_act): ReLU()\n", + " (rho): Linear(in_features=500, out_features=118936, bias=False)\n", + " (alphas): Linear(in_features=500, out_features=90, bias=False)\n", + " (q_theta): Sequential(\n", + " (0): Linear(in_features=118936, out_features=700, bias=True)\n", + " (1): ReLU()\n", + " (2): Linear(in_features=700, out_features=700, bias=True)\n", + " (3): ReLU()\n", + " )\n", + " (mu_q_theta): Linear(in_features=700, out_features=90, bias=True)\n", + " (logsigma_q_theta): Linear(in_features=700, out_features=90, bias=True)\n", + ")\n", + "****************************************************************************************************\n", + "Epoch----->1 .. LR: 0.005 .. KL_theta: 2.28 .. Rec_loss: 88962.42 .. NELBO: 88964.7\n", + "****************************************************************************************************\n", + "****************************************************************************************************\n", + "VALIDATION .. LR: 0.005 .. KL_theta: nan .. Rec_loss: nan .. NELBO: nan\n", + "****************************************************************************************************\n", + "model: ETM(\n", + " (t_drop): Dropout(p=0.1, inplace=False)\n", + " (theta_act): ReLU()\n", + " (rho): Linear(in_features=500, out_features=118936, bias=False)\n", + " (alphas): Linear(in_features=500, out_features=90, bias=False)\n", + " (q_theta): Sequential(\n", + " (0): Linear(in_features=118936, out_features=700, bias=True)\n", + " (1): ReLU()\n", + " (2): Linear(in_features=700, out_features=700, bias=True)\n", + " (3): ReLU()\n", + " )\n", + " (mu_q_theta): Linear(in_features=700, out_features=90, bias=True)\n", + " (logsigma_q_theta): Linear(in_features=700, out_features=90, bias=True)\n", + ")\n", + "****************************************************************************************************\n", + "Epoch----->1 .. LR: 0.005 .. KL_theta: 1.86 .. Rec_loss: 88984.61 .. NELBO: 88986.47\n", + "****************************************************************************************************\n", + "****************************************************************************************************\n", + "VALIDATION .. LR: 0.005 .. KL_theta: nan .. Rec_loss: nan .. NELBO: nan\n", + "****************************************************************************************************\n", + "Current call: 8\n", + "model: ETM(\n", + " (t_drop): Dropout(p=0.1, inplace=False)\n", + " (theta_act): ReLU()\n", + " (rho): Linear(in_features=500, out_features=118936, bias=False)\n", + " (alphas): Linear(in_features=500, out_features=82, bias=False)\n", + " (q_theta): Sequential(\n", + " (0): Linear(in_features=118936, out_features=700, bias=True)\n", + " (1): ReLU()\n", + " (2): Linear(in_features=700, out_features=700, bias=True)\n", + " (3): ReLU()\n", + " )\n", + " (mu_q_theta): Linear(in_features=700, out_features=82, bias=True)\n", + " (logsigma_q_theta): Linear(in_features=700, out_features=82, bias=True)\n", + ")\n", + "****************************************************************************************************\n", + "Epoch----->1 .. LR: 0.005 .. KL_theta: 1.74 .. Rec_loss: 88987.9 .. NELBO: 88989.64\n", + "****************************************************************************************************\n", + "****************************************************************************************************\n", + "VALIDATION .. LR: 0.005 .. KL_theta: nan .. Rec_loss: nan .. NELBO: nan\n", + "****************************************************************************************************\n", + "model: ETM(\n", + " (t_drop): Dropout(p=0.1, inplace=False)\n", + " (theta_act): ReLU()\n", + " (rho): Linear(in_features=500, out_features=118936, bias=False)\n", + " (alphas): Linear(in_features=500, out_features=82, bias=False)\n", + " (q_theta): Sequential(\n", + " (0): Linear(in_features=118936, out_features=700, bias=True)\n", + " (1): ReLU()\n", + " (2): Linear(in_features=700, out_features=700, bias=True)\n", + " (3): ReLU()\n", + " )\n", + " (mu_q_theta): Linear(in_features=700, out_features=82, bias=True)\n", + " (logsigma_q_theta): Linear(in_features=700, out_features=82, bias=True)\n", + ")\n", + "****************************************************************************************************\n", + "Epoch----->1 .. LR: 0.005 .. KL_theta: 1.34 .. Rec_loss: 88971.59 .. NELBO: 88972.93\n", + "****************************************************************************************************\n", + "****************************************************************************************************\n", + "VALIDATION .. LR: 0.005 .. KL_theta: nan .. Rec_loss: nan .. NELBO: nan\n", + "****************************************************************************************************\n", + "model: ETM(\n", + " (t_drop): Dropout(p=0.1, inplace=False)\n", + " (theta_act): ReLU()\n", + " (rho): Linear(in_features=500, out_features=118936, bias=False)\n", + " (alphas): Linear(in_features=500, out_features=82, bias=False)\n", + " (q_theta): Sequential(\n", + " (0): Linear(in_features=118936, out_features=700, bias=True)\n", + " (1): ReLU()\n", + " (2): Linear(in_features=700, out_features=700, bias=True)\n", + " (3): ReLU()\n", + " )\n", + " (mu_q_theta): Linear(in_features=700, out_features=82, bias=True)\n", + " (logsigma_q_theta): Linear(in_features=700, out_features=82, bias=True)\n", + ")\n", + "****************************************************************************************************\n", + "Epoch----->1 .. LR: 0.005 .. KL_theta: 3.46 .. Rec_loss: 88964.02 .. NELBO: 88967.48\n", + "****************************************************************************************************\n", + "****************************************************************************************************\n", + "VALIDATION .. LR: 0.005 .. KL_theta: nan .. Rec_loss: nan .. NELBO: nan\n", + "****************************************************************************************************\n", + "model: ETM(\n", + " (t_drop): Dropout(p=0.1, inplace=False)\n", + " (theta_act): ReLU()\n", + " (rho): Linear(in_features=500, out_features=118936, bias=False)\n", + " (alphas): Linear(in_features=500, out_features=82, bias=False)\n", + " (q_theta): Sequential(\n", + " (0): Linear(in_features=118936, out_features=700, bias=True)\n", + " (1): ReLU()\n", + " (2): Linear(in_features=700, out_features=700, bias=True)\n", + " (3): ReLU()\n", + " )\n", + " (mu_q_theta): Linear(in_features=700, out_features=82, bias=True)\n", + " (logsigma_q_theta): Linear(in_features=700, out_features=82, bias=True)\n", + ")\n", + "****************************************************************************************************\n", + "Epoch----->1 .. LR: 0.005 .. KL_theta: 4.33 .. Rec_loss: 88984.25 .. NELBO: 88988.58\n", + "****************************************************************************************************\n", + "****************************************************************************************************\n", + "VALIDATION .. LR: 0.005 .. KL_theta: nan .. Rec_loss: nan .. NELBO: nan\n", + "****************************************************************************************************\n", + "model: ETM(\n", + " (t_drop): Dropout(p=0.1, inplace=False)\n", + " (theta_act): ReLU()\n", + " (rho): Linear(in_features=500, out_features=118936, bias=False)\n", + " (alphas): Linear(in_features=500, out_features=82, bias=False)\n", + " (q_theta): Sequential(\n", + " (0): Linear(in_features=118936, out_features=700, bias=True)\n", + " (1): ReLU()\n", + " (2): Linear(in_features=700, out_features=700, bias=True)\n", + " (3): ReLU()\n", + " )\n", + " (mu_q_theta): Linear(in_features=700, out_features=82, bias=True)\n", + " (logsigma_q_theta): Linear(in_features=700, out_features=82, bias=True)\n", + ")\n", + "****************************************************************************************************\n", + "Epoch----->1 .. LR: 0.005 .. KL_theta: 3.5 .. Rec_loss: 88975.72 .. NELBO: 88979.22\n", + "****************************************************************************************************\n", + "****************************************************************************************************\n", + "VALIDATION .. LR: 0.005 .. KL_theta: nan .. Rec_loss: nan .. NELBO: nan\n", + "****************************************************************************************************\n", + "Current call: 9\n", + "model: ETM(\n", + " (t_drop): Dropout(p=0.1, inplace=False)\n", + " (theta_act): ReLU()\n", + " (rho): Linear(in_features=500, out_features=118936, bias=False)\n", + " (alphas): Linear(in_features=500, out_features=103, bias=False)\n", + " (q_theta): Sequential(\n", + " (0): Linear(in_features=118936, out_features=700, bias=True)\n", + " (1): ReLU()\n", + " (2): Linear(in_features=700, out_features=700, bias=True)\n", + " (3): ReLU()\n", + " )\n", + " (mu_q_theta): Linear(in_features=700, out_features=103, bias=True)\n", + " (logsigma_q_theta): Linear(in_features=700, out_features=103, bias=True)\n", + ")\n", + "****************************************************************************************************\n", + "Epoch----->1 .. LR: 0.005 .. KL_theta: 3.36 .. Rec_loss: 88991.34 .. NELBO: 88994.7\n", + "****************************************************************************************************\n", + "****************************************************************************************************\n", + "VALIDATION .. LR: 0.005 .. KL_theta: nan .. Rec_loss: nan .. NELBO: nan\n", + "****************************************************************************************************\n", + "model: ETM(\n", + " (t_drop): Dropout(p=0.1, inplace=False)\n", + " (theta_act): ReLU()\n", + " (rho): Linear(in_features=500, out_features=118936, bias=False)\n", + " (alphas): Linear(in_features=500, out_features=103, bias=False)\n", + " (q_theta): Sequential(\n", + " (0): Linear(in_features=118936, out_features=700, bias=True)\n", + " (1): ReLU()\n", + " (2): Linear(in_features=700, out_features=700, bias=True)\n", + " (3): ReLU()\n", + " )\n", + " (mu_q_theta): Linear(in_features=700, out_features=103, bias=True)\n", + " (logsigma_q_theta): Linear(in_features=700, out_features=103, bias=True)\n", + ")\n", + "****************************************************************************************************\n", + "Epoch----->1 .. LR: 0.005 .. KL_theta: 2.03 .. Rec_loss: 89034.76 .. NELBO: 89036.79\n", + "****************************************************************************************************\n", + "****************************************************************************************************\n", + "VALIDATION .. LR: 0.005 .. KL_theta: nan .. Rec_loss: nan .. NELBO: nan\n", + "****************************************************************************************************\n", + "model: ETM(\n", + " (t_drop): Dropout(p=0.1, inplace=False)\n", + " (theta_act): ReLU()\n", + " (rho): Linear(in_features=500, out_features=118936, bias=False)\n", + " (alphas): Linear(in_features=500, out_features=103, bias=False)\n", + " (q_theta): Sequential(\n", + " (0): Linear(in_features=118936, out_features=700, bias=True)\n", + " (1): ReLU()\n", + " (2): Linear(in_features=700, out_features=700, bias=True)\n", + " (3): ReLU()\n", + " )\n", + " (mu_q_theta): Linear(in_features=700, out_features=103, bias=True)\n", + " (logsigma_q_theta): Linear(in_features=700, out_features=103, bias=True)\n", + ")\n", + "****************************************************************************************************\n", + "Epoch----->1 .. LR: 0.005 .. KL_theta: 4.13 .. Rec_loss: 88979.65 .. NELBO: 88983.78\n", + "****************************************************************************************************\n", + "****************************************************************************************************\n", + "VALIDATION .. LR: 0.005 .. KL_theta: nan .. Rec_loss: nan .. NELBO: nan\n", + "****************************************************************************************************\n", + "model: ETM(\n", + " (t_drop): Dropout(p=0.1, inplace=False)\n", + " (theta_act): ReLU()\n", + " (rho): Linear(in_features=500, out_features=118936, bias=False)\n", + " (alphas): Linear(in_features=500, out_features=103, bias=False)\n", + " (q_theta): Sequential(\n", + " (0): Linear(in_features=118936, out_features=700, bias=True)\n", + " (1): ReLU()\n", + " (2): Linear(in_features=700, out_features=700, bias=True)\n", + " (3): ReLU()\n", + " )\n", + " (mu_q_theta): Linear(in_features=700, out_features=103, bias=True)\n", + " (logsigma_q_theta): Linear(in_features=700, out_features=103, bias=True)\n", + ")\n", + "****************************************************************************************************\n", + "Epoch----->1 .. LR: 0.005 .. KL_theta: 2.25 .. Rec_loss: 89011.82 .. NELBO: 89014.07\n", + "****************************************************************************************************\n", + "****************************************************************************************************\n", + "VALIDATION .. LR: 0.005 .. KL_theta: nan .. Rec_loss: nan .. NELBO: nan\n", + "****************************************************************************************************\n", + "model: ETM(\n", + " (t_drop): Dropout(p=0.1, inplace=False)\n", + " (theta_act): ReLU()\n", + " (rho): Linear(in_features=500, out_features=118936, bias=False)\n", + " (alphas): Linear(in_features=500, out_features=103, bias=False)\n", + " (q_theta): Sequential(\n", + " (0): Linear(in_features=118936, out_features=700, bias=True)\n", + " (1): ReLU()\n", + " (2): Linear(in_features=700, out_features=700, bias=True)\n", + " (3): ReLU()\n", + " )\n", + " (mu_q_theta): Linear(in_features=700, out_features=103, bias=True)\n", + " (logsigma_q_theta): Linear(in_features=700, out_features=103, bias=True)\n", + ")\n", + "****************************************************************************************************\n", + "Epoch----->1 .. LR: 0.005 .. KL_theta: 3.25 .. Rec_loss: 89034.11 .. NELBO: 89037.36\n", + "****************************************************************************************************\n", + "****************************************************************************************************\n", + "VALIDATION .. LR: 0.005 .. KL_theta: nan .. Rec_loss: nan .. NELBO: nan\n", + "****************************************************************************************************\n", + "Current call: 10\n", + "model: ETM(\n", + " (t_drop): Dropout(p=0.1, inplace=False)\n", + " (theta_act): ReLU()\n", + " (rho): Linear(in_features=500, out_features=118936, bias=False)\n", + " (alphas): Linear(in_features=500, out_features=102, bias=False)\n", + " (q_theta): Sequential(\n", + " (0): Linear(in_features=118936, out_features=700, bias=True)\n", + " (1): ReLU()\n", + " (2): Linear(in_features=700, out_features=700, bias=True)\n", + " (3): ReLU()\n", + " )\n", + " (mu_q_theta): Linear(in_features=700, out_features=102, bias=True)\n", + " (logsigma_q_theta): Linear(in_features=700, out_features=102, bias=True)\n", + ")\n", + "****************************************************************************************************\n", + "Epoch----->1 .. LR: 0.005 .. KL_theta: 3.07 .. Rec_loss: 88982.92 .. NELBO: 88985.99\n", + "****************************************************************************************************\n", + "****************************************************************************************************\n", + "VALIDATION .. LR: 0.005 .. KL_theta: nan .. Rec_loss: nan .. NELBO: nan\n", + "****************************************************************************************************\n", + "model: ETM(\n", + " (t_drop): Dropout(p=0.1, inplace=False)\n", + " (theta_act): ReLU()\n", + " (rho): Linear(in_features=500, out_features=118936, bias=False)\n", + " (alphas): Linear(in_features=500, out_features=102, bias=False)\n", + " (q_theta): Sequential(\n", + " (0): Linear(in_features=118936, out_features=700, bias=True)\n", + " (1): ReLU()\n", + " (2): Linear(in_features=700, out_features=700, bias=True)\n", + " (3): ReLU()\n", + " )\n", + " (mu_q_theta): Linear(in_features=700, out_features=102, bias=True)\n", + " (logsigma_q_theta): Linear(in_features=700, out_features=102, bias=True)\n", + ")\n", + "****************************************************************************************************\n", + "Epoch----->1 .. LR: 0.005 .. KL_theta: 3.02 .. Rec_loss: 88984.46 .. NELBO: 88987.48\n", + "****************************************************************************************************\n", + "****************************************************************************************************\n", + "VALIDATION .. LR: 0.005 .. KL_theta: nan .. Rec_loss: nan .. NELBO: nan\n", + "****************************************************************************************************\n", + "model: ETM(\n", + " (t_drop): Dropout(p=0.1, inplace=False)\n", + " (theta_act): ReLU()\n", + " (rho): Linear(in_features=500, out_features=118936, bias=False)\n", + " (alphas): Linear(in_features=500, out_features=102, bias=False)\n", + " (q_theta): Sequential(\n", + " (0): Linear(in_features=118936, out_features=700, bias=True)\n", + " (1): ReLU()\n", + " (2): Linear(in_features=700, out_features=700, bias=True)\n", + " (3): ReLU()\n", + " )\n", + " (mu_q_theta): Linear(in_features=700, out_features=102, bias=True)\n", + " (logsigma_q_theta): Linear(in_features=700, out_features=102, bias=True)\n", + ")\n", + "****************************************************************************************************\n", + "Epoch----->1 .. LR: 0.005 .. KL_theta: 1.26 .. Rec_loss: 89017.67 .. NELBO: 89018.93\n", + "****************************************************************************************************\n", + "****************************************************************************************************\n", + "VALIDATION .. LR: 0.005 .. KL_theta: nan .. Rec_loss: nan .. NELBO: nan\n", + "****************************************************************************************************\n", + "model: ETM(\n", + " (t_drop): Dropout(p=0.1, inplace=False)\n", + " (theta_act): ReLU()\n", + " (rho): Linear(in_features=500, out_features=118936, bias=False)\n", + " (alphas): Linear(in_features=500, out_features=102, bias=False)\n", + " (q_theta): Sequential(\n", + " (0): Linear(in_features=118936, out_features=700, bias=True)\n", + " (1): ReLU()\n", + " (2): Linear(in_features=700, out_features=700, bias=True)\n", + " (3): ReLU()\n", + " )\n", + " (mu_q_theta): Linear(in_features=700, out_features=102, bias=True)\n", + " (logsigma_q_theta): Linear(in_features=700, out_features=102, bias=True)\n", + ")\n", + "****************************************************************************************************\n", + "Epoch----->1 .. LR: 0.005 .. KL_theta: 3.61 .. Rec_loss: 88957.25 .. NELBO: 88960.86\n", + "****************************************************************************************************\n", + "****************************************************************************************************\n", + "VALIDATION .. LR: 0.005 .. KL_theta: nan .. Rec_loss: nan .. NELBO: nan\n", + "****************************************************************************************************\n", + "model: ETM(\n", + " (t_drop): Dropout(p=0.1, inplace=False)\n", + " (theta_act): ReLU()\n", + " (rho): Linear(in_features=500, out_features=118936, bias=False)\n", + " (alphas): Linear(in_features=500, out_features=102, bias=False)\n", + " (q_theta): Sequential(\n", + " (0): Linear(in_features=118936, out_features=700, bias=True)\n", + " (1): ReLU()\n", + " (2): Linear(in_features=700, out_features=700, bias=True)\n", + " (3): ReLU()\n", + " )\n", + " (mu_q_theta): Linear(in_features=700, out_features=102, bias=True)\n", + " (logsigma_q_theta): Linear(in_features=700, out_features=102, bias=True)\n", + ")\n", + "****************************************************************************************************\n", + "Epoch----->1 .. LR: 0.005 .. KL_theta: 1.86 .. Rec_loss: 88975.86 .. NELBO: 88977.72\n", + "****************************************************************************************************\n", + "****************************************************************************************************\n", + "VALIDATION .. LR: 0.005 .. KL_theta: nan .. Rec_loss: nan .. NELBO: nan\n", + "****************************************************************************************************\n", + "Current call: 11\n", + "model: ETM(\n", + " (t_drop): Dropout(p=0.1, inplace=False)\n", + " (theta_act): ReLU()\n", + " (rho): Linear(in_features=500, out_features=118936, bias=False)\n", + " (alphas): Linear(in_features=500, out_features=103, bias=False)\n", + " (q_theta): Sequential(\n", + " (0): Linear(in_features=118936, out_features=700, bias=True)\n", + " (1): ReLU()\n", + " (2): Linear(in_features=700, out_features=700, bias=True)\n", + " (3): ReLU()\n", + " )\n", + " (mu_q_theta): Linear(in_features=700, out_features=103, bias=True)\n", + " (logsigma_q_theta): Linear(in_features=700, out_features=103, bias=True)\n", + ")\n", + "****************************************************************************************************\n", + "Epoch----->1 .. LR: 0.005 .. KL_theta: 2.52 .. Rec_loss: 89025.5 .. NELBO: 89028.02\n", + "****************************************************************************************************\n", + "****************************************************************************************************\n", + "VALIDATION .. LR: 0.005 .. KL_theta: nan .. Rec_loss: nan .. NELBO: nan\n", + "****************************************************************************************************\n", + "model: ETM(\n", + " (t_drop): Dropout(p=0.1, inplace=False)\n", + " (theta_act): ReLU()\n", + " (rho): Linear(in_features=500, out_features=118936, bias=False)\n", + " (alphas): Linear(in_features=500, out_features=103, bias=False)\n", + " (q_theta): Sequential(\n", + " (0): Linear(in_features=118936, out_features=700, bias=True)\n", + " (1): ReLU()\n", + " (2): Linear(in_features=700, out_features=700, bias=True)\n", + " (3): ReLU()\n", + " )\n", + " (mu_q_theta): Linear(in_features=700, out_features=103, bias=True)\n", + " (logsigma_q_theta): Linear(in_features=700, out_features=103, bias=True)\n", + ")\n", + "****************************************************************************************************\n", + "Epoch----->1 .. LR: 0.005 .. KL_theta: 1.84 .. Rec_loss: 88987.69 .. NELBO: 88989.53\n", + "****************************************************************************************************\n", + "****************************************************************************************************\n", + "VALIDATION .. LR: 0.005 .. KL_theta: nan .. Rec_loss: nan .. NELBO: nan\n", + "****************************************************************************************************\n", + "model: ETM(\n", + " (t_drop): Dropout(p=0.1, inplace=False)\n", + " (theta_act): ReLU()\n", + " (rho): Linear(in_features=500, out_features=118936, bias=False)\n", + " (alphas): Linear(in_features=500, out_features=103, bias=False)\n", + " (q_theta): Sequential(\n", + " (0): Linear(in_features=118936, out_features=700, bias=True)\n", + " (1): ReLU()\n", + " (2): Linear(in_features=700, out_features=700, bias=True)\n", + " (3): ReLU()\n", + " )\n", + " (mu_q_theta): Linear(in_features=700, out_features=103, bias=True)\n", + " (logsigma_q_theta): Linear(in_features=700, out_features=103, bias=True)\n", + ")\n", + "****************************************************************************************************\n", + "Epoch----->1 .. LR: 0.005 .. KL_theta: 2.72 .. Rec_loss: 88987.53 .. NELBO: 88990.25\n", + "****************************************************************************************************\n", + "****************************************************************************************************\n", + "VALIDATION .. LR: 0.005 .. KL_theta: nan .. Rec_loss: nan .. NELBO: nan\n", + "****************************************************************************************************\n", + "model: ETM(\n", + " (t_drop): Dropout(p=0.1, inplace=False)\n", + " (theta_act): ReLU()\n", + " (rho): Linear(in_features=500, out_features=118936, bias=False)\n", + " (alphas): Linear(in_features=500, out_features=103, bias=False)\n", + " (q_theta): Sequential(\n", + " (0): Linear(in_features=118936, out_features=700, bias=True)\n", + " (1): ReLU()\n", + " (2): Linear(in_features=700, out_features=700, bias=True)\n", + " (3): ReLU()\n", + " )\n", + " (mu_q_theta): Linear(in_features=700, out_features=103, bias=True)\n", + " (logsigma_q_theta): Linear(in_features=700, out_features=103, bias=True)\n", + ")\n", + "****************************************************************************************************\n", + "Epoch----->1 .. LR: 0.005 .. KL_theta: 1.62 .. Rec_loss: 88963.97 .. NELBO: 88965.59\n", + "****************************************************************************************************\n", + "****************************************************************************************************\n", + "VALIDATION .. LR: 0.005 .. KL_theta: nan .. Rec_loss: nan .. NELBO: nan\n", + "****************************************************************************************************\n", + "model: ETM(\n", + " (t_drop): Dropout(p=0.1, inplace=False)\n", + " (theta_act): ReLU()\n", + " (rho): Linear(in_features=500, out_features=118936, bias=False)\n", + " (alphas): Linear(in_features=500, out_features=103, bias=False)\n", + " (q_theta): Sequential(\n", + " (0): Linear(in_features=118936, out_features=700, bias=True)\n", + " (1): ReLU()\n", + " (2): Linear(in_features=700, out_features=700, bias=True)\n", + " (3): ReLU()\n", + " )\n", + " (mu_q_theta): Linear(in_features=700, out_features=103, bias=True)\n", + " (logsigma_q_theta): Linear(in_features=700, out_features=103, bias=True)\n", + ")\n", + "****************************************************************************************************\n", + "Epoch----->1 .. LR: 0.005 .. KL_theta: 2.44 .. Rec_loss: 89019.76 .. NELBO: 89022.2\n", + "****************************************************************************************************\n", + "****************************************************************************************************\n", + "VALIDATION .. LR: 0.005 .. KL_theta: nan .. Rec_loss: nan .. NELBO: nan\n", + "****************************************************************************************************\n", + "Current call: 12\n", + "model: ETM(\n", + " (t_drop): Dropout(p=0.1, inplace=False)\n", + " (theta_act): ReLU()\n", + " (rho): Linear(in_features=500, out_features=118936, bias=False)\n", + " (alphas): Linear(in_features=500, out_features=104, bias=False)\n", + " (q_theta): Sequential(\n", + " (0): Linear(in_features=118936, out_features=700, bias=True)\n", + " (1): ReLU()\n", + " (2): Linear(in_features=700, out_features=700, bias=True)\n", + " (3): ReLU()\n", + " )\n", + " (mu_q_theta): Linear(in_features=700, out_features=104, bias=True)\n", + " (logsigma_q_theta): Linear(in_features=700, out_features=104, bias=True)\n", + ")\n", + "****************************************************************************************************\n", + "Epoch----->1 .. LR: 0.005 .. KL_theta: 1.75 .. Rec_loss: 88980.13 .. NELBO: 88981.88\n", + "****************************************************************************************************\n", + "****************************************************************************************************\n", + "VALIDATION .. LR: 0.005 .. KL_theta: nan .. Rec_loss: nan .. NELBO: nan\n", + "****************************************************************************************************\n", + "model: ETM(\n", + " (t_drop): Dropout(p=0.1, inplace=False)\n", + " (theta_act): ReLU()\n", + " (rho): Linear(in_features=500, out_features=118936, bias=False)\n", + " (alphas): Linear(in_features=500, out_features=104, bias=False)\n", + " (q_theta): Sequential(\n", + " (0): Linear(in_features=118936, out_features=700, bias=True)\n", + " (1): ReLU()\n", + " (2): Linear(in_features=700, out_features=700, bias=True)\n", + " (3): ReLU()\n", + " )\n", + " (mu_q_theta): Linear(in_features=700, out_features=104, bias=True)\n", + " (logsigma_q_theta): Linear(in_features=700, out_features=104, bias=True)\n", + ")\n", + "****************************************************************************************************\n", + "Epoch----->1 .. LR: 0.005 .. KL_theta: 2.32 .. Rec_loss: 89002.83 .. NELBO: 89005.15\n", + "****************************************************************************************************\n", + "****************************************************************************************************\n", + "VALIDATION .. LR: 0.005 .. KL_theta: nan .. Rec_loss: nan .. NELBO: nan\n", + "****************************************************************************************************\n", + "model: ETM(\n", + " (t_drop): Dropout(p=0.1, inplace=False)\n", + " (theta_act): ReLU()\n", + " (rho): Linear(in_features=500, out_features=118936, bias=False)\n", + " (alphas): Linear(in_features=500, out_features=104, bias=False)\n", + " (q_theta): Sequential(\n", + " (0): Linear(in_features=118936, out_features=700, bias=True)\n", + " (1): ReLU()\n", + " (2): Linear(in_features=700, out_features=700, bias=True)\n", + " (3): ReLU()\n", + " )\n", + " (mu_q_theta): Linear(in_features=700, out_features=104, bias=True)\n", + " (logsigma_q_theta): Linear(in_features=700, out_features=104, bias=True)\n", + ")\n", + "****************************************************************************************************\n", + "Epoch----->1 .. LR: 0.005 .. KL_theta: 2.44 .. Rec_loss: 89004.85 .. NELBO: 89007.29\n", + "****************************************************************************************************\n", + "****************************************************************************************************\n", + "VALIDATION .. LR: 0.005 .. KL_theta: nan .. Rec_loss: nan .. NELBO: nan\n", + "****************************************************************************************************\n", + "model: ETM(\n", + " (t_drop): Dropout(p=0.1, inplace=False)\n", + " (theta_act): ReLU()\n", + " (rho): Linear(in_features=500, out_features=118936, bias=False)\n", + " (alphas): Linear(in_features=500, out_features=104, bias=False)\n", + " (q_theta): Sequential(\n", + " (0): Linear(in_features=118936, out_features=700, bias=True)\n", + " (1): ReLU()\n", + " (2): Linear(in_features=700, out_features=700, bias=True)\n", + " (3): ReLU()\n", + " )\n", + " (mu_q_theta): Linear(in_features=700, out_features=104, bias=True)\n", + " (logsigma_q_theta): Linear(in_features=700, out_features=104, bias=True)\n", + ")\n", + "****************************************************************************************************\n", + "Epoch----->1 .. LR: 0.005 .. KL_theta: 3.13 .. Rec_loss: 88975.44 .. NELBO: 88978.57\n", + "****************************************************************************************************\n", + "****************************************************************************************************\n", + "VALIDATION .. LR: 0.005 .. KL_theta: nan .. Rec_loss: nan .. NELBO: nan\n", + "****************************************************************************************************\n", + "model: ETM(\n", + " (t_drop): Dropout(p=0.1, inplace=False)\n", + " (theta_act): ReLU()\n", + " (rho): Linear(in_features=500, out_features=118936, bias=False)\n", + " (alphas): Linear(in_features=500, out_features=104, bias=False)\n", + " (q_theta): Sequential(\n", + " (0): Linear(in_features=118936, out_features=700, bias=True)\n", + " (1): ReLU()\n", + " (2): Linear(in_features=700, out_features=700, bias=True)\n", + " (3): ReLU()\n", + " )\n", + " (mu_q_theta): Linear(in_features=700, out_features=104, bias=True)\n", + " (logsigma_q_theta): Linear(in_features=700, out_features=104, bias=True)\n", + ")\n", + "****************************************************************************************************\n", + "Epoch----->1 .. LR: 0.005 .. KL_theta: 1.79 .. Rec_loss: 89020.73 .. NELBO: 89022.52\n", + "****************************************************************************************************\n", + "****************************************************************************************************\n", + "VALIDATION .. LR: 0.005 .. KL_theta: nan .. Rec_loss: nan .. NELBO: nan\n", + "****************************************************************************************************\n", + "Current call: 13\n", + "model: ETM(\n", + " (t_drop): Dropout(p=0.1, inplace=False)\n", + " (theta_act): ReLU()\n", + " (rho): Linear(in_features=500, out_features=118936, bias=False)\n", + " (alphas): Linear(in_features=500, out_features=103, bias=False)\n", + " (q_theta): Sequential(\n", + " (0): Linear(in_features=118936, out_features=700, bias=True)\n", + " (1): ReLU()\n", + " (2): Linear(in_features=700, out_features=700, bias=True)\n", + " (3): ReLU()\n", + " )\n", + " (mu_q_theta): Linear(in_features=700, out_features=103, bias=True)\n", + " (logsigma_q_theta): Linear(in_features=700, out_features=103, bias=True)\n", + ")\n", + "****************************************************************************************************\n", + "Epoch----->1 .. LR: 0.005 .. KL_theta: 1.11 .. Rec_loss: 89009.93 .. NELBO: 89011.04\n", + "****************************************************************************************************\n", + "****************************************************************************************************\n", + "VALIDATION .. LR: 0.005 .. KL_theta: nan .. Rec_loss: nan .. NELBO: nan\n", + "****************************************************************************************************\n", + "model: ETM(\n", + " (t_drop): Dropout(p=0.1, inplace=False)\n", + " (theta_act): ReLU()\n", + " (rho): Linear(in_features=500, out_features=118936, bias=False)\n", + " (alphas): Linear(in_features=500, out_features=103, bias=False)\n", + " (q_theta): Sequential(\n", + " (0): Linear(in_features=118936, out_features=700, bias=True)\n", + " (1): ReLU()\n", + " (2): Linear(in_features=700, out_features=700, bias=True)\n", + " (3): ReLU()\n", + " )\n", + " (mu_q_theta): Linear(in_features=700, out_features=103, bias=True)\n", + " (logsigma_q_theta): Linear(in_features=700, out_features=103, bias=True)\n", + ")\n", + "****************************************************************************************************\n", + "Epoch----->1 .. LR: 0.005 .. KL_theta: 3.0 .. Rec_loss: 88963.22 .. NELBO: 88966.22\n", + "****************************************************************************************************\n", + "****************************************************************************************************\n", + "VALIDATION .. LR: 0.005 .. KL_theta: nan .. Rec_loss: nan .. NELBO: nan\n", + "****************************************************************************************************\n", + "model: ETM(\n", + " (t_drop): Dropout(p=0.1, inplace=False)\n", + " (theta_act): ReLU()\n", + " (rho): Linear(in_features=500, out_features=118936, bias=False)\n", + " (alphas): Linear(in_features=500, out_features=103, bias=False)\n", + " (q_theta): Sequential(\n", + " (0): Linear(in_features=118936, out_features=700, bias=True)\n", + " (1): ReLU()\n", + " (2): Linear(in_features=700, out_features=700, bias=True)\n", + " (3): ReLU()\n", + " )\n", + " (mu_q_theta): Linear(in_features=700, out_features=103, bias=True)\n", + " (logsigma_q_theta): Linear(in_features=700, out_features=103, bias=True)\n", + ")\n", + "****************************************************************************************************\n", + "Epoch----->1 .. LR: 0.005 .. KL_theta: 2.15 .. Rec_loss: 88989.65 .. NELBO: 88991.8\n", + "****************************************************************************************************\n", + "****************************************************************************************************\n", + "VALIDATION .. LR: 0.005 .. KL_theta: nan .. Rec_loss: nan .. NELBO: nan\n", + "****************************************************************************************************\n", + "model: ETM(\n", + " (t_drop): Dropout(p=0.1, inplace=False)\n", + " (theta_act): ReLU()\n", + " (rho): Linear(in_features=500, out_features=118936, bias=False)\n", + " (alphas): Linear(in_features=500, out_features=103, bias=False)\n", + " (q_theta): Sequential(\n", + " (0): Linear(in_features=118936, out_features=700, bias=True)\n", + " (1): ReLU()\n", + " (2): Linear(in_features=700, out_features=700, bias=True)\n", + " (3): ReLU()\n", + " )\n", + " (mu_q_theta): Linear(in_features=700, out_features=103, bias=True)\n", + " (logsigma_q_theta): Linear(in_features=700, out_features=103, bias=True)\n", + ")\n", + "****************************************************************************************************\n", + "Epoch----->1 .. LR: 0.005 .. KL_theta: 2.13 .. Rec_loss: 88987.96 .. NELBO: 88990.09\n", + "****************************************************************************************************\n", + "****************************************************************************************************\n", + "VALIDATION .. LR: 0.005 .. KL_theta: nan .. Rec_loss: nan .. NELBO: nan\n", + "****************************************************************************************************\n", + "model: ETM(\n", + " (t_drop): Dropout(p=0.1, inplace=False)\n", + " (theta_act): ReLU()\n", + " (rho): Linear(in_features=500, out_features=118936, bias=False)\n", + " (alphas): Linear(in_features=500, out_features=103, bias=False)\n", + " (q_theta): Sequential(\n", + " (0): Linear(in_features=118936, out_features=700, bias=True)\n", + " (1): ReLU()\n", + " (2): Linear(in_features=700, out_features=700, bias=True)\n", + " (3): ReLU()\n", + " )\n", + " (mu_q_theta): Linear(in_features=700, out_features=103, bias=True)\n", + " (logsigma_q_theta): Linear(in_features=700, out_features=103, bias=True)\n", + ")\n", + "****************************************************************************************************\n", + "Epoch----->1 .. LR: 0.005 .. KL_theta: 1.75 .. Rec_loss: 88986.13 .. NELBO: 88987.88\n", + "****************************************************************************************************\n", + "****************************************************************************************************\n", + "VALIDATION .. LR: 0.005 .. KL_theta: nan .. Rec_loss: nan .. NELBO: nan\n", + "****************************************************************************************************\n", + "Current call: 14\n", + "model: ETM(\n", + " (t_drop): Dropout(p=0.1, inplace=False)\n", + " (theta_act): ReLU()\n", + " (rho): Linear(in_features=500, out_features=118936, bias=False)\n", + " (alphas): Linear(in_features=500, out_features=101, bias=False)\n", + " (q_theta): Sequential(\n", + " (0): Linear(in_features=118936, out_features=700, bias=True)\n", + " (1): ReLU()\n", + " (2): Linear(in_features=700, out_features=700, bias=True)\n", + " (3): ReLU()\n", + " )\n", + " (mu_q_theta): Linear(in_features=700, out_features=101, bias=True)\n", + " (logsigma_q_theta): Linear(in_features=700, out_features=101, bias=True)\n", + ")\n", + "****************************************************************************************************\n", + "Epoch----->1 .. LR: 0.005 .. KL_theta: 2.17 .. Rec_loss: 89048.06 .. NELBO: 89050.23\n", + "****************************************************************************************************\n", + "****************************************************************************************************\n", + "VALIDATION .. LR: 0.005 .. KL_theta: nan .. Rec_loss: nan .. NELBO: nan\n", + "****************************************************************************************************\n", + "model: ETM(\n", + " (t_drop): Dropout(p=0.1, inplace=False)\n", + " (theta_act): ReLU()\n", + " (rho): Linear(in_features=500, out_features=118936, bias=False)\n", + " (alphas): Linear(in_features=500, out_features=101, bias=False)\n", + " (q_theta): Sequential(\n", + " (0): Linear(in_features=118936, out_features=700, bias=True)\n", + " (1): ReLU()\n", + " (2): Linear(in_features=700, out_features=700, bias=True)\n", + " (3): ReLU()\n", + " )\n", + " (mu_q_theta): Linear(in_features=700, out_features=101, bias=True)\n", + " (logsigma_q_theta): Linear(in_features=700, out_features=101, bias=True)\n", + ")\n", + "****************************************************************************************************\n", + "Epoch----->1 .. LR: 0.005 .. KL_theta: 3.89 .. Rec_loss: 88974.84 .. NELBO: 88978.73\n", + "****************************************************************************************************\n", + "****************************************************************************************************\n", + "VALIDATION .. LR: 0.005 .. KL_theta: nan .. Rec_loss: nan .. NELBO: nan\n", + "****************************************************************************************************\n", + "model: ETM(\n", + " (t_drop): Dropout(p=0.1, inplace=False)\n", + " (theta_act): ReLU()\n", + " (rho): Linear(in_features=500, out_features=118936, bias=False)\n", + " (alphas): Linear(in_features=500, out_features=101, bias=False)\n", + " (q_theta): Sequential(\n", + " (0): Linear(in_features=118936, out_features=700, bias=True)\n", + " (1): ReLU()\n", + " (2): Linear(in_features=700, out_features=700, bias=True)\n", + " (3): ReLU()\n", + " )\n", + " (mu_q_theta): Linear(in_features=700, out_features=101, bias=True)\n", + " (logsigma_q_theta): Linear(in_features=700, out_features=101, bias=True)\n", + ")\n", + "****************************************************************************************************\n", + "Epoch----->1 .. LR: 0.005 .. KL_theta: 2.58 .. Rec_loss: 88997.39 .. NELBO: 88999.97\n", + "****************************************************************************************************\n", + "****************************************************************************************************\n", + "VALIDATION .. LR: 0.005 .. KL_theta: nan .. Rec_loss: nan .. NELBO: nan\n", + "****************************************************************************************************\n", + "model: ETM(\n", + " (t_drop): Dropout(p=0.1, inplace=False)\n", + " (theta_act): ReLU()\n", + " (rho): Linear(in_features=500, out_features=118936, bias=False)\n", + " (alphas): Linear(in_features=500, out_features=101, bias=False)\n", + " (q_theta): Sequential(\n", + " (0): Linear(in_features=118936, out_features=700, bias=True)\n", + " (1): ReLU()\n", + " (2): Linear(in_features=700, out_features=700, bias=True)\n", + " (3): ReLU()\n", + " )\n", + " (mu_q_theta): Linear(in_features=700, out_features=101, bias=True)\n", + " (logsigma_q_theta): Linear(in_features=700, out_features=101, bias=True)\n", + ")\n", + "****************************************************************************************************\n", + "Epoch----->1 .. LR: 0.005 .. KL_theta: 2.53 .. Rec_loss: 88971.39 .. NELBO: 88973.92\n", + "****************************************************************************************************\n", + "****************************************************************************************************\n", + "VALIDATION .. LR: 0.005 .. KL_theta: nan .. Rec_loss: nan .. NELBO: nan\n", + "****************************************************************************************************\n", + "model: ETM(\n", + " (t_drop): Dropout(p=0.1, inplace=False)\n", + " (theta_act): ReLU()\n", + " (rho): Linear(in_features=500, out_features=118936, bias=False)\n", + " (alphas): Linear(in_features=500, out_features=101, bias=False)\n", + " (q_theta): Sequential(\n", + " (0): Linear(in_features=118936, out_features=700, bias=True)\n", + " (1): ReLU()\n", + " (2): Linear(in_features=700, out_features=700, bias=True)\n", + " (3): ReLU()\n", + " )\n", + " (mu_q_theta): Linear(in_features=700, out_features=101, bias=True)\n", + " (logsigma_q_theta): Linear(in_features=700, out_features=101, bias=True)\n", + ")\n", + "****************************************************************************************************\n", + "Epoch----->1 .. LR: 0.005 .. KL_theta: 3.58 .. Rec_loss: 89000.65 .. NELBO: 89004.23\n", + "****************************************************************************************************\n", + "****************************************************************************************************\n", + "VALIDATION .. LR: 0.005 .. KL_theta: nan .. Rec_loss: nan .. NELBO: nan\n", + "****************************************************************************************************\n", + "Optimizing model took: 4109 seconds.\n" + ] + } + ], + "source": [ + "optimizer=Optimizer()\n", + "import time\n", + "start = time.time()\n", + "optimization_result = optimizer.optimize(\n", + " model, dataset, topic_diversity, search_space, number_of_call=optimization_runs, \n", + " model_runs=model_runs, save_models=True, \n", + " extra_metrics=None, # to keep track of other metrics\n", + " save_path='results/test_ETMco5_wz//')\n", + "end = time.time()\n", + "duration = end - start\n", + "optimization_result.save_to_csv(\"results_ETMco5_wz.csv\")\n", + "print('Optimizing model took: ' + str(round(duration)) + ' seconds.')" + ] + }, + { + "cell_type": "code", + "execution_count": 40, + "id": "012b1e5d-ab2c-4af2-825f-35ec4ba36584", + "metadata": {}, + "outputs": [ + { + "data": { + "text/plain": [ + "dict_keys(['dataset_name', 'dataset_path', 'is_cached', 'kernel', 'acq_func', 'surrogate_model', 'optimization_type', 'model_runs', 'save_models', 'save_step', 'save_name', 'save_path', 'early_stop', 'early_step', 'plot_model', 'plot_best_seen', 'plot_name', 'log_scale_plot', 'search_space', 'model_name', 'model_attributes', 'use_partitioning', 'metric_name', 'extra_metric_names', 'metric_attributes', 'extra_metric_attributes', 'current_call', 'number_of_call', 'random_state', 'x0', 'y0', 'n_random_starts', 'initial_point_generator', 'topk', 'time_eval', 'dict_model_runs', 'f_val', 'x_iters'])" + ] + }, + "execution_count": 40, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "results = json.load(open('results/test_ETMco5_wz/result.json','r'))\n", + "results.keys()" + ] + }, + { + "cell_type": "code", + "execution_count": 41, + "id": "88f05c2d-a055-4d36-840e-5fee027979c1", + "metadata": {}, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "[[119, 127, 99, 109, 108, 90, 99, 90, 82, 103, 102, 103, 104, 103, 101]]\n" + ] + } + ], + "source": [ + "print([results['x_iters'][parameter] for parameter in results['x_iters'].keys()])" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "id": "f4b0c8d1-c91f-42f8-afd7-0664274daf1d", + "metadata": {}, + "outputs": [], + "source": [] + }, + { + "cell_type": "markdown", + "id": "9392cba6-9bd4-44a4-92d2-c047ba4c9b16", + "metadata": {}, + "source": [ + "

final model

" + ] + }, + { + "cell_type": "code", + "execution_count": 17, + "id": "dbb3e9ba-4767-4cf1-b626-847483c50650", + "metadata": {}, + "outputs": [], + "source": [ + "model = ETM(num_topics=99, num_epochs=150, t_hidden_size=700, rho_size=500,\n", + "embedding_size=800, activation='relu', dropout=0.1, lr=0.005,\n", + "optimizer='adam', batch_size=128, clip=0.0, wdecay=1.2e-06, bow_norm=1,\n", + "device='cpu', top_word=25, train_embeddings=True, embeddings_path=None,\n", + "embeddings_type='pickle', binary_embeddings=True,\n", + "headerless_embeddings=False, use_partitions=True)" + ] + }, + { + "cell_type": "code", + "execution_count": 18, + "id": "98b21d15-25bd-43ae-b359-1b045324b806", + "metadata": {}, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "model: ETM(\n", + " (t_drop): Dropout(p=0.1, inplace=False)\n", + " (theta_act): ReLU()\n", + " (rho): Linear(in_features=500, out_features=118936, bias=False)\n", + " (alphas): Linear(in_features=500, out_features=99, bias=False)\n", + " (q_theta): Sequential(\n", + " (0): Linear(in_features=118936, out_features=700, bias=True)\n", + " (1): ReLU()\n", + " (2): Linear(in_features=700, out_features=700, bias=True)\n", + " (3): ReLU()\n", + " )\n", + " (mu_q_theta): Linear(in_features=700, out_features=99, bias=True)\n", + " (logsigma_q_theta): Linear(in_features=700, out_features=99, bias=True)\n", + ")\n", + "****************************************************************************************************\n", + "Epoch----->1 .. LR: 0.005 .. KL_theta: 3.03 .. Rec_loss: 88965.19 .. NELBO: 88968.22\n", + "****************************************************************************************************\n", + "****************************************************************************************************\n", + "VALIDATION .. LR: 0.005 .. KL_theta: nan .. Rec_loss: nan .. NELBO: nan\n", + "****************************************************************************************************\n" + ] + } + ], + "source": [ + "model_output = model.train_model(dataset)" + ] + }, + { + "cell_type": "code", + "execution_count": 19, + "id": "c3e1e849-4243-4a21-8a3b-bb4d0fd330fc", + "metadata": {}, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "stadt bestimmte find haus nürnberg nachm bekannt statten bringen besatzung\n", + "königreich gebäude beyden halb wenige besteht bringen bewegungen jahren befindlich\n", + "kung rechr namen königreich bestimmte bevollmächtig endlich pest wisse erlaubniß\n", + "wisse reichs beyden nürnberg haus rechtssache endlich genau bekannt schwere\n", + "gewisse stande hader besteht beyden laden herausgabe hauptstadt verkaufe begab\n", + "leute herrn langte jahren grund preise schmeichelt mauer erfolg lauten\n", + "rechr gewe amortisirung london oktober endlich werner dero bracht fche\n", + "gewisser platze preise wisse leute königreich gläubiger obbe berlin besteht\n", + "gemeldet grund vorbehalt christian besteht zeichen kommen zurück königreich welch\n", + "eingetroffen rich ersten herausgabe list hausmeister daselbst endlich obern melde\n", + "dienste genugsam höchste lass befehlen grund gewisser hader viele schau\n", + "daselbst grund wenige rechr erfahrung königreich begebenheiten mach wasser marquis\n", + "grund korps platze rechr vorge soldat königreich wesentlichen befinden gemeldet\n", + "diel leute schwere preise mehr erhält stand königreich gewe spielen\n", + "bekomme rechtssache macht seite halt last gottes spanien unserm brin\n", + "allerhand einzusehen brücke erlaubniß dörfer schwere rechr rechtssache viele geschehen\n", + "theils wahr gewe bewegungen getheilt wien angemeldet lung gast einzuberufen\n", + "rechr pfandrecht halb klage hader sothane bracht nich befind betreffende\n", + "pfandrecht verbinden hauptstadt beyden rechr bekannt karten haust kanone theils\n", + "rich bekannt derley agram gewe asse rechr inder gewisser nich\n", + "rechr langte kung endlich sagten gemeldet gestorben begebenheiten öffentlichen geständig\n", + "grund platze königreich verkauf wohnhaft endlich kanonen bitten thal wehr\n", + "konkurs rechr nachdem hätte hader besteht viele befehlen wasser frist\n", + "rechr kaum vorzuladen besteht pest mauer mona bringen gewisser erhält\n", + "bringen verstorbenen begebenheiten befehlen geschehen begab kohl befinden macher beyden\n", + "befinden namen geschätzt laden mittel haftet kohl erhebung nachfrage schaden\n", + "konkurs melden platze schicksal hiemtt abends geltend obstgarten bringen selb\n", + "endlich beständig reichs lass schuld london gemeldet wundarzt icit haust\n", + "stroh besteht wien pfandrecht best wann schiff königreich beyden grund\n", + "wann pest oktober nächste befehle schlesien künstler uche wasser gewe\n", + "diel lung mehr legt tags bald bitten eingetroffen befehle rechr\n", + "rechr grund ober wasser sothane spanien beyden theils verbinden kirche\n", + "stand vieles pfer halb hätte gege herausgabe daraus eingetroffen vergnügen\n", + "schau bringen find welch rechr nähern bald ichen derley gewe\n", + "leute pest wünsche rich monats schlesien lauten wasser band papiere\n", + "rechr rich frucht nich bringen melden bestehen obbe nahm verkauf\n", + "zurück rechr ober weiches gemacht königreich kanonen person rechtssache abgehalten\n", + "leute beyden bekannt vorzula stande pest großbritannien begebenheiten hilf bringen\n", + "sammeln dienste verstrichen seite rothen beyden hätte gewisser bedienen nachdem\n", + "grund hausmeister stein rechr daraus bekannt thomas haut gemeldet begebenheiten\n", + "rechr vorbehalt rufen schwarzen preise ergangen erst bereits klasse vergnügen\n", + "ausgenommen königreich besteht leute reichs sothane chre zugleich hiemtt gern\n", + "städte herausgabe lass gewe stande bald schau hauptstadt stunde langte\n", + "hielt gewisser endlich rechr ersten nähern wich erleichtern neubau schneidermeister\n", + "königreich leitung leute herrn kenntnisse eingetroffen letzter hader gemeldet london\n", + "rechr zumelden allgemein liquidiren find anverwandten mehr verkaufe bekannt wohnhaft\n", + "vertheidigung willigen pfandrecht gern ober ersten gemeldet langte erlaubniß daselbst\n", + "beyden rechr hauptstadt wann ausgenommen bringen mannschaft viele seite theils\n", + "haus verkaufe gewisser sieg schuld bezahlet verstorbenen handels zahlreiche bändchen\n", + "gewe ufer rechr leute vorgehen steh nachm aufsatz mündlich reichs\n", + "grund platze befinden rechr welch rechtssache verlangte schuld scher hätte\n", + "bringen beyden begebenheiten haus rechr gewisser erhält gründen betreffende nachm\n", + "ober beyden gewisser befinden sothane halb besteht rechr gewe lung\n", + "bekannt rechr deutsche geschichte schmeichelt sollen vorhandene melden erhält schau\n", + "thig ausgenommen bracht hätte schwere kreis daselbst verlangen rechr ober\n", + "wisse derley befind schaden bereit gläubiger verstrichen leute allgemein gewisser\n", + "rechr oktober hauptstadt pfandrecht leute rden ichen beyden bemerkte macher\n", + "preise rich haus wien verkauf nachm bereit mauer käuflich platze\n", + "nich nähern schlesien nachfrage vergnügen verstärkung kauft karten find ichen\n", + "besteht kohl bestimmte lebe mehr lauten kanonen herrn zimmern thal\n", + "mehr davon schlesien deut legt berichte majors anverwandte händen platze\n", + "beyden nachm bekannt wahr nürnberg wann zweyter oktober liquidiren viele\n", + "beyden wurde gerathen mach geschehen rischen reichs zelt lung gemeldet\n", + "partheyen zweyter pfandrecht stande leute geständig wisse verkauf schaden viele\n", + "gewe eingetroffen besteht geschehen macht königreich fein gewisser mach haus\n", + "wisse rechtssache rothen straffe mach freyherr schaden brücke gewe haust\n", + "wasser grundsätzen handbuch gemeldet preise befindlich steuer endlich rechr lebe\n", + "grund königreich gemeldet rechr wohnhaft zeitungen wienerzeitung feinden gestandenen obrigkeit\n", + "gewe viele zeitungen zahlen liquidiren vertheidigung nachm statten genaueste mehr\n", + "beyden gewisser pier langte rechr bringen neubauer gestorben pest kriege\n", + "erlaubniß allgemein begebenheiten tags platze königreich wasser bereits graden gedeckt\n", + "bringen rechtssache erlaubniß verstrichen bestimmte geschehen konkurs rechr wage wisse\n", + "besteht geschehen rechr schicksal öffentlichen haust namen gemacht nothwendig london\n", + "verkaufe begebenheiten seite nähern pfandrecht leitung christian königreich regiments vorzuladen\n", + "nutzen namen band jakob befehle mittels verkauf verbinden lebe ober\n", + "rechr asse bekannt nähern gemeldet verkaufe nürnberg leute gewisser lebe\n", + "verkaufe beyden berech besteht allerhand bereits lehr kaum lauten nürnberg\n", + "pest melden eingetroffen bekannt berlin feinden verstrichen verkaufe wahrscheinlich stande\n", + "barb bringen haust gewisser liquidiren schau rothen anker geltend geschehen\n", + "ober kriegs gemeldet seite gewisser nachmittags rechr ungeachtet straffe regina\n", + "bekannt dienste erinnert enthalten leute bringen niederlage christian papiere stern\n", + "verbinden frage bald allgemein viele begebenheiten anfang nürnberg stande rechr\n", + "stande nung bekannt leicht bedient rechr verkaufe langte gewe obrigkeit\n", + "besteht befinden mühle gleiche preise gewisser allgemein rechr bereit wich\n", + "beyden mmer gewisser konnten nich melden verstrichen allgemein nachm endlich\n", + "königreich bereits grund könne verlangte rechr ferner nähern lassen leute\n", + "anfang gewe erobert ebenfalls rechr wisse viele haus befindlich gelegenen\n", + "hätte rechr viele find hader mithin nürnberg verstorbenen doktor verkaufe\n", + "rechtssache rechr herrn herausgabe königreich vollen daselbst nothwendig beyden geschehen\n", + "schritt endlich herrn melde landesregierung befehle dadurch lauten hauptstadt bringen\n", + "rechr königreich bringen bürgerschaft oktober verkaufe erhält jahren welch stroh\n", + "besteht langte befindlich verkauf erlaubniß festung gewisser zurück abge grund\n", + "bewegungen wage grund platze vollmacht tage merkantil dern freyen erleichtern\n", + "rechr begebenheiten beyden baaden find wasser lung viele anleitung schau\n", + "ausgenommen person rechr resia zurück gänzlich erlaubt eingetroffen gewe statten\n", + "schwere besteht viele hätte geschehen rechr dieß könne pest gottes\n", + "pest beyden liegendes gehet rechtssache gedachter leute rechr wien gemacht\n", + "grund rechr königreich ausgenommen beyden sothane verkauf kirche nimmt bekannt\n", + "oktober linz haus hauptstadt verkauf find gege eingetroffen stand bewegungen\n" + ] + } + ], + "source": [ + "for t in model_output['topics']:\n", + " print(\" \".join(t))" + ] + }, + { + "cell_type": "code", + "execution_count": 9, + "id": "39749ac2-f03e-4007-96f4-962c3dbce2e4", + "metadata": {}, + "outputs": [], + "source": [ + "from octis.evaluation_metrics.coherence_metrics import Coherence" + ] + }, + { + "cell_type": "code", + "execution_count": 10, + "id": "e16cfefb-6e35-4e8e-bffa-dc75ac4d0b78", + "metadata": {}, + "outputs": [], + "source": [ + "c_v = Coherence(texts=dataset.get_corpus(), topk=10, measure='c_v')" + ] + }, + { + "cell_type": "code", + "execution_count": 11, + "id": "f96cd3ae-2e63-4415-95f2-09e7ecf5a491", + "metadata": {}, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "Coherence: 0.24269082272061301\n" + ] + } + ], + "source": [ + "c_v_score1 = c_v.score(model_output)\n", + "print(\"Coherence: \"+str(c_v_score1))" + ] + }, + { + "cell_type": "code", + "execution_count": 16, + "id": "2664a16f-17f1-49c1-b884-1dfb57ad5d19", + "metadata": {}, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "Coherence: 0.2322927611424697\n" + ] + } + ], + "source": [ + "c_v_score2 = c_v.score(model_output)\n", + "print(\"Coherence: \"+str(c_v_score2))" + ] + }, + { + "cell_type": "code", + "execution_count": 20, + "id": "e4a55846-65f4-4a23-9192-64dcdc5e2088", + "metadata": {}, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "Coherence: 0.25430712709212944\n" + ] + } + ], + "source": [ + "c_v_score3 = c_v.score(model_output)\n", + "print(\"Coherence: \"+str(c_v_score3))" + ] + }, + { + "cell_type": "code", + "execution_count": 21, + "id": "0784a0ad-939a-4f81-89ba-2d60f261d339", + "metadata": {}, + "outputs": [ + { + "data": { + "text/plain": [ + "0.2430969036517374" + ] + }, + "execution_count": 21, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "(c_v_score1 + c_v_score2 + c_v_score3)/3" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "id": "84e6785d-0f39-4f24-840b-4adaf390b359", + "metadata": {}, + "outputs": [], + "source": [] + }, + { + "cell_type": "code", + "execution_count": 54, + "id": "ea12613e-84a1-405b-9e36-3b8192bb9e2f", + "metadata": {}, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "0.00892981328927209\n", + "0.005752487635194249\n", + "0.013216860969465203\n", + "0.006727193655771849\n", + "0.013936653763250066\n", + "0.009115385087321232\n", + "0.012557738666291252\n", + "0.013758111866533848\n", + "0.00805919258169647\n", + "0.012569742992897433\n", + "0.006951230721679613\n", + "0.006120088422368138\n", + "0.005240785352245796\n", + "0.018566502926676918\n", + "0.006817132426694355\n", + "0.013163342719120574\n", + "0.007764790879213965\n", + "0.006431077827665201\n", + "0.00528377585935812\n", + "0.013046113878454259\n", + "0.005100105596317744\n", + "0.016067656288437683\n", + "0.012385502040523327\n", + "0.014854079636636595\n", + "0.014636284356045486\n", + "0.00641009885177839\n", + "0.014581746918840642\n", + "0.012688601130985317\n", + "0.01782811822175431\n", + "0.01709644317032735\n", + "0.0054470091205421674\n", + "0.006953811360111723\n", + "0.013934429242144242\n", + "0.009330621112046614\n", + "0.012584305598337684\n", + "0.007505920441375554\n", + "0.015205508842207264\n", + "0.005320571877913652\n", + "0.005451252684711359\n", + "0.005202965103118378\n", + "0.005938796580060631\n", + "0.011943943957095407\n", + "0.00514229963193619\n", + "0.007768431705554113\n", + "0.010843483438326812\n", + "0.005888860664856077\n", + "0.00767057689343882\n", + "0.005469522022562204\n", + "0.0066302273675308\n", + "0.013525858358622878\n", + "0.0068566577324780855\n", + "0.006910914033822761\n", + "0.012369832473927023\n", + "0.006880960416511569\n", + "0.007287157000973821\n", + "0.005224719083656563\n", + "0.005133935413180502\n", + "0.005220418668814872\n", + "0.0104119454901894\n", + "0.006978537085997455\n", + "0.005054730849849072\n", + "0.013813768080692807\n", + "0.011676042336410631\n", + "0.018316130308102977\n", + "0.013738562824330265\n", + "0.006765332405792515\n", + "0.014279150634009872\n", + "0.012483622073167307\n", + "0.012903620910322282\n", + "0.0074068728343018\n", + "0.006650707405917575\n", + "0.014741938189814794\n", + "0.004934789926425034\n", + "0.01761044112771201\n", + "0.006685835963537905\n", + "0.018982859545507314\n", + "0.014406598972990835\n", + "0.0071355210712888036\n", + "0.010536963477205097\n", + "0.0063256092306706434\n", + "0.012557359143771643\n", + "0.005407262549227092\n", + "0.011592576917306594\n", + "0.015215490551871116\n", + "0.006571163045545251\n", + "0.009033264530868343\n", + "0.005555467889358524\n", + "0.013273532700902023\n", + "0.0072792586770502885\n", + "0.0050834710802597225\n", + "0.00794934848769128\n", + "0.013096709809968807\n", + "0.01527988217182549\n", + "0.018238299983365038\n", + "0.009112778566834843\n", + "0.007862051470388024\n", + "0.01378072461718979\n", + "0.014571650513659226\n", + "0.017400475798826094\n" + ] + } + ], + "source": [ + "for list in model_output['topic-document-matrix']:\n", + " print(((sum(list))/652))" + ] + }, + { + "cell_type": "code", + "execution_count": 55, + "id": "b75fdc65-9760-4f41-81f6-1d1b098b3773", + "metadata": {}, + "outputs": [], + "source": [ + "with open('output_wz1.csv', 'w') as csvfile:\n", + " csvwriter = csv.writer(csvfile)\n", + " for t in model_output['topics']:\n", + " csvwriter.writerow(t)" + ] + }, + { + "cell_type": "code", + "execution_count": 56, + "id": "a492a18f-6a3b-4214-9258-1454aadb2a21", + "metadata": {}, + "outputs": [], + "source": [ + "with open('output_wz1_sc.csv', 'w') as csvfile:\n", + " csvwriter = csv.writer(csvfile)\n", + " for list in model_output['topic-document-matrix']:\n", + " csvwriter.writerow(str((sum(list))/652))" + ] + }, + { + "cell_type": "code", + "execution_count": 57, + "id": "5b6e77f3-3cdd-4281-bd1a-7b2a83baa66c", + "metadata": {}, + "outputs": [], + "source": [ + "a = pd.read_csv(\"output_wz1.csv\", sep='\\t', encoding='cp1252', header=None)\n", + "b = pd.read_csv(\"output_wz1_sc.csv\", sep='\\t', header =None, encoding='cp1252')" + ] + }, + { + "cell_type": "code", + "execution_count": 58, + "id": "9e00fe47-5acd-4384-afc2-51249f890082", + "metadata": {}, + "outputs": [], + "source": [ + "topic_df = a.merge(b, left_index=True, right_index=True, how='left')" + ] + }, + { + "cell_type": "code", + "execution_count": 59, + "id": "a6e984bf-4809-4e0e-96c2-88e017c598db", + "metadata": {}, + "outputs": [], + "source": [ + "topic_df = topic_df.rename(columns={\"0_x\": \"topic\", \"0_y\": \"percentage\"})" + ] + }, + { + "cell_type": "code", + "execution_count": 60, + "id": "76db06b0-e447-4689-b59e-1e98179ce83b", + "metadata": {}, + "outputs": [], + "source": [ + "topic_df['topic'] = topic_df['topic'].str.replace(\",\", \" \")" + ] + }, + { + "cell_type": "code", + "execution_count": 61, + "id": "5778dc4c-5a89-4c7d-8de7-ac2145f78110", + "metadata": {}, + "outputs": [], + "source": [ + "topic_df['percentage'] = topic_df['percentage'].str.replace(\",\", \"\")" + ] + }, + { + "cell_type": "code", + "execution_count": 62, + "id": "24fd92b6-3cfe-44dc-9533-fa6d54f3e58a", + "metadata": {}, + "outputs": [ + { + "data": { + "text/html": [ + "
\n", + "\n", + "\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
topicpercentage
0erhebung widrigen beschreibung achen gedenket ...0.00892981328927209
1mann schmeichelt stehen anna einzuschreiten sc...0.005752487635194249
2schwei beste ankunft begehren leich fich cach ...0.013216860969465203
3antheil weite schmeichelt jahr begeben möchte ...0.006727193655771849
4meere begeben goldenen kunst anna tagl beste g...0.013936653763250066
.........
94zeitung wenig jahr diensten traf pfandrechts o...0.009112778566834843
95oberlieutenant hell eilte stellte könnten verl...0.007862051470388024
96barometerstand klara goldenen ches vergleich w...0.01378072461718979
97diensten öder liebhaber erhebung angeordnet ge...0.014571650513659226
98folge melde weiteren vorstädte einrichtung wir...0.017400475798826094
\n", + "

99 rows × 2 columns

\n", + "
" + ], + "text/plain": [ + " topic percentage\n", + "0 erhebung widrigen beschreibung achen gedenket ... 0.00892981328927209\n", + "1 mann schmeichelt stehen anna einzuschreiten sc... 0.005752487635194249\n", + "2 schwei beste ankunft begehren leich fich cach ... 0.013216860969465203\n", + "3 antheil weite schmeichelt jahr begeben möchte ... 0.006727193655771849\n", + "4 meere begeben goldenen kunst anna tagl beste g... 0.013936653763250066\n", + ".. ... ...\n", + "94 zeitung wenig jahr diensten traf pfandrechts o... 0.009112778566834843\n", + "95 oberlieutenant hell eilte stellte könnten verl... 0.007862051470388024\n", + "96 barometerstand klara goldenen ches vergleich w... 0.01378072461718979\n", + "97 diensten öder liebhaber erhebung angeordnet ge... 0.014571650513659226\n", + "98 folge melde weiteren vorstädte einrichtung wir... 0.017400475798826094\n", + "\n", + "[99 rows x 2 columns]" + ] + }, + "execution_count": 62, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "topic_df" + ] + }, + { + "cell_type": "code", + "execution_count": 64, + "id": "c0edbacb-e6cc-4069-b9dc-8e1d164b47d5", + "metadata": {}, + "outputs": [], + "source": [ + "topic_df_wz = topic_df.assign(newspaper=\"wz\")" + ] + }, + { + "cell_type": "code", + "execution_count": 65, + "id": "f77be8a8-dee3-477e-b304-b5b77b6f0f15", + "metadata": {}, + "outputs": [ + { + "data": { + "text/html": [ + "
\n", + "\n", + "\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
topicpercentagenewspaper
0erhebung widrigen beschreibung achen gedenket ...0.00892981328927209wz
1mann schmeichelt stehen anna einzuschreiten sc...0.005752487635194249wz
2schwei beste ankunft begehren leich fich cach ...0.013216860969465203wz
3antheil weite schmeichelt jahr begeben möchte ...0.006727193655771849wz
4meere begeben goldenen kunst anna tagl beste g...0.013936653763250066wz
............
94zeitung wenig jahr diensten traf pfandrechts o...0.009112778566834843wz
95oberlieutenant hell eilte stellte könnten verl...0.007862051470388024wz
96barometerstand klara goldenen ches vergleich w...0.01378072461718979wz
97diensten öder liebhaber erhebung angeordnet ge...0.014571650513659226wz
98folge melde weiteren vorstädte einrichtung wir...0.017400475798826094wz
\n", + "

99 rows × 3 columns

\n", + "
" + ], + "text/plain": [ + " topic percentage \\\n", + "0 erhebung widrigen beschreibung achen gedenket ... 0.00892981328927209 \n", + "1 mann schmeichelt stehen anna einzuschreiten sc... 0.005752487635194249 \n", + "2 schwei beste ankunft begehren leich fich cach ... 0.013216860969465203 \n", + "3 antheil weite schmeichelt jahr begeben möchte ... 0.006727193655771849 \n", + "4 meere begeben goldenen kunst anna tagl beste g... 0.013936653763250066 \n", + ".. ... ... \n", + "94 zeitung wenig jahr diensten traf pfandrechts o... 0.009112778566834843 \n", + "95 oberlieutenant hell eilte stellte könnten verl... 0.007862051470388024 \n", + "96 barometerstand klara goldenen ches vergleich w... 0.01378072461718979 \n", + "97 diensten öder liebhaber erhebung angeordnet ge... 0.014571650513659226 \n", + "98 folge melde weiteren vorstädte einrichtung wir... 0.017400475798826094 \n", + "\n", + " newspaper \n", + "0 wz \n", + "1 wz \n", + "2 wz \n", + "3 wz \n", + "4 wz \n", + ".. ... \n", + "94 wz \n", + "95 wz \n", + "96 wz \n", + "97 wz \n", + "98 wz \n", + "\n", + "[99 rows x 3 columns]" + ] + }, + "execution_count": 65, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "topic_df_wz" + ] + }, + { + "cell_type": "code", + "execution_count": 66, + "id": "0e1a2eef-f395-4720-a29d-abb6ade56960", + "metadata": {}, + "outputs": [], + "source": [ + "topic_df_wz.to_csv('topics1_wz.csv', sep=',', index=True, header=True, encoding='cp1252')" + ] + }, + { + "cell_type": "code", + "execution_count": 67, + "id": "677a6801-1948-48fd-9f73-3613e96f4a4d", + "metadata": {}, + "outputs": [], + "source": [ + "topic_df_wz.to_excel(\"topics_wz1.xlsx\", index=True, header=True)" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "id": "a4890687-7641-4fe2-8574-09b126228b61", + "metadata": {}, + "outputs": [], + "source": [] + }, + { + "cell_type": "markdown", + "id": "ff87084c-3562-430f-acaa-8d7a6d2c4e92", + "metadata": {}, + "source": [ + "

create excel of both WZ and SZ for manual interpretation

" + ] + }, + { + "cell_type": "code", + "execution_count": 76, + "id": "2d86efcb-706a-4075-a4f8-fda8acf4300b", + "metadata": {}, + "outputs": [], + "source": [ + "a = pd.read_csv(\"topics_sz.csv\", sep=',', encoding='cp1252')\n", + "b = pd.read_csv(\"topics1_wz.csv\", sep=',', encoding='cp1252')" + ] + }, + { + "cell_type": "code", + "execution_count": 77, + "id": "822f15e2-b9e0-47b2-8d18-ad6dd6cfa238", + "metadata": {}, + "outputs": [], + "source": [ + "df_topics = b.append(a)" + ] + }, + { + "cell_type": "code", + "execution_count": 78, + "id": "8e5746af-c973-49ad-84eb-64de8dd85506", + "metadata": {}, + "outputs": [ + { + "data": { + "text/html": [ + "
\n", + "\n", + "\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
Unnamed: 0topicpercentagenewspaper
00erhebung widrigen beschreibung achen gedenket ...0.008930wz
11mann schmeichelt stehen anna einzuschreiten sc...0.005752wz
22schwei beste ankunft begehren leich fich cach ...0.013217wz
33antheil weite schmeichelt jahr begeben möchte ...0.006727wz
44meere begeben goldenen kunst anna tagl beste g...0.013937wz
...............
6262pariser tafeln hungarn wahr jesu unaufhörlich ...0.015926sz
6363geschlachtet ungerechter schwer einmahl franzö...0.014824sz
6464werke redliche wenige größ seide begraben heil...0.013928sz
6565blattes natürlichen summe vergrößerten besoldu...0.015981sz
6666körpern stifte erlauben ansehen brin neun munt...0.014102sz
\n", + "

166 rows × 4 columns

\n", + "
" + ], + "text/plain": [ + " Unnamed: 0 topic percentage \\\n", + "0 0 erhebung widrigen beschreibung achen gedenket ... 0.008930 \n", + "1 1 mann schmeichelt stehen anna einzuschreiten sc... 0.005752 \n", + "2 2 schwei beste ankunft begehren leich fich cach ... 0.013217 \n", + "3 3 antheil weite schmeichelt jahr begeben möchte ... 0.006727 \n", + "4 4 meere begeben goldenen kunst anna tagl beste g... 0.013937 \n", + ".. ... ... ... \n", + "62 62 pariser tafeln hungarn wahr jesu unaufhörlich ... 0.015926 \n", + "63 63 geschlachtet ungerechter schwer einmahl franzö... 0.014824 \n", + "64 64 werke redliche wenige größ seide begraben heil... 0.013928 \n", + "65 65 blattes natürlichen summe vergrößerten besoldu... 0.015981 \n", + "66 66 körpern stifte erlauben ansehen brin neun munt... 0.014102 \n", + "\n", + " newspaper \n", + "0 wz \n", + "1 wz \n", + "2 wz \n", + "3 wz \n", + "4 wz \n", + ".. ... \n", + "62 sz \n", + "63 sz \n", + "64 sz \n", + "65 sz \n", + "66 sz \n", + "\n", + "[166 rows x 4 columns]" + ] + }, + "execution_count": 78, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "df_topics" + ] + }, + { + "cell_type": "code", + "execution_count": 79, + "id": "9d6112cb-2d76-4682-84b2-d18aa00fbe55", + "metadata": {}, + "outputs": [], + "source": [ + "df_topics = df_topics.iloc[: , 1:]" + ] + }, + { + "cell_type": "code", + "execution_count": 80, + "id": "4e7aeb4a-e3b1-4137-ae3d-62e9099099c4", + "metadata": {}, + "outputs": [ + { + "data": { + "text/html": [ + "
\n", + "\n", + "\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
topicpercentagenewspaper
0erhebung widrigen beschreibung achen gedenket ...0.008930wz
1mann schmeichelt stehen anna einzuschreiten sc...0.005752wz
2schwei beste ankunft begehren leich fich cach ...0.013217wz
3antheil weite schmeichelt jahr begeben möchte ...0.006727wz
4meere begeben goldenen kunst anna tagl beste g...0.013937wz
............
62pariser tafeln hungarn wahr jesu unaufhörlich ...0.015926sz
63geschlachtet ungerechter schwer einmahl franzö...0.014824sz
64werke redliche wenige größ seide begraben heil...0.013928sz
65blattes natürlichen summe vergrößerten besoldu...0.015981sz
66körpern stifte erlauben ansehen brin neun munt...0.014102sz
\n", + "

166 rows × 3 columns

\n", + "
" + ], + "text/plain": [ + " topic percentage newspaper\n", + "0 erhebung widrigen beschreibung achen gedenket ... 0.008930 wz\n", + "1 mann schmeichelt stehen anna einzuschreiten sc... 0.005752 wz\n", + "2 schwei beste ankunft begehren leich fich cach ... 0.013217 wz\n", + "3 antheil weite schmeichelt jahr begeben möchte ... 0.006727 wz\n", + "4 meere begeben goldenen kunst anna tagl beste g... 0.013937 wz\n", + ".. ... ... ...\n", + "62 pariser tafeln hungarn wahr jesu unaufhörlich ... 0.015926 sz\n", + "63 geschlachtet ungerechter schwer einmahl franzö... 0.014824 sz\n", + "64 werke redliche wenige größ seide begraben heil... 0.013928 sz\n", + "65 blattes natürlichen summe vergrößerten besoldu... 0.015981 sz\n", + "66 körpern stifte erlauben ansehen brin neun munt... 0.014102 sz\n", + "\n", + "[166 rows x 3 columns]" + ] + }, + "execution_count": 80, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "df_topics" + ] + }, + { + "cell_type": "code", + "execution_count": 81, + "id": "78d99632-b788-4a3e-b030-dc1ce4d3f093", + "metadata": {}, + "outputs": [], + "source": [ + "df_topics.index.name=\"num_topic\"" + ] + }, + { + "cell_type": "code", + "execution_count": 82, + "id": "39fa34a6-a56c-47db-971e-2eb3334bf2ed", + "metadata": {}, + "outputs": [ + { + "data": { + "text/html": [ + "
\n", + "\n", + "\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
topicpercentagenewspaper
num_topic
0erhebung widrigen beschreibung achen gedenket ...0.008930wz
1mann schmeichelt stehen anna einzuschreiten sc...0.005752wz
2schwei beste ankunft begehren leich fich cach ...0.013217wz
3antheil weite schmeichelt jahr begeben möchte ...0.006727wz
4meere begeben goldenen kunst anna tagl beste g...0.013937wz
............
62pariser tafeln hungarn wahr jesu unaufhörlich ...0.015926sz
63geschlachtet ungerechter schwer einmahl franzö...0.014824sz
64werke redliche wenige größ seide begraben heil...0.013928sz
65blattes natürlichen summe vergrößerten besoldu...0.015981sz
66körpern stifte erlauben ansehen brin neun munt...0.014102sz
\n", + "

166 rows × 3 columns

\n", + "
" + ], + "text/plain": [ + " topic percentage \\\n", + "num_topic \n", + "0 erhebung widrigen beschreibung achen gedenket ... 0.008930 \n", + "1 mann schmeichelt stehen anna einzuschreiten sc... 0.005752 \n", + "2 schwei beste ankunft begehren leich fich cach ... 0.013217 \n", + "3 antheil weite schmeichelt jahr begeben möchte ... 0.006727 \n", + "4 meere begeben goldenen kunst anna tagl beste g... 0.013937 \n", + "... ... ... \n", + "62 pariser tafeln hungarn wahr jesu unaufhörlich ... 0.015926 \n", + "63 geschlachtet ungerechter schwer einmahl franzö... 0.014824 \n", + "64 werke redliche wenige größ seide begraben heil... 0.013928 \n", + "65 blattes natürlichen summe vergrößerten besoldu... 0.015981 \n", + "66 körpern stifte erlauben ansehen brin neun munt... 0.014102 \n", + "\n", + " newspaper \n", + "num_topic \n", + "0 wz \n", + "1 wz \n", + "2 wz \n", + "3 wz \n", + "4 wz \n", + "... ... \n", + "62 sz \n", + "63 sz \n", + "64 sz \n", + "65 sz \n", + "66 sz \n", + "\n", + "[166 rows x 3 columns]" + ] + }, + "execution_count": 82, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "df_topics" + ] + }, + { + "cell_type": "code", + "execution_count": 83, + "id": "ff003ef7-403e-49e1-a299-d82e1c76576d", + "metadata": {}, + "outputs": [], + "source": [ + "df_topics.to_excel(\"topics_gesamt.xlsx\", index=True, header=True)" + ] + } + ], + "metadata": { + "kernelspec": { + "display_name": "Python 3 (ipykernel)", + "language": "python", + "name": "python3" + }, + "language_info": { + "codemirror_mode": { + "name": "ipython", + "version": 3 + }, + "file_extension": ".py", + "mimetype": "text/x-python", + "name": "python", + "nbconvert_exporter": "python", + "pygments_lexer": "ipython3", + "version": "3.9.12" + } + }, + "nbformat": 4, + "nbformat_minor": 5 +}