From 93ee286fc555bfa1be53df20d593328105be4f48 Mon Sep 17 00:00:00 2001 From: Benjamin van der Burgh Date: Wed, 20 Feb 2019 11:57:20 +0100 Subject: [PATCH] Added experiments and results for Dutch on 110kDBRD dataset --- experiments/dutch/README.md | 26 + experiments/dutch/fastText/README.md | 52 + experiments/dutch/fastText/predict.sh | 7 + experiments/dutch/fastText/prepare.py | 36 + experiments/dutch/fastText/requirements.txt | 1 + experiments/dutch/fastText/train.sh | 17 + experiments/dutch/flair/README.md | 7 + .../dutch/flair/flair_experiment.ipynb | 2315 +++++++++++++++++ experiments/dutch/flair/requirements.txt | 1 + experiments/dutch/svm/README.md | 7 + experiments/dutch/svm/requirements.txt | 1 + experiments/dutch/svm/svm_experiment.ipynb | 163 ++ .../dutch/ulmfit_no_pretrain/README.md | 9 + .../dutch/ulmfit_no_pretrain/requirements.txt | 1 + .../ulmfit_no_pretrain.ipynb | 1062 ++++++++ .../dutch/ulmfit_pretrained_wiki/README.md | 13 + .../ulmfit_pretrained_wiki/requirements.txt | 1 + .../ulmfit_pretrain_exeperiment.ipynb | 1404 ++++++++++ 18 files changed, 5123 insertions(+) create mode 100644 experiments/dutch/README.md create mode 100644 experiments/dutch/fastText/README.md create mode 100755 experiments/dutch/fastText/predict.sh create mode 100755 experiments/dutch/fastText/prepare.py create mode 100644 experiments/dutch/fastText/requirements.txt create mode 100755 experiments/dutch/fastText/train.sh create mode 100644 experiments/dutch/flair/README.md create mode 100644 experiments/dutch/flair/flair_experiment.ipynb create mode 100644 experiments/dutch/flair/requirements.txt create mode 100644 experiments/dutch/svm/README.md create mode 100644 experiments/dutch/svm/requirements.txt create mode 100644 experiments/dutch/svm/svm_experiment.ipynb create mode 100644 experiments/dutch/ulmfit_no_pretrain/README.md create mode 100644 experiments/dutch/ulmfit_no_pretrain/requirements.txt create mode 100644 experiments/dutch/ulmfit_no_pretrain/ulmfit_no_pretrain.ipynb create mode 100644 experiments/dutch/ulmfit_pretrained_wiki/README.md create mode 100644 experiments/dutch/ulmfit_pretrained_wiki/requirements.txt create mode 100644 experiments/dutch/ulmfit_pretrained_wiki/ulmfit_pretrain_exeperiment.ipynb diff --git a/experiments/dutch/README.md b/experiments/dutch/README.md new file mode 100644 index 0000000..985028f --- /dev/null +++ b/experiments/dutch/README.md @@ -0,0 +1,26 @@ +# ULMFiT experiments for Dutch + +```` +Author: Benjamin van der Burgh +Email: b.van.der.burgh@liacs.leidenuniv.nl +Affiliation: LIACS, Universiteit Leiden, Leiden, The Netherlands +```` + + +## Description + +This folder contains experiment that were done with ULMFiT and compared against various baselines. The dataset that was used is [110kDBRD](https://github.com/benjaminvdb/110kDBRD) + +## LM weights + +LM trained on Dutch Wikipedia: http://bit.ly/2trOhzq + +## Results + +```` +ULMFiT pre-trained: 93.84% +ULMFiT no pre-train: 92.55% +SVM: 89.16% +Flair with fastText: 88.48% +fastText: 80.90% +```` \ No newline at end of file diff --git a/experiments/dutch/fastText/README.md b/experiments/dutch/fastText/README.md new file mode 100644 index 0000000..dc7c0b2 --- /dev/null +++ b/experiments/dutch/fastText/README.md @@ -0,0 +1,52 @@ +# fastText classifier baseline + +## Description + +This folder contains scripts that were used to obtain a baseline for the sentiment polarity classification task. + +## fastText + +### Install + +We'll be using the command-line tool, which supports using pre-trained word embeddings. Instructions for downloading and building fastText can be found here: https://github.com/facebookresearch/fastText + +### Word embeddings + +Pre-trained word embeddings for Dutch can be downloaded from: https://dl.fbaipublicfiles.com/fasttext/vectors-wiki/wiki.nl.zip + +Extract them to the current directory: `unzip wiki.nl.zip` + +## Dataset + +### Download + +The experiments were run on 110kDBRD dataset, which can be downloaded from here: https://github.com/benjaminvdb/110kDBRD + +### Convert + +The 110kDBRD dataset is in a different format and needs to be converted first. Run `prepare.py` to convert the *extracted* dataset and save it to the current directory. + +```` +python ./prepare.py /path/to/110kDBRD +```` + +### Modelling + +## Train + +```` +./train.sh train.txt ./wiki.nl.vec +Read 26M words +Number of words: 665350 +Number of labels: 2 +Progress: 100.0% words/sec/thread: 337040 lr: 0.000000 loss: 0.074446 ETA: 0h 0m +```` + +## Test + +```` +./predict.sh test.txt +N 10972 +P@1 0.809 +R@1 0.809 +```` \ No newline at end of file diff --git a/experiments/dutch/fastText/predict.sh b/experiments/dutch/fastText/predict.sh new file mode 100755 index 0000000..7181400 --- /dev/null +++ b/experiments/dutch/fastText/predict.sh @@ -0,0 +1,7 @@ +#!/usr/bin/env sh + +TEST_FILE=$1 + +./fasttext test \ + model.bin \ + $TEST_FILE 1 diff --git a/experiments/dutch/fastText/prepare.py b/experiments/dutch/fastText/prepare.py new file mode 100755 index 0000000..ba04975 --- /dev/null +++ b/experiments/dutch/fastText/prepare.py @@ -0,0 +1,36 @@ +#!/usr/bin/env python2 + +import os +import sys +import codecs +import re +import tarfile + +from sklearn.datasets import load_files + + +def convert(input_dir, output_file): + """ + Convert 110kDBRD dataset into fastText compatible format. + """ + regex = re.compile(r'\s+') + dataset = load_files(input_dir, encoding='utf-8') + with codecs.open(output_file, 'w', encoding='utf-8') as f: + buff = u'\n'.join([u'__label__{} {}'.format(target, regex.sub(' ', text).strip()) for target, text in zip(dataset.target, dataset.data)]) + f.write(buff) + + +def main(): + """ + Expects the root of 110kDBRD as input argument. Converts and saves to ./train.txt and ./test.txt + """ + base_dir = sys.argv[1] + train_dir = os.path.join(base_dir, 'train') + test_dir = os.path.join(base_dir, 'test') + + convert(train_dir, 'train.txt') + convert(test_dir, 'test.txt') + + +if __name__ == '__main__': + main() \ No newline at end of file diff --git a/experiments/dutch/fastText/requirements.txt b/experiments/dutch/fastText/requirements.txt new file mode 100644 index 0000000..1afcc19 --- /dev/null +++ b/experiments/dutch/fastText/requirements.txt @@ -0,0 +1 @@ +scikit-learn==0.20.1 \ No newline at end of file diff --git a/experiments/dutch/fastText/train.sh b/experiments/dutch/fastText/train.sh new file mode 100755 index 0000000..12876a4 --- /dev/null +++ b/experiments/dutch/fastText/train.sh @@ -0,0 +1,17 @@ +#!/usr/bin/env sh + +TRAIN_FILE=$1 +PRETRAINED=$2 + +./fasttext supervised \ + -input $TRAIN_FILE \ + -output model \ + -epoch 25 \ + -wordNgrams 4 \ + -dim 300 \ + -loss hs \ + -thread 7 \ + -minCount 1 \ + -lr 1.0 \ + -verbose 2 \ + -pretrainedVectors $PRETRAINED diff --git a/experiments/dutch/flair/README.md b/experiments/dutch/flair/README.md new file mode 100644 index 0000000..a1ece1e --- /dev/null +++ b/experiments/dutch/flair/README.md @@ -0,0 +1,7 @@ +# SVM classifier baseline + +## Description + +[Flair](https://github.com/zalandoresearch/flair) with [fastText](https://github.com/facebookresearch/fastText) Dutch word embeddings was used to obtain a baseline for the sentiment polarity classification task. + +The folder simply includes a notebook that shows the experiments and its results. \ No newline at end of file diff --git a/experiments/dutch/flair/flair_experiment.ipynb b/experiments/dutch/flair/flair_experiment.ipynb new file mode 100644 index 0000000..1b975c9 --- /dev/null +++ b/experiments/dutch/flair/flair_experiment.ipynb @@ -0,0 +1,2315 @@ +{ + "cells": [ + { + "cell_type": "code", + "execution_count": 1, + "metadata": {}, + "outputs": [], + "source": [ + "from flair.data import TaggedCorpus\n", + "from flair.data_fetcher import NLPTaskDataFetcher, NLPTask\n", + "from flair.embeddings import WordEmbeddings, FlairEmbeddings, DocumentLSTMEmbeddings\n", + "from flair.models import TextClassifier\n", + "from flair.trainers import ModelTrainer" + ] + }, + { + "cell_type": "code", + "execution_count": 2, + "metadata": {}, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "2019-02-18 15:56:14,003 Reading data from /local/burghbvander/flair_experiments\n", + "2019-02-18 15:56:14,005 Train: /local/burghbvander/flair_experiments/train_smaller.txt\n", + "2019-02-18 15:56:14,006 Dev: /local/burghbvander/flair_experiments/dev.txt\n", + "2019-02-18 15:56:14,006 Test: /local/burghbvander/flair_experiments/test.txt\n" + ] + } + ], + "source": [ + "from flair.data_fetcher import NLPTaskDataFetcher\n", + "from pathlib import Path\n", + "\n", + "# use your own data path\n", + "data_folder = Path('/local/burghbvander/flair_experiments/')\n", + "\n", + "# load corpus containing training, test and dev data\n", + "corpus: TaggedCorpus = NLPTaskDataFetcher.load_classification_corpus(data_folder,\n", + " test_file='test.txt',\n", + " dev_file='dev.txt',\n", + " train_file='train_smaller.txt')" + ] + }, + { + "cell_type": "code", + "execution_count": 3, + "metadata": {}, + "outputs": [], + "source": [ + "# 2. create the label dictionary\n", + "label_dict = corpus.make_label_dictionary()" + ] + }, + { + "cell_type": "code", + "execution_count": 4, + "metadata": {}, + "outputs": [], + "source": [ + "# 3. make a list of word embeddings\n", + "word_embeddings = [WordEmbeddings('nl')\n", + "# FlairEmbeddings('dutch-forward'),\n", + "# FlairEmbeddings('dutch-backward')\n", + "\n", + " # comment in flair embeddings for state-of-the-art results \n", + "# FlairEmbeddings('news-forward'),\n", + "# FlairEmbeddings('news-backward'),\n", + " ]" + ] + }, + { + "cell_type": "code", + "execution_count": 5, + "metadata": {}, + "outputs": [], + "source": [ + "# 4. init document embedding by passing list of word embeddings\n", + "document_embeddings: DocumentLSTMEmbeddings = DocumentLSTMEmbeddings(word_embeddings,\n", + " hidden_size=512,\n", + " reproject_words=True,\n", + " reproject_words_dimension=256,\n", + " )" + ] + }, + { + "cell_type": "code", + "execution_count": 6, + "metadata": {}, + "outputs": [], + "source": [ + "# 5. create the text classifier\n", + "classifier = TextClassifier(document_embeddings, label_dictionary=label_dict, multi_label=False)" + ] + }, + { + "cell_type": "code", + "execution_count": 7, + "metadata": {}, + "outputs": [], + "source": [ + "# 6. initialize the text classifier trainer\n", + "trainer = ModelTrainer(classifier, corpus)" + ] + }, + { + "cell_type": "code", + "execution_count": 8, + "metadata": { + "collapsed": true + }, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "2019-02-18 15:58:08,278 ----------------------------------------------------------------------------------------------------\n", + "2019-02-18 15:58:08,279 Evaluation method: MICRO_F1_SCORE\n", + "2019-02-18 15:58:08,281 ----------------------------------------------------------------------------------------------------\n", + "2019-02-18 15:58:09,203 epoch 1 - iter 0/526 - loss 0.02127613\n", + "2019-02-18 15:58:52,760 epoch 1 - iter 52/526 - loss 0.01889031\n", + "2019-02-18 15:59:46,718 epoch 1 - iter 104/526 - loss 0.01824219\n", + "2019-02-18 16:00:30,909 epoch 1 - iter 156/526 - loss 0.01770823\n", + "2019-02-18 16:01:19,406 epoch 1 - iter 208/526 - loss 0.01749309\n", + "2019-02-18 16:02:04,412 epoch 1 - iter 260/526 - loss 0.01735454\n", + "2019-02-18 16:02:56,693 epoch 1 - iter 312/526 - loss 0.01706644\n", + "2019-02-18 16:03:36,529 epoch 1 - iter 364/526 - loss 0.01698531\n", + "2019-02-18 16:04:21,896 epoch 1 - iter 416/526 - loss 0.01690337\n", + "2019-02-18 16:05:04,667 epoch 1 - iter 468/526 - loss 0.01680622\n", + "2019-02-18 16:05:54,632 epoch 1 - iter 520/526 - loss 0.01671503\n", + "2019-02-18 16:05:58,057 ----------------------------------------------------------------------------------------------------\n", + "2019-02-18 16:05:58,059 EPOCH 1 done: loss 0.0167 - lr 0.1000 - bad epochs 0\n", + "2019-02-18 16:06:38,014 DEV : loss 0.01553357 - f-score 0.7349 - acc 0.7349\n", + "2019-02-18 16:07:05,520 TEST : loss 0.02054467 - f-score 0.6267 - acc 0.6267\n", + "2019-02-18 16:07:14,260 ----------------------------------------------------------------------------------------------------\n", + "2019-02-18 16:07:15,178 epoch 2 - iter 0/526 - loss 0.01717842\n", + "2019-02-18 16:07:52,789 epoch 2 - iter 52/526 - loss 0.01595207\n", + "2019-02-18 16:08:38,517 epoch 2 - iter 104/526 - loss 0.01552524\n", + "2019-02-18 16:09:18,423 epoch 2 - iter 156/526 - loss 0.01546827\n", + "2019-02-18 16:09:55,639 epoch 2 - iter 208/526 - loss 0.01533624\n", + "2019-02-18 16:10:36,471 epoch 2 - iter 260/526 - loss 0.01531059\n", + "2019-02-18 16:11:20,440 epoch 2 - iter 312/526 - loss 0.01536111\n", + "2019-02-18 16:12:01,423 epoch 2 - iter 364/526 - loss 0.01536426\n", + "2019-02-18 16:12:45,635 epoch 2 - iter 416/526 - loss 0.01534227\n", + "2019-02-18 16:13:34,458 epoch 2 - iter 468/526 - loss 0.01524534\n", + "2019-02-18 16:14:15,592 epoch 2 - iter 520/526 - loss 0.01515822\n", + "2019-02-18 16:14:19,540 ----------------------------------------------------------------------------------------------------\n", + "2019-02-18 16:14:19,542 EPOCH 2 done: loss 0.0152 - lr 0.1000 - bad epochs 0\n", + "2019-02-18 16:14:56,222 DEV : loss 0.01485776 - f-score 0.7599 - acc 0.7599\n", + "2019-02-18 16:15:22,438 TEST : loss 0.01995775 - f-score 0.6534 - acc 0.6534\n", + "2019-02-18 16:15:33,203 ----------------------------------------------------------------------------------------------------\n", + "2019-02-18 16:15:34,269 epoch 3 - iter 0/526 - loss 0.01352574\n", + "2019-02-18 16:16:15,668 epoch 3 - iter 52/526 - loss 0.01487503\n", + "2019-02-18 16:16:56,937 epoch 3 - iter 104/526 - loss 0.01488308\n", + "2019-02-18 16:17:43,956 epoch 3 - iter 156/526 - loss 0.01489741\n", + "2019-02-18 16:18:23,976 epoch 3 - iter 208/526 - loss 0.01483106\n", + "2019-02-18 16:19:06,144 epoch 3 - iter 260/526 - loss 0.01486248\n", + "2019-02-18 16:19:48,716 epoch 3 - iter 312/526 - loss 0.01475698\n", + "2019-02-18 16:20:28,351 epoch 3 - iter 364/526 - loss 0.01464827\n", + "2019-02-18 16:21:11,465 epoch 3 - iter 416/526 - loss 0.01454867\n", + "2019-02-18 16:21:57,595 epoch 3 - iter 468/526 - loss 0.01450732\n", + "2019-02-18 16:22:33,474 epoch 3 - iter 520/526 - loss 0.01456542\n", + "2019-02-18 16:22:38,061 ----------------------------------------------------------------------------------------------------\n", + "2019-02-18 16:22:38,062 EPOCH 3 done: loss 0.0146 - lr 0.1000 - bad epochs 0\n", + "2019-02-18 16:23:12,592 DEV : loss 0.01434629 - f-score 0.7714 - acc 0.7714\n", + "2019-02-18 16:23:38,321 TEST : loss 0.02016712 - f-score 0.6539 - acc 0.6539\n", + "2019-02-18 16:23:49,399 ----------------------------------------------------------------------------------------------------\n", + "2019-02-18 16:23:50,874 epoch 4 - iter 0/526 - loss 0.01323878\n", + "2019-02-18 16:24:32,184 epoch 4 - iter 52/526 - loss 0.01348973\n", + "2019-02-18 16:25:11,676 epoch 4 - iter 104/526 - loss 0.01362511\n", + "2019-02-18 16:25:53,569 epoch 4 - iter 156/526 - loss 0.01371228\n", + "2019-02-18 16:26:38,569 epoch 4 - iter 208/526 - loss 0.01398436\n", + "2019-02-18 16:27:16,954 epoch 4 - iter 260/526 - loss 0.01406107\n", + "2019-02-18 16:27:56,288 epoch 4 - iter 312/526 - loss 0.01402520\n", + "2019-02-18 16:28:35,774 epoch 4 - iter 364/526 - loss 0.01396586\n", + "2019-02-18 16:29:17,182 epoch 4 - iter 416/526 - loss 0.01398844\n", + "2019-02-18 16:29:58,304 epoch 4 - iter 468/526 - loss 0.01397442\n", + "2019-02-18 16:30:36,673 epoch 4 - iter 520/526 - loss 0.01393643\n", + "2019-02-18 16:30:40,184 ----------------------------------------------------------------------------------------------------\n", + "2019-02-18 16:30:40,185 EPOCH 4 done: loss 0.0139 - lr 0.1000 - bad epochs 0\n", + "2019-02-18 16:31:15,968 DEV : loss 0.01392026 - f-score 0.7859 - acc 0.7859\n", + "2019-02-18 16:31:40,487 TEST : loss 0.01973633 - f-score 0.6740 - acc 0.6740\n", + "2019-02-18 16:31:51,508 ----------------------------------------------------------------------------------------------------\n", + "2019-02-18 16:31:52,725 epoch 5 - iter 0/526 - loss 0.01598181\n", + "2019-02-18 16:32:36,083 epoch 5 - iter 52/526 - loss 0.01334639\n", + "2019-02-18 16:33:17,879 epoch 5 - iter 104/526 - loss 0.01330042\n", + "2019-02-18 16:34:03,064 epoch 5 - iter 156/526 - loss 0.01334889\n", + "2019-02-18 16:34:46,187 epoch 5 - iter 208/526 - loss 0.01332951\n", + "2019-02-18 16:35:23,356 epoch 5 - iter 260/526 - loss 0.01349746\n", + "2019-02-18 16:36:07,931 epoch 5 - iter 312/526 - loss 0.01352572\n", + "2019-02-18 16:36:48,456 epoch 5 - iter 364/526 - loss 0.01362373\n", + "2019-02-18 16:37:28,204 epoch 5 - iter 416/526 - loss 0.01364770\n", + "2019-02-18 16:38:09,262 epoch 5 - iter 468/526 - loss 0.01367406\n", + "2019-02-18 16:38:54,083 epoch 5 - iter 520/526 - loss 0.01353081\n", + "2019-02-18 16:38:58,947 ----------------------------------------------------------------------------------------------------\n", + "2019-02-18 16:38:58,948 EPOCH 5 done: loss 0.0135 - lr 0.1000 - bad epochs 0\n", + "2019-02-18 16:39:43,079 DEV : loss 0.01338645 - f-score 0.7994 - acc 0.7994\n", + "2019-02-18 16:40:10,662 TEST : loss 0.01683049 - f-score 0.7447 - acc 0.7447\n", + "2019-02-18 16:40:21,709 ----------------------------------------------------------------------------------------------------\n", + "2019-02-18 16:40:22,566 epoch 6 - iter 0/526 - loss 0.01515922\n", + "2019-02-18 16:41:00,739 epoch 6 - iter 52/526 - loss 0.01319935\n", + "2019-02-18 16:41:42,353 epoch 6 - iter 104/526 - loss 0.01306053\n", + "2019-02-18 16:42:22,524 epoch 6 - iter 156/526 - loss 0.01334328\n", + "2019-02-18 16:43:02,983 epoch 6 - iter 208/526 - loss 0.01322553\n", + "2019-02-18 16:43:46,347 epoch 6 - iter 260/526 - loss 0.01316519\n", + "2019-02-18 16:44:26,672 epoch 6 - iter 312/526 - loss 0.01344200\n", + "2019-02-18 16:45:05,290 epoch 6 - iter 364/526 - loss 0.01345868\n", + "2019-02-18 16:45:40,805 epoch 6 - iter 416/526 - loss 0.01348272\n", + "2019-02-18 16:46:23,473 epoch 6 - iter 468/526 - loss 0.01350070\n", + "2019-02-18 16:47:01,389 epoch 6 - iter 520/526 - loss 0.01347896\n", + "2019-02-18 16:47:04,699 ----------------------------------------------------------------------------------------------------\n", + "2019-02-18 16:47:04,700 EPOCH 6 done: loss 0.0135 - lr 0.1000 - bad epochs 0\n", + "2019-02-18 16:47:41,476 DEV : loss 0.01267112 - f-score 0.8054 - acc 0.8054\n", + "2019-02-18 16:48:08,294 TEST : loss 0.01666281 - f-score 0.7519 - acc 0.7519\n", + "2019-02-18 16:48:19,065 ----------------------------------------------------------------------------------------------------\n", + "2019-02-18 16:48:19,876 epoch 7 - iter 0/526 - loss 0.01306688\n", + "2019-02-18 16:49:00,903 epoch 7 - iter 52/526 - loss 0.01367513\n", + "2019-02-18 16:49:43,185 epoch 7 - iter 104/526 - loss 0.01332517\n", + "2019-02-18 16:50:21,140 epoch 7 - iter 156/526 - loss 0.01319720\n", + "2019-02-18 16:51:00,818 epoch 7 - iter 208/526 - loss 0.01318900\n", + "2019-02-18 16:51:40,858 epoch 7 - iter 260/526 - loss 0.01314650\n", + "2019-02-18 16:52:24,149 epoch 7 - iter 312/526 - loss 0.01310183\n", + "2019-02-18 16:53:01,585 epoch 7 - iter 364/526 - loss 0.01307307\n", + "2019-02-18 16:53:41,933 epoch 7 - iter 416/526 - loss 0.01312719\n", + "2019-02-18 16:54:19,028 epoch 7 - iter 468/526 - loss 0.01315661\n", + "2019-02-18 16:55:02,962 epoch 7 - iter 520/526 - loss 0.01312956\n", + "2019-02-18 16:55:07,229 ----------------------------------------------------------------------------------------------------\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "2019-02-18 16:55:07,230 EPOCH 7 done: loss 0.0131 - lr 0.1000 - bad epochs 0\n", + "2019-02-18 16:55:43,209 DEV : loss 0.01436462 - f-score 0.7654 - acc 0.7654\n", + "2019-02-18 16:56:07,425 TEST : loss 0.01884936 - f-score 0.6807 - acc 0.6807\n", + "2019-02-18 16:56:18,415 ----------------------------------------------------------------------------------------------------\n", + "2019-02-18 16:56:19,243 epoch 8 - iter 0/526 - loss 0.01391503\n", + "2019-02-18 16:57:02,814 epoch 8 - iter 52/526 - loss 0.01269610\n", + "2019-02-18 16:57:38,786 epoch 8 - iter 104/526 - loss 0.01287505\n", + "2019-02-18 16:58:16,825 epoch 8 - iter 156/526 - loss 0.01289498\n", + "2019-02-18 16:58:55,526 epoch 8 - iter 208/526 - loss 0.01269878\n", + "2019-02-18 16:59:38,772 epoch 8 - iter 260/526 - loss 0.01278463\n", + "2019-02-18 17:00:19,956 epoch 8 - iter 312/526 - loss 0.01280592\n", + "2019-02-18 17:01:06,535 epoch 8 - iter 364/526 - loss 0.01280442\n", + "2019-02-18 17:01:46,057 epoch 8 - iter 416/526 - loss 0.01269708\n", + "2019-02-18 17:02:26,427 epoch 8 - iter 468/526 - loss 0.01273897\n", + "2019-02-18 17:03:06,014 epoch 8 - iter 520/526 - loss 0.01280426\n", + "2019-02-18 17:03:09,355 ----------------------------------------------------------------------------------------------------\n", + "2019-02-18 17:03:09,356 EPOCH 8 done: loss 0.0128 - lr 0.1000 - bad epochs 0\n", + "2019-02-18 17:03:50,934 DEV : loss 0.01279273 - f-score 0.7994 - acc 0.7994\n", + "2019-02-18 17:04:18,228 TEST : loss 0.01753456 - f-score 0.7165 - acc 0.7165\n", + "2019-02-18 17:04:29,146 ----------------------------------------------------------------------------------------------------\n", + "2019-02-18 17:04:30,116 epoch 9 - iter 0/526 - loss 0.00904663\n", + "2019-02-18 17:05:14,147 epoch 9 - iter 52/526 - loss 0.01267557\n", + "2019-02-18 17:05:55,132 epoch 9 - iter 104/526 - loss 0.01258353\n", + "2019-02-18 17:06:45,871 epoch 9 - iter 156/526 - loss 0.01273380\n", + "2019-02-18 17:07:39,826 epoch 9 - iter 208/526 - loss 0.01289245\n", + "2019-02-18 17:08:37,689 epoch 9 - iter 260/526 - loss 0.01284212\n", + "2019-02-18 17:09:31,316 epoch 9 - iter 312/526 - loss 0.01287030\n", + "2019-02-18 17:10:22,492 epoch 9 - iter 364/526 - loss 0.01284674\n", + "2019-02-18 17:11:14,441 epoch 9 - iter 416/526 - loss 0.01277994\n", + "2019-02-18 17:12:09,854 epoch 9 - iter 468/526 - loss 0.01269307\n", + "2019-02-18 17:12:53,877 epoch 9 - iter 520/526 - loss 0.01269265\n", + "2019-02-18 17:12:59,603 ----------------------------------------------------------------------------------------------------\n", + "2019-02-18 17:12:59,606 EPOCH 9 done: loss 0.0127 - lr 0.1000 - bad epochs 0\n", + "2019-02-18 17:13:37,247 DEV : loss 0.01260460 - f-score 0.8069 - acc 0.8069\n", + "2019-02-18 17:14:03,124 TEST : loss 0.01784888 - f-score 0.7027 - acc 0.7027\n", + "2019-02-18 17:14:13,869 ----------------------------------------------------------------------------------------------------\n", + "2019-02-18 17:14:14,678 epoch 10 - iter 0/526 - loss 0.01197039\n", + "2019-02-18 17:14:55,993 epoch 10 - iter 52/526 - loss 0.01214427\n", + "2019-02-18 17:15:38,582 epoch 10 - iter 104/526 - loss 0.01237999\n", + "2019-02-18 17:16:22,818 epoch 10 - iter 156/526 - loss 0.01240889\n", + "2019-02-18 17:17:04,752 epoch 10 - iter 208/526 - loss 0.01233547\n", + "2019-02-18 17:17:42,918 epoch 10 - iter 260/526 - loss 0.01240603\n", + "2019-02-18 17:18:19,815 epoch 10 - iter 312/526 - loss 0.01244341\n", + "2019-02-18 17:19:04,682 epoch 10 - iter 364/526 - loss 0.01248983\n", + "2019-02-18 17:19:45,431 epoch 10 - iter 416/526 - loss 0.01255515\n", + "2019-02-18 17:20:27,207 epoch 10 - iter 468/526 - loss 0.01253496\n", + "2019-02-18 17:21:05,278 epoch 10 - iter 520/526 - loss 0.01255321\n", + "2019-02-18 17:21:08,906 ----------------------------------------------------------------------------------------------------\n", + "2019-02-18 17:21:08,908 EPOCH 10 done: loss 0.0125 - lr 0.1000 - bad epochs 0\n", + "2019-02-18 17:21:44,505 DEV : loss 0.01219011 - f-score 0.8179 - acc 0.8179\n", + "2019-02-18 17:22:10,338 TEST : loss 0.01602328 - f-score 0.7653 - acc 0.7653\n", + "2019-02-18 17:22:21,375 ----------------------------------------------------------------------------------------------------\n", + "2019-02-18 17:22:22,291 epoch 11 - iter 0/526 - loss 0.01013956\n", + "2019-02-18 17:23:04,136 epoch 11 - iter 52/526 - loss 0.01213045\n", + "2019-02-18 17:23:43,762 epoch 11 - iter 104/526 - loss 0.01261378\n", + "2019-02-18 17:24:25,567 epoch 11 - iter 156/526 - loss 0.01224389\n", + "2019-02-18 17:25:17,665 epoch 11 - iter 208/526 - loss 0.01231242\n", + "2019-02-18 17:26:05,704 epoch 11 - iter 260/526 - loss 0.01216261\n", + "2019-02-18 17:26:44,226 epoch 11 - iter 312/526 - loss 0.01229325\n", + "2019-02-18 17:27:25,686 epoch 11 - iter 364/526 - loss 0.01229002\n", + "2019-02-18 17:28:03,442 epoch 11 - iter 416/526 - loss 0.01234051\n", + "2019-02-18 17:28:41,458 epoch 11 - iter 468/526 - loss 0.01241809\n", + "2019-02-18 17:29:28,208 epoch 11 - iter 520/526 - loss 0.01242832\n", + "2019-02-18 17:29:32,230 ----------------------------------------------------------------------------------------------------\n", + "2019-02-18 17:29:32,231 EPOCH 11 done: loss 0.0124 - lr 0.1000 - bad epochs 0\n", + "2019-02-18 17:30:07,672 DEV : loss 0.01209316 - f-score 0.8169 - acc 0.8169\n", + "2019-02-18 17:30:31,773 TEST : loss 0.01652627 - f-score 0.7519 - acc 0.7519\n", + "2019-02-18 17:30:42,529 ----------------------------------------------------------------------------------------------------\n", + "2019-02-18 17:30:43,322 epoch 12 - iter 0/526 - loss 0.01227321\n", + "2019-02-18 17:31:33,231 epoch 12 - iter 52/526 - loss 0.01224642\n", + "2019-02-18 17:32:16,506 epoch 12 - iter 104/526 - loss 0.01227952\n", + "2019-02-18 17:32:57,046 epoch 12 - iter 156/526 - loss 0.01233341\n", + "2019-02-18 17:33:39,580 epoch 12 - iter 208/526 - loss 0.01250964\n", + "2019-02-18 17:34:21,545 epoch 12 - iter 260/526 - loss 0.01254298\n", + "2019-02-18 17:35:01,734 epoch 12 - iter 312/526 - loss 0.01239779\n", + "2019-02-18 17:35:39,321 epoch 12 - iter 364/526 - loss 0.01242299\n", + "2019-02-18 17:36:17,535 epoch 12 - iter 416/526 - loss 0.01238217\n", + "2019-02-18 17:37:02,206 epoch 12 - iter 468/526 - loss 0.01238705\n", + "2019-02-18 17:37:42,575 epoch 12 - iter 520/526 - loss 0.01237962\n", + "2019-02-18 17:37:46,411 ----------------------------------------------------------------------------------------------------\n", + "2019-02-18 17:37:46,412 EPOCH 12 done: loss 0.0124 - lr 0.1000 - bad epochs 0\n", + "2019-02-18 17:38:23,579 DEV : loss 0.01263722 - f-score 0.8114 - acc 0.8114\n", + "2019-02-18 17:38:48,537 TEST : loss 0.01537714 - f-score 0.7677 - acc 0.7677\n", + "2019-02-18 17:38:59,483 ----------------------------------------------------------------------------------------------------\n", + "2019-02-18 17:39:00,389 epoch 13 - iter 0/526 - loss 0.00931402\n", + "2019-02-18 17:39:38,625 epoch 13 - iter 52/526 - loss 0.01237009\n", + "2019-02-18 17:40:23,446 epoch 13 - iter 104/526 - loss 0.01227296\n", + "2019-02-18 17:41:11,095 epoch 13 - iter 156/526 - loss 0.01209146\n", + "2019-02-18 17:41:52,252 epoch 13 - iter 208/526 - loss 0.01210759\n", + "2019-02-18 17:42:34,558 epoch 13 - iter 260/526 - loss 0.01217075\n", + "2019-02-18 17:43:13,732 epoch 13 - iter 312/526 - loss 0.01206028\n", + "2019-02-18 17:43:52,797 epoch 13 - iter 364/526 - loss 0.01200963\n", + "2019-02-18 17:44:33,837 epoch 13 - iter 416/526 - loss 0.01200332\n", + "2019-02-18 17:45:15,198 epoch 13 - iter 468/526 - loss 0.01202327\n", + "2019-02-18 17:45:54,386 epoch 13 - iter 520/526 - loss 0.01199283\n", + "2019-02-18 17:45:58,060 ----------------------------------------------------------------------------------------------------\n", + "2019-02-18 17:45:58,061 EPOCH 13 done: loss 0.0120 - lr 0.1000 - bad epochs 0\n", + "2019-02-18 17:46:33,516 DEV : loss 0.01170990 - f-score 0.8329 - acc 0.8329\n", + "2019-02-18 17:46:59,277 TEST : loss 0.01515957 - f-score 0.7787 - acc 0.7787\n", + "2019-02-18 17:47:10,206 ----------------------------------------------------------------------------------------------------\n", + "2019-02-18 17:47:11,119 epoch 14 - iter 0/526 - loss 0.00990110\n", + "2019-02-18 17:47:47,469 epoch 14 - iter 52/526 - loss 0.01083351\n", + "2019-02-18 17:48:24,868 epoch 14 - iter 104/526 - loss 0.01140991\n", + "2019-02-18 17:49:02,643 epoch 14 - iter 156/526 - loss 0.01159181\n", + "2019-02-18 17:49:44,398 epoch 14 - iter 208/526 - loss 0.01157900\n", + "2019-02-18 17:50:24,427 epoch 14 - iter 260/526 - loss 0.01169203\n", + "2019-02-18 17:51:06,430 epoch 14 - iter 312/526 - loss 0.01174273\n", + "2019-02-18 17:51:53,758 epoch 14 - iter 364/526 - loss 0.01178766\n", + "2019-02-18 17:52:36,084 epoch 14 - iter 416/526 - loss 0.01170609\n", + "2019-02-18 17:53:20,535 epoch 14 - iter 468/526 - loss 0.01166916\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "2019-02-18 17:54:02,337 epoch 14 - iter 520/526 - loss 0.01174037\n", + "2019-02-18 17:54:05,345 ----------------------------------------------------------------------------------------------------\n", + "2019-02-18 17:54:05,346 EPOCH 14 done: loss 0.0117 - lr 0.1000 - bad epochs 0\n", + "2019-02-18 17:54:41,545 DEV : loss 0.01152237 - f-score 0.8289 - acc 0.8289\n", + "2019-02-18 17:55:06,820 TEST : loss 0.01493260 - f-score 0.7796 - acc 0.7796\n", + "2019-02-18 17:55:17,794 ----------------------------------------------------------------------------------------------------\n", + "2019-02-18 17:55:18,906 epoch 15 - iter 0/526 - loss 0.00745257\n", + "2019-02-18 17:55:56,971 epoch 15 - iter 52/526 - loss 0.01075182\n", + "2019-02-18 17:56:36,160 epoch 15 - iter 104/526 - loss 0.01123895\n", + "2019-02-18 17:57:14,979 epoch 15 - iter 156/526 - loss 0.01111512\n", + "2019-02-18 17:57:55,841 epoch 15 - iter 208/526 - loss 0.01109633\n", + "2019-02-18 17:58:35,062 epoch 15 - iter 260/526 - loss 0.01120362\n", + "2019-02-18 17:59:16,808 epoch 15 - iter 312/526 - loss 0.01121806\n", + "2019-02-18 17:59:56,804 epoch 15 - iter 364/526 - loss 0.01125122\n", + "2019-02-18 18:00:40,281 epoch 15 - iter 416/526 - loss 0.01134365\n", + "2019-02-18 18:01:18,374 epoch 15 - iter 468/526 - loss 0.01133036\n", + "2019-02-18 18:01:59,215 epoch 15 - iter 520/526 - loss 0.01130990\n", + "2019-02-18 18:02:05,436 ----------------------------------------------------------------------------------------------------\n", + "2019-02-18 18:02:05,439 EPOCH 15 done: loss 0.0113 - lr 0.1000 - bad epochs 0\n", + "2019-02-18 18:02:42,647 DEV : loss 0.01007134 - f-score 0.8579 - acc 0.8579\n", + "2019-02-18 18:03:08,268 TEST : loss 0.01374990 - f-score 0.7997 - acc 0.7997\n", + "2019-02-18 18:03:19,140 ----------------------------------------------------------------------------------------------------\n", + "2019-02-18 18:03:19,973 epoch 16 - iter 0/526 - loss 0.00623085\n", + "2019-02-18 18:04:05,629 epoch 16 - iter 52/526 - loss 0.01067232\n", + "2019-02-18 18:04:43,731 epoch 16 - iter 104/526 - loss 0.01074571\n", + "2019-02-18 18:05:27,007 epoch 16 - iter 156/526 - loss 0.01048908\n", + "2019-02-18 18:06:07,405 epoch 16 - iter 208/526 - loss 0.01026548\n", + "2019-02-18 18:06:52,095 epoch 16 - iter 260/526 - loss 0.01016827\n", + "2019-02-18 18:07:35,782 epoch 16 - iter 312/526 - loss 0.01007975\n", + "2019-02-18 18:08:12,756 epoch 16 - iter 364/526 - loss 0.00996693\n", + "2019-02-18 18:08:49,916 epoch 16 - iter 416/526 - loss 0.00979732\n", + "2019-02-18 18:09:36,652 epoch 16 - iter 468/526 - loss 0.00971618\n", + "2019-02-18 18:10:18,519 epoch 16 - iter 520/526 - loss 0.00975455\n", + "2019-02-18 18:10:21,727 ----------------------------------------------------------------------------------------------------\n", + "2019-02-18 18:10:21,728 EPOCH 16 done: loss 0.0098 - lr 0.1000 - bad epochs 0\n", + "2019-02-18 18:10:58,722 DEV : loss 0.00873072 - f-score 0.8744 - acc 0.8744\n", + "2019-02-18 18:11:24,481 TEST : loss 0.01232619 - f-score 0.8279 - acc 0.8279\n", + "2019-02-18 18:11:35,296 ----------------------------------------------------------------------------------------------------\n", + "2019-02-18 18:11:36,044 epoch 17 - iter 0/526 - loss 0.00967250\n", + "2019-02-18 18:12:16,254 epoch 17 - iter 52/526 - loss 0.00922615\n", + "2019-02-18 18:12:52,615 epoch 17 - iter 104/526 - loss 0.00890183\n", + "2019-02-18 18:13:28,146 epoch 17 - iter 156/526 - loss 0.00908327\n", + "2019-02-18 18:14:11,353 epoch 17 - iter 208/526 - loss 0.00905697\n", + "2019-02-18 18:14:47,186 epoch 17 - iter 260/526 - loss 0.00902008\n", + "2019-02-18 18:15:26,947 epoch 17 - iter 312/526 - loss 0.00901800\n", + "2019-02-18 18:16:06,199 epoch 17 - iter 364/526 - loss 0.00896919\n", + "2019-02-18 18:16:48,604 epoch 17 - iter 416/526 - loss 0.00890790\n", + "2019-02-18 18:17:37,089 epoch 17 - iter 468/526 - loss 0.00878037\n", + "2019-02-18 18:18:16,169 epoch 17 - iter 520/526 - loss 0.00872495\n", + "2019-02-18 18:18:19,962 ----------------------------------------------------------------------------------------------------\n", + "2019-02-18 18:18:19,963 EPOCH 17 done: loss 0.0087 - lr 0.1000 - bad epochs 0\n", + "2019-02-18 18:18:55,554 DEV : loss 0.00906551 - f-score 0.8754 - acc 0.8754\n", + "2019-02-18 18:19:26,327 TEST : loss 0.01094206 - f-score 0.8504 - acc 0.8504\n", + "2019-02-18 18:19:37,212 ----------------------------------------------------------------------------------------------------\n", + "2019-02-18 18:19:38,143 epoch 18 - iter 0/526 - loss 0.00958856\n", + "2019-02-18 18:20:14,891 epoch 18 - iter 52/526 - loss 0.00781917\n", + "2019-02-18 18:20:56,802 epoch 18 - iter 104/526 - loss 0.00790162\n", + "2019-02-18 18:21:40,229 epoch 18 - iter 156/526 - loss 0.00821849\n", + "2019-02-18 18:22:19,944 epoch 18 - iter 208/526 - loss 0.00806862\n", + "2019-02-18 18:23:03,430 epoch 18 - iter 260/526 - loss 0.00805257\n", + "2019-02-18 18:23:48,261 epoch 18 - iter 312/526 - loss 0.00811873\n", + "2019-02-18 18:24:33,787 epoch 18 - iter 364/526 - loss 0.00806263\n", + "2019-02-18 18:25:14,974 epoch 18 - iter 416/526 - loss 0.00806289\n", + "2019-02-18 18:26:02,290 epoch 18 - iter 468/526 - loss 0.00808262\n", + "2019-02-18 18:26:54,268 epoch 18 - iter 520/526 - loss 0.00809047\n", + "2019-02-18 18:26:58,970 ----------------------------------------------------------------------------------------------------\n", + "2019-02-18 18:26:58,971 EPOCH 18 done: loss 0.0081 - lr 0.1000 - bad epochs 0\n", + "2019-02-18 18:27:48,778 DEV : loss 0.00895122 - f-score 0.8739 - acc 0.8739\n", + "2019-02-18 18:28:23,176 TEST : loss 0.01393017 - f-score 0.8040 - acc 0.8040\n", + "2019-02-18 18:28:34,073 ----------------------------------------------------------------------------------------------------\n", + "2019-02-18 18:28:34,820 epoch 19 - iter 0/526 - loss 0.00693367\n", + "2019-02-18 18:29:15,601 epoch 19 - iter 52/526 - loss 0.00744070\n", + "2019-02-18 18:29:52,711 epoch 19 - iter 104/526 - loss 0.00731393\n", + "2019-02-18 18:30:33,862 epoch 19 - iter 156/526 - loss 0.00768933\n", + "2019-02-18 18:31:13,904 epoch 19 - iter 208/526 - loss 0.00773914\n", + "2019-02-18 18:31:55,854 epoch 19 - iter 260/526 - loss 0.00769556\n", + "2019-02-18 18:32:35,011 epoch 19 - iter 312/526 - loss 0.00765124\n", + "2019-02-18 18:33:14,134 epoch 19 - iter 364/526 - loss 0.00763169\n", + "2019-02-18 18:33:51,035 epoch 19 - iter 416/526 - loss 0.00766937\n", + "2019-02-18 18:34:36,084 epoch 19 - iter 468/526 - loss 0.00765516\n", + "2019-02-18 18:35:17,404 epoch 19 - iter 520/526 - loss 0.00762454\n", + "2019-02-18 18:35:20,882 ----------------------------------------------------------------------------------------------------\n", + "2019-02-18 18:35:20,883 EPOCH 19 done: loss 0.0076 - lr 0.1000 - bad epochs 0\n", + "2019-02-18 18:35:58,586 DEV : loss 0.00849486 - f-score 0.8789 - acc 0.8789\n", + "2019-02-18 18:36:24,922 TEST : loss 0.01305993 - f-score 0.8150 - acc 0.8150\n", + "2019-02-18 18:36:35,853 ----------------------------------------------------------------------------------------------------\n", + "2019-02-18 18:36:36,586 epoch 20 - iter 0/526 - loss 0.00446512\n", + "2019-02-18 18:37:17,576 epoch 20 - iter 52/526 - loss 0.00742575\n", + "2019-02-18 18:37:58,266 epoch 20 - iter 104/526 - loss 0.00741747\n", + "2019-02-18 18:38:36,298 epoch 20 - iter 156/526 - loss 0.00731348\n", + "2019-02-18 18:39:16,881 epoch 20 - iter 208/526 - loss 0.00731204\n", + "2019-02-18 18:39:55,945 epoch 20 - iter 260/526 - loss 0.00735582\n", + "2019-02-18 18:40:37,616 epoch 20 - iter 312/526 - loss 0.00744158\n", + "2019-02-18 18:41:17,279 epoch 20 - iter 364/526 - loss 0.00746509\n", + "2019-02-18 18:41:55,950 epoch 20 - iter 416/526 - loss 0.00742372\n", + "2019-02-18 18:42:35,469 epoch 20 - iter 468/526 - loss 0.00739152\n", + "2019-02-18 18:43:15,558 epoch 20 - iter 520/526 - loss 0.00736543\n", + "2019-02-18 18:43:19,182 ----------------------------------------------------------------------------------------------------\n", + "2019-02-18 18:43:19,183 EPOCH 20 done: loss 0.0074 - lr 0.1000 - bad epochs 0\n", + "2019-02-18 18:43:57,603 DEV : loss 0.00742245 - f-score 0.9025 - acc 0.9025\n", + "2019-02-18 18:44:23,549 TEST : loss 0.01072053 - f-score 0.8556 - acc 0.8556\n", + "2019-02-18 18:44:34,496 ----------------------------------------------------------------------------------------------------\n", + "2019-02-18 18:44:35,761 epoch 21 - iter 0/526 - loss 0.00700021\n", + "2019-02-18 18:45:15,499 epoch 21 - iter 52/526 - loss 0.00702865\n", + "2019-02-18 18:45:57,283 epoch 21 - iter 104/526 - loss 0.00684636\n", + "2019-02-18 18:46:39,477 epoch 21 - iter 156/526 - loss 0.00704635\n", + "2019-02-18 18:47:20,830 epoch 21 - iter 208/526 - loss 0.00724219\n", + "2019-02-18 18:48:09,691 epoch 21 - iter 260/526 - loss 0.00723798\n", + "2019-02-18 18:48:47,405 epoch 21 - iter 312/526 - loss 0.00715051\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "2019-02-18 18:49:29,728 epoch 21 - iter 364/526 - loss 0.00711797\n", + "2019-02-18 18:50:12,052 epoch 21 - iter 416/526 - loss 0.00712686\n", + "2019-02-18 18:50:53,060 epoch 21 - iter 468/526 - loss 0.00710849\n", + "2019-02-18 18:51:37,296 epoch 21 - iter 520/526 - loss 0.00702905\n", + "2019-02-18 18:51:40,922 ----------------------------------------------------------------------------------------------------\n", + "2019-02-18 18:51:40,923 EPOCH 21 done: loss 0.0070 - lr 0.1000 - bad epochs 0\n", + "2019-02-18 18:52:18,269 DEV : loss 0.00902766 - f-score 0.8769 - acc 0.8769\n", + "2019-02-18 18:52:44,386 TEST : loss 0.01008986 - f-score 0.8662 - acc 0.8662\n", + "2019-02-18 18:52:55,257 ----------------------------------------------------------------------------------------------------\n", + "2019-02-18 18:52:56,432 epoch 22 - iter 0/526 - loss 0.01365851\n", + "2019-02-18 18:53:39,296 epoch 22 - iter 52/526 - loss 0.00670433\n", + "2019-02-18 18:54:16,343 epoch 22 - iter 104/526 - loss 0.00679970\n", + "2019-02-18 18:54:55,685 epoch 22 - iter 156/526 - loss 0.00674478\n", + "2019-02-18 18:55:33,845 epoch 22 - iter 208/526 - loss 0.00668477\n", + "2019-02-18 18:56:14,839 epoch 22 - iter 260/526 - loss 0.00674326\n", + "2019-02-18 18:56:53,103 epoch 22 - iter 312/526 - loss 0.00681602\n", + "2019-02-18 18:57:33,153 epoch 22 - iter 364/526 - loss 0.00691157\n", + "2019-02-18 18:58:10,846 epoch 22 - iter 416/526 - loss 0.00691438\n", + "2019-02-18 18:58:55,043 epoch 22 - iter 468/526 - loss 0.00688541\n", + "2019-02-18 18:59:32,914 epoch 22 - iter 520/526 - loss 0.00688444\n", + "2019-02-18 18:59:36,304 ----------------------------------------------------------------------------------------------------\n", + "2019-02-18 18:59:36,307 EPOCH 22 done: loss 0.0069 - lr 0.1000 - bad epochs 0\n", + "2019-02-18 19:00:11,956 DEV : loss 0.01018114 - f-score 0.8749 - acc 0.8749\n", + "2019-02-18 19:00:36,143 TEST : loss 0.01700473 - f-score 0.7973 - acc 0.7973\n", + "2019-02-18 19:00:47,001 ----------------------------------------------------------------------------------------------------\n", + "2019-02-18 19:00:47,966 epoch 23 - iter 0/526 - loss 0.00208094\n", + "2019-02-18 19:01:35,538 epoch 23 - iter 52/526 - loss 0.00655314\n", + "2019-02-18 19:02:12,622 epoch 23 - iter 104/526 - loss 0.00643935\n", + "2019-02-18 19:03:00,713 epoch 23 - iter 156/526 - loss 0.00649835\n", + "2019-02-18 19:03:40,690 epoch 23 - iter 208/526 - loss 0.00675218\n", + "2019-02-18 19:04:19,512 epoch 23 - iter 260/526 - loss 0.00665778\n", + "2019-02-18 19:04:59,313 epoch 23 - iter 312/526 - loss 0.00651823\n", + "2019-02-18 19:05:37,600 epoch 23 - iter 364/526 - loss 0.00648123\n", + "2019-02-18 19:06:19,002 epoch 23 - iter 416/526 - loss 0.00646906\n", + "2019-02-18 19:07:01,693 epoch 23 - iter 468/526 - loss 0.00656030\n", + "2019-02-18 19:07:45,891 epoch 23 - iter 520/526 - loss 0.00653499\n", + "2019-02-18 19:07:48,964 ----------------------------------------------------------------------------------------------------\n", + "2019-02-18 19:07:48,966 EPOCH 23 done: loss 0.0065 - lr 0.1000 - bad epochs 0\n", + "2019-02-18 19:08:25,431 DEV : loss 0.00811643 - f-score 0.8944 - acc 0.8944\n", + "2019-02-18 19:08:50,269 TEST : loss 0.01300632 - f-score 0.8346 - acc 0.8346\n", + "2019-02-18 19:09:01,159 ----------------------------------------------------------------------------------------------------\n", + "2019-02-18 19:09:02,155 epoch 24 - iter 0/526 - loss 0.00370325\n", + "2019-02-18 19:09:39,881 epoch 24 - iter 52/526 - loss 0.00528836\n", + "2019-02-18 19:10:22,792 epoch 24 - iter 104/526 - loss 0.00564843\n", + "2019-02-18 19:11:01,662 epoch 24 - iter 156/526 - loss 0.00606675\n", + "2019-02-18 19:11:38,160 epoch 24 - iter 208/526 - loss 0.00607177\n", + "2019-02-18 19:12:16,088 epoch 24 - iter 260/526 - loss 0.00621683\n", + "2019-02-18 19:12:53,659 epoch 24 - iter 312/526 - loss 0.00632252\n", + "2019-02-18 19:13:30,327 epoch 24 - iter 364/526 - loss 0.00633934\n", + "2019-02-18 19:14:08,294 epoch 24 - iter 416/526 - loss 0.00634795\n", + "2019-02-18 19:14:50,062 epoch 24 - iter 468/526 - loss 0.00637791\n", + "2019-02-18 19:15:36,514 epoch 24 - iter 520/526 - loss 0.00631386\n", + "2019-02-18 19:15:40,854 ----------------------------------------------------------------------------------------------------\n", + "2019-02-18 19:15:40,855 EPOCH 24 done: loss 0.0063 - lr 0.1000 - bad epochs 0\n", + "2019-02-18 19:16:29,853 DEV : loss 0.00701130 - f-score 0.9070 - acc 0.9070\n", + "2019-02-18 19:16:57,256 TEST : loss 0.01000786 - f-score 0.8662 - acc 0.8662\n", + "2019-02-18 19:17:08,232 ----------------------------------------------------------------------------------------------------\n", + "2019-02-18 19:17:09,031 epoch 25 - iter 0/526 - loss 0.00396606\n", + "2019-02-18 19:17:53,046 epoch 25 - iter 52/526 - loss 0.00648390\n", + "2019-02-18 19:18:34,367 epoch 25 - iter 104/526 - loss 0.00626455\n", + "2019-02-18 19:19:15,532 epoch 25 - iter 156/526 - loss 0.00635470\n", + "2019-02-18 19:19:54,340 epoch 25 - iter 208/526 - loss 0.00636875\n", + "2019-02-18 19:20:36,426 epoch 25 - iter 260/526 - loss 0.00619974\n", + "2019-02-18 19:21:16,967 epoch 25 - iter 312/526 - loss 0.00610287\n", + "2019-02-18 19:21:59,431 epoch 25 - iter 364/526 - loss 0.00604070\n", + "2019-02-18 19:22:36,775 epoch 25 - iter 416/526 - loss 0.00605358\n", + "2019-02-18 19:23:13,661 epoch 25 - iter 468/526 - loss 0.00611972\n", + "2019-02-18 19:23:53,071 epoch 25 - iter 520/526 - loss 0.00622856\n", + "2019-02-18 19:23:56,380 ----------------------------------------------------------------------------------------------------\n", + "2019-02-18 19:23:56,381 EPOCH 25 done: loss 0.0062 - lr 0.1000 - bad epochs 0\n", + "2019-02-18 19:24:31,694 DEV : loss 0.00707518 - f-score 0.9040 - acc 0.9040\n", + "2019-02-18 19:24:56,882 TEST : loss 0.01061903 - f-score 0.8542 - acc 0.8542\n", + "2019-02-18 19:25:07,996 ----------------------------------------------------------------------------------------------------\n", + "2019-02-18 19:25:08,697 epoch 26 - iter 0/526 - loss 0.00863055\n", + "2019-02-18 19:25:47,732 epoch 26 - iter 52/526 - loss 0.00587896\n", + "2019-02-18 19:26:27,458 epoch 26 - iter 104/526 - loss 0.00580321\n", + "2019-02-18 19:27:09,532 epoch 26 - iter 156/526 - loss 0.00573094\n", + "2019-02-18 19:27:46,472 epoch 26 - iter 208/526 - loss 0.00586916\n", + "2019-02-18 19:28:25,105 epoch 26 - iter 260/526 - loss 0.00591552\n", + "2019-02-18 19:29:08,893 epoch 26 - iter 312/526 - loss 0.00590248\n", + "2019-02-18 19:29:47,865 epoch 26 - iter 364/526 - loss 0.00594697\n", + "2019-02-18 19:30:26,496 epoch 26 - iter 416/526 - loss 0.00607133\n", + "2019-02-18 19:31:07,851 epoch 26 - iter 468/526 - loss 0.00602952\n", + "2019-02-18 19:31:49,167 epoch 26 - iter 520/526 - loss 0.00607515\n", + "2019-02-18 19:31:53,405 ----------------------------------------------------------------------------------------------------\n", + "2019-02-18 19:31:53,406 EPOCH 26 done: loss 0.0061 - lr 0.1000 - bad epochs 0\n", + "2019-02-18 19:32:30,250 DEV : loss 0.00671551 - f-score 0.9185 - acc 0.9185\n", + "2019-02-18 19:32:56,248 TEST : loss 0.00952343 - f-score 0.8743 - acc 0.8743\n", + "2019-02-18 19:33:07,193 ----------------------------------------------------------------------------------------------------\n", + "2019-02-18 19:33:07,964 epoch 27 - iter 0/526 - loss 0.00227738\n", + "2019-02-18 19:33:46,347 epoch 27 - iter 52/526 - loss 0.00601368\n", + "2019-02-18 19:34:25,075 epoch 27 - iter 104/526 - loss 0.00591048\n", + "2019-02-18 19:35:07,728 epoch 27 - iter 156/526 - loss 0.00590332\n", + "2019-02-18 19:35:48,634 epoch 27 - iter 208/526 - loss 0.00604888\n", + "2019-02-18 19:36:25,451 epoch 27 - iter 260/526 - loss 0.00605107\n", + "2019-02-18 19:37:12,908 epoch 27 - iter 312/526 - loss 0.00611740\n", + "2019-02-18 19:37:56,356 epoch 27 - iter 364/526 - loss 0.00610380\n", + "2019-02-18 19:38:37,240 epoch 27 - iter 416/526 - loss 0.00601502\n", + "2019-02-18 19:39:15,762 epoch 27 - iter 468/526 - loss 0.00601412\n", + "2019-02-18 19:39:56,251 epoch 27 - iter 520/526 - loss 0.00600550\n", + "2019-02-18 19:40:00,093 ----------------------------------------------------------------------------------------------------\n", + "2019-02-18 19:40:00,094 EPOCH 27 done: loss 0.0060 - lr 0.1000 - bad epochs 0\n", + "2019-02-18 19:40:35,771 DEV : loss 0.00741955 - f-score 0.9055 - acc 0.9055\n", + "2019-02-18 19:41:00,129 TEST : loss 0.01143624 - f-score 0.8537 - acc 0.8537\n", + "2019-02-18 19:41:10,947 ----------------------------------------------------------------------------------------------------\n", + "2019-02-18 19:41:11,765 epoch 28 - iter 0/526 - loss 0.00277614\n", + "2019-02-18 19:41:48,141 epoch 28 - iter 52/526 - loss 0.00652433\n", + "2019-02-18 19:42:29,356 epoch 28 - iter 104/526 - loss 0.00570894\n", + "2019-02-18 19:43:10,957 epoch 28 - iter 156/526 - loss 0.00581449\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "2019-02-18 19:43:49,868 epoch 28 - iter 208/526 - loss 0.00561163\n", + "2019-02-18 19:44:29,693 epoch 28 - iter 260/526 - loss 0.00571488\n", + "2019-02-18 19:45:12,313 epoch 28 - iter 312/526 - loss 0.00580308\n", + "2019-02-18 19:45:51,397 epoch 28 - iter 364/526 - loss 0.00583960\n", + "2019-02-18 19:46:33,452 epoch 28 - iter 416/526 - loss 0.00583972\n", + "2019-02-18 19:47:12,304 epoch 28 - iter 468/526 - loss 0.00574856\n", + "2019-02-18 19:47:56,758 epoch 28 - iter 520/526 - loss 0.00571306\n", + "2019-02-18 19:47:59,826 ----------------------------------------------------------------------------------------------------\n", + "2019-02-18 19:47:59,829 EPOCH 28 done: loss 0.0057 - lr 0.1000 - bad epochs 0\n", + "2019-02-18 19:48:35,872 DEV : loss 0.00659911 - f-score 0.9200 - acc 0.9200\n", + "2019-02-18 19:49:01,439 TEST : loss 0.00868921 - f-score 0.8805 - acc 0.8805\n", + "2019-02-18 19:49:12,256 ----------------------------------------------------------------------------------------------------\n", + "2019-02-18 19:49:13,427 epoch 29 - iter 0/526 - loss 0.00485749\n", + "2019-02-18 19:49:51,838 epoch 29 - iter 52/526 - loss 0.00564721\n", + "2019-02-18 19:50:30,378 epoch 29 - iter 104/526 - loss 0.00522518\n", + "2019-02-18 19:51:10,081 epoch 29 - iter 156/526 - loss 0.00568877\n", + "2019-02-18 19:51:49,802 epoch 29 - iter 208/526 - loss 0.00564869\n", + "2019-02-18 19:52:28,622 epoch 29 - iter 260/526 - loss 0.00563647\n", + "2019-02-18 19:53:11,167 epoch 29 - iter 312/526 - loss 0.00574610\n", + "2019-02-18 19:53:48,648 epoch 29 - iter 364/526 - loss 0.00568082\n", + "2019-02-18 19:54:27,901 epoch 29 - iter 416/526 - loss 0.00571574\n", + "2019-02-18 19:55:19,843 epoch 29 - iter 468/526 - loss 0.00569390\n", + "2019-02-18 19:55:59,771 epoch 29 - iter 520/526 - loss 0.00570530\n", + "2019-02-18 19:56:03,479 ----------------------------------------------------------------------------------------------------\n", + "2019-02-18 19:56:03,480 EPOCH 29 done: loss 0.0057 - lr 0.1000 - bad epochs 0\n", + "2019-02-18 19:56:38,317 DEV : loss 0.00676128 - f-score 0.9140 - acc 0.9140\n", + "2019-02-18 19:57:04,002 TEST : loss 0.01025531 - f-score 0.8604 - acc 0.8604\n", + "2019-02-18 19:57:14,830 ----------------------------------------------------------------------------------------------------\n", + "2019-02-18 19:57:15,678 epoch 30 - iter 0/526 - loss 0.01091329\n", + "2019-02-18 19:58:01,712 epoch 30 - iter 52/526 - loss 0.00513044\n", + "2019-02-18 19:58:39,606 epoch 30 - iter 104/526 - loss 0.00500759\n", + "2019-02-18 19:59:27,895 epoch 30 - iter 156/526 - loss 0.00522309\n", + "2019-02-18 20:00:10,116 epoch 30 - iter 208/526 - loss 0.00523110\n", + "2019-02-18 20:00:50,092 epoch 30 - iter 260/526 - loss 0.00528235\n", + "2019-02-18 20:01:29,503 epoch 30 - iter 312/526 - loss 0.00546464\n", + "2019-02-18 20:02:10,113 epoch 30 - iter 364/526 - loss 0.00542460\n", + "2019-02-18 20:02:47,800 epoch 30 - iter 416/526 - loss 0.00543210\n", + "2019-02-18 20:03:28,931 epoch 30 - iter 468/526 - loss 0.00545644\n", + "2019-02-18 20:04:07,928 epoch 30 - iter 520/526 - loss 0.00548361\n", + "2019-02-18 20:04:11,827 ----------------------------------------------------------------------------------------------------\n", + "2019-02-18 20:04:11,828 EPOCH 30 done: loss 0.0055 - lr 0.1000 - bad epochs 0\n", + "2019-02-18 20:04:46,557 DEV : loss 0.00742778 - f-score 0.9065 - acc 0.9065\n", + "2019-02-18 20:05:12,104 TEST : loss 0.01216540 - f-score 0.8461 - acc 0.8461\n", + "2019-02-18 20:05:23,320 ----------------------------------------------------------------------------------------------------\n", + "2019-02-18 20:05:24,008 epoch 31 - iter 0/526 - loss 0.00303670\n", + "2019-02-18 20:06:01,987 epoch 31 - iter 52/526 - loss 0.00505696\n", + "2019-02-18 20:06:38,512 epoch 31 - iter 104/526 - loss 0.00561687\n", + "2019-02-18 20:07:15,094 epoch 31 - iter 156/526 - loss 0.00549186\n", + "2019-02-18 20:07:53,514 epoch 31 - iter 208/526 - loss 0.00551414\n", + "2019-02-18 20:08:28,911 epoch 31 - iter 260/526 - loss 0.00549868\n", + "2019-02-18 20:09:08,379 epoch 31 - iter 312/526 - loss 0.00542240\n", + "2019-02-18 20:09:46,399 epoch 31 - iter 364/526 - loss 0.00545813\n", + "2019-02-18 20:10:28,703 epoch 31 - iter 416/526 - loss 0.00535614\n", + "2019-02-18 20:11:06,818 epoch 31 - iter 468/526 - loss 0.00537679\n", + "2019-02-18 20:11:46,134 epoch 31 - iter 520/526 - loss 0.00537339\n", + "2019-02-18 20:11:49,636 ----------------------------------------------------------------------------------------------------\n", + "2019-02-18 20:11:49,638 EPOCH 31 done: loss 0.0054 - lr 0.1000 - bad epochs 0\n", + "2019-02-18 20:12:27,148 DEV : loss 0.00631380 - f-score 0.9250 - acc 0.9250\n", + "2019-02-18 20:12:53,549 TEST : loss 0.00956621 - f-score 0.8728 - acc 0.8728\n", + "2019-02-18 20:13:04,619 ----------------------------------------------------------------------------------------------------\n", + "2019-02-18 20:13:05,446 epoch 32 - iter 0/526 - loss 0.00277344\n", + "2019-02-18 20:13:48,262 epoch 32 - iter 52/526 - loss 0.00480584\n", + "2019-02-18 20:14:28,197 epoch 32 - iter 104/526 - loss 0.00488942\n", + "2019-02-18 20:15:14,667 epoch 32 - iter 156/526 - loss 0.00496550\n", + "2019-02-18 20:15:54,196 epoch 32 - iter 208/526 - loss 0.00501320\n", + "2019-02-18 20:16:36,520 epoch 32 - iter 260/526 - loss 0.00514464\n", + "2019-02-18 20:17:19,796 epoch 32 - iter 312/526 - loss 0.00517199\n", + "2019-02-18 20:17:57,039 epoch 32 - iter 364/526 - loss 0.00514651\n", + "2019-02-18 20:18:33,410 epoch 32 - iter 416/526 - loss 0.00518220\n", + "2019-02-18 20:19:13,713 epoch 32 - iter 468/526 - loss 0.00522393\n", + "2019-02-18 20:19:55,510 epoch 32 - iter 520/526 - loss 0.00522841\n", + "2019-02-18 20:19:58,825 ----------------------------------------------------------------------------------------------------\n", + "2019-02-18 20:19:58,826 EPOCH 32 done: loss 0.0052 - lr 0.1000 - bad epochs 0\n", + "2019-02-18 20:20:36,938 DEV : loss 0.00655561 - f-score 0.9165 - acc 0.9165\n", + "2019-02-18 20:21:02,225 TEST : loss 0.00874485 - f-score 0.8829 - acc 0.8829\n", + "2019-02-18 20:21:13,050 ----------------------------------------------------------------------------------------------------\n", + "2019-02-18 20:21:13,539 epoch 33 - iter 0/526 - loss 0.00345887\n", + "2019-02-18 20:21:53,421 epoch 33 - iter 52/526 - loss 0.00509555\n", + "2019-02-18 20:22:36,354 epoch 33 - iter 104/526 - loss 0.00513980\n", + "2019-02-18 20:23:17,252 epoch 33 - iter 156/526 - loss 0.00504405\n", + "2019-02-18 20:23:56,069 epoch 33 - iter 208/526 - loss 0.00506351\n", + "2019-02-18 20:24:40,131 epoch 33 - iter 260/526 - loss 0.00502177\n", + "2019-02-18 20:25:18,959 epoch 33 - iter 312/526 - loss 0.00496115\n", + "2019-02-18 20:25:56,059 epoch 33 - iter 364/526 - loss 0.00498400\n", + "2019-02-18 20:26:35,101 epoch 33 - iter 416/526 - loss 0.00503730\n", + "2019-02-18 20:27:10,064 epoch 33 - iter 468/526 - loss 0.00511903\n", + "2019-02-18 20:27:47,068 epoch 33 - iter 520/526 - loss 0.00506179\n", + "2019-02-18 20:27:50,715 ----------------------------------------------------------------------------------------------------\n", + "2019-02-18 20:27:50,716 EPOCH 33 done: loss 0.0051 - lr 0.1000 - bad epochs 0\n", + "2019-02-18 20:28:26,073 DEV : loss 0.00671039 - f-score 0.9170 - acc 0.9170\n", + "2019-02-18 20:28:50,475 TEST : loss 0.00838385 - f-score 0.8958 - acc 0.8958\n", + "2019-02-18 20:29:01,331 ----------------------------------------------------------------------------------------------------\n", + "2019-02-18 20:29:02,799 epoch 34 - iter 0/526 - loss 0.00541468\n", + "2019-02-18 20:29:43,161 epoch 34 - iter 52/526 - loss 0.00535458\n", + "2019-02-18 20:30:24,871 epoch 34 - iter 104/526 - loss 0.00532681\n", + "2019-02-18 20:31:06,934 epoch 34 - iter 156/526 - loss 0.00517745\n", + "2019-02-18 20:31:46,657 epoch 34 - iter 208/526 - loss 0.00508750\n", + "2019-02-18 20:32:28,094 epoch 34 - iter 260/526 - loss 0.00506163\n", + "2019-02-18 20:33:07,706 epoch 34 - iter 312/526 - loss 0.00497305\n", + "2019-02-18 20:33:47,077 epoch 34 - iter 364/526 - loss 0.00493927\n", + "2019-02-18 20:34:28,584 epoch 34 - iter 416/526 - loss 0.00497704\n", + "2019-02-18 20:35:05,299 epoch 34 - iter 468/526 - loss 0.00500551\n", + "2019-02-18 20:35:41,709 epoch 34 - iter 520/526 - loss 0.00502267\n", + "2019-02-18 20:35:45,440 ----------------------------------------------------------------------------------------------------\n", + "2019-02-18 20:35:45,442 EPOCH 34 done: loss 0.0050 - lr 0.1000 - bad epochs 0\n", + "2019-02-18 20:36:21,336 DEV : loss 0.00648914 - f-score 0.9215 - acc 0.9215\n", + "2019-02-18 20:36:45,359 TEST : loss 0.00947540 - f-score 0.8791 - acc 0.8791\n", + "2019-02-18 20:36:56,228 ----------------------------------------------------------------------------------------------------\n", + "2019-02-18 20:36:56,977 epoch 35 - iter 0/526 - loss 0.00254138\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "2019-02-18 20:37:38,109 epoch 35 - iter 52/526 - loss 0.00486626\n", + "2019-02-18 20:38:21,944 epoch 35 - iter 104/526 - loss 0.00464931\n", + "2019-02-18 20:39:02,476 epoch 35 - iter 156/526 - loss 0.00467166\n", + "2019-02-18 20:39:39,040 epoch 35 - iter 208/526 - loss 0.00458144\n", + "2019-02-18 20:40:20,064 epoch 35 - iter 260/526 - loss 0.00466519\n", + "2019-02-18 20:40:59,534 epoch 35 - iter 312/526 - loss 0.00473275\n", + "2019-02-18 20:41:39,710 epoch 35 - iter 364/526 - loss 0.00480266\n", + "2019-02-18 20:42:17,946 epoch 35 - iter 416/526 - loss 0.00478740\n", + "2019-02-18 20:42:56,209 epoch 35 - iter 468/526 - loss 0.00478709\n", + "2019-02-18 20:43:38,886 epoch 35 - iter 520/526 - loss 0.00480185\n", + "2019-02-18 20:43:43,255 ----------------------------------------------------------------------------------------------------\n", + "2019-02-18 20:43:43,256 EPOCH 35 done: loss 0.0048 - lr 0.1000 - bad epochs 0\n", + "2019-02-18 20:44:20,730 DEV : loss 0.00762835 - f-score 0.9055 - acc 0.9055\n", + "2019-02-18 20:44:46,691 TEST : loss 0.01265931 - f-score 0.8356 - acc 0.8356\n", + "2019-02-18 20:44:57,503 ----------------------------------------------------------------------------------------------------\n", + "2019-02-18 20:44:58,606 epoch 36 - iter 0/526 - loss 0.00431249\n", + "2019-02-18 20:45:40,307 epoch 36 - iter 52/526 - loss 0.00446975\n", + "2019-02-18 20:46:18,418 epoch 36 - iter 104/526 - loss 0.00485159\n", + "2019-02-18 20:46:54,950 epoch 36 - iter 156/526 - loss 0.00497521\n", + "2019-02-18 20:47:34,670 epoch 36 - iter 208/526 - loss 0.00486131\n", + "2019-02-18 20:48:13,052 epoch 36 - iter 260/526 - loss 0.00486605\n", + "2019-02-18 20:48:58,815 epoch 36 - iter 312/526 - loss 0.00487960\n", + "2019-02-18 20:49:40,770 epoch 36 - iter 364/526 - loss 0.00486963\n", + "2019-02-18 20:50:21,572 epoch 36 - iter 416/526 - loss 0.00491666\n", + "2019-02-18 20:51:11,050 epoch 36 - iter 468/526 - loss 0.00499552\n", + "2019-02-18 20:51:51,037 epoch 36 - iter 520/526 - loss 0.00495299\n", + "2019-02-18 20:51:54,586 ----------------------------------------------------------------------------------------------------\n", + "2019-02-18 20:51:54,587 EPOCH 36 done: loss 0.0050 - lr 0.1000 - bad epochs 0\n", + "2019-02-18 20:52:31,926 DEV : loss 0.00754723 - f-score 0.9080 - acc 0.9080\n", + "2019-02-18 20:53:03,083 TEST : loss 0.00890553 - f-score 0.8815 - acc 0.8815\n", + "2019-02-18 20:53:03,085 ----------------------------------------------------------------------------------------------------\n", + "2019-02-18 20:53:03,598 epoch 37 - iter 0/526 - loss 0.00611407\n", + "2019-02-18 20:53:43,608 epoch 37 - iter 52/526 - loss 0.00438129\n", + "2019-02-18 20:54:26,584 epoch 37 - iter 104/526 - loss 0.00431170\n", + "2019-02-18 20:55:09,212 epoch 37 - iter 156/526 - loss 0.00440844\n", + "2019-02-18 20:55:51,370 epoch 37 - iter 208/526 - loss 0.00457593\n", + "2019-02-18 20:56:30,692 epoch 37 - iter 260/526 - loss 0.00450663\n", + "2019-02-18 20:57:09,351 epoch 37 - iter 312/526 - loss 0.00457339\n", + "2019-02-18 20:57:53,149 epoch 37 - iter 364/526 - loss 0.00459854\n", + "2019-02-18 20:58:36,870 epoch 37 - iter 416/526 - loss 0.00471017\n", + "2019-02-18 20:59:18,389 epoch 37 - iter 468/526 - loss 0.00472581\n", + "2019-02-18 21:00:00,388 epoch 37 - iter 520/526 - loss 0.00476817\n", + "2019-02-18 21:00:05,075 ----------------------------------------------------------------------------------------------------\n", + "2019-02-18 21:00:05,078 EPOCH 37 done: loss 0.0048 - lr 0.1000 - bad epochs 1\n", + "2019-02-18 21:00:43,382 DEV : loss 0.00671968 - f-score 0.9260 - acc 0.9260\n", + "2019-02-18 21:01:09,261 TEST : loss 0.00935920 - f-score 0.8881 - acc 0.8881\n", + "2019-02-18 21:01:20,202 ----------------------------------------------------------------------------------------------------\n", + "2019-02-18 21:01:20,954 epoch 38 - iter 0/526 - loss 0.00125326\n", + "2019-02-18 21:01:59,088 epoch 38 - iter 52/526 - loss 0.00482854\n", + "2019-02-18 21:02:42,063 epoch 38 - iter 104/526 - loss 0.00473240\n", + "2019-02-18 21:03:26,364 epoch 38 - iter 156/526 - loss 0.00453341\n", + "2019-02-18 21:04:10,695 epoch 38 - iter 208/526 - loss 0.00471422\n", + "2019-02-18 21:04:54,233 epoch 38 - iter 260/526 - loss 0.00461908\n", + "2019-02-18 21:05:33,796 epoch 38 - iter 312/526 - loss 0.00458001\n", + "2019-02-18 21:06:17,393 epoch 38 - iter 364/526 - loss 0.00454397\n", + "2019-02-18 21:06:57,175 epoch 38 - iter 416/526 - loss 0.00460031\n", + "2019-02-18 21:07:37,441 epoch 38 - iter 468/526 - loss 0.00455714\n", + "2019-02-18 21:08:18,851 epoch 38 - iter 520/526 - loss 0.00466265\n", + "2019-02-18 21:08:22,178 ----------------------------------------------------------------------------------------------------\n", + "2019-02-18 21:08:22,179 EPOCH 38 done: loss 0.0047 - lr 0.1000 - bad epochs 0\n", + "2019-02-18 21:08:59,680 DEV : loss 0.00658262 - f-score 0.9270 - acc 0.9270\n", + "2019-02-18 21:09:24,624 TEST : loss 0.00904336 - f-score 0.8834 - acc 0.8834\n", + "2019-02-18 21:09:35,606 ----------------------------------------------------------------------------------------------------\n", + "2019-02-18 21:09:36,748 epoch 39 - iter 0/526 - loss 0.00322293\n", + "2019-02-18 21:10:28,051 epoch 39 - iter 52/526 - loss 0.00477019\n", + "2019-02-18 21:11:15,955 epoch 39 - iter 104/526 - loss 0.00452314\n", + "2019-02-18 21:11:53,786 epoch 39 - iter 156/526 - loss 0.00428137\n", + "2019-02-18 21:12:30,426 epoch 39 - iter 208/526 - loss 0.00421742\n", + "2019-02-18 21:13:12,313 epoch 39 - iter 260/526 - loss 0.00418670\n", + "2019-02-18 21:13:54,716 epoch 39 - iter 312/526 - loss 0.00430061\n", + "2019-02-18 21:14:36,006 epoch 39 - iter 364/526 - loss 0.00436528\n", + "2019-02-18 21:15:14,603 epoch 39 - iter 416/526 - loss 0.00444931\n", + "2019-02-18 21:15:58,896 epoch 39 - iter 468/526 - loss 0.00445602\n", + "2019-02-18 21:16:42,371 epoch 39 - iter 520/526 - loss 0.00445684\n", + "2019-02-18 21:16:48,178 ----------------------------------------------------------------------------------------------------\n", + "2019-02-18 21:16:48,182 EPOCH 39 done: loss 0.0044 - lr 0.1000 - bad epochs 0\n", + "2019-02-18 21:17:25,892 DEV : loss 0.00689131 - f-score 0.9300 - acc 0.9300\n", + "2019-02-18 21:17:51,974 TEST : loss 0.01112639 - f-score 0.8762 - acc 0.8762\n", + "2019-02-18 21:18:02,883 ----------------------------------------------------------------------------------------------------\n", + "2019-02-18 21:18:04,363 epoch 40 - iter 0/526 - loss 0.00486721\n", + "2019-02-18 21:18:51,887 epoch 40 - iter 52/526 - loss 0.00416534\n", + "2019-02-18 21:19:33,940 epoch 40 - iter 104/526 - loss 0.00454180\n", + "2019-02-18 21:20:21,834 epoch 40 - iter 156/526 - loss 0.00440060\n", + "2019-02-18 21:21:02,604 epoch 40 - iter 208/526 - loss 0.00441413\n", + "2019-02-18 21:21:43,965 epoch 40 - iter 260/526 - loss 0.00444192\n", + "2019-02-18 21:22:22,555 epoch 40 - iter 312/526 - loss 0.00451867\n", + "2019-02-18 21:23:02,929 epoch 40 - iter 364/526 - loss 0.00446207\n", + "2019-02-18 21:23:42,956 epoch 40 - iter 416/526 - loss 0.00453132\n", + "2019-02-18 21:24:24,143 epoch 40 - iter 468/526 - loss 0.00451663\n", + "2019-02-18 21:25:01,295 epoch 40 - iter 520/526 - loss 0.00452041\n", + "2019-02-18 21:25:05,192 ----------------------------------------------------------------------------------------------------\n", + "2019-02-18 21:25:05,193 EPOCH 40 done: loss 0.0045 - lr 0.1000 - bad epochs 0\n", + "2019-02-18 21:25:40,220 DEV : loss 0.00639352 - f-score 0.9250 - acc 0.9250\n", + "2019-02-18 21:26:06,024 TEST : loss 0.00922748 - f-score 0.8815 - acc 0.8815\n", + "2019-02-18 21:26:06,027 ----------------------------------------------------------------------------------------------------\n", + "2019-02-18 21:26:06,835 epoch 41 - iter 0/526 - loss 0.00359781\n", + "2019-02-18 21:26:48,678 epoch 41 - iter 52/526 - loss 0.00427996\n", + "2019-02-18 21:27:28,459 epoch 41 - iter 104/526 - loss 0.00410419\n", + "2019-02-18 21:28:16,896 epoch 41 - iter 156/526 - loss 0.00404274\n", + "2019-02-18 21:29:06,033 epoch 41 - iter 208/526 - loss 0.00410938\n", + "2019-02-18 21:29:50,899 epoch 41 - iter 260/526 - loss 0.00426882\n", + "2019-02-18 21:30:31,612 epoch 41 - iter 312/526 - loss 0.00430495\n", + "2019-02-18 21:31:13,656 epoch 41 - iter 364/526 - loss 0.00435696\n", + "2019-02-18 21:31:59,596 epoch 41 - iter 416/526 - loss 0.00437778\n", + "2019-02-18 21:32:36,157 epoch 41 - iter 468/526 - loss 0.00433847\n", + "2019-02-18 21:33:23,477 epoch 41 - iter 520/526 - loss 0.00439062\n", + "2019-02-18 21:33:27,803 ----------------------------------------------------------------------------------------------------\n", + "2019-02-18 21:33:27,804 EPOCH 41 done: loss 0.0044 - lr 0.1000 - bad epochs 1\n", + "2019-02-18 21:34:17,359 DEV : loss 0.00646965 - f-score 0.9235 - acc 0.9235\n", + "2019-02-18 21:34:51,500 TEST : loss 0.00933895 - f-score 0.8848 - acc 0.8848\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "2019-02-18 21:35:02,397 ----------------------------------------------------------------------------------------------------\n", + "2019-02-18 21:35:03,260 epoch 42 - iter 0/526 - loss 0.00241166\n", + "2019-02-18 21:35:43,394 epoch 42 - iter 52/526 - loss 0.00424583\n", + "2019-02-18 21:36:27,727 epoch 42 - iter 104/526 - loss 0.00425751\n", + "2019-02-18 21:37:11,781 epoch 42 - iter 156/526 - loss 0.00417415\n", + "2019-02-18 21:37:51,732 epoch 42 - iter 208/526 - loss 0.00429902\n", + "2019-02-18 21:38:30,073 epoch 42 - iter 260/526 - loss 0.00425840\n", + "2019-02-18 21:39:09,222 epoch 42 - iter 312/526 - loss 0.00420073\n", + "2019-02-18 21:39:50,656 epoch 42 - iter 364/526 - loss 0.00419647\n", + "2019-02-18 21:40:31,932 epoch 42 - iter 416/526 - loss 0.00425195\n", + "2019-02-18 21:41:14,060 epoch 42 - iter 468/526 - loss 0.00428688\n", + "2019-02-18 21:41:57,861 epoch 42 - iter 520/526 - loss 0.00423423\n", + "2019-02-18 21:42:01,321 ----------------------------------------------------------------------------------------------------\n", + "2019-02-18 21:42:01,322 EPOCH 42 done: loss 0.0042 - lr 0.1000 - bad epochs 0\n", + "2019-02-18 21:42:38,340 DEV : loss 0.00665304 - f-score 0.9210 - acc 0.9210\n", + "2019-02-18 21:43:03,507 TEST : loss 0.00993264 - f-score 0.8752 - acc 0.8752\n", + "2019-02-18 21:43:14,522 ----------------------------------------------------------------------------------------------------\n", + "2019-02-18 21:43:15,281 epoch 43 - iter 0/526 - loss 0.00307408\n", + "2019-02-18 21:43:55,531 epoch 43 - iter 52/526 - loss 0.00420892\n", + "2019-02-18 21:44:36,082 epoch 43 - iter 104/526 - loss 0.00416528\n", + "2019-02-18 21:45:17,762 epoch 43 - iter 156/526 - loss 0.00428778\n", + "2019-02-18 21:46:00,216 epoch 43 - iter 208/526 - loss 0.00425751\n", + "2019-02-18 21:46:37,180 epoch 43 - iter 260/526 - loss 0.00421303\n", + "2019-02-18 21:47:19,888 epoch 43 - iter 312/526 - loss 0.00413917\n", + "2019-02-18 21:47:59,632 epoch 43 - iter 364/526 - loss 0.00405976\n", + "2019-02-18 21:48:37,353 epoch 43 - iter 416/526 - loss 0.00410515\n", + "2019-02-18 21:49:15,754 epoch 43 - iter 468/526 - loss 0.00406046\n", + "2019-02-18 21:49:57,043 epoch 43 - iter 520/526 - loss 0.00404571\n", + "2019-02-18 21:50:01,849 ----------------------------------------------------------------------------------------------------\n", + "2019-02-18 21:50:01,851 EPOCH 43 done: loss 0.0041 - lr 0.1000 - bad epochs 0\n", + "2019-02-18 21:50:40,360 DEV : loss 0.00663564 - f-score 0.9235 - acc 0.9235\n", + "2019-02-18 21:51:07,131 TEST : loss 0.01030743 - f-score 0.8772 - acc 0.8772\n", + "2019-02-18 21:51:18,209 ----------------------------------------------------------------------------------------------------\n", + "2019-02-18 21:51:19,306 epoch 44 - iter 0/526 - loss 0.00401964\n", + "2019-02-18 21:51:58,811 epoch 44 - iter 52/526 - loss 0.00365249\n", + "2019-02-18 21:52:40,077 epoch 44 - iter 104/526 - loss 0.00364939\n", + "2019-02-18 21:53:16,716 epoch 44 - iter 156/526 - loss 0.00394233\n", + "2019-02-18 21:53:53,207 epoch 44 - iter 208/526 - loss 0.00379948\n", + "2019-02-18 21:54:35,587 epoch 44 - iter 260/526 - loss 0.00382793\n", + "2019-02-18 21:55:20,449 epoch 44 - iter 312/526 - loss 0.00389868\n", + "2019-02-18 21:56:02,783 epoch 44 - iter 364/526 - loss 0.00399273\n", + "2019-02-18 21:56:43,280 epoch 44 - iter 416/526 - loss 0.00399537\n", + "2019-02-18 21:57:21,843 epoch 44 - iter 468/526 - loss 0.00396334\n", + "2019-02-18 21:58:02,906 epoch 44 - iter 520/526 - loss 0.00393572\n", + "2019-02-18 21:58:06,344 ----------------------------------------------------------------------------------------------------\n", + "2019-02-18 21:58:06,345 EPOCH 44 done: loss 0.0039 - lr 0.1000 - bad epochs 0\n", + "2019-02-18 21:58:42,066 DEV : loss 0.00663930 - f-score 0.9295 - acc 0.9295\n", + "2019-02-18 21:59:05,664 TEST : loss 0.01006414 - f-score 0.8853 - acc 0.8853\n", + "2019-02-18 21:59:16,482 ----------------------------------------------------------------------------------------------------\n", + "2019-02-18 21:59:17,006 epoch 45 - iter 0/526 - loss 0.00515019\n", + "2019-02-18 22:00:00,137 epoch 45 - iter 52/526 - loss 0.00369945\n", + "2019-02-18 22:00:38,321 epoch 45 - iter 104/526 - loss 0.00400419\n", + "2019-02-18 22:01:22,699 epoch 45 - iter 156/526 - loss 0.00412338\n", + "2019-02-18 22:02:02,133 epoch 45 - iter 208/526 - loss 0.00403188\n", + "2019-02-18 22:02:40,725 epoch 45 - iter 260/526 - loss 0.00408112\n", + "2019-02-18 22:03:20,566 epoch 45 - iter 312/526 - loss 0.00400799\n", + "2019-02-18 22:03:58,158 epoch 45 - iter 364/526 - loss 0.00400158\n", + "2019-02-18 22:04:39,585 epoch 45 - iter 416/526 - loss 0.00397888\n", + "2019-02-18 22:05:21,017 epoch 45 - iter 468/526 - loss 0.00402013\n", + "2019-02-18 22:06:00,658 epoch 45 - iter 520/526 - loss 0.00401658\n", + "2019-02-18 22:06:04,127 ----------------------------------------------------------------------------------------------------\n", + "2019-02-18 22:06:04,127 EPOCH 45 done: loss 0.0040 - lr 0.1000 - bad epochs 0\n", + "2019-02-18 22:06:42,391 DEV : loss 0.00681305 - f-score 0.9185 - acc 0.9185\n", + "2019-02-18 22:07:07,580 TEST : loss 0.01078089 - f-score 0.8705 - acc 0.8705\n", + "2019-02-18 22:07:07,584 ----------------------------------------------------------------------------------------------------\n", + "2019-02-18 22:07:08,113 epoch 46 - iter 0/526 - loss 0.00238467\n", + "2019-02-18 22:07:46,985 epoch 46 - iter 52/526 - loss 0.00327575\n", + "2019-02-18 22:08:27,357 epoch 46 - iter 104/526 - loss 0.00342690\n", + "2019-02-18 22:09:09,071 epoch 46 - iter 156/526 - loss 0.00349763\n", + "2019-02-18 22:09:55,669 epoch 46 - iter 208/526 - loss 0.00357279\n", + "2019-02-18 22:10:44,695 epoch 46 - iter 260/526 - loss 0.00359622\n", + "2019-02-18 22:11:24,020 epoch 46 - iter 312/526 - loss 0.00365794\n", + "2019-02-18 22:12:05,325 epoch 46 - iter 364/526 - loss 0.00371609\n", + "2019-02-18 22:12:44,729 epoch 46 - iter 416/526 - loss 0.00374051\n", + "2019-02-18 22:13:23,625 epoch 46 - iter 468/526 - loss 0.00380232\n", + "2019-02-18 22:14:04,731 epoch 46 - iter 520/526 - loss 0.00385406\n", + "2019-02-18 22:14:09,014 ----------------------------------------------------------------------------------------------------\n", + "2019-02-18 22:14:09,015 EPOCH 46 done: loss 0.0038 - lr 0.1000 - bad epochs 1\n", + "2019-02-18 22:14:45,284 DEV : loss 0.00684360 - f-score 0.9260 - acc 0.9260\n", + "2019-02-18 22:15:10,366 TEST : loss 0.00988535 - f-score 0.8858 - acc 0.8858\n", + "2019-02-18 22:15:21,421 ----------------------------------------------------------------------------------------------------\n", + "2019-02-18 22:15:22,113 epoch 47 - iter 0/526 - loss 0.00661816\n", + "2019-02-18 22:16:02,109 epoch 47 - iter 52/526 - loss 0.00370134\n", + "2019-02-18 22:16:44,003 epoch 47 - iter 104/526 - loss 0.00378943\n", + "2019-02-18 22:17:26,430 epoch 47 - iter 156/526 - loss 0.00380121\n", + "2019-02-18 22:18:10,539 epoch 47 - iter 208/526 - loss 0.00399171\n", + "2019-02-18 22:18:50,717 epoch 47 - iter 260/526 - loss 0.00395213\n", + "2019-02-18 22:19:33,640 epoch 47 - iter 312/526 - loss 0.00392926\n", + "2019-02-18 22:20:13,243 epoch 47 - iter 364/526 - loss 0.00392242\n", + "2019-02-18 22:20:54,344 epoch 47 - iter 416/526 - loss 0.00388569\n", + "2019-02-18 22:21:33,885 epoch 47 - iter 468/526 - loss 0.00387582\n", + "2019-02-18 22:22:17,347 epoch 47 - iter 520/526 - loss 0.00389832\n", + "2019-02-18 22:22:20,526 ----------------------------------------------------------------------------------------------------\n", + "2019-02-18 22:22:20,529 EPOCH 47 done: loss 0.0039 - lr 0.1000 - bad epochs 0\n", + "2019-02-18 22:22:56,845 DEV : loss 0.00683776 - f-score 0.9245 - acc 0.9245\n", + "2019-02-18 22:23:20,835 TEST : loss 0.00988217 - f-score 0.8881 - acc 0.8881\n", + "2019-02-18 22:23:20,839 ----------------------------------------------------------------------------------------------------\n", + "2019-02-18 22:23:21,679 epoch 48 - iter 0/526 - loss 0.00374591\n", + "2019-02-18 22:23:59,756 epoch 48 - iter 52/526 - loss 0.00371948\n", + "2019-02-18 22:24:39,563 epoch 48 - iter 104/526 - loss 0.00373221\n", + "2019-02-18 22:25:19,607 epoch 48 - iter 156/526 - loss 0.00355817\n", + "2019-02-18 22:26:00,138 epoch 48 - iter 208/526 - loss 0.00367312\n", + "2019-02-18 22:26:41,645 epoch 48 - iter 260/526 - loss 0.00361000\n", + "2019-02-18 22:27:24,490 epoch 48 - iter 312/526 - loss 0.00367510\n", + "2019-02-18 22:28:09,611 epoch 48 - iter 364/526 - loss 0.00372203\n", + "2019-02-18 22:28:48,462 epoch 48 - iter 416/526 - loss 0.00374720\n", + "2019-02-18 22:29:29,260 epoch 48 - iter 468/526 - loss 0.00377810\n", + "2019-02-18 22:30:06,519 epoch 48 - iter 520/526 - loss 0.00380874\n", + "2019-02-18 22:30:10,366 ----------------------------------------------------------------------------------------------------\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "2019-02-18 22:30:10,368 EPOCH 48 done: loss 0.0038 - lr 0.1000 - bad epochs 1\n", + "2019-02-18 22:30:46,194 DEV : loss 0.00711772 - f-score 0.9185 - acc 0.9185\n", + "2019-02-18 22:31:10,684 TEST : loss 0.01182052 - f-score 0.8728 - acc 0.8728\n", + "2019-02-18 22:31:21,586 ----------------------------------------------------------------------------------------------------\n", + "2019-02-18 22:31:22,504 epoch 49 - iter 0/526 - loss 0.00432880\n", + "2019-02-18 22:32:02,952 epoch 49 - iter 52/526 - loss 0.00273727\n", + "2019-02-18 22:32:44,264 epoch 49 - iter 104/526 - loss 0.00330484\n", + "2019-02-18 22:33:22,541 epoch 49 - iter 156/526 - loss 0.00344824\n", + "2019-02-18 22:34:03,754 epoch 49 - iter 208/526 - loss 0.00345334\n", + "2019-02-18 22:34:46,894 epoch 49 - iter 260/526 - loss 0.00351180\n", + "2019-02-18 22:35:28,065 epoch 49 - iter 312/526 - loss 0.00352594\n", + "2019-02-18 22:36:08,642 epoch 49 - iter 364/526 - loss 0.00349992\n", + "2019-02-18 22:36:52,745 epoch 49 - iter 416/526 - loss 0.00349705\n", + "2019-02-18 22:37:33,047 epoch 49 - iter 468/526 - loss 0.00346704\n", + "2019-02-18 22:38:11,296 epoch 49 - iter 520/526 - loss 0.00349617\n", + "2019-02-18 22:38:14,951 ----------------------------------------------------------------------------------------------------\n", + "2019-02-18 22:38:14,952 EPOCH 49 done: loss 0.0035 - lr 0.1000 - bad epochs 0\n", + "2019-02-18 22:38:53,435 DEV : loss 0.00707259 - f-score 0.9195 - acc 0.9195\n", + "2019-02-18 22:39:19,262 TEST : loss 0.00947260 - f-score 0.8920 - acc 0.8920\n", + "2019-02-18 22:39:30,191 ----------------------------------------------------------------------------------------------------\n", + "2019-02-18 22:39:30,977 epoch 50 - iter 0/526 - loss 0.00229934\n", + "2019-02-18 22:40:13,327 epoch 50 - iter 52/526 - loss 0.00319553\n", + "2019-02-18 22:40:50,404 epoch 50 - iter 104/526 - loss 0.00313789\n", + "2019-02-18 22:41:30,296 epoch 50 - iter 156/526 - loss 0.00327911\n", + "2019-02-18 22:42:13,514 epoch 50 - iter 208/526 - loss 0.00326068\n", + "2019-02-18 22:42:55,274 epoch 50 - iter 260/526 - loss 0.00335144\n", + "2019-02-18 22:43:34,746 epoch 50 - iter 312/526 - loss 0.00340644\n", + "2019-02-18 22:44:13,033 epoch 50 - iter 364/526 - loss 0.00346751\n", + "2019-02-18 22:44:52,440 epoch 50 - iter 416/526 - loss 0.00347848\n", + "2019-02-18 22:45:38,279 epoch 50 - iter 468/526 - loss 0.00351688\n", + "2019-02-18 22:46:17,965 epoch 50 - iter 520/526 - loss 0.00345608\n", + "2019-02-18 22:46:21,432 ----------------------------------------------------------------------------------------------------\n", + "2019-02-18 22:46:21,434 EPOCH 50 done: loss 0.0035 - lr 0.1000 - bad epochs 0\n", + "2019-02-18 22:46:58,073 DEV : loss 0.00797859 - f-score 0.9170 - acc 0.9170\n", + "2019-02-18 22:47:24,603 TEST : loss 0.00954126 - f-score 0.8915 - acc 0.8915\n", + "2019-02-18 22:47:35,984 ----------------------------------------------------------------------------------------------------\n", + "2019-02-18 22:47:36,714 epoch 51 - iter 0/526 - loss 0.00388148\n", + "2019-02-18 22:48:16,050 epoch 51 - iter 52/526 - loss 0.00375175\n", + "2019-02-18 22:48:55,596 epoch 51 - iter 104/526 - loss 0.00328642\n", + "2019-02-18 22:49:44,875 epoch 51 - iter 156/526 - loss 0.00330505\n", + "2019-02-18 22:50:25,946 epoch 51 - iter 208/526 - loss 0.00338960\n", + "2019-02-18 22:51:06,464 epoch 51 - iter 260/526 - loss 0.00339443\n", + "2019-02-18 22:51:48,620 epoch 51 - iter 312/526 - loss 0.00343139\n", + "2019-02-18 22:52:33,731 epoch 51 - iter 364/526 - loss 0.00344611\n", + "2019-02-18 22:53:17,798 epoch 51 - iter 416/526 - loss 0.00346570\n", + "2019-02-18 22:54:02,962 epoch 51 - iter 468/526 - loss 0.00350265\n", + "2019-02-18 22:54:45,335 epoch 51 - iter 520/526 - loss 0.00352374\n", + "2019-02-18 22:54:48,980 ----------------------------------------------------------------------------------------------------\n", + "2019-02-18 22:54:48,982 EPOCH 51 done: loss 0.0035 - lr 0.1000 - bad epochs 0\n", + "2019-02-18 22:55:27,264 DEV : loss 0.00934036 - f-score 0.9055 - acc 0.9055\n", + "2019-02-18 22:55:53,256 TEST : loss 0.01036092 - f-score 0.8867 - acc 0.8867\n", + "2019-02-18 22:55:53,259 ----------------------------------------------------------------------------------------------------\n", + "2019-02-18 22:55:53,909 epoch 52 - iter 0/526 - loss 0.00092397\n", + "2019-02-18 22:56:36,639 epoch 52 - iter 52/526 - loss 0.00343864\n", + "2019-02-18 22:57:21,556 epoch 52 - iter 104/526 - loss 0.00325611\n", + "2019-02-18 22:58:03,737 epoch 52 - iter 156/526 - loss 0.00335475\n", + "2019-02-18 22:58:48,484 epoch 52 - iter 208/526 - loss 0.00335209\n", + "2019-02-18 22:59:33,400 epoch 52 - iter 260/526 - loss 0.00340309\n", + "2019-02-18 23:00:15,874 epoch 52 - iter 312/526 - loss 0.00334400\n", + "2019-02-18 23:00:58,535 epoch 52 - iter 364/526 - loss 0.00336129\n", + "2019-02-18 23:01:43,574 epoch 52 - iter 416/526 - loss 0.00346382\n", + "2019-02-18 23:02:25,829 epoch 52 - iter 468/526 - loss 0.00342028\n", + "2019-02-18 23:03:06,531 epoch 52 - iter 520/526 - loss 0.00345363\n", + "2019-02-18 23:03:10,190 ----------------------------------------------------------------------------------------------------\n", + "2019-02-18 23:03:10,192 EPOCH 52 done: loss 0.0035 - lr 0.1000 - bad epochs 1\n", + "2019-02-18 23:03:49,447 DEV : loss 0.00713309 - f-score 0.9180 - acc 0.9180\n", + "2019-02-18 23:04:15,788 TEST : loss 0.01041376 - f-score 0.8834 - acc 0.8834\n", + "2019-02-18 23:04:26,668 ----------------------------------------------------------------------------------------------------\n", + "2019-02-18 23:04:27,775 epoch 53 - iter 0/526 - loss 0.00372904\n", + "2019-02-18 23:05:08,489 epoch 53 - iter 52/526 - loss 0.00302973\n", + "2019-02-18 23:05:49,892 epoch 53 - iter 104/526 - loss 0.00322269\n", + "2019-02-18 23:06:29,050 epoch 53 - iter 156/526 - loss 0.00317444\n", + "2019-02-18 23:07:12,329 epoch 53 - iter 208/526 - loss 0.00306875\n", + "2019-02-18 23:07:51,825 epoch 53 - iter 260/526 - loss 0.00316483\n", + "2019-02-18 23:08:30,141 epoch 53 - iter 312/526 - loss 0.00323263\n", + "2019-02-18 23:09:07,720 epoch 53 - iter 364/526 - loss 0.00326291\n", + "2019-02-18 23:09:53,126 epoch 53 - iter 416/526 - loss 0.00327111\n", + "2019-02-18 23:10:29,478 epoch 53 - iter 468/526 - loss 0.00329684\n", + "2019-02-18 23:11:09,776 epoch 53 - iter 520/526 - loss 0.00333445\n", + "2019-02-18 23:11:13,475 ----------------------------------------------------------------------------------------------------\n", + "2019-02-18 23:11:13,476 EPOCH 53 done: loss 0.0033 - lr 0.1000 - bad epochs 0\n", + "2019-02-18 23:11:49,293 DEV : loss 0.00780328 - f-score 0.9140 - acc 0.9140\n", + "2019-02-18 23:12:14,305 TEST : loss 0.00930190 - f-score 0.8967 - acc 0.8967\n", + "2019-02-18 23:12:25,234 ----------------------------------------------------------------------------------------------------\n", + "2019-02-18 23:12:25,728 epoch 54 - iter 0/526 - loss 0.00407488\n", + "2019-02-18 23:13:07,861 epoch 54 - iter 52/526 - loss 0.00330168\n", + "2019-02-18 23:13:51,577 epoch 54 - iter 104/526 - loss 0.00303882\n", + "2019-02-18 23:14:29,206 epoch 54 - iter 156/526 - loss 0.00310417\n", + "2019-02-18 23:15:08,709 epoch 54 - iter 208/526 - loss 0.00313229\n", + "2019-02-18 23:15:51,484 epoch 54 - iter 260/526 - loss 0.00303136\n", + "2019-02-18 23:16:31,666 epoch 54 - iter 312/526 - loss 0.00297755\n", + "2019-02-18 23:17:10,414 epoch 54 - iter 364/526 - loss 0.00300270\n", + "2019-02-18 23:17:50,981 epoch 54 - iter 416/526 - loss 0.00304721\n", + "2019-02-18 23:18:34,679 epoch 54 - iter 468/526 - loss 0.00310522\n", + "2019-02-18 23:19:15,449 epoch 54 - iter 520/526 - loss 0.00318497\n", + "2019-02-18 23:19:18,679 ----------------------------------------------------------------------------------------------------\n", + "2019-02-18 23:19:18,680 EPOCH 54 done: loss 0.0032 - lr 0.1000 - bad epochs 0\n", + "2019-02-18 23:19:55,082 DEV : loss 0.00677184 - f-score 0.9260 - acc 0.9260\n", + "2019-02-18 23:20:19,809 TEST : loss 0.00938160 - f-score 0.8896 - acc 0.8896\n", + "2019-02-18 23:20:30,772 ----------------------------------------------------------------------------------------------------\n", + "2019-02-18 23:20:31,800 epoch 55 - iter 0/526 - loss 0.00073507\n", + "2019-02-18 23:21:11,730 epoch 55 - iter 52/526 - loss 0.00248448\n", + "2019-02-18 23:21:49,714 epoch 55 - iter 104/526 - loss 0.00279474\n", + "2019-02-18 23:22:33,708 epoch 55 - iter 156/526 - loss 0.00317448\n", + "2019-02-18 23:23:15,418 epoch 55 - iter 208/526 - loss 0.00318162\n", + "2019-02-18 23:23:57,558 epoch 55 - iter 260/526 - loss 0.00317461\n", + "2019-02-18 23:24:36,509 epoch 55 - iter 312/526 - loss 0.00325967\n", + "2019-02-18 23:25:22,885 epoch 55 - iter 364/526 - loss 0.00322780\n", + "2019-02-18 23:26:02,505 epoch 55 - iter 416/526 - loss 0.00324162\n", + "2019-02-18 23:26:44,647 epoch 55 - iter 468/526 - loss 0.00324057\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "2019-02-18 23:27:31,149 epoch 55 - iter 520/526 - loss 0.00325132\n", + "2019-02-18 23:27:35,224 ----------------------------------------------------------------------------------------------------\n", + "2019-02-18 23:27:35,225 EPOCH 55 done: loss 0.0032 - lr 0.1000 - bad epochs 0\n", + "2019-02-18 23:28:25,572 DEV : loss 0.00798117 - f-score 0.9240 - acc 0.9240\n", + "2019-02-18 23:28:52,407 TEST : loss 0.01260192 - f-score 0.8752 - acc 0.8752\n", + "2019-02-18 23:28:52,410 ----------------------------------------------------------------------------------------------------\n", + "2019-02-18 23:28:53,168 epoch 56 - iter 0/526 - loss 0.00118866\n", + "2019-02-18 23:29:33,703 epoch 56 - iter 52/526 - loss 0.00245853\n", + "2019-02-18 23:30:17,666 epoch 56 - iter 104/526 - loss 0.00264936\n", + "2019-02-18 23:30:56,443 epoch 56 - iter 156/526 - loss 0.00287769\n", + "2019-02-18 23:31:37,056 epoch 56 - iter 208/526 - loss 0.00289000\n", + "2019-02-18 23:32:16,691 epoch 56 - iter 260/526 - loss 0.00300595\n", + "2019-02-18 23:32:56,661 epoch 56 - iter 312/526 - loss 0.00290452\n", + "2019-02-18 23:33:48,151 epoch 56 - iter 364/526 - loss 0.00288159\n", + "2019-02-18 23:34:28,956 epoch 56 - iter 416/526 - loss 0.00298162\n", + "2019-02-18 23:35:09,728 epoch 56 - iter 468/526 - loss 0.00305390\n", + "2019-02-18 23:35:52,027 epoch 56 - iter 520/526 - loss 0.00306228\n", + "2019-02-18 23:35:55,262 ----------------------------------------------------------------------------------------------------\n", + "2019-02-18 23:35:55,263 EPOCH 56 done: loss 0.0031 - lr 0.1000 - bad epochs 1\n", + "2019-02-18 23:36:31,906 DEV : loss 0.00798300 - f-score 0.9230 - acc 0.9230\n", + "2019-02-18 23:36:56,797 TEST : loss 0.01210687 - f-score 0.8767 - acc 0.8767\n", + "2019-02-18 23:37:08,047 ----------------------------------------------------------------------------------------------------\n", + "2019-02-18 23:37:08,780 epoch 57 - iter 0/526 - loss 0.00542540\n", + "2019-02-18 23:37:50,816 epoch 57 - iter 52/526 - loss 0.00316473\n", + "2019-02-18 23:38:32,956 epoch 57 - iter 104/526 - loss 0.00287327\n", + "2019-02-18 23:39:17,958 epoch 57 - iter 156/526 - loss 0.00288073\n", + "2019-02-18 23:40:01,280 epoch 57 - iter 208/526 - loss 0.00287998\n", + "2019-02-18 23:40:43,286 epoch 57 - iter 260/526 - loss 0.00288271\n", + "2019-02-18 23:41:24,718 epoch 57 - iter 312/526 - loss 0.00289988\n", + "2019-02-18 23:42:05,496 epoch 57 - iter 364/526 - loss 0.00297501\n", + "2019-02-18 23:42:45,062 epoch 57 - iter 416/526 - loss 0.00304170\n", + "2019-02-18 23:43:23,455 epoch 57 - iter 468/526 - loss 0.00299723\n", + "2019-02-18 23:44:09,098 epoch 57 - iter 520/526 - loss 0.00304574\n", + "2019-02-18 23:44:12,583 ----------------------------------------------------------------------------------------------------\n", + "2019-02-18 23:44:12,585 EPOCH 57 done: loss 0.0031 - lr 0.1000 - bad epochs 0\n", + "2019-02-18 23:44:51,040 DEV : loss 0.00787286 - f-score 0.9205 - acc 0.9205\n", + "2019-02-18 23:45:17,592 TEST : loss 0.01184142 - f-score 0.8834 - acc 0.8834\n", + "2019-02-18 23:45:28,686 ----------------------------------------------------------------------------------------------------\n", + "2019-02-18 23:45:29,418 epoch 58 - iter 0/526 - loss 0.00108189\n", + "2019-02-18 23:46:04,356 epoch 58 - iter 52/526 - loss 0.00370117\n", + "2019-02-18 23:46:40,339 epoch 58 - iter 104/526 - loss 0.00309483\n", + "2019-02-18 23:47:18,333 epoch 58 - iter 156/526 - loss 0.00312497\n", + "2019-02-18 23:48:01,569 epoch 58 - iter 208/526 - loss 0.00322787\n", + "2019-02-18 23:48:46,501 epoch 58 - iter 260/526 - loss 0.00310435\n", + "2019-02-18 23:49:28,123 epoch 58 - iter 312/526 - loss 0.00299135\n", + "2019-02-18 23:50:13,803 epoch 58 - iter 364/526 - loss 0.00300436\n", + "2019-02-18 23:50:57,020 epoch 58 - iter 416/526 - loss 0.00302056\n", + "2019-02-18 23:51:35,830 epoch 58 - iter 468/526 - loss 0.00298431\n", + "2019-02-18 23:52:17,890 epoch 58 - iter 520/526 - loss 0.00295317\n", + "2019-02-18 23:52:22,014 ----------------------------------------------------------------------------------------------------\n", + "2019-02-18 23:52:22,015 EPOCH 58 done: loss 0.0029 - lr 0.1000 - bad epochs 0\n", + "2019-02-18 23:52:57,624 DEV : loss 0.00805508 - f-score 0.9205 - acc 0.9205\n", + "2019-02-18 23:53:22,376 TEST : loss 0.01032458 - f-score 0.8910 - acc 0.8910\n", + "2019-02-18 23:53:33,289 ----------------------------------------------------------------------------------------------------\n", + "2019-02-18 23:53:34,149 epoch 59 - iter 0/526 - loss 0.00282102\n", + "2019-02-18 23:54:15,747 epoch 59 - iter 52/526 - loss 0.00278821\n", + "2019-02-18 23:54:56,560 epoch 59 - iter 104/526 - loss 0.00255563\n", + "2019-02-18 23:55:38,083 epoch 59 - iter 156/526 - loss 0.00272326\n", + "2019-02-18 23:56:18,717 epoch 59 - iter 208/526 - loss 0.00273410\n", + "2019-02-18 23:57:00,737 epoch 59 - iter 260/526 - loss 0.00276645\n", + "2019-02-18 23:57:41,298 epoch 59 - iter 312/526 - loss 0.00280639\n", + "2019-02-18 23:58:21,768 epoch 59 - iter 364/526 - loss 0.00279493\n", + "2019-02-18 23:59:04,079 epoch 59 - iter 416/526 - loss 0.00285703\n", + "2019-02-18 23:59:54,448 epoch 59 - iter 468/526 - loss 0.00288722\n", + "2019-02-19 00:00:38,109 epoch 59 - iter 520/526 - loss 0.00286601\n", + "2019-02-19 00:00:41,648 ----------------------------------------------------------------------------------------------------\n", + "2019-02-19 00:00:41,649 EPOCH 59 done: loss 0.0029 - lr 0.1000 - bad epochs 0\n", + "2019-02-19 00:01:20,016 DEV : loss 0.00815735 - f-score 0.9240 - acc 0.9240\n", + "2019-02-19 00:01:47,344 TEST : loss 0.01191089 - f-score 0.8858 - acc 0.8858\n", + "2019-02-19 00:01:58,216 ----------------------------------------------------------------------------------------------------\n", + "2019-02-19 00:01:59,060 epoch 60 - iter 0/526 - loss 0.00610146\n", + "2019-02-19 00:02:38,283 epoch 60 - iter 52/526 - loss 0.00247116\n", + "2019-02-19 00:03:16,193 epoch 60 - iter 104/526 - loss 0.00231581\n", + "2019-02-19 00:03:57,802 epoch 60 - iter 156/526 - loss 0.00242107\n", + "2019-02-19 00:04:36,135 epoch 60 - iter 208/526 - loss 0.00257680\n", + "2019-02-19 00:05:15,773 epoch 60 - iter 260/526 - loss 0.00270869\n", + "2019-02-19 00:05:57,391 epoch 60 - iter 312/526 - loss 0.00273444\n", + "2019-02-19 00:06:38,909 epoch 60 - iter 364/526 - loss 0.00281719\n", + "2019-02-19 00:07:32,448 epoch 60 - iter 416/526 - loss 0.00278299\n", + "2019-02-19 00:08:16,093 epoch 60 - iter 468/526 - loss 0.00283406\n", + "2019-02-19 00:08:57,384 epoch 60 - iter 520/526 - loss 0.00283877\n", + "2019-02-19 00:09:01,990 ----------------------------------------------------------------------------------------------------\n", + "2019-02-19 00:09:01,991 EPOCH 60 done: loss 0.0028 - lr 0.1000 - bad epochs 0\n", + "2019-02-19 00:09:40,495 DEV : loss 0.00791260 - f-score 0.9245 - acc 0.9245\n", + "2019-02-19 00:10:06,688 TEST : loss 0.01081203 - f-score 0.8924 - acc 0.8924\n", + "2019-02-19 00:10:17,925 ----------------------------------------------------------------------------------------------------\n", + "2019-02-19 00:10:18,810 epoch 61 - iter 0/526 - loss 0.00050923\n", + "2019-02-19 00:11:02,971 epoch 61 - iter 52/526 - loss 0.00260678\n", + "2019-02-19 00:11:42,612 epoch 61 - iter 104/526 - loss 0.00249397\n", + "2019-02-19 00:12:25,655 epoch 61 - iter 156/526 - loss 0.00242163\n", + "2019-02-19 00:13:10,206 epoch 61 - iter 208/526 - loss 0.00255181\n", + "2019-02-19 00:13:48,663 epoch 61 - iter 260/526 - loss 0.00265703\n", + "2019-02-19 00:14:26,656 epoch 61 - iter 312/526 - loss 0.00281335\n", + "2019-02-19 00:15:11,474 epoch 61 - iter 364/526 - loss 0.00280355\n", + "2019-02-19 00:15:59,311 epoch 61 - iter 416/526 - loss 0.00280971\n", + "2019-02-19 00:16:41,540 epoch 61 - iter 468/526 - loss 0.00276764\n", + "2019-02-19 00:17:26,352 epoch 61 - iter 520/526 - loss 0.00278377\n", + "2019-02-19 00:17:30,024 ----------------------------------------------------------------------------------------------------\n", + "2019-02-19 00:17:30,025 EPOCH 61 done: loss 0.0028 - lr 0.1000 - bad epochs 0\n", + "2019-02-19 00:18:07,367 DEV : loss 0.00865918 - f-score 0.9195 - acc 0.9195\n", + "2019-02-19 00:18:33,441 TEST : loss 0.01084274 - f-score 0.8934 - acc 0.8934\n", + "2019-02-19 00:18:44,363 ----------------------------------------------------------------------------------------------------\n", + "2019-02-19 00:18:45,061 epoch 62 - iter 0/526 - loss 0.00034932\n", + "2019-02-19 00:19:25,300 epoch 62 - iter 52/526 - loss 0.00227827\n", + "2019-02-19 00:20:04,243 epoch 62 - iter 104/526 - loss 0.00282858\n", + "2019-02-19 00:20:46,248 epoch 62 - iter 156/526 - loss 0.00284658\n", + "2019-02-19 00:21:23,149 epoch 62 - iter 208/526 - loss 0.00293704\n", + "2019-02-19 00:22:03,143 epoch 62 - iter 260/526 - loss 0.00281066\n", + "2019-02-19 00:22:42,486 epoch 62 - iter 312/526 - loss 0.00285570\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "2019-02-19 00:23:22,553 epoch 62 - iter 364/526 - loss 0.00278258\n", + "2019-02-19 00:24:04,943 epoch 62 - iter 416/526 - loss 0.00275699\n", + "2019-02-19 00:24:44,488 epoch 62 - iter 468/526 - loss 0.00277452\n", + "2019-02-19 00:25:31,105 epoch 62 - iter 520/526 - loss 0.00276041\n", + "2019-02-19 00:25:35,058 ----------------------------------------------------------------------------------------------------\n", + "2019-02-19 00:25:35,059 EPOCH 62 done: loss 0.0028 - lr 0.1000 - bad epochs 0\n", + "2019-02-19 00:26:11,235 DEV : loss 0.00735644 - f-score 0.9220 - acc 0.9220\n", + "2019-02-19 00:26:38,238 TEST : loss 0.01034874 - f-score 0.8896 - acc 0.8896\n", + "2019-02-19 00:26:49,198 ----------------------------------------------------------------------------------------------------\n", + "2019-02-19 00:26:49,778 epoch 63 - iter 0/526 - loss 0.00223490\n", + "2019-02-19 00:27:41,750 epoch 63 - iter 52/526 - loss 0.00236185\n", + "2019-02-19 00:28:34,866 epoch 63 - iter 104/526 - loss 0.00236702\n", + "2019-02-19 00:29:13,655 epoch 63 - iter 156/526 - loss 0.00243840\n", + "2019-02-19 00:29:53,758 epoch 63 - iter 208/526 - loss 0.00242682\n", + "2019-02-19 00:30:33,548 epoch 63 - iter 260/526 - loss 0.00247188\n", + "2019-02-19 00:31:15,130 epoch 63 - iter 312/526 - loss 0.00247130\n", + "2019-02-19 00:31:54,391 epoch 63 - iter 364/526 - loss 0.00245345\n", + "2019-02-19 00:32:31,563 epoch 63 - iter 416/526 - loss 0.00250323\n", + "2019-02-19 00:33:09,772 epoch 63 - iter 468/526 - loss 0.00254974\n", + "2019-02-19 00:33:50,084 epoch 63 - iter 520/526 - loss 0.00256905\n", + "2019-02-19 00:33:54,138 ----------------------------------------------------------------------------------------------------\n", + "2019-02-19 00:33:54,140 EPOCH 63 done: loss 0.0026 - lr 0.1000 - bad epochs 0\n", + "2019-02-19 00:34:34,366 DEV : loss 0.00804905 - f-score 0.9210 - acc 0.9210\n", + "2019-02-19 00:35:02,142 TEST : loss 0.01207406 - f-score 0.8752 - acc 0.8752\n", + "2019-02-19 00:35:13,128 ----------------------------------------------------------------------------------------------------\n", + "2019-02-19 00:35:13,936 epoch 64 - iter 0/526 - loss 0.00028811\n", + "2019-02-19 00:35:55,740 epoch 64 - iter 52/526 - loss 0.00238117\n", + "2019-02-19 00:36:38,204 epoch 64 - iter 104/526 - loss 0.00250847\n", + "2019-02-19 00:37:20,608 epoch 64 - iter 156/526 - loss 0.00253019\n", + "2019-02-19 00:37:59,927 epoch 64 - iter 208/526 - loss 0.00258418\n", + "2019-02-19 00:38:45,727 epoch 64 - iter 260/526 - loss 0.00265268\n", + "2019-02-19 00:39:25,200 epoch 64 - iter 312/526 - loss 0.00258906\n", + "2019-02-19 00:40:07,438 epoch 64 - iter 364/526 - loss 0.00271621\n", + "2019-02-19 00:40:51,982 epoch 64 - iter 416/526 - loss 0.00274402\n", + "2019-02-19 00:41:32,007 epoch 64 - iter 468/526 - loss 0.00268537\n", + "2019-02-19 00:42:12,228 epoch 64 - iter 520/526 - loss 0.00269436\n", + "2019-02-19 00:42:16,327 ----------------------------------------------------------------------------------------------------\n", + "2019-02-19 00:42:16,328 EPOCH 64 done: loss 0.0027 - lr 0.1000 - bad epochs 0\n", + "2019-02-19 00:42:52,499 DEV : loss 0.00891922 - f-score 0.9230 - acc 0.9230\n", + "2019-02-19 00:43:18,114 TEST : loss 0.01327625 - f-score 0.8795 - acc 0.8795\n", + "2019-02-19 00:43:18,116 ----------------------------------------------------------------------------------------------------\n", + "2019-02-19 00:43:18,817 epoch 65 - iter 0/526 - loss 0.00217022\n", + "2019-02-19 00:43:55,057 epoch 65 - iter 52/526 - loss 0.00266105\n", + "2019-02-19 00:44:32,573 epoch 65 - iter 104/526 - loss 0.00257228\n", + "2019-02-19 00:45:16,399 epoch 65 - iter 156/526 - loss 0.00255856\n", + "2019-02-19 00:45:55,981 epoch 65 - iter 208/526 - loss 0.00239845\n", + "2019-02-19 00:46:33,930 epoch 65 - iter 260/526 - loss 0.00244004\n", + "2019-02-19 00:47:20,597 epoch 65 - iter 312/526 - loss 0.00253080\n", + "2019-02-19 00:48:01,008 epoch 65 - iter 364/526 - loss 0.00258291\n", + "2019-02-19 00:48:46,487 epoch 65 - iter 416/526 - loss 0.00251281\n", + "2019-02-19 00:49:28,760 epoch 65 - iter 468/526 - loss 0.00253580\n", + "2019-02-19 00:50:06,880 epoch 65 - iter 520/526 - loss 0.00251206\n", + "2019-02-19 00:50:10,841 ----------------------------------------------------------------------------------------------------\n", + "2019-02-19 00:50:10,841 EPOCH 65 done: loss 0.0025 - lr 0.1000 - bad epochs 1\n", + "2019-02-19 00:50:47,185 DEV : loss 0.00777686 - f-score 0.9200 - acc 0.9200\n", + "2019-02-19 00:51:12,007 TEST : loss 0.01157837 - f-score 0.8810 - acc 0.8810\n", + "2019-02-19 00:51:22,839 ----------------------------------------------------------------------------------------------------\n", + "2019-02-19 00:51:23,639 epoch 66 - iter 0/526 - loss 0.00292374\n", + "2019-02-19 00:52:08,642 epoch 66 - iter 52/526 - loss 0.00262003\n", + "2019-02-19 00:52:47,759 epoch 66 - iter 104/526 - loss 0.00244041\n", + "2019-02-19 00:53:24,248 epoch 66 - iter 156/526 - loss 0.00255294\n", + "2019-02-19 00:54:06,633 epoch 66 - iter 208/526 - loss 0.00241041\n", + "2019-02-19 00:54:46,512 epoch 66 - iter 260/526 - loss 0.00246299\n", + "2019-02-19 00:55:26,570 epoch 66 - iter 312/526 - loss 0.00248248\n", + "2019-02-19 00:56:07,497 epoch 66 - iter 364/526 - loss 0.00248905\n", + "2019-02-19 00:56:47,703 epoch 66 - iter 416/526 - loss 0.00250246\n", + "2019-02-19 00:57:29,005 epoch 66 - iter 468/526 - loss 0.00251366\n", + "2019-02-19 00:58:13,522 epoch 66 - iter 520/526 - loss 0.00255076\n", + "2019-02-19 00:58:16,994 ----------------------------------------------------------------------------------------------------\n", + "2019-02-19 00:58:16,995 EPOCH 66 done: loss 0.0025 - lr 0.1000 - bad epochs 0\n", + "2019-02-19 00:58:59,352 DEV : loss 0.01033701 - f-score 0.9135 - acc 0.9135\n", + "2019-02-19 00:59:25,782 TEST : loss 0.01172750 - f-score 0.8901 - acc 0.8901\n", + "2019-02-19 00:59:25,785 ----------------------------------------------------------------------------------------------------\n", + "2019-02-19 00:59:26,338 epoch 67 - iter 0/526 - loss 0.00406442\n", + "2019-02-19 01:00:10,748 epoch 67 - iter 52/526 - loss 0.00254583\n", + "2019-02-19 01:00:49,351 epoch 67 - iter 104/526 - loss 0.00241898\n", + "2019-02-19 01:01:31,104 epoch 67 - iter 156/526 - loss 0.00244464\n", + "2019-02-19 01:02:10,538 epoch 67 - iter 208/526 - loss 0.00234420\n", + "2019-02-19 01:02:53,511 epoch 67 - iter 260/526 - loss 0.00238693\n", + "2019-02-19 01:03:30,879 epoch 67 - iter 312/526 - loss 0.00245075\n", + "2019-02-19 01:04:13,062 epoch 67 - iter 364/526 - loss 0.00240967\n", + "2019-02-19 01:04:54,868 epoch 67 - iter 416/526 - loss 0.00244997\n", + "2019-02-19 01:05:36,854 epoch 67 - iter 468/526 - loss 0.00249924\n", + "2019-02-19 01:06:13,406 epoch 67 - iter 520/526 - loss 0.00249006\n", + "2019-02-19 01:06:17,592 ----------------------------------------------------------------------------------------------------\n", + "2019-02-19 01:06:17,593 EPOCH 67 done: loss 0.0025 - lr 0.1000 - bad epochs 1\n", + "2019-02-19 01:06:53,554 DEV : loss 0.00929861 - f-score 0.9195 - acc 0.9195\n", + "2019-02-19 01:07:18,693 TEST : loss 0.01209871 - f-score 0.8915 - acc 0.8915\n", + "2019-02-19 01:07:29,708 ----------------------------------------------------------------------------------------------------\n", + "2019-02-19 01:07:30,333 epoch 68 - iter 0/526 - loss 0.00133460\n", + "2019-02-19 01:08:08,123 epoch 68 - iter 52/526 - loss 0.00229490\n", + "2019-02-19 01:08:46,754 epoch 68 - iter 104/526 - loss 0.00254624\n", + "2019-02-19 01:09:25,125 epoch 68 - iter 156/526 - loss 0.00243393\n", + "2019-02-19 01:10:09,529 epoch 68 - iter 208/526 - loss 0.00233091\n", + "2019-02-19 01:10:51,658 epoch 68 - iter 260/526 - loss 0.00246447\n", + "2019-02-19 01:11:30,740 epoch 68 - iter 312/526 - loss 0.00245493\n", + "2019-02-19 01:12:11,646 epoch 68 - iter 364/526 - loss 0.00251110\n", + "2019-02-19 01:12:52,270 epoch 68 - iter 416/526 - loss 0.00246071\n", + "2019-02-19 01:13:38,552 epoch 68 - iter 468/526 - loss 0.00241373\n", + "2019-02-19 01:14:21,456 epoch 68 - iter 520/526 - loss 0.00245487\n", + "2019-02-19 01:14:25,221 ----------------------------------------------------------------------------------------------------\n", + "2019-02-19 01:14:25,222 EPOCH 68 done: loss 0.0025 - lr 0.1000 - bad epochs 0\n", + "2019-02-19 01:15:03,895 DEV : loss 0.00871720 - f-score 0.9145 - acc 0.9145\n", + "2019-02-19 01:15:29,991 TEST : loss 0.01106954 - f-score 0.8829 - acc 0.8829\n", + "2019-02-19 01:15:40,829 ----------------------------------------------------------------------------------------------------\n", + "2019-02-19 01:15:42,132 epoch 69 - iter 0/526 - loss 0.00181395\n", + "2019-02-19 01:16:25,256 epoch 69 - iter 52/526 - loss 0.00205936\n", + "2019-02-19 01:17:04,417 epoch 69 - iter 104/526 - loss 0.00212097\n", + "2019-02-19 01:17:45,235 epoch 69 - iter 156/526 - loss 0.00209010\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "2019-02-19 01:18:29,297 epoch 69 - iter 208/526 - loss 0.00211917\n", + "2019-02-19 01:19:09,736 epoch 69 - iter 260/526 - loss 0.00231962\n", + "2019-02-19 01:19:50,833 epoch 69 - iter 312/526 - loss 0.00240284\n", + "2019-02-19 01:20:32,683 epoch 69 - iter 364/526 - loss 0.00244005\n", + "2019-02-19 01:21:13,577 epoch 69 - iter 416/526 - loss 0.00246184\n", + "2019-02-19 01:21:53,515 epoch 69 - iter 468/526 - loss 0.00242231\n", + "2019-02-19 01:22:34,498 epoch 69 - iter 520/526 - loss 0.00246337\n", + "2019-02-19 01:22:38,061 ----------------------------------------------------------------------------------------------------\n", + "2019-02-19 01:22:38,062 EPOCH 69 done: loss 0.0025 - lr 0.1000 - bad epochs 0\n", + "2019-02-19 01:23:16,833 DEV : loss 0.00926123 - f-score 0.9220 - acc 0.9220\n", + "2019-02-19 01:23:44,206 TEST : loss 0.01422705 - f-score 0.8719 - acc 0.8719\n", + "2019-02-19 01:23:55,218 ----------------------------------------------------------------------------------------------------\n", + "2019-02-19 01:23:56,038 epoch 70 - iter 0/526 - loss 0.00366507\n", + "2019-02-19 01:24:35,820 epoch 70 - iter 52/526 - loss 0.00263450\n", + "2019-02-19 01:25:22,307 epoch 70 - iter 104/526 - loss 0.00237126\n", + "2019-02-19 01:26:01,104 epoch 70 - iter 156/526 - loss 0.00222151\n", + "2019-02-19 01:26:43,815 epoch 70 - iter 208/526 - loss 0.00240983\n", + "2019-02-19 01:27:23,405 epoch 70 - iter 260/526 - loss 0.00242108\n", + "2019-02-19 01:28:09,025 epoch 70 - iter 312/526 - loss 0.00236389\n", + "2019-02-19 01:28:49,716 epoch 70 - iter 364/526 - loss 0.00236170\n", + "2019-02-19 01:29:29,710 epoch 70 - iter 416/526 - loss 0.00238424\n", + "2019-02-19 01:30:08,956 epoch 70 - iter 468/526 - loss 0.00236710\n", + "2019-02-19 01:30:50,037 epoch 70 - iter 520/526 - loss 0.00236953\n", + "2019-02-19 01:30:54,005 ----------------------------------------------------------------------------------------------------\n", + "2019-02-19 01:30:54,006 EPOCH 70 done: loss 0.0024 - lr 0.1000 - bad epochs 0\n", + "2019-02-19 01:31:29,214 DEV : loss 0.00926350 - f-score 0.9230 - acc 0.9230\n", + "2019-02-19 01:31:54,161 TEST : loss 0.01213447 - f-score 0.8891 - acc 0.8891\n", + "2019-02-19 01:32:04,939 ----------------------------------------------------------------------------------------------------\n", + "2019-02-19 01:32:05,753 epoch 71 - iter 0/526 - loss 0.00028783\n", + "2019-02-19 01:32:47,597 epoch 71 - iter 52/526 - loss 0.00189563\n", + "2019-02-19 01:33:27,771 epoch 71 - iter 104/526 - loss 0.00195687\n", + "2019-02-19 01:34:13,385 epoch 71 - iter 156/526 - loss 0.00206313\n", + "2019-02-19 01:34:55,858 epoch 71 - iter 208/526 - loss 0.00222775\n", + "2019-02-19 01:35:39,642 epoch 71 - iter 260/526 - loss 0.00223508\n", + "2019-02-19 01:36:24,105 epoch 71 - iter 312/526 - loss 0.00229322\n", + "2019-02-19 01:37:02,901 epoch 71 - iter 364/526 - loss 0.00234192\n", + "2019-02-19 01:37:42,704 epoch 71 - iter 416/526 - loss 0.00233389\n", + "2019-02-19 01:38:29,428 epoch 71 - iter 468/526 - loss 0.00235340\n", + "2019-02-19 01:39:09,396 epoch 71 - iter 520/526 - loss 0.00240196\n", + "2019-02-19 01:39:13,242 ----------------------------------------------------------------------------------------------------\n", + "2019-02-19 01:39:13,244 EPOCH 71 done: loss 0.0024 - lr 0.1000 - bad epochs 0\n", + "2019-02-19 01:39:50,747 DEV : loss 0.00911213 - f-score 0.9205 - acc 0.9205\n", + "2019-02-19 01:40:17,351 TEST : loss 0.01078602 - f-score 0.8877 - acc 0.8877\n", + "2019-02-19 01:40:17,355 ----------------------------------------------------------------------------------------------------\n", + "2019-02-19 01:40:18,109 epoch 72 - iter 0/526 - loss 0.00247123\n", + "2019-02-19 01:41:02,900 epoch 72 - iter 52/526 - loss 0.00183861\n", + "2019-02-19 01:41:43,753 epoch 72 - iter 104/526 - loss 0.00205073\n", + "2019-02-19 01:42:29,150 epoch 72 - iter 156/526 - loss 0.00232858\n", + "2019-02-19 01:43:09,966 epoch 72 - iter 208/526 - loss 0.00235987\n", + "2019-02-19 01:43:49,982 epoch 72 - iter 260/526 - loss 0.00234824\n", + "2019-02-19 01:44:31,561 epoch 72 - iter 312/526 - loss 0.00238126\n", + "2019-02-19 01:45:14,203 epoch 72 - iter 364/526 - loss 0.00232852\n", + "2019-02-19 01:45:53,362 epoch 72 - iter 416/526 - loss 0.00231680\n", + "2019-02-19 01:46:30,007 epoch 72 - iter 468/526 - loss 0.00230169\n", + "2019-02-19 01:47:10,531 epoch 72 - iter 520/526 - loss 0.00229159\n", + "2019-02-19 01:47:14,820 ----------------------------------------------------------------------------------------------------\n", + "2019-02-19 01:47:14,821 EPOCH 72 done: loss 0.0023 - lr 0.1000 - bad epochs 1\n", + "2019-02-19 01:47:50,080 DEV : loss 0.00948996 - f-score 0.9195 - acc 0.9195\n", + "2019-02-19 01:48:14,642 TEST : loss 0.01261456 - f-score 0.8915 - acc 0.8915\n", + "2019-02-19 01:48:25,421 ----------------------------------------------------------------------------------------------------\n", + "2019-02-19 01:48:26,118 epoch 73 - iter 0/526 - loss 0.00011234\n", + "2019-02-19 01:49:05,493 epoch 73 - iter 52/526 - loss 0.00206336\n", + "2019-02-19 01:49:41,701 epoch 73 - iter 104/526 - loss 0.00221668\n", + "2019-02-19 01:50:19,689 epoch 73 - iter 156/526 - loss 0.00214525\n", + "2019-02-19 01:51:00,099 epoch 73 - iter 208/526 - loss 0.00217245\n", + "2019-02-19 01:51:41,649 epoch 73 - iter 260/526 - loss 0.00218513\n", + "2019-02-19 01:52:25,708 epoch 73 - iter 312/526 - loss 0.00215204\n", + "2019-02-19 01:53:08,101 epoch 73 - iter 364/526 - loss 0.00215785\n", + "2019-02-19 01:53:45,959 epoch 73 - iter 416/526 - loss 0.00214769\n", + "2019-02-19 01:54:28,707 epoch 73 - iter 468/526 - loss 0.00220016\n", + "2019-02-19 01:55:09,980 epoch 73 - iter 520/526 - loss 0.00220002\n", + "2019-02-19 01:55:13,206 ----------------------------------------------------------------------------------------------------\n", + "2019-02-19 01:55:13,208 EPOCH 73 done: loss 0.0022 - lr 0.1000 - bad epochs 0\n", + "2019-02-19 01:55:49,597 DEV : loss 0.00898498 - f-score 0.9210 - acc 0.9210\n", + "2019-02-19 01:56:13,656 TEST : loss 0.01489249 - f-score 0.8585 - acc 0.8585\n", + "2019-02-19 01:56:24,429 ----------------------------------------------------------------------------------------------------\n", + "2019-02-19 01:56:25,134 epoch 74 - iter 0/526 - loss 0.00045626\n", + "2019-02-19 01:57:06,090 epoch 74 - iter 52/526 - loss 0.00197132\n", + "2019-02-19 01:57:43,213 epoch 74 - iter 104/526 - loss 0.00202614\n", + "2019-02-19 01:58:25,424 epoch 74 - iter 156/526 - loss 0.00206083\n", + "2019-02-19 01:59:03,954 epoch 74 - iter 208/526 - loss 0.00209924\n", + "2019-02-19 01:59:42,959 epoch 74 - iter 260/526 - loss 0.00213567\n", + "2019-02-19 02:00:23,488 epoch 74 - iter 312/526 - loss 0.00211349\n", + "2019-02-19 02:01:04,542 epoch 74 - iter 364/526 - loss 0.00216789\n", + "2019-02-19 02:01:46,701 epoch 74 - iter 416/526 - loss 0.00215544\n", + "2019-02-19 02:02:28,801 epoch 74 - iter 468/526 - loss 0.00220382\n", + "2019-02-19 02:03:19,784 epoch 74 - iter 520/526 - loss 0.00220328\n", + "2019-02-19 02:03:24,042 ----------------------------------------------------------------------------------------------------\n", + "2019-02-19 02:03:24,045 EPOCH 74 done: loss 0.0022 - lr 0.1000 - bad epochs 0\n", + "2019-02-19 02:04:03,844 DEV : loss 0.00927694 - f-score 0.9270 - acc 0.9270\n", + "2019-02-19 02:04:30,670 TEST : loss 0.01332265 - f-score 0.8838 - acc 0.8838\n", + "2019-02-19 02:04:30,673 ----------------------------------------------------------------------------------------------------\n", + "2019-02-19 02:04:31,391 epoch 75 - iter 0/526 - loss 0.00578790\n", + "2019-02-19 02:05:13,157 epoch 75 - iter 52/526 - loss 0.00201705\n", + "2019-02-19 02:05:58,713 epoch 75 - iter 104/526 - loss 0.00176217\n", + "2019-02-19 02:06:42,236 epoch 75 - iter 156/526 - loss 0.00161076\n", + "2019-02-19 02:07:22,574 epoch 75 - iter 208/526 - loss 0.00153212\n", + "2019-02-19 02:08:08,605 epoch 75 - iter 260/526 - loss 0.00162826\n", + "2019-02-19 02:08:46,940 epoch 75 - iter 312/526 - loss 0.00181670\n", + "2019-02-19 02:09:25,555 epoch 75 - iter 364/526 - loss 0.00183147\n", + "2019-02-19 02:10:04,681 epoch 75 - iter 416/526 - loss 0.00187992\n", + "2019-02-19 02:10:46,617 epoch 75 - iter 468/526 - loss 0.00195198\n", + "2019-02-19 02:11:32,250 epoch 75 - iter 520/526 - loss 0.00193492\n", + "2019-02-19 02:11:36,292 ----------------------------------------------------------------------------------------------------\n", + "2019-02-19 02:11:36,294 EPOCH 75 done: loss 0.0019 - lr 0.1000 - bad epochs 1\n", + "2019-02-19 02:12:13,277 DEV : loss 0.00957381 - f-score 0.9220 - acc 0.9220\n", + "2019-02-19 02:12:39,055 TEST : loss 0.01183666 - f-score 0.8920 - acc 0.8920\n", + "2019-02-19 02:12:50,140 ----------------------------------------------------------------------------------------------------\n", + "2019-02-19 02:12:50,941 epoch 76 - iter 0/526 - loss 0.00323863\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "2019-02-19 02:13:29,638 epoch 76 - iter 52/526 - loss 0.00212599\n", + "2019-02-19 02:14:10,552 epoch 76 - iter 104/526 - loss 0.00208220\n", + "2019-02-19 02:14:52,904 epoch 76 - iter 156/526 - loss 0.00190547\n", + "2019-02-19 02:15:34,351 epoch 76 - iter 208/526 - loss 0.00184827\n", + "2019-02-19 02:16:15,470 epoch 76 - iter 260/526 - loss 0.00175899\n", + "2019-02-19 02:16:56,341 epoch 76 - iter 312/526 - loss 0.00181931\n", + "2019-02-19 02:17:34,116 epoch 76 - iter 364/526 - loss 0.00181837\n", + "2019-02-19 02:18:12,453 epoch 76 - iter 416/526 - loss 0.00178375\n", + "2019-02-19 02:18:53,565 epoch 76 - iter 468/526 - loss 0.00188068\n", + "2019-02-19 02:19:32,419 epoch 76 - iter 520/526 - loss 0.00193227\n", + "2019-02-19 02:19:35,982 ----------------------------------------------------------------------------------------------------\n", + "2019-02-19 02:19:35,983 EPOCH 76 done: loss 0.0019 - lr 0.1000 - bad epochs 0\n", + "2019-02-19 02:20:11,972 DEV : loss 0.00917836 - f-score 0.9205 - acc 0.9205\n", + "2019-02-19 02:20:36,564 TEST : loss 0.01364193 - f-score 0.8748 - acc 0.8748\n", + "2019-02-19 02:20:36,568 ----------------------------------------------------------------------------------------------------\n", + "2019-02-19 02:20:37,292 epoch 77 - iter 0/526 - loss 0.00156669\n", + "2019-02-19 02:21:15,702 epoch 77 - iter 52/526 - loss 0.00144137\n", + "2019-02-19 02:21:52,444 epoch 77 - iter 104/526 - loss 0.00145727\n", + "2019-02-19 02:22:31,773 epoch 77 - iter 156/526 - loss 0.00157244\n", + "2019-02-19 02:23:11,928 epoch 77 - iter 208/526 - loss 0.00171624\n", + "2019-02-19 02:23:55,161 epoch 77 - iter 260/526 - loss 0.00177478\n", + "2019-02-19 02:24:39,206 epoch 77 - iter 312/526 - loss 0.00173043\n", + "2019-02-19 02:25:21,429 epoch 77 - iter 364/526 - loss 0.00184676\n", + "2019-02-19 02:26:07,415 epoch 77 - iter 416/526 - loss 0.00182094\n", + "2019-02-19 02:26:51,424 epoch 77 - iter 468/526 - loss 0.00182330\n", + "2019-02-19 02:27:30,190 epoch 77 - iter 520/526 - loss 0.00188240\n", + "2019-02-19 02:27:33,871 ----------------------------------------------------------------------------------------------------\n", + "2019-02-19 02:27:33,872 EPOCH 77 done: loss 0.0019 - lr 0.1000 - bad epochs 1\n", + "2019-02-19 02:28:10,543 DEV : loss 0.01020000 - f-score 0.9140 - acc 0.9140\n", + "2019-02-19 02:28:36,119 TEST : loss 0.01244381 - f-score 0.8910 - acc 0.8910\n", + "2019-02-19 02:28:46,987 ----------------------------------------------------------------------------------------------------\n", + "2019-02-19 02:28:47,869 epoch 78 - iter 0/526 - loss 0.00054872\n", + "2019-02-19 02:29:30,747 epoch 78 - iter 52/526 - loss 0.00141659\n", + "2019-02-19 02:30:15,700 epoch 78 - iter 104/526 - loss 0.00174331\n", + "2019-02-19 02:30:56,947 epoch 78 - iter 156/526 - loss 0.00177353\n", + "2019-02-19 02:31:39,842 epoch 78 - iter 208/526 - loss 0.00180384\n", + "2019-02-19 02:32:25,579 epoch 78 - iter 260/526 - loss 0.00185663\n", + "2019-02-19 02:33:06,241 epoch 78 - iter 312/526 - loss 0.00180144\n", + "2019-02-19 02:33:47,859 epoch 78 - iter 364/526 - loss 0.00187756\n", + "2019-02-19 02:34:32,693 epoch 78 - iter 416/526 - loss 0.00192514\n", + "2019-02-19 02:35:17,072 epoch 78 - iter 468/526 - loss 0.00190703\n", + "2019-02-19 02:36:01,395 epoch 78 - iter 520/526 - loss 0.00195062\n", + "2019-02-19 02:36:04,754 ----------------------------------------------------------------------------------------------------\n", + "2019-02-19 02:36:04,756 EPOCH 78 done: loss 0.0020 - lr 0.1000 - bad epochs 0\n", + "2019-02-19 02:36:42,592 DEV : loss 0.00875567 - f-score 0.9200 - acc 0.9200\n", + "2019-02-19 02:37:08,871 TEST : loss 0.01336690 - f-score 0.8791 - acc 0.8791\n", + "2019-02-19 02:37:08,873 ----------------------------------------------------------------------------------------------------\n", + "2019-02-19 02:37:09,337 epoch 79 - iter 0/526 - loss 0.00065538\n", + "2019-02-19 02:37:51,948 epoch 79 - iter 52/526 - loss 0.00191990\n", + "2019-02-19 02:38:36,725 epoch 79 - iter 104/526 - loss 0.00194779\n", + "2019-02-19 02:39:19,145 epoch 79 - iter 156/526 - loss 0.00201094\n", + "2019-02-19 02:40:01,177 epoch 79 - iter 208/526 - loss 0.00193250\n", + "2019-02-19 02:40:42,325 epoch 79 - iter 260/526 - loss 0.00197127\n", + "2019-02-19 02:41:23,284 epoch 79 - iter 312/526 - loss 0.00197641\n", + "2019-02-19 02:42:17,528 epoch 79 - iter 364/526 - loss 0.00195634\n", + "2019-02-19 02:42:59,073 epoch 79 - iter 416/526 - loss 0.00201068\n", + "2019-02-19 02:43:39,041 epoch 79 - iter 468/526 - loss 0.00200842\n", + "2019-02-19 02:44:15,818 epoch 79 - iter 520/526 - loss 0.00198414\n", + "2019-02-19 02:44:19,621 ----------------------------------------------------------------------------------------------------\n", + "2019-02-19 02:44:19,622 EPOCH 79 done: loss 0.0020 - lr 0.1000 - bad epochs 1\n", + "2019-02-19 02:44:58,237 DEV : loss 0.00981320 - f-score 0.9245 - acc 0.9245\n", + "2019-02-19 02:45:25,307 TEST : loss 0.01326628 - f-score 0.8881 - acc 0.8881\n", + "2019-02-19 02:45:25,312 ----------------------------------------------------------------------------------------------------\n", + "2019-02-19 02:45:25,981 epoch 80 - iter 0/526 - loss 0.00144069\n", + "2019-02-19 02:46:04,536 epoch 80 - iter 52/526 - loss 0.00199222\n", + "2019-02-19 02:46:45,747 epoch 80 - iter 104/526 - loss 0.00210346\n", + "2019-02-19 02:47:25,520 epoch 80 - iter 156/526 - loss 0.00194081\n", + "2019-02-19 02:48:05,866 epoch 80 - iter 208/526 - loss 0.00187974\n", + "2019-02-19 02:48:45,502 epoch 80 - iter 260/526 - loss 0.00190591\n", + "2019-02-19 02:49:26,513 epoch 80 - iter 312/526 - loss 0.00187764\n", + "2019-02-19 02:50:10,527 epoch 80 - iter 364/526 - loss 0.00192389\n", + "2019-02-19 02:50:51,165 epoch 80 - iter 416/526 - loss 0.00189695\n", + "2019-02-19 02:51:35,254 epoch 80 - iter 468/526 - loss 0.00193701\n", + "2019-02-19 02:52:14,793 epoch 80 - iter 520/526 - loss 0.00192635\n", + "2019-02-19 02:52:19,188 ----------------------------------------------------------------------------------------------------\n", + "2019-02-19 02:52:19,189 EPOCH 80 done: loss 0.0019 - lr 0.1000 - bad epochs 2\n", + "2019-02-19 02:52:55,951 DEV : loss 0.00911485 - f-score 0.9250 - acc 0.9250\n", + "2019-02-19 02:53:20,886 TEST : loss 0.01340368 - f-score 0.8752 - acc 0.8752\n", + "2019-02-19 02:53:20,889 ----------------------------------------------------------------------------------------------------\n", + "2019-02-19 02:53:21,597 epoch 81 - iter 0/526 - loss 0.00439265\n", + "2019-02-19 02:53:57,933 epoch 81 - iter 52/526 - loss 0.00239608\n", + "2019-02-19 02:54:44,730 epoch 81 - iter 104/526 - loss 0.00199362\n", + "2019-02-19 02:55:36,891 epoch 81 - iter 156/526 - loss 0.00198345\n", + "2019-02-19 02:56:18,314 epoch 81 - iter 208/526 - loss 0.00207105\n", + "2019-02-19 02:57:03,542 epoch 81 - iter 260/526 - loss 0.00197111\n", + "2019-02-19 02:57:43,905 epoch 81 - iter 312/526 - loss 0.00186707\n", + "2019-02-19 02:58:23,235 epoch 81 - iter 364/526 - loss 0.00182501\n", + "2019-02-19 02:59:09,443 epoch 81 - iter 416/526 - loss 0.00183292\n", + "2019-02-19 02:59:49,669 epoch 81 - iter 468/526 - loss 0.00188667\n", + "2019-02-19 03:00:29,539 epoch 81 - iter 520/526 - loss 0.00191649\n", + "2019-02-19 03:00:32,704 ----------------------------------------------------------------------------------------------------\n", + "2019-02-19 03:00:32,705 EPOCH 81 done: loss 0.0019 - lr 0.1000 - bad epochs 3\n", + "2019-02-19 03:01:10,200 DEV : loss 0.01051898 - f-score 0.9030 - acc 0.9030\n", + "2019-02-19 03:01:36,105 TEST : loss 0.01146377 - f-score 0.8920 - acc 0.8920\n", + "2019-02-19 03:01:36,108 ----------------------------------------------------------------------------------------------------\n", + "2019-02-19 03:01:37,175 epoch 82 - iter 0/526 - loss 0.00541445\n", + "2019-02-19 03:02:14,652 epoch 82 - iter 52/526 - loss 0.00150638\n", + "2019-02-19 03:02:51,758 epoch 82 - iter 104/526 - loss 0.00167378\n", + "2019-02-19 03:03:32,773 epoch 82 - iter 156/526 - loss 0.00139234\n", + "2019-02-19 03:04:15,870 epoch 82 - iter 208/526 - loss 0.00145033\n", + "2019-02-19 03:05:02,197 epoch 82 - iter 260/526 - loss 0.00148591\n", + "2019-02-19 03:05:41,905 epoch 82 - iter 312/526 - loss 0.00152059\n", + "2019-02-19 03:06:29,345 epoch 82 - iter 364/526 - loss 0.00158479\n", + "2019-02-19 03:07:11,674 epoch 82 - iter 416/526 - loss 0.00161180\n", + "2019-02-19 03:07:53,200 epoch 82 - iter 468/526 - loss 0.00166763\n", + "2019-02-19 03:08:37,506 epoch 82 - iter 520/526 - loss 0.00170417\n", + "2019-02-19 03:08:41,610 ----------------------------------------------------------------------------------------------------\n", + "2019-02-19 03:08:41,612 EPOCH 82 done: loss 0.0017 - lr 0.1000 - bad epochs 4\n", + "2019-02-19 03:09:19,502 DEV : loss 0.00939283 - f-score 0.9185 - acc 0.9185\n", + "2019-02-19 03:09:44,831 TEST : loss 0.01314014 - f-score 0.8834 - acc 0.8834\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "2019-02-19 03:09:55,742 ----------------------------------------------------------------------------------------------------\n", + "2019-02-19 03:09:57,170 epoch 83 - iter 0/526 - loss 0.00116846\n", + "2019-02-19 03:10:36,124 epoch 83 - iter 52/526 - loss 0.00159172\n", + "2019-02-19 03:11:13,588 epoch 83 - iter 104/526 - loss 0.00161017\n", + "2019-02-19 03:11:53,418 epoch 83 - iter 156/526 - loss 0.00155334\n", + "2019-02-19 03:12:41,752 epoch 83 - iter 208/526 - loss 0.00163101\n", + "2019-02-19 03:13:23,178 epoch 83 - iter 260/526 - loss 0.00162492\n", + "2019-02-19 03:14:02,174 epoch 83 - iter 312/526 - loss 0.00160849\n", + "2019-02-19 03:14:46,326 epoch 83 - iter 364/526 - loss 0.00157752\n", + "2019-02-19 03:15:30,124 epoch 83 - iter 416/526 - loss 0.00158247\n", + "2019-02-19 03:16:12,719 epoch 83 - iter 468/526 - loss 0.00167728\n", + "2019-02-19 03:16:54,016 epoch 83 - iter 520/526 - loss 0.00172712\n", + "2019-02-19 03:17:00,792 ----------------------------------------------------------------------------------------------------\n", + "2019-02-19 03:17:00,793 EPOCH 83 done: loss 0.0017 - lr 0.1000 - bad epochs 0\n", + "2019-02-19 03:17:39,164 DEV : loss 0.01019812 - f-score 0.9180 - acc 0.9180\n", + "2019-02-19 03:18:06,079 TEST : loss 0.01362399 - f-score 0.8881 - acc 0.8881\n", + "2019-02-19 03:18:06,082 ----------------------------------------------------------------------------------------------------\n", + "2019-02-19 03:18:06,563 epoch 84 - iter 0/526 - loss 0.00104602\n", + "2019-02-19 03:18:45,351 epoch 84 - iter 52/526 - loss 0.00187649\n", + "2019-02-19 03:19:26,271 epoch 84 - iter 104/526 - loss 0.00157879\n", + "2019-02-19 03:20:15,276 epoch 84 - iter 156/526 - loss 0.00170571\n", + "2019-02-19 03:20:57,428 epoch 84 - iter 208/526 - loss 0.00172057\n", + "2019-02-19 03:21:41,594 epoch 84 - iter 260/526 - loss 0.00173967\n", + "2019-02-19 03:22:23,043 epoch 84 - iter 312/526 - loss 0.00169418\n", + "2019-02-19 03:23:06,685 epoch 84 - iter 364/526 - loss 0.00167364\n", + "2019-02-19 03:23:50,703 epoch 84 - iter 416/526 - loss 0.00166478\n", + "2019-02-19 03:24:32,658 epoch 84 - iter 468/526 - loss 0.00166701\n", + "2019-02-19 03:25:13,996 epoch 84 - iter 520/526 - loss 0.00166984\n", + "2019-02-19 03:25:18,524 ----------------------------------------------------------------------------------------------------\n", + "2019-02-19 03:25:18,525 EPOCH 84 done: loss 0.0017 - lr 0.1000 - bad epochs 1\n", + "2019-02-19 03:25:57,558 DEV : loss 0.01050610 - f-score 0.9210 - acc 0.9210\n", + "2019-02-19 03:26:24,133 TEST : loss 0.01489008 - f-score 0.8867 - acc 0.8867\n", + "2019-02-19 03:26:35,003 ----------------------------------------------------------------------------------------------------\n", + "2019-02-19 03:26:37,771 epoch 85 - iter 0/526 - loss 0.00104147\n", + "2019-02-19 03:27:19,435 epoch 85 - iter 52/526 - loss 0.00169354\n", + "2019-02-19 03:28:02,000 epoch 85 - iter 104/526 - loss 0.00167812\n", + "2019-02-19 03:28:44,709 epoch 85 - iter 156/526 - loss 0.00160129\n", + "2019-02-19 03:29:26,565 epoch 85 - iter 208/526 - loss 0.00161251\n", + "2019-02-19 03:30:05,279 epoch 85 - iter 260/526 - loss 0.00154626\n", + "2019-02-19 03:30:43,622 epoch 85 - iter 312/526 - loss 0.00160706\n", + "2019-02-19 03:31:25,456 epoch 85 - iter 364/526 - loss 0.00164673\n", + "2019-02-19 03:32:08,277 epoch 85 - iter 416/526 - loss 0.00158821\n", + "2019-02-19 03:32:47,972 epoch 85 - iter 468/526 - loss 0.00161365\n", + "2019-02-19 03:33:32,867 epoch 85 - iter 520/526 - loss 0.00158964\n", + "2019-02-19 03:33:36,072 ----------------------------------------------------------------------------------------------------\n", + "2019-02-19 03:33:36,073 EPOCH 85 done: loss 0.0016 - lr 0.1000 - bad epochs 0\n", + "2019-02-19 03:34:12,160 DEV : loss 0.01179647 - f-score 0.9245 - acc 0.9245\n", + "2019-02-19 03:34:38,269 TEST : loss 0.01552512 - f-score 0.8905 - acc 0.8905\n", + "2019-02-19 03:34:49,203 ----------------------------------------------------------------------------------------------------\n", + "2019-02-19 03:34:49,779 epoch 86 - iter 0/526 - loss 0.00014578\n", + "2019-02-19 03:35:31,308 epoch 86 - iter 52/526 - loss 0.00181892\n", + "2019-02-19 03:36:11,743 epoch 86 - iter 104/526 - loss 0.00172629\n", + "2019-02-19 03:36:47,593 epoch 86 - iter 156/526 - loss 0.00177134\n", + "2019-02-19 03:37:25,249 epoch 86 - iter 208/526 - loss 0.00186702\n", + "2019-02-19 03:38:06,991 epoch 86 - iter 260/526 - loss 0.00182549\n", + "2019-02-19 03:38:47,202 epoch 86 - iter 312/526 - loss 0.00179496\n", + "2019-02-19 03:39:27,749 epoch 86 - iter 364/526 - loss 0.00180684\n", + "2019-02-19 03:40:09,161 epoch 86 - iter 416/526 - loss 0.00183078\n", + "2019-02-19 03:40:51,981 epoch 86 - iter 468/526 - loss 0.00184957\n", + "2019-02-19 03:41:34,842 epoch 86 - iter 520/526 - loss 0.00182854\n", + "2019-02-19 03:41:38,207 ----------------------------------------------------------------------------------------------------\n", + "2019-02-19 03:41:38,209 EPOCH 86 done: loss 0.0018 - lr 0.1000 - bad epochs 0\n", + "2019-02-19 03:42:14,387 DEV : loss 0.01291922 - f-score 0.9095 - acc 0.9095\n", + "2019-02-19 03:42:40,022 TEST : loss 0.02182853 - f-score 0.8566 - acc 0.8566\n", + "2019-02-19 03:42:40,025 ----------------------------------------------------------------------------------------------------\n", + "2019-02-19 03:42:40,657 epoch 87 - iter 0/526 - loss 0.00238495\n", + "2019-02-19 03:43:21,317 epoch 87 - iter 52/526 - loss 0.00213423\n", + "2019-02-19 03:44:01,515 epoch 87 - iter 104/526 - loss 0.00176320\n", + "2019-02-19 03:44:44,551 epoch 87 - iter 156/526 - loss 0.00187373\n", + "2019-02-19 03:45:25,541 epoch 87 - iter 208/526 - loss 0.00187932\n", + "2019-02-19 03:46:12,422 epoch 87 - iter 260/526 - loss 0.00174580\n", + "2019-02-19 03:46:55,052 epoch 87 - iter 312/526 - loss 0.00164460\n", + "2019-02-19 03:47:34,683 epoch 87 - iter 364/526 - loss 0.00167436\n", + "2019-02-19 03:48:15,683 epoch 87 - iter 416/526 - loss 0.00165913\n", + "2019-02-19 03:49:00,692 epoch 87 - iter 468/526 - loss 0.00161779\n", + "2019-02-19 03:49:38,162 epoch 87 - iter 520/526 - loss 0.00167926\n", + "2019-02-19 03:49:41,280 ----------------------------------------------------------------------------------------------------\n", + "2019-02-19 03:49:41,281 EPOCH 87 done: loss 0.0017 - lr 0.1000 - bad epochs 1\n", + "2019-02-19 03:50:19,035 DEV : loss 0.01156142 - f-score 0.9100 - acc 0.9100\n", + "2019-02-19 03:50:53,896 TEST : loss 0.01318137 - f-score 0.8977 - acc 0.8977\n", + "2019-02-19 03:50:53,899 ----------------------------------------------------------------------------------------------------\n", + "2019-02-19 03:50:54,694 epoch 88 - iter 0/526 - loss 0.00888010\n", + "2019-02-19 03:51:32,643 epoch 88 - iter 52/526 - loss 0.00179779\n", + "2019-02-19 03:52:14,288 epoch 88 - iter 104/526 - loss 0.00178959\n", + "2019-02-19 03:53:07,367 epoch 88 - iter 156/526 - loss 0.00158125\n", + "2019-02-19 03:53:47,027 epoch 88 - iter 208/526 - loss 0.00149774\n", + "2019-02-19 03:54:27,961 epoch 88 - iter 260/526 - loss 0.00156698\n", + "2019-02-19 03:55:06,177 epoch 88 - iter 312/526 - loss 0.00158517\n", + "2019-02-19 03:55:48,056 epoch 88 - iter 364/526 - loss 0.00157284\n", + "2019-02-19 03:56:31,494 epoch 88 - iter 416/526 - loss 0.00161180\n", + "2019-02-19 03:57:14,026 epoch 88 - iter 468/526 - loss 0.00159980\n", + "2019-02-19 03:57:54,676 epoch 88 - iter 520/526 - loss 0.00162030\n", + "2019-02-19 03:57:58,394 ----------------------------------------------------------------------------------------------------\n", + "2019-02-19 03:57:58,395 EPOCH 88 done: loss 0.0016 - lr 0.1000 - bad epochs 2\n", + "2019-02-19 03:58:37,099 DEV : loss 0.00950958 - f-score 0.9180 - acc 0.9180\n", + "2019-02-19 03:59:09,304 TEST : loss 0.01486431 - f-score 0.8647 - acc 0.8647\n", + "2019-02-19 03:59:09,306 ----------------------------------------------------------------------------------------------------\n", + "2019-02-19 03:59:10,382 epoch 89 - iter 0/526 - loss 0.00106604\n", + "2019-02-19 03:59:53,107 epoch 89 - iter 52/526 - loss 0.00143349\n", + "2019-02-19 04:00:33,169 epoch 89 - iter 104/526 - loss 0.00127343\n", + "2019-02-19 04:01:12,532 epoch 89 - iter 156/526 - loss 0.00132347\n", + "2019-02-19 04:01:48,752 epoch 89 - iter 208/526 - loss 0.00141182\n", + "2019-02-19 04:02:25,892 epoch 89 - iter 260/526 - loss 0.00144000\n", + "2019-02-19 04:03:07,553 epoch 89 - iter 312/526 - loss 0.00141707\n", + "2019-02-19 04:03:48,632 epoch 89 - iter 364/526 - loss 0.00159705\n", + "2019-02-19 04:04:30,010 epoch 89 - iter 416/526 - loss 0.00162946\n", + "2019-02-19 04:05:11,681 epoch 89 - iter 468/526 - loss 0.00169225\n", + "2019-02-19 04:05:52,479 epoch 89 - iter 520/526 - loss 0.00166944\n", + "2019-02-19 04:05:56,285 ----------------------------------------------------------------------------------------------------\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "2019-02-19 04:05:56,286 EPOCH 89 done: loss 0.0017 - lr 0.1000 - bad epochs 3\n", + "2019-02-19 04:06:32,360 DEV : loss 0.00939411 - f-score 0.9235 - acc 0.9235\n", + "2019-02-19 04:06:58,131 TEST : loss 0.01308209 - f-score 0.8838 - acc 0.8838\n", + "2019-02-19 04:06:58,133 ----------------------------------------------------------------------------------------------------\n", + "2019-02-19 04:06:58,860 epoch 90 - iter 0/526 - loss 0.00101154\n", + "2019-02-19 04:07:37,443 epoch 90 - iter 52/526 - loss 0.00089107\n", + "2019-02-19 04:08:16,461 epoch 90 - iter 104/526 - loss 0.00139649\n", + "2019-02-19 04:08:54,228 epoch 90 - iter 156/526 - loss 0.00175853\n", + "2019-02-19 04:09:32,488 epoch 90 - iter 208/526 - loss 0.00172246\n", + "2019-02-19 04:10:12,980 epoch 90 - iter 260/526 - loss 0.00189268\n", + "2019-02-19 04:10:53,641 epoch 90 - iter 312/526 - loss 0.00188720\n", + "2019-02-19 04:11:30,056 epoch 90 - iter 364/526 - loss 0.00182692\n", + "2019-02-19 04:12:16,140 epoch 90 - iter 416/526 - loss 0.00177614\n", + "2019-02-19 04:12:55,559 epoch 90 - iter 468/526 - loss 0.00172816\n", + "2019-02-19 04:13:35,062 epoch 90 - iter 520/526 - loss 0.00173893\n", + "2019-02-19 04:13:38,367 ----------------------------------------------------------------------------------------------------\n", + "2019-02-19 04:13:38,368 EPOCH 90 done: loss 0.0017 - lr 0.1000 - bad epochs 4\n", + "2019-02-19 04:14:14,133 DEV : loss 0.01047690 - f-score 0.9150 - acc 0.9150\n", + "2019-02-19 04:14:38,997 TEST : loss 0.01398433 - f-score 0.8815 - acc 0.8815\n", + "2019-02-19 04:14:39,000 ----------------------------------------------------------------------------------------------------\n", + "2019-02-19 04:14:39,771 epoch 91 - iter 0/526 - loss 0.00077369\n", + "2019-02-19 04:15:20,017 epoch 91 - iter 52/526 - loss 0.00159348\n", + "2019-02-19 04:16:06,778 epoch 91 - iter 104/526 - loss 0.00126205\n", + "2019-02-19 04:16:51,666 epoch 91 - iter 156/526 - loss 0.00143544\n", + "2019-02-19 04:17:30,571 epoch 91 - iter 208/526 - loss 0.00146865\n", + "2019-02-19 04:18:11,681 epoch 91 - iter 260/526 - loss 0.00139851\n", + "2019-02-19 04:18:50,777 epoch 91 - iter 312/526 - loss 0.00143424\n", + "2019-02-19 04:19:35,239 epoch 91 - iter 364/526 - loss 0.00143754\n", + "2019-02-19 04:20:29,443 epoch 91 - iter 416/526 - loss 0.00144322\n", + "2019-02-19 04:21:08,777 epoch 91 - iter 468/526 - loss 0.00142449\n", + "2019-02-19 04:21:49,426 epoch 91 - iter 520/526 - loss 0.00147375\n", + "2019-02-19 04:21:53,225 ----------------------------------------------------------------------------------------------------\n", + "2019-02-19 04:21:53,227 EPOCH 91 done: loss 0.0015 - lr 0.1000 - bad epochs 5\n", + "2019-02-19 04:22:42,848 DEV : loss 0.01142728 - f-score 0.9240 - acc 0.9240\n", + "2019-02-19 04:23:09,283 TEST : loss 0.01610915 - f-score 0.8877 - acc 0.8877\n", + "2019-02-19 04:23:20,255 ----------------------------------------------------------------------------------------------------\n", + "2019-02-19 04:23:21,186 epoch 92 - iter 0/526 - loss 0.00007011\n", + "2019-02-19 04:24:01,872 epoch 92 - iter 52/526 - loss 0.00164318\n", + "2019-02-19 04:24:45,352 epoch 92 - iter 104/526 - loss 0.00154162\n", + "2019-02-19 04:25:24,542 epoch 92 - iter 156/526 - loss 0.00141932\n", + "2019-02-19 04:26:05,209 epoch 92 - iter 208/526 - loss 0.00136995\n", + "2019-02-19 04:26:44,670 epoch 92 - iter 260/526 - loss 0.00138729\n", + "2019-02-19 04:27:25,123 epoch 92 - iter 312/526 - loss 0.00134203\n", + "2019-02-19 04:28:11,010 epoch 92 - iter 364/526 - loss 0.00135643\n", + "2019-02-19 04:28:50,742 epoch 92 - iter 416/526 - loss 0.00142221\n", + "2019-02-19 04:29:29,970 epoch 92 - iter 468/526 - loss 0.00138912\n", + "2019-02-19 04:30:14,129 epoch 92 - iter 520/526 - loss 0.00139426\n", + "2019-02-19 04:30:18,673 ----------------------------------------------------------------------------------------------------\n", + "2019-02-19 04:30:18,674 EPOCH 92 done: loss 0.0014 - lr 0.1000 - bad epochs 0\n", + "2019-02-19 04:30:57,160 DEV : loss 0.01147311 - f-score 0.9180 - acc 0.9180\n", + "2019-02-19 04:31:23,518 TEST : loss 0.01745269 - f-score 0.8705 - acc 0.8705\n", + "2019-02-19 04:31:34,343 ----------------------------------------------------------------------------------------------------\n", + "2019-02-19 04:31:35,045 epoch 93 - iter 0/526 - loss 0.00333420\n", + "2019-02-19 04:32:15,211 epoch 93 - iter 52/526 - loss 0.00144450\n", + "2019-02-19 04:33:08,536 epoch 93 - iter 104/526 - loss 0.00124302\n", + "2019-02-19 04:33:45,927 epoch 93 - iter 156/526 - loss 0.00123781\n", + "2019-02-19 04:34:23,005 epoch 93 - iter 208/526 - loss 0.00120892\n", + "2019-02-19 04:35:00,646 epoch 93 - iter 260/526 - loss 0.00128353\n", + "2019-02-19 04:35:42,418 epoch 93 - iter 312/526 - loss 0.00128915\n", + "2019-02-19 04:36:26,053 epoch 93 - iter 364/526 - loss 0.00136641\n", + "2019-02-19 04:37:05,173 epoch 93 - iter 416/526 - loss 0.00137863\n", + "2019-02-19 04:37:57,451 epoch 93 - iter 468/526 - loss 0.00144463\n", + "2019-02-19 04:38:37,082 epoch 93 - iter 520/526 - loss 0.00155321\n", + "2019-02-19 04:38:40,625 ----------------------------------------------------------------------------------------------------\n", + "2019-02-19 04:38:40,626 EPOCH 93 done: loss 0.0016 - lr 0.1000 - bad epochs 0\n", + "2019-02-19 04:39:18,039 DEV : loss 0.01175705 - f-score 0.9220 - acc 0.9220\n", + "2019-02-19 04:39:44,095 TEST : loss 0.01827965 - f-score 0.8795 - acc 0.8795\n", + "2019-02-19 04:39:44,097 ----------------------------------------------------------------------------------------------------\n", + "2019-02-19 04:39:44,820 epoch 94 - iter 0/526 - loss 0.00773266\n", + "2019-02-19 04:40:26,093 epoch 94 - iter 52/526 - loss 0.00121886\n", + "2019-02-19 04:41:07,960 epoch 94 - iter 104/526 - loss 0.00127905\n", + "2019-02-19 04:42:03,489 epoch 94 - iter 156/526 - loss 0.00122680\n", + "2019-02-19 04:42:46,403 epoch 94 - iter 208/526 - loss 0.00129118\n", + "2019-02-19 04:43:31,433 epoch 94 - iter 260/526 - loss 0.00130237\n", + "2019-02-19 04:44:10,246 epoch 94 - iter 312/526 - loss 0.00127384\n", + "2019-02-19 04:44:51,962 epoch 94 - iter 364/526 - loss 0.00124976\n", + "2019-02-19 04:45:33,105 epoch 94 - iter 416/526 - loss 0.00127324\n", + "2019-02-19 04:46:13,533 epoch 94 - iter 468/526 - loss 0.00128987\n", + "2019-02-19 04:46:55,169 epoch 94 - iter 520/526 - loss 0.00133658\n", + "2019-02-19 04:46:58,687 ----------------------------------------------------------------------------------------------------\n", + "2019-02-19 04:46:58,688 EPOCH 94 done: loss 0.0013 - lr 0.1000 - bad epochs 1\n", + "2019-02-19 04:47:35,065 DEV : loss 0.01234767 - f-score 0.9155 - acc 0.9155\n", + "2019-02-19 04:48:00,431 TEST : loss 0.01424169 - f-score 0.8944 - acc 0.8944\n", + "2019-02-19 04:48:11,380 ----------------------------------------------------------------------------------------------------\n", + "2019-02-19 04:48:12,465 epoch 95 - iter 0/526 - loss 0.00014443\n", + "2019-02-19 04:48:57,205 epoch 95 - iter 52/526 - loss 0.00140546\n", + "2019-02-19 04:49:39,666 epoch 95 - iter 104/526 - loss 0.00114873\n", + "2019-02-19 04:50:21,825 epoch 95 - iter 156/526 - loss 0.00112524\n", + "2019-02-19 04:50:59,568 epoch 95 - iter 208/526 - loss 0.00119036\n", + "2019-02-19 04:51:40,341 epoch 95 - iter 260/526 - loss 0.00125732\n", + "2019-02-19 04:52:20,495 epoch 95 - iter 312/526 - loss 0.00127443\n", + "2019-02-19 04:53:00,700 epoch 95 - iter 364/526 - loss 0.00127471\n", + "2019-02-19 04:53:38,960 epoch 95 - iter 416/526 - loss 0.00127094\n", + "2019-02-19 04:54:16,842 epoch 95 - iter 468/526 - loss 0.00129768\n", + "2019-02-19 04:54:59,030 epoch 95 - iter 520/526 - loss 0.00135680\n", + "2019-02-19 04:55:02,621 ----------------------------------------------------------------------------------------------------\n", + "2019-02-19 04:55:02,622 EPOCH 95 done: loss 0.0014 - lr 0.1000 - bad epochs 0\n", + "2019-02-19 04:55:38,650 DEV : loss 0.01068178 - f-score 0.9140 - acc 0.9140\n", + "2019-02-19 04:56:03,485 TEST : loss 0.01493327 - f-score 0.8776 - acc 0.8776\n", + "2019-02-19 04:56:03,488 ----------------------------------------------------------------------------------------------------\n", + "2019-02-19 04:56:04,335 epoch 96 - iter 0/526 - loss 0.00018781\n", + "2019-02-19 04:56:42,224 epoch 96 - iter 52/526 - loss 0.00149686\n", + "2019-02-19 04:57:22,582 epoch 96 - iter 104/526 - loss 0.00132458\n", + "2019-02-19 04:58:02,760 epoch 96 - iter 156/526 - loss 0.00126279\n", + "2019-02-19 04:58:42,049 epoch 96 - iter 208/526 - loss 0.00129965\n", + "2019-02-19 04:59:21,499 epoch 96 - iter 260/526 - loss 0.00128112\n", + "2019-02-19 05:00:03,057 epoch 96 - iter 312/526 - loss 0.00126635\n", + "2019-02-19 05:00:40,537 epoch 96 - iter 364/526 - loss 0.00128816\n", + "2019-02-19 05:01:18,138 epoch 96 - iter 416/526 - loss 0.00131574\n", + "2019-02-19 05:01:59,089 epoch 96 - iter 468/526 - loss 0.00130132\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "2019-02-19 05:02:37,096 epoch 96 - iter 520/526 - loss 0.00130853\n", + "2019-02-19 05:02:40,620 ----------------------------------------------------------------------------------------------------\n", + "2019-02-19 05:02:40,621 EPOCH 96 done: loss 0.0013 - lr 0.1000 - bad epochs 1\n", + "2019-02-19 05:03:18,696 DEV : loss 0.01226297 - f-score 0.9145 - acc 0.9145\n", + "2019-02-19 05:03:44,963 TEST : loss 0.01488450 - f-score 0.8853 - acc 0.8853\n", + "2019-02-19 05:03:55,820 ----------------------------------------------------------------------------------------------------\n", + "2019-02-19 05:03:56,443 epoch 97 - iter 0/526 - loss 0.00024264\n", + "2019-02-19 05:04:36,270 epoch 97 - iter 52/526 - loss 0.00130788\n", + "2019-02-19 05:05:14,296 epoch 97 - iter 104/526 - loss 0.00145916\n", + "2019-02-19 05:05:53,124 epoch 97 - iter 156/526 - loss 0.00146267\n", + "2019-02-19 05:06:35,695 epoch 97 - iter 208/526 - loss 0.00135054\n", + "2019-02-19 05:07:17,866 epoch 97 - iter 260/526 - loss 0.00140619\n", + "2019-02-19 05:07:59,147 epoch 97 - iter 312/526 - loss 0.00134640\n", + "2019-02-19 05:08:42,354 epoch 97 - iter 364/526 - loss 0.00136702\n", + "2019-02-19 05:09:21,560 epoch 97 - iter 416/526 - loss 0.00139266\n", + "2019-02-19 05:10:01,792 epoch 97 - iter 468/526 - loss 0.00140579\n", + "2019-02-19 05:10:44,270 epoch 97 - iter 520/526 - loss 0.00139031\n", + "2019-02-19 05:10:48,288 ----------------------------------------------------------------------------------------------------\n", + "2019-02-19 05:10:48,289 EPOCH 97 done: loss 0.0014 - lr 0.1000 - bad epochs 0\n", + "2019-02-19 05:11:25,170 DEV : loss 0.01116125 - f-score 0.9180 - acc 0.9180\n", + "2019-02-19 05:11:50,998 TEST : loss 0.01560584 - f-score 0.8800 - acc 0.8800\n", + "2019-02-19 05:11:51,000 ----------------------------------------------------------------------------------------------------\n", + "2019-02-19 05:11:51,754 epoch 98 - iter 0/526 - loss 0.00012022\n", + "2019-02-19 05:12:32,908 epoch 98 - iter 52/526 - loss 0.00103170\n", + "2019-02-19 05:13:10,501 epoch 98 - iter 104/526 - loss 0.00087034\n", + "2019-02-19 05:13:53,116 epoch 98 - iter 156/526 - loss 0.00104750\n", + "2019-02-19 05:14:31,318 epoch 98 - iter 208/526 - loss 0.00103992\n", + "2019-02-19 05:15:13,141 epoch 98 - iter 260/526 - loss 0.00109514\n", + "2019-02-19 05:15:54,644 epoch 98 - iter 312/526 - loss 0.00109452\n", + "2019-02-19 05:16:35,835 epoch 98 - iter 364/526 - loss 0.00110683\n", + "2019-02-19 05:17:14,223 epoch 98 - iter 416/526 - loss 0.00108642\n", + "2019-02-19 05:17:58,404 epoch 98 - iter 468/526 - loss 0.00111691\n", + "2019-02-19 05:18:43,695 epoch 98 - iter 520/526 - loss 0.00114827\n", + "2019-02-19 05:18:47,518 ----------------------------------------------------------------------------------------------------\n", + "2019-02-19 05:18:47,520 EPOCH 98 done: loss 0.0012 - lr 0.1000 - bad epochs 1\n", + "2019-02-19 05:19:26,272 DEV : loss 0.01133704 - f-score 0.9215 - acc 0.9215\n", + "2019-02-19 05:19:52,518 TEST : loss 0.01621639 - f-score 0.8781 - acc 0.8781\n", + "2019-02-19 05:20:03,429 ----------------------------------------------------------------------------------------------------\n", + "2019-02-19 05:20:05,254 epoch 99 - iter 0/526 - loss 0.00053865\n", + "2019-02-19 05:20:44,830 epoch 99 - iter 52/526 - loss 0.00109932\n", + "2019-02-19 05:21:25,549 epoch 99 - iter 104/526 - loss 0.00138798\n", + "2019-02-19 05:22:12,139 epoch 99 - iter 156/526 - loss 0.00128947\n", + "2019-02-19 05:22:51,781 epoch 99 - iter 208/526 - loss 0.00133365\n", + "2019-02-19 05:23:29,632 epoch 99 - iter 260/526 - loss 0.00139241\n", + "2019-02-19 05:24:08,193 epoch 99 - iter 312/526 - loss 0.00135227\n", + "2019-02-19 05:24:46,940 epoch 99 - iter 364/526 - loss 0.00133667\n", + "2019-02-19 05:25:26,571 epoch 99 - iter 416/526 - loss 0.00135636\n", + "2019-02-19 05:26:10,507 epoch 99 - iter 468/526 - loss 0.00136814\n", + "2019-02-19 05:26:58,024 epoch 99 - iter 520/526 - loss 0.00135109\n", + "2019-02-19 05:27:01,500 ----------------------------------------------------------------------------------------------------\n", + "2019-02-19 05:27:01,501 EPOCH 99 done: loss 0.0014 - lr 0.1000 - bad epochs 0\n", + "2019-02-19 05:27:38,507 DEV : loss 0.01141116 - f-score 0.9200 - acc 0.9200\n", + "2019-02-19 05:28:03,395 TEST : loss 0.01647193 - f-score 0.8805 - acc 0.8805\n", + "2019-02-19 05:28:03,399 ----------------------------------------------------------------------------------------------------\n", + "2019-02-19 05:28:04,242 epoch 100 - iter 0/526 - loss 0.00205240\n", + "2019-02-19 05:28:43,705 epoch 100 - iter 52/526 - loss 0.00142875\n", + "2019-02-19 05:29:25,255 epoch 100 - iter 104/526 - loss 0.00141394\n", + "2019-02-19 05:30:09,541 epoch 100 - iter 156/526 - loss 0.00135374\n", + "2019-02-19 05:30:47,861 epoch 100 - iter 208/526 - loss 0.00130048\n", + "2019-02-19 05:31:30,009 epoch 100 - iter 260/526 - loss 0.00125319\n", + "2019-02-19 05:32:07,358 epoch 100 - iter 312/526 - loss 0.00127834\n", + "2019-02-19 05:32:45,013 epoch 100 - iter 364/526 - loss 0.00122238\n", + "2019-02-19 05:33:22,192 epoch 100 - iter 416/526 - loss 0.00123365\n", + "2019-02-19 05:34:02,515 epoch 100 - iter 468/526 - loss 0.00119514\n", + "2019-02-19 05:34:42,764 epoch 100 - iter 520/526 - loss 0.00118177\n", + "2019-02-19 05:34:47,164 ----------------------------------------------------------------------------------------------------\n", + "2019-02-19 05:34:47,166 EPOCH 100 done: loss 0.0012 - lr 0.1000 - bad epochs 1\n", + "2019-02-19 05:35:25,628 DEV : loss 0.01209000 - f-score 0.9285 - acc 0.9285\n", + "2019-02-19 05:35:51,712 TEST : loss 0.01760402 - f-score 0.8824 - acc 0.8824\n", + "2019-02-19 05:35:51,714 ----------------------------------------------------------------------------------------------------\n", + "2019-02-19 05:35:52,501 epoch 101 - iter 0/526 - loss 0.00106431\n", + "2019-02-19 05:36:31,030 epoch 101 - iter 52/526 - loss 0.00123354\n", + "2019-02-19 05:37:18,043 epoch 101 - iter 104/526 - loss 0.00138914\n", + "2019-02-19 05:37:55,530 epoch 101 - iter 156/526 - loss 0.00134113\n", + "2019-02-19 05:38:37,605 epoch 101 - iter 208/526 - loss 0.00140518\n", + "2019-02-19 05:39:19,489 epoch 101 - iter 260/526 - loss 0.00137156\n", + "2019-02-19 05:40:01,490 epoch 101 - iter 312/526 - loss 0.00133900\n", + "2019-02-19 05:40:44,527 epoch 101 - iter 364/526 - loss 0.00133006\n", + "2019-02-19 05:41:32,385 epoch 101 - iter 416/526 - loss 0.00127373\n", + "2019-02-19 05:42:12,314 epoch 101 - iter 468/526 - loss 0.00121552\n", + "2019-02-19 05:42:53,265 epoch 101 - iter 520/526 - loss 0.00125339\n", + "2019-02-19 05:42:56,782 ----------------------------------------------------------------------------------------------------\n", + "2019-02-19 05:42:56,783 EPOCH 101 done: loss 0.0012 - lr 0.1000 - bad epochs 2\n", + "2019-02-19 05:43:32,009 DEV : loss 0.01149580 - f-score 0.9205 - acc 0.9205\n", + "2019-02-19 05:43:57,120 TEST : loss 0.01478640 - f-score 0.8867 - acc 0.8867\n", + "2019-02-19 05:43:57,122 ----------------------------------------------------------------------------------------------------\n", + "2019-02-19 05:43:57,792 epoch 102 - iter 0/526 - loss 0.00034308\n", + "2019-02-19 05:44:47,766 epoch 102 - iter 52/526 - loss 0.00111355\n", + "2019-02-19 05:45:32,037 epoch 102 - iter 104/526 - loss 0.00115448\n", + "2019-02-19 05:46:18,590 epoch 102 - iter 156/526 - loss 0.00119224\n", + "2019-02-19 05:46:56,421 epoch 102 - iter 208/526 - loss 0.00118233\n", + "2019-02-19 05:47:35,766 epoch 102 - iter 260/526 - loss 0.00121846\n", + "2019-02-19 05:48:21,188 epoch 102 - iter 312/526 - loss 0.00127382\n", + "2019-02-19 05:48:59,950 epoch 102 - iter 364/526 - loss 0.00126384\n", + "2019-02-19 05:49:42,131 epoch 102 - iter 416/526 - loss 0.00125549\n", + "2019-02-19 05:50:25,036 epoch 102 - iter 468/526 - loss 0.00123138\n", + "2019-02-19 05:51:08,328 epoch 102 - iter 520/526 - loss 0.00125433\n", + "2019-02-19 05:51:12,972 ----------------------------------------------------------------------------------------------------\n", + "2019-02-19 05:51:12,974 EPOCH 102 done: loss 0.0012 - lr 0.1000 - bad epochs 3\n", + "2019-02-19 05:51:49,285 DEV : loss 0.01211794 - f-score 0.9250 - acc 0.9250\n", + "2019-02-19 05:52:14,459 TEST : loss 0.01766142 - f-score 0.8824 - acc 0.8824\n", + "2019-02-19 05:52:14,461 ----------------------------------------------------------------------------------------------------\n", + "2019-02-19 05:52:15,265 epoch 103 - iter 0/526 - loss 0.00020129\n", + "2019-02-19 05:52:54,278 epoch 103 - iter 52/526 - loss 0.00117241\n", + "2019-02-19 05:53:40,566 epoch 103 - iter 104/526 - loss 0.00129302\n", + "2019-02-19 05:54:21,014 epoch 103 - iter 156/526 - loss 0.00119402\n", + "2019-02-19 05:55:07,676 epoch 103 - iter 208/526 - loss 0.00129898\n", + "2019-02-19 05:55:48,013 epoch 103 - iter 260/526 - loss 0.00130149\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "2019-02-19 05:56:29,273 epoch 103 - iter 312/526 - loss 0.00130189\n", + "2019-02-19 05:57:11,297 epoch 103 - iter 364/526 - loss 0.00133018\n", + "2019-02-19 05:57:49,646 epoch 103 - iter 416/526 - loss 0.00131048\n", + "2019-02-19 05:58:30,983 epoch 103 - iter 468/526 - loss 0.00130456\n", + "2019-02-19 05:59:13,014 epoch 103 - iter 520/526 - loss 0.00127761\n", + "2019-02-19 05:59:16,259 ----------------------------------------------------------------------------------------------------\n", + "2019-02-19 05:59:16,260 EPOCH 103 done: loss 0.0013 - lr 0.1000 - bad epochs 4\n", + "2019-02-19 05:59:52,479 DEV : loss 0.01174637 - f-score 0.9240 - acc 0.9240\n", + "2019-02-19 06:00:17,984 TEST : loss 0.01570701 - f-score 0.8824 - acc 0.8824\n", + "2019-02-19 06:00:17,987 ----------------------------------------------------------------------------------------------------\n", + "2019-02-19 06:00:18,988 epoch 104 - iter 0/526 - loss 0.00028872\n", + "2019-02-19 06:01:00,303 epoch 104 - iter 52/526 - loss 0.00128675\n", + "2019-02-19 06:01:40,773 epoch 104 - iter 104/526 - loss 0.00129726\n", + "2019-02-19 06:02:23,467 epoch 104 - iter 156/526 - loss 0.00116072\n", + "2019-02-19 06:03:01,850 epoch 104 - iter 208/526 - loss 0.00117532\n", + "2019-02-19 06:03:41,140 epoch 104 - iter 260/526 - loss 0.00118035\n", + "2019-02-19 06:04:23,657 epoch 104 - iter 312/526 - loss 0.00123913\n", + "2019-02-19 06:05:09,079 epoch 104 - iter 364/526 - loss 0.00119165\n", + "2019-02-19 06:05:52,089 epoch 104 - iter 416/526 - loss 0.00120042\n", + "2019-02-19 06:06:29,401 epoch 104 - iter 468/526 - loss 0.00124895\n", + "2019-02-19 06:07:10,132 epoch 104 - iter 520/526 - loss 0.00127027\n", + "2019-02-19 06:07:13,510 ----------------------------------------------------------------------------------------------------\n", + "2019-02-19 06:07:13,512 EPOCH 104 done: loss 0.0013 - lr 0.1000 - bad epochs 5\n", + "2019-02-19 06:07:49,372 DEV : loss 0.01213129 - f-score 0.9100 - acc 0.9100\n", + "2019-02-19 06:08:13,798 TEST : loss 0.02008677 - f-score 0.8485 - acc 0.8485\n", + "Epoch 103: reducing learning rate of group 0 to 5.0000e-02.\n", + "2019-02-19 06:08:13,802 ----------------------------------------------------------------------------------------------------\n", + "2019-02-19 06:08:14,471 epoch 105 - iter 0/526 - loss 0.00048894\n", + "2019-02-19 06:08:54,567 epoch 105 - iter 52/526 - loss 0.00089895\n", + "2019-02-19 06:09:30,302 epoch 105 - iter 104/526 - loss 0.00094203\n", + "2019-02-19 06:10:10,807 epoch 105 - iter 156/526 - loss 0.00086284\n", + "2019-02-19 06:10:49,854 epoch 105 - iter 208/526 - loss 0.00085964\n", + "2019-02-19 06:11:28,507 epoch 105 - iter 260/526 - loss 0.00080848\n", + "2019-02-19 06:12:08,794 epoch 105 - iter 312/526 - loss 0.00086415\n", + "2019-02-19 06:12:53,583 epoch 105 - iter 364/526 - loss 0.00088859\n", + "2019-02-19 06:13:34,755 epoch 105 - iter 416/526 - loss 0.00090857\n", + "2019-02-19 06:14:16,640 epoch 105 - iter 468/526 - loss 0.00090407\n", + "2019-02-19 06:15:00,598 epoch 105 - iter 520/526 - loss 0.00088821\n", + "2019-02-19 06:15:05,196 ----------------------------------------------------------------------------------------------------\n", + "2019-02-19 06:15:05,198 EPOCH 105 done: loss 0.0009 - lr 0.0500 - bad epochs 0\n", + "2019-02-19 06:15:58,421 DEV : loss 0.01244135 - f-score 0.9190 - acc 0.9190\n", + "2019-02-19 06:16:34,003 TEST : loss 0.01626293 - f-score 0.8862 - acc 0.8862\n", + "2019-02-19 06:16:45,196 ----------------------------------------------------------------------------------------------------\n", + "2019-02-19 06:16:45,951 epoch 106 - iter 0/526 - loss 0.00030530\n", + "2019-02-19 06:17:27,294 epoch 106 - iter 52/526 - loss 0.00056293\n", + "2019-02-19 06:18:11,224 epoch 106 - iter 104/526 - loss 0.00061212\n", + "2019-02-19 06:18:50,629 epoch 106 - iter 156/526 - loss 0.00069673\n", + "2019-02-19 06:19:33,765 epoch 106 - iter 208/526 - loss 0.00075924\n", + "2019-02-19 06:20:14,245 epoch 106 - iter 260/526 - loss 0.00076106\n", + "2019-02-19 06:20:52,190 epoch 106 - iter 312/526 - loss 0.00077286\n", + "2019-02-19 06:21:32,268 epoch 106 - iter 364/526 - loss 0.00074958\n", + "2019-02-19 06:22:09,558 epoch 106 - iter 416/526 - loss 0.00081282\n", + "2019-02-19 06:22:48,818 epoch 106 - iter 468/526 - loss 0.00083233\n", + "2019-02-19 06:23:31,557 epoch 106 - iter 520/526 - loss 0.00082965\n", + "2019-02-19 06:23:35,328 ----------------------------------------------------------------------------------------------------\n", + "2019-02-19 06:23:35,329 EPOCH 106 done: loss 0.0008 - lr 0.0500 - bad epochs 0\n", + "2019-02-19 06:24:13,622 DEV : loss 0.01348019 - f-score 0.9180 - acc 0.9180\n", + "2019-02-19 06:24:39,040 TEST : loss 0.01750593 - f-score 0.8791 - acc 0.8791\n", + "2019-02-19 06:24:49,961 ----------------------------------------------------------------------------------------------------\n", + "2019-02-19 06:24:51,260 epoch 107 - iter 0/526 - loss 0.00168006\n", + "2019-02-19 06:25:33,840 epoch 107 - iter 52/526 - loss 0.00066215\n", + "2019-02-19 06:26:13,859 epoch 107 - iter 104/526 - loss 0.00066321\n", + "2019-02-19 06:26:52,051 epoch 107 - iter 156/526 - loss 0.00069134\n", + "2019-02-19 06:27:36,375 epoch 107 - iter 208/526 - loss 0.00065783\n", + "2019-02-19 06:28:14,066 epoch 107 - iter 260/526 - loss 0.00063577\n", + "2019-02-19 06:28:56,302 epoch 107 - iter 312/526 - loss 0.00065161\n", + "2019-02-19 06:29:34,917 epoch 107 - iter 364/526 - loss 0.00063521\n", + "2019-02-19 06:30:11,756 epoch 107 - iter 416/526 - loss 0.00062486\n", + "2019-02-19 06:30:50,263 epoch 107 - iter 468/526 - loss 0.00060772\n", + "2019-02-19 06:31:33,289 epoch 107 - iter 520/526 - loss 0.00062081\n", + "2019-02-19 06:31:35,950 ----------------------------------------------------------------------------------------------------\n", + "2019-02-19 06:31:35,951 EPOCH 107 done: loss 0.0006 - lr 0.0500 - bad epochs 0\n", + "2019-02-19 06:32:11,180 DEV : loss 0.01386657 - f-score 0.9195 - acc 0.9195\n", + "2019-02-19 06:32:35,566 TEST : loss 0.01769999 - f-score 0.8848 - acc 0.8848\n", + "2019-02-19 06:32:46,461 ----------------------------------------------------------------------------------------------------\n", + "2019-02-19 06:32:47,097 epoch 108 - iter 0/526 - loss 0.00015158\n", + "2019-02-19 06:33:24,171 ----------------------------------------------------------------------------------------------------\n", + "2019-02-19 06:33:24,173 Exiting from training early.\n", + "2019-02-19 06:33:24,174 Saving model ...\n", + "2019-02-19 06:33:34,901 Done.\n", + "2019-02-19 06:33:34,902 ----------------------------------------------------------------------------------------------------\n", + "2019-02-19 06:33:34,903 Testing using best model ...\n", + "2019-02-19 06:34:03,015 MICRO_AVG: acc 0.8848 - f1-score 0.8848\n", + "2019-02-19 06:34:03,018 MARCO_AVG: acc 0.8847 - f1-score 0.8862\n", + "2019-02-19 06:34:03,019 0 tp: 894 - fp: 89 - fn: 152 - tn: 894 - precision: 0.9095 - recall: 0.8547 - accuracy: 0.8812 - f1-score: 0.8812\n", + "2019-02-19 06:34:03,020 1 tp: 957 - fp: 152 - fn: 89 - tn: 957 - precision: 0.8629 - recall: 0.9149 - accuracy: 0.8882 - f1-score: 0.8881\n", + "2019-02-19 06:34:03,020 ----------------------------------------------------------------------------------------------------\n" + ] + }, + { + "data": { + "text/plain": [ + "{'test_score': 0.8848,\n", + " 'dev_score_history': [0.7349,\n", + " 0.7599,\n", + " 0.7714,\n", + " 0.7859,\n", + " 0.7994,\n", + " 0.8054,\n", + " 0.7654,\n", + " 0.7994,\n", + " 0.8069,\n", + " 0.8179,\n", + " 0.8169,\n", + " 0.8114,\n", + " 0.8329,\n", + " 0.8289,\n", + " 0.8579,\n", + " 0.8744,\n", + " 0.8754,\n", + " 0.8739,\n", + " 0.8789,\n", + " 0.9025,\n", + " 0.8769,\n", + " 0.8749,\n", + " 0.8944,\n", + " 0.907,\n", + " 0.904,\n", + " 0.9185,\n", + " 0.9055,\n", + " 0.92,\n", + " 0.914,\n", + " 0.9065,\n", + " 0.925,\n", + " 0.9165,\n", + " 0.917,\n", + " 0.9215,\n", + " 0.9055,\n", + " 0.908,\n", + " 0.926,\n", + " 0.927,\n", + " 0.93,\n", + " 0.925,\n", + " 0.9235,\n", + " 0.921,\n", + " 0.9235,\n", + " 0.9295,\n", + " 0.9185,\n", + " 0.926,\n", + " 0.9245,\n", + " 0.9185,\n", + " 0.9195,\n", + " 0.917,\n", + " 0.9055,\n", + " 0.918,\n", + " 0.914,\n", + " 0.926,\n", + " 0.924,\n", + " 0.923,\n", + " 0.9205,\n", + " 0.9205,\n", + " 0.924,\n", + " 0.9245,\n", + " 0.9195,\n", + " 0.922,\n", + " 0.921,\n", + " 0.923,\n", + " 0.92,\n", + " 0.9135,\n", + " 0.9195,\n", + " 0.9145,\n", + " 0.922,\n", + " 0.923,\n", + " 0.9205,\n", + " 0.9195,\n", + " 0.921,\n", + " 0.927,\n", + " 0.922,\n", + " 0.9205,\n", + " 0.914,\n", + " 0.92,\n", + " 0.9245,\n", + " 0.925,\n", + " 0.903,\n", + " 0.9185,\n", + " 0.918,\n", + " 0.921,\n", + " 0.9245,\n", + " 0.9095,\n", + " 0.91,\n", + " 0.918,\n", + " 0.9235,\n", + " 0.915,\n", + " 0.924,\n", + " 0.918,\n", + " 0.922,\n", + " 0.9155,\n", + " 0.914,\n", + " 0.9145,\n", + " 0.918,\n", + " 0.9215,\n", + " 0.92,\n", + " 0.9285,\n", + " 0.9205,\n", + " 0.925,\n", + " 0.924,\n", + " 0.91,\n", + " 0.919,\n", + " 0.918,\n", + " 0.9195],\n", + " 'train_loss_history': [0.016708851694586187,\n", + " 0.015160481161020435,\n", + " 0.014552138807315904,\n", + " 0.013930917686584849,\n", + " 0.013529171745206688,\n", + " 0.013466031610253915,\n", + " 0.013145331682230189,\n", + " 0.012817235365284224,\n", + " 0.012712909168018802,\n", + " 0.012545509526708477,\n", + " 0.01243734514941351,\n", + " 0.012369954493422467,\n", + " 0.011985785183043314,\n", + " 0.011734974272046722,\n", + " 0.011265585188927707,\n", + " 0.009753199330176427,\n", + " 0.008712939202022329,\n", + " 0.008085133701183956,\n", + " 0.007628458493796058,\n", + " 0.007359891166205245,\n", + " 0.007021535409405393,\n", + " 0.0068794458783159465,\n", + " 0.006523635948451897,\n", + " 0.006310657831531399,\n", + " 0.006219421519852671,\n", + " 0.006067579466608089,\n", + " 0.006013898238806183,\n", + " 0.005733796698424447,\n", + " 0.0057139206003931345,\n", + " 0.005473889973129466,\n", + " 0.005376285016842155,\n", + " 0.00523868023881753,\n", + " 0.005051989691873922,\n", + " 0.005016283240534711,\n", + " 0.004839610288709917,\n", + " 0.004950970484230559,\n", + " 0.004769527550500547,\n", + " 0.0046601146442979335,\n", + " 0.004447404004039806,\n", + " 0.004532231647313424,\n", + " 0.00438205041639818,\n", + " 0.004246738519083316,\n", + " 0.004066525674837579,\n", + " 0.003926651166311192,\n", + " 0.004010900164831025,\n", + " 0.003835272856796392,\n", + " 0.0038848838711739663,\n", + " 0.003801890622175255,\n", + " 0.0035123873102948966,\n", + " 0.003456471815344966,\n", + " 0.0035348378520145304,\n", + " 0.0034528942777046537,\n", + " 0.003348463570674638,\n", + " 0.003193427973256063,\n", + " 0.003242392421183077,\n", + " 0.0030558225421823608,\n", + " 0.0030510075235736364,\n", + " 0.0029469775199211967,\n", + " 0.0028531293365197997,\n", + " 0.002834125804684923,\n", + " 0.0027787558807236194,\n", + " 0.0027531463259204804,\n", + " 0.0025840972514633727,\n", + " 0.0026839049507555997,\n", + " 0.002527960452501411,\n", + " 0.002543972393569869,\n", + " 0.002498156162445083,\n", + " 0.002457980479604402,\n", + " 0.0024528499806334,\n", + " 0.0023583637921873435,\n", + " 0.002392645299735235,\n", + " 0.002279001029983971,\n", + " 0.002196007255093171,\n", + " 0.002195928766141565,\n", + " 0.001935656289787772,\n", + " 0.0019363653748697648,\n", + " 0.0018713638718433575,\n", + " 0.0019595822783970668,\n", + " 0.0019903742065232113,\n", + " 0.001939045057511014,\n", + " 0.0019225626514375645,\n", + " 0.001705819316066487,\n", + " 0.0017266585037307453,\n", + " 0.0016854887821701474,\n", + " 0.0015841096522989605,\n", + " 0.001820786543977104,\n", + " 0.0016709693140520654,\n", + " 0.0016224729744373856,\n", + " 0.001661624518069777,\n", + " 0.0017472637632891504,\n", + " 0.0014731667006905014,\n", + " 0.0014054862485825485,\n", + " 0.0015519472988850594,\n", + " 0.001334842675344536,\n", + " 0.0013547355089343052,\n", + " 0.0013040071516550909,\n", + " 0.0013844019493054816,\n", + " 0.0011575900212547356,\n", + " 0.0013619943227098574,\n", + " 0.0011829861343373084,\n", + " 0.001247771065135475,\n", + " 0.0012492339696869494,\n", + " 0.0012906563962573965,\n", + " 0.0012776504237974814,\n", + " 0.000895365420656988,\n", + " 0.0008274823035215936,\n", + " 0.0006204608782981346],\n", + " 'dev_loss_history': [0.015533569268882275,\n", + " 0.014857761561870575,\n", + " 0.014346286654472351,\n", + " 0.013920259661972523,\n", + " 0.013386452570557594,\n", + " 0.012671118602156639,\n", + " 0.014364621601998806,\n", + " 0.012792730703949928,\n", + " 0.01260459516197443,\n", + " 0.012190107256174088,\n", + " 0.012093155644834042,\n", + " 0.012637223117053509,\n", + " 0.011709899641573429,\n", + " 0.01152237132191658,\n", + " 0.010071340948343277,\n", + " 0.008730717934668064,\n", + " 0.009065507911145687,\n", + " 0.008951223455369473,\n", + " 0.008494862355291843,\n", + " 0.007422446273267269,\n", + " 0.009027659893035889,\n", + " 0.010181138291954994,\n", + " 0.00811642687767744,\n", + " 0.007011303212493658,\n", + " 0.007075179368257523,\n", + " 0.006715509574860334,\n", + " 0.007419547066092491,\n", + " 0.006599108688533306,\n", + " 0.0067612831480801105,\n", + " 0.007427784148603678,\n", + " 0.006313795689493418,\n", + " 0.006555614527314901,\n", + " 0.006710393819957972,\n", + " 0.006489144638180733,\n", + " 0.007628345862030983,\n", + " 0.007547229994088411,\n", + " 0.0067196800373494625,\n", + " 0.006582622416317463,\n", + " 0.006891313940286636,\n", + " 0.006393517833203077,\n", + " 0.006469651125371456,\n", + " 0.00665303785353899,\n", + " 0.006635638885200024,\n", + " 0.006639295723289251,\n", + " 0.0068130530416965485,\n", + " 0.006843602284789085,\n", + " 0.006837761960923672,\n", + " 0.007117715664207935,\n", + " 0.007072587497532368,\n", + " 0.007978592999279499,\n", + " 0.009340363554656506,\n", + " 0.007133088540285826,\n", + " 0.007803276181221008,\n", + " 0.0067718359641730785,\n", + " 0.00798116996884346,\n", + " 0.007982995361089706,\n", + " 0.00787285715341568,\n", + " 0.008055082522332668,\n", + " 0.00815735012292862,\n", + " 0.007912601344287395,\n", + " 0.008659182116389275,\n", + " 0.007356438785791397,\n", + " 0.00804904755204916,\n", + " 0.008919219486415386,\n", + " 0.007776861544698477,\n", + " 0.01033700816333294,\n", + " 0.009298614226281643,\n", + " 0.00871719978749752,\n", + " 0.00926122721284628,\n", + " 0.009263498708605766,\n", + " 0.009112130850553513,\n", + " 0.00948996003717184,\n", + " 0.008984975516796112,\n", + " 0.009276941418647766,\n", + " 0.009573808871209621,\n", + " 0.009178363718092442,\n", + " 0.010200003162026405,\n", + " 0.008755668997764587,\n", + " 0.00981319509446621,\n", + " 0.00911485031247139,\n", + " 0.010518982075154781,\n", + " 0.009392832405865192,\n", + " 0.010198121890425682,\n", + " 0.010506096296012402,\n", + " 0.011796471662819386,\n", + " 0.012919222936034203,\n", + " 0.011561417952179909,\n", + " 0.009509583935141563,\n", + " 0.009394108317792416,\n", + " 0.010476901195943356,\n", + " 0.011427275836467743,\n", + " 0.011473114602267742,\n", + " 0.011757048778235912,\n", + " 0.012347670271992683,\n", + " 0.010681777261197567,\n", + " 0.012262973934412003,\n", + " 0.011161251924932003,\n", + " 0.01133703999221325,\n", + " 0.01141116302460432,\n", + " 0.012089996598660946,\n", + " 0.011495801620185375,\n", + " 0.012117942795157433,\n", + " 0.011746374890208244,\n", + " 0.012131287716329098,\n", + " 0.012441350147128105,\n", + " 0.013480187393724918,\n", + " 0.01386656891554594]}" + ] + }, + "execution_count": 8, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "# 7. start the training\n", + "trainer.train('/local/burghbvander/flair_experiments/',\n", + " learning_rate=0.1,\n", + " mini_batch_size=32,\n", + " anneal_factor=0.5,\n", + " patience=5,\n", + " max_epochs=150)" + ] + }, + { + "cell_type": "code", + "execution_count": 10, + "metadata": {}, + "outputs": [], + "source": [ + "# 8. plot training curves (optional)\n", + "from flair.visual.training_curves import Plotter\n", + "plotter = Plotter()\n", + "plotter.plot_training_curves('/local/burghbvander/flair_experiments/loss.tsv')\n", + "plotter.plot_weights('/local/burghbvander/flair_experiments/weights.txt')" + ] + } + ], + "metadata": { + "kernelspec": { + "display_name": "Python 3", + "language": "python", + "name": "python3" + }, + "language_info": { + "codemirror_mode": { + "name": "ipython", + "version": 3 + }, + "file_extension": ".py", + "mimetype": "text/x-python", + "name": "python", + "nbconvert_exporter": "python", + "pygments_lexer": "ipython3", + "version": "3.7.1" + } + }, + "nbformat": 4, + "nbformat_minor": 2 +} diff --git a/experiments/dutch/flair/requirements.txt b/experiments/dutch/flair/requirements.txt new file mode 100644 index 0000000..276ef1b --- /dev/null +++ b/experiments/dutch/flair/requirements.txt @@ -0,0 +1 @@ +flair==0.4.0 \ No newline at end of file diff --git a/experiments/dutch/svm/README.md b/experiments/dutch/svm/README.md new file mode 100644 index 0000000..37feef0 --- /dev/null +++ b/experiments/dutch/svm/README.md @@ -0,0 +1,7 @@ +# SVM classifier baseline + +## Description + +[LinearSVC](https://scikit-learn.org/stable/modules/generated/sklearn.svm.LinearSVC.html) from [scikit-learn](https://scikit-learn.org) was used to obtain a baseline for the sentiment polarity classification task. + +The folder simply includes \ No newline at end of file diff --git a/experiments/dutch/svm/requirements.txt b/experiments/dutch/svm/requirements.txt new file mode 100644 index 0000000..1afcc19 --- /dev/null +++ b/experiments/dutch/svm/requirements.txt @@ -0,0 +1 @@ +scikit-learn==0.20.1 \ No newline at end of file diff --git a/experiments/dutch/svm/svm_experiment.ipynb b/experiments/dutch/svm/svm_experiment.ipynb new file mode 100644 index 0000000..13d656d --- /dev/null +++ b/experiments/dutch/svm/svm_experiment.ipynb @@ -0,0 +1,163 @@ +{ + "cells": [ + { + "cell_type": "code", + "execution_count": 1, + "metadata": {}, + "outputs": [], + "source": [ + "from sklearn.datasets import load_files\n", + "from sklearn.feature_extraction.text import TfidfVectorizer\n", + "from sklearn.svm import LinearSVC\n", + "from sklearn.metrics import accuracy_score" + ] + }, + { + "cell_type": "code", + "execution_count": 2, + "metadata": {}, + "outputs": [], + "source": [ + "basedir = '/local/burghbvander/110kDBRDv2/'" + ] + }, + { + "cell_type": "code", + "execution_count": 3, + "metadata": {}, + "outputs": [], + "source": [ + "train = load_files(basedir + 'train', encoding='utf-8')\n", + "test = load_files(basedir + 'test', encoding='utf-8')" + ] + }, + { + "cell_type": "code", + "execution_count": 5, + "metadata": {}, + "outputs": [], + "source": [ + "x_orig_train, y_train = train.data, train.target\n", + "x_orig_test, y_test = test.data, test.target" + ] + }, + { + "cell_type": "code", + "execution_count": 6, + "metadata": {}, + "outputs": [ + { + "data": { + "text/plain": [ + "TfidfVectorizer(analyzer='word', binary=False, decode_error='strict',\n", + " dtype=, encoding='utf-8', input='content',\n", + " lowercase=True, max_df=1.0, max_features=None, min_df=1,\n", + " ngram_range=(1, 4), norm='l2', preprocessor=None, smooth_idf=True,\n", + " stop_words=None, strip_accents=None, sublinear_tf=False,\n", + " token_pattern='(?u)\\\\b\\\\w\\\\w+\\\\b', tokenizer=None, use_idf=True,\n", + " vocabulary=None)" + ] + }, + "execution_count": 6, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "ngram_range = (1,4)\n", + "analyzer = 'word'\n", + "\n", + "vectorizer = TfidfVectorizer(\n", + " ngram_range=ngram_range,\n", + " analyzer=analyzer\n", + ")\n", + "\n", + "vectorizer.fit(x_orig_train + x_orig_test)" + ] + }, + { + "cell_type": "code", + "execution_count": 7, + "metadata": {}, + "outputs": [], + "source": [ + "x_train = vectorizer.transform(x_orig_train)\n", + "x_test = vectorizer.transform(x_orig_test)" + ] + }, + { + "cell_type": "code", + "execution_count": 8, + "metadata": {}, + "outputs": [ + { + "data": { + "text/plain": [ + "LinearSVC(C=1.0, class_weight=None, dual=True, fit_intercept=True,\n", + " intercept_scaling=1, loss='squared_hinge', max_iter=1000,\n", + " multi_class='ovr', penalty='l2', random_state=None, tol=0.0001,\n", + " verbose=0)" + ] + }, + "execution_count": 8, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "svc = LinearSVC()\n", + "svc.fit(x_train, y_train)" + ] + }, + { + "cell_type": "code", + "execution_count": 10, + "metadata": {}, + "outputs": [], + "source": [ + "y_pred = svc.predict(x_test)" + ] + }, + { + "cell_type": "code", + "execution_count": 11, + "metadata": {}, + "outputs": [ + { + "data": { + "text/plain": [ + "0.8915950334288443" + ] + }, + "execution_count": 11, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "accuracy_score(y_test, y_pred)" + ] + } + ], + "metadata": { + "kernelspec": { + "display_name": "Python 3", + "language": "python", + "name": "python3" + }, + "language_info": { + "codemirror_mode": { + "name": "ipython", + "version": 3 + }, + "file_extension": ".py", + "mimetype": "text/x-python", + "name": "python", + "nbconvert_exporter": "python", + "pygments_lexer": "ipython3", + "version": "3.7.1" + } + }, + "nbformat": 4, + "nbformat_minor": 2 +} diff --git a/experiments/dutch/ulmfit_no_pretrain/README.md b/experiments/dutch/ulmfit_no_pretrain/README.md new file mode 100644 index 0000000..a4d9e72 --- /dev/null +++ b/experiments/dutch/ulmfit_no_pretrain/README.md @@ -0,0 +1,9 @@ +# ULMFiT pre-trained LM experiment + +## Description + +This folder contains a Jupyter Notebook with experiments and results on the 110kDBRD dataset for sentiment polarity classification. It uses no pre-trained LM and the LM is therefore trained on all available data in 110kDBRD. + +## Run + +The `path` variable to the 110kDBRD dataset should be changed and the Jupyter Notebook should run fine. \ No newline at end of file diff --git a/experiments/dutch/ulmfit_no_pretrain/requirements.txt b/experiments/dutch/ulmfit_no_pretrain/requirements.txt new file mode 100644 index 0000000..5abc0a5 --- /dev/null +++ b/experiments/dutch/ulmfit_no_pretrain/requirements.txt @@ -0,0 +1 @@ +fastai==1.0.45 \ No newline at end of file diff --git a/experiments/dutch/ulmfit_no_pretrain/ulmfit_no_pretrain.ipynb b/experiments/dutch/ulmfit_no_pretrain/ulmfit_no_pretrain.ipynb new file mode 100644 index 0000000..571f075 --- /dev/null +++ b/experiments/dutch/ulmfit_no_pretrain/ulmfit_no_pretrain.ipynb @@ -0,0 +1,1062 @@ +{ + "cells": [ + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "# IMDB" + ] + }, + { + "cell_type": "code", + "execution_count": 1, + "metadata": {}, + "outputs": [], + "source": [ + "%reload_ext autoreload\n", + "%autoreload 2\n", + "%matplotlib inline" + ] + }, + { + "cell_type": "code", + "execution_count": 2, + "metadata": {}, + "outputs": [], + "source": [ + "from fastai.text import *" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "## Preparing the data" + ] + }, + { + "cell_type": "code", + "execution_count": 3, + "metadata": {}, + "outputs": [ + { + "data": { + "text/plain": [ + "[PosixPath('/local/burghbvander/110kDBRDv2_no_pretrain/tmp_lm'),\n", + " PosixPath('/local/burghbvander/110kDBRDv2_no_pretrain/test'),\n", + " PosixPath('/local/burghbvander/110kDBRDv2_no_pretrain/unsup'),\n", + " PosixPath('/local/burghbvander/110kDBRDv2_no_pretrain/urls.txt'),\n", + " PosixPath('/local/burghbvander/110kDBRDv2_no_pretrain/tmp_clas'),\n", + " PosixPath('/local/burghbvander/110kDBRDv2_no_pretrain/train'),\n", + " PosixPath('/local/burghbvander/110kDBRDv2_no_pretrain/models')]" + ] + }, + "execution_count": 3, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "path = Path('/local/burghbvander/110kDBRDv2_no_pretrain/')\n", + "path.ls()" + ] + }, + { + "cell_type": "code", + "execution_count": 4, + "metadata": {}, + "outputs": [], + "source": [ + "bs=118" + ] + }, + { + "cell_type": "code", + "execution_count": 5, + "metadata": {}, + "outputs": [], + "source": [ + "data_lm = (TextList.from_folder(path)\n", + " #Inputs: all the text files in path\n", + " .filter_by_folder(include=['train', 'test', 'unsup']) \n", + " #We may have other temp folders that contain text files so we only keep what's in train and test\n", + " .random_split_by_pct(0.1)\n", + " #We randomly split and keep 10% (10,000 reviews) for validation\n", + " .label_for_lm() \n", + " #We want to do a language model so we label accordingly\n", + " .databunch(bs=bs))\n", + "data_lm.save('tmp_lm')" + ] + }, + { + "cell_type": "code", + "execution_count": 8, + "metadata": {}, + "outputs": [], + "source": [ + "data_lm = load_data(path, 'tmp_lm', bs=bs)" + ] + }, + { + "cell_type": "code", + "execution_count": 6, + "metadata": {}, + "outputs": [ + { + "data": { + "text/html": [ + "\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
idxtext
0ik uiteindelijk wel zeker , xxmaj matthias was dood . \\n xxmaj uit de verschillende verhaallijnen heb ik echter nooit kunnen distilleren wie xxmaj matthias nu wel was . xxmaj wel was het duidelijk dat hij op zijn weg heel wat tegenslagen te verwerken kreeg en niet altijd begrepen werd . \\n xxmaj ik kreeg wel een beter beeld van de naasten van xxmaj matthias . \\n
1de schrijver . \\n ' xxmaj het is autobiografisch , helemaal waargebeurd maar toch zie je elementen van fictie in de stijl en vooral de opbouw , dat maakt het des te sterker . ' - xxmaj win boeken voor je hele leesclub ! \\n ' xxmaj wat beweegt de jonge zwarte deelpachter xxmaj tucker xxmaj caliban om huis , vee en akkers te vernietigen en met vrouw
2xxmaj win boeken voor je hele leesclub ! \\n ' xxmaj wat beweegt de jonge zwarte deelpachter xxmaj tucker xxmaj caliban om huis , vee en akkers te vernietigen en met vrouw en kind naar het xxmaj noorden te vertrekken?'- xxmaj win xxmaj uit de maat voor je hele leesgroep ! \\n xxmaj we gaan xxmaj wil van xxmaj jeroen xxmaj olyslaegers luisteren via de gratis xxmaj hebban
3xxmaj je leert veel over het katholieke geloof , de verschillende stromingen , geschiedenis en gebruiken . xxmaj al vanaf de eerste bladzijden toont xxmaj caldwell zich een goed onderwijzer , de inleiding is een historische kanttekening over de verschillende stromingen binnen deze religie . xxmaj in het verhaal wordt uitvoerig ingegaan op het verloop van het xxunk onderzoek binnen het xxmaj vaticaan . xxmaj de zorgvuldig uitgewerkte details hebben
4mag xxmaj ambrose van zijn moeder niet met hem omgaan . xxmaj totdat hij erachter komt dat ze allebei gek zijn op xxunk ... \\n \\n xxmaj het eerste wat mij opviel was dat xxunk een grote rol speelt in het boek . xxmaj ambrose is natuurlijk gek op xxunk , dus komt dat ook veel voor in het boek . xxmaj zo is de de titel van het
\n" + ], + "text/plain": [ + "" + ] + }, + "metadata": {}, + "output_type": "display_data" + } + ], + "source": [ + "data_lm.show_batch()" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "## Language model" + ] + }, + { + "cell_type": "code", + "execution_count": 7, + "metadata": {}, + "outputs": [], + "source": [ + "from fastai.text.models import AWD_LSTM" + ] + }, + { + "cell_type": "code", + "execution_count": 8, + "metadata": {}, + "outputs": [], + "source": [ + "learn = language_model_learner(data_lm, AWD_LSTM, drop_mult=0.3)" + ] + }, + { + "cell_type": "code", + "execution_count": 9, + "metadata": {}, + "outputs": [ + { + "data": { + "text/html": [], + "text/plain": [ + "" + ] + }, + "metadata": {}, + "output_type": "display_data" + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "LR Finder is complete, type {learner_name}.recorder.plot() to see the graph.\n" + ] + } + ], + "source": [ + "learn.lr_find()" + ] + }, + { + "cell_type": "code", + "execution_count": 10, + "metadata": {}, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "Min numerical gradient: 1.58E-02\n" + ] + }, + { + "data": { + "image/png": "\n", + "text/plain": [ + "
" + ] + }, + "metadata": { + "needs_background": "light" + }, + "output_type": "display_data" + } + ], + "source": [ + "learn.recorder.plot(skip_end=15)" + ] + }, + { + "cell_type": "code", + "execution_count": 11, + "metadata": {}, + "outputs": [ + { + "data": { + "text/html": [ + "Total time: 44:32

\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
epochtrain_lossvalid_lossaccuracy
13.8611423.6811370.362308
\n" + ], + "text/plain": [ + "" + ] + }, + "metadata": {}, + "output_type": "display_data" + } + ], + "source": [ + "learn.fit_one_cycle(1, 1e-2, moms=(0.8,0.7))" + ] + }, + { + "cell_type": "code", + "execution_count": 12, + "metadata": {}, + "outputs": [], + "source": [ + "learn.save('fit_head')" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [], + "source": [ + "learn.load('fit_head');" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "To complete the fine-tuning, we can then unfeeze and launch a new training." + ] + }, + { + "cell_type": "code", + "execution_count": 13, + "metadata": {}, + "outputs": [], + "source": [ + "learn.unfreeze()" + ] + }, + { + "cell_type": "code", + "execution_count": 14, + "metadata": {}, + "outputs": [ + { + "data": { + "text/html": [], + "text/plain": [ + "" + ] + }, + "metadata": {}, + "output_type": "display_data" + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "LR Finder is complete, type {learner_name}.recorder.plot() to see the graph.\n" + ] + } + ], + "source": [ + "learn.lr_find()" + ] + }, + { + "cell_type": "code", + "execution_count": 15, + "metadata": {}, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "Min numerical gradient: 1.45E-05\n" + ] + }, + { + "data": { + "image/png": "\n", + "text/plain": [ + "

" + ] + }, + "metadata": { + "needs_background": "light" + }, + "output_type": "display_data" + } + ], + "source": [ + "learn.recorder.plot(skip_end=15)" + ] + }, + { + "cell_type": "code", + "execution_count": 16, + "metadata": {}, + "outputs": [], + "source": [ + "from fastai.callbacks import SaveModelCallback\n", + "cb = SaveModelCallback(learn, every='epoch')" + ] + }, + { + "cell_type": "code", + "execution_count": 17, + "metadata": {}, + "outputs": [ + { + "data": { + "text/html": [ + "\n", + "
\n", + " \n", + " \n", + " 65.00% [13/20 10:52:59<5:51:36]\n", + "
\n", + " \n", + "\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
epochtrain_lossvalid_lossaccuracy
13.6710353.6039900.369439
23.6000483.5262030.377952
33.5221763.4461750.386902
43.4075563.3740150.395235
53.3594153.3147430.402030
63.3354503.2665840.407596
73.2747443.2299750.411999
83.2435053.2005300.415410
93.2091893.1776830.418160
103.2099213.1583600.420391
113.1370683.1434750.422215
123.1702853.1313290.423638
133.1180373.1218550.424704
\n", + "\n", + "\n", + "
\n", + " \n", + " \n", + " Interrupted\n", + "
\n", + " " + ], + "text/plain": [ + "" + ] + }, + "metadata": {}, + "output_type": "display_data" + }, + { + "ename": "KeyboardInterrupt", + "evalue": "", + "output_type": "error", + "traceback": [ + "\u001b[0;31m---------------------------------------------------------------------------\u001b[0m", + "\u001b[0;31mKeyboardInterrupt\u001b[0m Traceback (most recent call last)", + "\u001b[0;32m\u001b[0m in \u001b[0;36m\u001b[0;34m\u001b[0m\n\u001b[0;32m----> 1\u001b[0;31m \u001b[0mlearn\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mfit_one_cycle\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0;36m20\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0;36m1e-4\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mmoms\u001b[0m\u001b[0;34m=\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0;36m0.8\u001b[0m\u001b[0;34m,\u001b[0m\u001b[0;36m0.7\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mcallbacks\u001b[0m\u001b[0;34m=\u001b[0m\u001b[0;34m[\u001b[0m\u001b[0mcb\u001b[0m\u001b[0;34m]\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0m", + "\u001b[0;32m/local/burghbvander/anaconda3/lib/python3.7/site-packages/fastai/train.py\u001b[0m in \u001b[0;36mfit_one_cycle\u001b[0;34m(learn, cyc_len, max_lr, moms, div_factor, pct_start, wd, callbacks, tot_epochs, start_epoch)\u001b[0m\n\u001b[1;32m 20\u001b[0m callbacks.append(OneCycleScheduler(learn, max_lr, moms=moms, div_factor=div_factor, pct_start=pct_start, tot_epochs=tot_epochs, \n\u001b[1;32m 21\u001b[0m start_epoch=start_epoch))\n\u001b[0;32m---> 22\u001b[0;31m \u001b[0mlearn\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mfit\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mcyc_len\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mmax_lr\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mwd\u001b[0m\u001b[0;34m=\u001b[0m\u001b[0mwd\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mcallbacks\u001b[0m\u001b[0;34m=\u001b[0m\u001b[0mcallbacks\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0m\u001b[1;32m 23\u001b[0m \u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 24\u001b[0m \u001b[0;32mdef\u001b[0m \u001b[0mlr_find\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mlearn\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0mLearner\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mstart_lr\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0mFloats\u001b[0m\u001b[0;34m=\u001b[0m\u001b[0;36m1e-7\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mend_lr\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0mFloats\u001b[0m\u001b[0;34m=\u001b[0m\u001b[0;36m10\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mnum_it\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0mint\u001b[0m\u001b[0;34m=\u001b[0m\u001b[0;36m100\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mstop_div\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0mbool\u001b[0m\u001b[0;34m=\u001b[0m\u001b[0;32mTrue\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mwd\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0mfloat\u001b[0m\u001b[0;34m=\u001b[0m\u001b[0;32mNone\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n", + "\u001b[0;32m/local/burghbvander/anaconda3/lib/python3.7/site-packages/fastai/basic_train.py\u001b[0m in \u001b[0;36mfit\u001b[0;34m(self, epochs, lr, wd, callbacks)\u001b[0m\n\u001b[1;32m 176\u001b[0m \u001b[0mcallbacks\u001b[0m \u001b[0;34m=\u001b[0m \u001b[0;34m[\u001b[0m\u001b[0mcb\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mself\u001b[0m\u001b[0;34m)\u001b[0m \u001b[0;32mfor\u001b[0m \u001b[0mcb\u001b[0m \u001b[0;32min\u001b[0m \u001b[0mself\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mcallback_fns\u001b[0m\u001b[0;34m]\u001b[0m \u001b[0;34m+\u001b[0m \u001b[0mlistify\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mcallbacks\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 177\u001b[0m fit(epochs, self.model, self.loss_func, opt=self.opt, data=self.data, metrics=self.metrics,\n\u001b[0;32m--> 178\u001b[0;31m callbacks=self.callbacks+callbacks)\n\u001b[0m\u001b[1;32m 179\u001b[0m \u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 180\u001b[0m \u001b[0;32mdef\u001b[0m \u001b[0mcreate_opt\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mself\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mlr\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0mFloats\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mwd\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0mFloats\u001b[0m\u001b[0;34m=\u001b[0m\u001b[0;36m0.\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m->\u001b[0m\u001b[0;32mNone\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n", + "\u001b[0;32m/local/burghbvander/anaconda3/lib/python3.7/site-packages/fastai/utils/mem.py\u001b[0m in \u001b[0;36mwrapper\u001b[0;34m(*args, **kwargs)\u001b[0m\n\u001b[1;32m 78\u001b[0m \u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 79\u001b[0m \u001b[0;32mtry\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0;32m---> 80\u001b[0;31m \u001b[0;32mreturn\u001b[0m \u001b[0mfunc\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0;34m*\u001b[0m\u001b[0margs\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0;34m**\u001b[0m\u001b[0mkwargs\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0m\u001b[1;32m 81\u001b[0m \u001b[0;32mexcept\u001b[0m \u001b[0mException\u001b[0m \u001b[0;32mas\u001b[0m \u001b[0me\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 82\u001b[0m if (\"CUDA out of memory\" in str(e) or\n", + "\u001b[0;32m/local/burghbvander/anaconda3/lib/python3.7/site-packages/fastai/basic_train.py\u001b[0m in \u001b[0;36mfit\u001b[0;34m(epochs, model, loss_func, opt, data, callbacks, metrics)\u001b[0m\n\u001b[1;32m 88\u001b[0m \u001b[0;32mfor\u001b[0m \u001b[0mxb\u001b[0m\u001b[0;34m,\u001b[0m\u001b[0myb\u001b[0m \u001b[0;32min\u001b[0m \u001b[0mprogress_bar\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mdata\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mtrain_dl\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mparent\u001b[0m\u001b[0;34m=\u001b[0m\u001b[0mpbar\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 89\u001b[0m \u001b[0mxb\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0myb\u001b[0m \u001b[0;34m=\u001b[0m \u001b[0mcb_handler\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mon_batch_begin\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mxb\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0myb\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0;32m---> 90\u001b[0;31m \u001b[0mloss\u001b[0m \u001b[0;34m=\u001b[0m \u001b[0mloss_batch\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mmodel\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mxb\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0myb\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mloss_func\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mopt\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mcb_handler\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0m\u001b[1;32m 91\u001b[0m \u001b[0;32mif\u001b[0m \u001b[0mcb_handler\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mon_batch_end\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mloss\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m:\u001b[0m \u001b[0;32mbreak\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 92\u001b[0m \u001b[0;34m\u001b[0m\u001b[0m\n", + "\u001b[0;32m/local/burghbvander/anaconda3/lib/python3.7/site-packages/fastai/basic_train.py\u001b[0m in \u001b[0;36mloss_batch\u001b[0;34m(model, xb, yb, loss_func, opt, cb_handler)\u001b[0m\n\u001b[1;32m 25\u001b[0m \u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 26\u001b[0m \u001b[0;32mif\u001b[0m \u001b[0mopt\u001b[0m \u001b[0;32mis\u001b[0m \u001b[0;32mnot\u001b[0m \u001b[0;32mNone\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0;32m---> 27\u001b[0;31m \u001b[0mloss\u001b[0m \u001b[0;34m=\u001b[0m \u001b[0mcb_handler\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mon_backward_begin\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mloss\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0m\u001b[1;32m 28\u001b[0m \u001b[0mloss\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mbackward\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 29\u001b[0m \u001b[0mcb_handler\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mon_backward_end\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n", + "\u001b[0;32m/local/burghbvander/anaconda3/lib/python3.7/site-packages/fastai/callback.py\u001b[0m in \u001b[0;36mon_backward_begin\u001b[0;34m(self, loss)\u001b[0m\n\u001b[1;32m 240\u001b[0m \u001b[0;32mdef\u001b[0m \u001b[0mon_backward_begin\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mself\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mloss\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0mTensor\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m->\u001b[0m\u001b[0;32mNone\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 241\u001b[0m \u001b[0;34m\"Handle gradient calculation on `loss`.\"\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0;32m--> 242\u001b[0;31m \u001b[0mself\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0msmoothener\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0madd_value\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mloss\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mdetach\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mcpu\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0m\u001b[1;32m 243\u001b[0m \u001b[0mself\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mstate_dict\u001b[0m\u001b[0;34m[\u001b[0m\u001b[0;34m'last_loss'\u001b[0m\u001b[0;34m]\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mself\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mstate_dict\u001b[0m\u001b[0;34m[\u001b[0m\u001b[0;34m'smooth_loss'\u001b[0m\u001b[0;34m]\u001b[0m \u001b[0;34m=\u001b[0m \u001b[0mloss\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mself\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0msmoothener\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0msmooth\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 244\u001b[0m \u001b[0;32mfor\u001b[0m \u001b[0mcb\u001b[0m \u001b[0;32min\u001b[0m \u001b[0mself\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mcallbacks\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n", + "\u001b[0;31mKeyboardInterrupt\u001b[0m: " + ] + } + ], + "source": [ + "learn.fit_one_cycle(20, 1e-4, moms=(0.8,0.7), callbacks=[cb])" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [], + "source": [ + "learn.save('fine_tuned')" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "How good is our model? Well let's try to see what it predicts after a few given words." + ] + }, + { + "cell_type": "code", + "execution_count": 18, + "metadata": {}, + "outputs": [], + "source": [ + "learn.load('bestmodel_13');" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [], + "source": [ + "TEXT = \"Wat een fantastisch boek\"\n", + "N_WORDS = 40\n", + "N_SENTENCES = 2" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [], + "source": [ + "print(\"\\n\".join(learn.predict(TEXT, N_WORDS, temperature=0.75) for _ in range(N_SENTENCES)))" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "We have to save the model but also it's encoder, the part that's responsible for creating and updating the hidden state. For the next part, we don't care about the part that tries to guess the next word." + ] + }, + { + "cell_type": "code", + "execution_count": 19, + "metadata": {}, + "outputs": [], + "source": [ + "learn.save_encoder('fine_tuned_enc')" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "## Classifier" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "Now, we'll create a new data object that only grabs the labelled data and keeps those labels. Again, this line takes a bit of time." + ] + }, + { + "cell_type": "code", + "execution_count": 5, + "metadata": {}, + "outputs": [], + "source": [ + "bs = 32" + ] + }, + { + "cell_type": "code", + "execution_count": 42, + "metadata": {}, + "outputs": [], + "source": [ + "data_clas = (TextList.from_folder(path, vocab=data_lm.vocab)\n", + " #grab all the text files in path\n", + " .split_by_folder(valid='test')\n", + " #split by train and valid folder (that only keeps 'train' and 'test' so no need to filter)\n", + " .label_from_folder(classes=['neg', 'pos'])\n", + " #label them all with their folders\n", + " .databunch(bs=bs))\n", + "\n", + "data_clas.save('tmp_clas')" + ] + }, + { + "cell_type": "code", + "execution_count": 6, + "metadata": { + "scrolled": false + }, + "outputs": [], + "source": [ + "data_clas = load_data(path, 'tmp_clas', bs=bs)" + ] + }, + { + "cell_type": "code", + "execution_count": 21, + "metadata": {}, + "outputs": [ + { + "data": { + "text/html": [ + "\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
texttarget
xxbos “ xxmaj het huwelijk is het graf van de liefde . ” \\n \\n xxmaj woorden , woorden , woorden . xxmaj in de juiste volgorde vormen ze een universum waarin je helemaal wil verdwijnen . xxmaj alleen al bij het horen van de naam xxmaj proust word ik – heel toepasselijk - teruggeworpen naar die heerlijke weken waarin ik mocht verdwalen in de omgeving van xxmaj xxunkneg
xxbos xxup de xxup cover \\n \\n xxmaj de cover toont een xxunk zoals xxmaj homeros dat waarschijnlijk in zijn gedachten had toen hij de ' xxmaj odysseus ' geschreven heeft . \\n \\n xxmaj op de achtergrond zie je felle xxunk die van een onweer kunnen zijn , maar evengoed kan het de verschijning van één of andere god zijn . xxmaj het gaat nu éénmaal overpos
xxbos xxmaj het is zo treurig dat in het tijdperk waarin iedereen ( in de vrije wereld althans ) uitstekend xxunk is om de juistheid of xxunk van elke stelling , elke bewering zelf na te gaan , vrijwel niemand de moeite neemt om het te doen . xxmaj het kritisch vermogen ontbreekt kennelijk volkomen . xxmaj een paar xxunk en je duikt in gedigitaliseerde archieven , bekijkt ebook versiesneg
xxbos xxmaj david xxmaj garnett ( 1892 - 1981 ) schreef dit debuut al in 1922 en de novelle werd meteen als meesterwerk bestempeld . xxmaj hij maakte destijds deel uit van de xxmaj xxunk - die bestond uit schrijvers , kunstenaars en intellectuelen - waar onder andere ook xxmaj virginia xxmaj woolf , haar echtgenoot xxmaj leonard xxmaj woolf , xxmaj vanessa en xxmaj clive xxmaj bell , xxmajpos
xxbos xxmaj hij is wonderbaarlijk lichtvoetig , die xxmaj daniel xxmaj kehlmann , en gezegend met een onbegrijpelijk soepele pen . xxmaj ogenschijnlijk achteloos schudt hij de ene originele en vederlichte zin na de andere uit de mouw , en hij presenteert allerlei filosofische thema 's of tragische scenes met zo'n virtuositeit en souplesse dat je de zwaarte en complexiteit van hun inhoud bijna vergeet . xxmaj sommige recensenten vindenpos
\n" + ], + "text/plain": [ + "" + ] + }, + "metadata": {}, + "output_type": "display_data" + } + ], + "source": [ + "data_clas.show_batch()" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "We can then create a model to classify those reviews and load the encoder we saved before." + ] + }, + { + "cell_type": "code", + "execution_count": 7, + "metadata": {}, + "outputs": [], + "source": [ + "learn = text_classifier_learner(data_clas, AWD_LSTM, drop_mult=0.5)\n", + "learn.load_encoder('fine_tuned_enc')" + ] + }, + { + "cell_type": "code", + "execution_count": 27, + "metadata": {}, + "outputs": [ + { + "data": { + "text/html": [], + "text/plain": [ + "" + ] + }, + "metadata": {}, + "output_type": "display_data" + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "LR Finder is complete, type {learner_name}.recorder.plot() to see the graph.\n" + ] + } + ], + "source": [ + "learn.lr_find()" + ] + }, + { + "cell_type": "code", + "execution_count": 28, + "metadata": {}, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "Min numerical gradient: 1.74E-01\n" + ] + }, + { + "data": { + "image/png": "\n", + "text/plain": [ + "
" + ] + }, + "metadata": { + "needs_background": "light" + }, + "output_type": "display_data" + } + ], + "source": [ + "learn.recorder.plot()" + ] + }, + { + "cell_type": "code", + "execution_count": 29, + "metadata": {}, + "outputs": [ + { + "data": { + "text/html": [ + "Total time: 02:47

\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
epochtrain_lossvalid_lossaccuracy
10.5240420.4085990.811843
\n" + ], + "text/plain": [ + "" + ] + }, + "metadata": {}, + "output_type": "display_data" + } + ], + "source": [ + "learn.fit_one_cycle(1, 1e-3, moms=(0.8,0.7))" + ] + }, + { + "cell_type": "code", + "execution_count": 30, + "metadata": {}, + "outputs": [], + "source": [ + "learn.save('first')" + ] + }, + { + "cell_type": "code", + "execution_count": 37, + "metadata": {}, + "outputs": [], + "source": [ + "learn.load('first');" + ] + }, + { + "cell_type": "code", + "execution_count": 38, + "metadata": {}, + "outputs": [ + { + "data": { + "text/html": [ + "Total time: 16:41

\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
epochtrain_lossvalid_lossaccuracy
10.4142960.2675850.892073
20.3241290.2292280.914040
30.2995210.2259340.914518
40.2756850.2081430.927412
50.2521720.2164820.923114
\n" + ], + "text/plain": [ + "" + ] + }, + "metadata": {}, + "output_type": "display_data" + } + ], + "source": [ + "learn.freeze_to(-2)\n", + "learn.fit_one_cycle(5, slice(1e-2/(2.6**4),1e-2), moms=(0.8,0.7))" + ] + }, + { + "cell_type": "code", + "execution_count": 39, + "metadata": {}, + "outputs": [], + "source": [ + "learn.save('second')" + ] + }, + { + "cell_type": "code", + "execution_count": 8, + "metadata": {}, + "outputs": [], + "source": [ + "learn.load('second');" + ] + }, + { + "cell_type": "code", + "execution_count": 33, + "metadata": {}, + "outputs": [], + "source": [ + "from fastai.callbacks import SaveModelCallback\n", + "cb = SaveModelCallback(learn)" + ] + }, + { + "cell_type": "code", + "execution_count": 34, + "metadata": {}, + "outputs": [ + { + "data": { + "text/html": [ + "Total time: 04:43

\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
epochtrain_lossvalid_lossaccuracy
10.3260480.2361890.903534
\n" + ], + "text/plain": [ + "" + ] + }, + "metadata": {}, + "output_type": "display_data" + } + ], + "source": [ + "learn.freeze_to(-3)\n", + "learn.fit_one_cycle(1, slice(5e-6/(2.6**4),5e-5), moms=(0.8,0.7))" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [ + { + "data": { + "text/html": [ + "\n", + "

\n", + " \n", + " \n", + " 50.00% [1/2 08:20<08:20]\n", + "
\n", + " \n", + "\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
epochtrain_lossvalid_lossaccuracy
10.2429300.2177290.923114
\n", + "\n", + "\n", + "
\n", + " \n", + " \n", + " 93.89% [553/589 08:23<00:32 0.2488]\n", + "
\n", + " " + ], + "text/plain": [ + "" + ] + }, + "metadata": {}, + "output_type": "display_data" + } + ], + "source": [ + "learn.unfreeze()\n", + "learn.fit_one_cycle(2, slice(1e-3/(2.6**4),1e-3), moms=(0.8,0.7))" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [], + "source": [ + "learn.save('fitted') # better train loss, same accuracy" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [], + "source": [ + "learn.show_results(rows=10)" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [], + "source": [ + "interp = learn.interpret()" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [], + "source": [ + "interp.plot_confusion_matrix()" + ] + } + ], + "metadata": { + "kernelspec": { + "display_name": "Python 3", + "language": "python", + "name": "python3" + }, + "language_info": { + "codemirror_mode": { + "name": "ipython", + "version": 3 + }, + "file_extension": ".py", + "mimetype": "text/x-python", + "name": "python", + "nbconvert_exporter": "python", + "pygments_lexer": "ipython3", + "version": "3.7.1" + } + }, + "nbformat": 4, + "nbformat_minor": 2 +} diff --git a/experiments/dutch/ulmfit_pretrained_wiki/README.md b/experiments/dutch/ulmfit_pretrained_wiki/README.md new file mode 100644 index 0000000..e26c313 --- /dev/null +++ b/experiments/dutch/ulmfit_pretrained_wiki/README.md @@ -0,0 +1,13 @@ +# ULMFiT pre-trained LM experiment + +## Description + +This folder contains a Jupyter Notebook with experiments and results on the 110kDBRD dataset for sentiment polarity classification. We first pre-trained a model on Dutch Wikipedia. + +## Pre-trained Dutch LM + +An LM pre-trained on the Dutch Wikipedia can be downloaded from here: http://bit.ly/2trOhzq + +## Run + +The `path` variable to the 110kDBRD dataset should be changed and the Jupyter Notebook should run fine. \ No newline at end of file diff --git a/experiments/dutch/ulmfit_pretrained_wiki/requirements.txt b/experiments/dutch/ulmfit_pretrained_wiki/requirements.txt new file mode 100644 index 0000000..5abc0a5 --- /dev/null +++ b/experiments/dutch/ulmfit_pretrained_wiki/requirements.txt @@ -0,0 +1 @@ +fastai==1.0.45 \ No newline at end of file diff --git a/experiments/dutch/ulmfit_pretrained_wiki/ulmfit_pretrain_exeperiment.ipynb b/experiments/dutch/ulmfit_pretrained_wiki/ulmfit_pretrain_exeperiment.ipynb new file mode 100644 index 0000000..ce4b01b --- /dev/null +++ b/experiments/dutch/ulmfit_pretrained_wiki/ulmfit_pretrain_exeperiment.ipynb @@ -0,0 +1,1404 @@ +{ + "cells": [ + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "# IMDB" + ] + }, + { + "cell_type": "code", + "execution_count": 1, + "metadata": {}, + "outputs": [], + "source": [ + "%reload_ext autoreload\n", + "%autoreload 2\n", + "%matplotlib inline" + ] + }, + { + "cell_type": "code", + "execution_count": 2, + "metadata": {}, + "outputs": [], + "source": [ + "from fastai.text import *" + ] + }, + { + "cell_type": "code", + "execution_count": 3, + "metadata": {}, + "outputs": [], + "source": [ + "import pandas as pd" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "## Preparing the data" + ] + }, + { + "cell_type": "code", + "execution_count": 3, + "metadata": {}, + "outputs": [ + { + "data": { + "text/plain": [ + "[PosixPath('/local/burghbvander/110kDBRDv2/tmp_lm'),\n", + " PosixPath('/local/burghbvander/110kDBRDv2/test'),\n", + " PosixPath('/local/burghbvander/110kDBRDv2/unsup'),\n", + " PosixPath('/local/burghbvander/110kDBRDv2/tmp_clas_bs96'),\n", + " PosixPath('/local/burghbvander/110kDBRDv2/urls.txt'),\n", + " PosixPath('/local/burghbvander/110kDBRDv2/tmp_clas'),\n", + " PosixPath('/local/burghbvander/110kDBRDv2/train'),\n", + " PosixPath('/local/burghbvander/110kDBRDv2/tmp_clas_bs64'),\n", + " PosixPath('/local/burghbvander/110kDBRDv2/models')]" + ] + }, + "execution_count": 3, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "path = Path('/local/burghbvander/110kDBRDv2/')\n", + "path.ls()" + ] + }, + { + "cell_type": "code", + "execution_count": 4, + "metadata": {}, + "outputs": [], + "source": [ + "bs=118" + ] + }, + { + "cell_type": "code", + "execution_count": 5, + "metadata": {}, + "outputs": [ + { + "ename": "KeyboardInterrupt", + "evalue": "", + "traceback": [ + "\u001b[0;31m---------------------------------------------------------------------------\u001b[0m", + "\u001b[0;31mKeyboardInterrupt\u001b[0m Traceback (most recent call last)", + "\u001b[0;32m\u001b[0m in \u001b[0;36m\u001b[0;34m\u001b[0m\n\u001b[1;32m 1\u001b[0m data_lm = (TextList.from_folder(path)\n\u001b[1;32m 2\u001b[0m \u001b[0;31m#Inputs: all the text files in path\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0;32m----> 3\u001b[0;31m \u001b[0;34m.\u001b[0m\u001b[0mfilter_by_folder\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0minclude\u001b[0m\u001b[0;34m=\u001b[0m\u001b[0;34m[\u001b[0m\u001b[0;34m'train'\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0;34m'test'\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0;34m'unsup'\u001b[0m\u001b[0;34m]\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0m\u001b[1;32m 4\u001b[0m \u001b[0;31m#We may have other temp folders that contain text files so we only keep what's in train and test\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 5\u001b[0m \u001b[0;34m.\u001b[0m\u001b[0mrandom_split_by_pct\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0;36m0.1\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n", + "\u001b[0;32m/local/burghbvander/anaconda3/lib/python3.7/site-packages/fastai/data_block.py\u001b[0m in \u001b[0;36mfilter_by_folder\u001b[0;34m(self, include, exclude)\u001b[0m\n\u001b[1;32m 155\u001b[0m \u001b[0;32mif\u001b[0m \u001b[0mexclude\u001b[0m \u001b[0;32mand\u001b[0m \u001b[0mn\u001b[0m \u001b[0;32min\u001b[0m \u001b[0mexclude\u001b[0m\u001b[0;34m:\u001b[0m \u001b[0;32mreturn\u001b[0m \u001b[0;32mFalse\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 156\u001b[0m \u001b[0;32mreturn\u001b[0m \u001b[0;32mTrue\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0;32m--> 157\u001b[0;31m \u001b[0;32mreturn\u001b[0m \u001b[0mself\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mfilter_by_func\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0m_inner\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0m\u001b[1;32m 158\u001b[0m \u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 159\u001b[0m \u001b[0;32mdef\u001b[0m \u001b[0mfilter_by_rand\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mself\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mp\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0mfloat\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mseed\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0mint\u001b[0m\u001b[0;34m=\u001b[0m\u001b[0;32mNone\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n", + "\u001b[0;32m/local/burghbvander/anaconda3/lib/python3.7/site-packages/fastai/data_block.py\u001b[0m in \u001b[0;36mfilter_by_func\u001b[0;34m(self, func)\u001b[0m\n\u001b[1;32m 144\u001b[0m \u001b[0;32mdef\u001b[0m \u001b[0mfilter_by_func\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mself\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mfunc\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0mCallable\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m->\u001b[0m\u001b[0;34m'ItemList'\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 145\u001b[0m \u001b[0;34m\"Only keep elements for which `func` returns `True`.\"\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0;32m--> 146\u001b[0;31m \u001b[0mself\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mitems\u001b[0m \u001b[0;34m=\u001b[0m \u001b[0marray\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0;34m[\u001b[0m\u001b[0mo\u001b[0m \u001b[0;32mfor\u001b[0m \u001b[0mo\u001b[0m \u001b[0;32min\u001b[0m \u001b[0mself\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mitems\u001b[0m \u001b[0;32mif\u001b[0m \u001b[0mfunc\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mo\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m]\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0m\u001b[1;32m 147\u001b[0m \u001b[0;32mreturn\u001b[0m \u001b[0mself\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 148\u001b[0m \u001b[0;34m\u001b[0m\u001b[0m\n", + "\u001b[0;32m/local/burghbvander/anaconda3/lib/python3.7/site-packages/fastai/core.py\u001b[0m in \u001b[0;36marray\u001b[0;34m(a, dtype, **kwargs)\u001b[0m\n\u001b[1;32m 261\u001b[0m \u001b[0;32mif\u001b[0m \u001b[0mnp\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mint_\u001b[0m\u001b[0;34m==\u001b[0m\u001b[0mnp\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mint32\u001b[0m \u001b[0;32mand\u001b[0m \u001b[0mdtype\u001b[0m \u001b[0;32mis\u001b[0m \u001b[0;32mNone\u001b[0m \u001b[0;32mand\u001b[0m \u001b[0mis_listy\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0ma\u001b[0m\u001b[0;34m)\u001b[0m \u001b[0;32mand\u001b[0m \u001b[0mlen\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0ma\u001b[0m\u001b[0;34m)\u001b[0m \u001b[0;32mand\u001b[0m \u001b[0misinstance\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0ma\u001b[0m\u001b[0;34m[\u001b[0m\u001b[0;36m0\u001b[0m\u001b[0;34m]\u001b[0m\u001b[0;34m,\u001b[0m\u001b[0mint\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 262\u001b[0m \u001b[0mdtype\u001b[0m\u001b[0;34m=\u001b[0m\u001b[0mnp\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mint64\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0;32m--> 263\u001b[0;31m \u001b[0;32mreturn\u001b[0m \u001b[0mnp\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0marray\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0ma\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mdtype\u001b[0m\u001b[0;34m=\u001b[0m\u001b[0mdtype\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0;34m**\u001b[0m\u001b[0mkwargs\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0m\u001b[1;32m 264\u001b[0m \u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 265\u001b[0m \u001b[0;32mclass\u001b[0m \u001b[0mEmptyLabel\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mItemBase\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n", + "\u001b[0;31mKeyboardInterrupt\u001b[0m: " + ], + "output_type": "error" + } + ], + "source": [ + "data_lm = (TextList.from_folder(path)\n", + " #Inputs: all the text files in path\n", + " .filter_by_folder(include=['train', 'test', 'unsup']) \n", + " #We may have other temp folders that contain text files so we only keep what's in train and test\n", + " .random_split_by_pct(0.1)\n", + " #We randomly split and keep 10% (10,000 reviews) for validation\n", + " .label_for_lm() \n", + " #We want to do a language model so we label accordingly\n", + " .databunch(bs=bs))\n", + "data_lm.save('tmp_lm')" + ] + }, + { + "cell_type": "code", + "execution_count": 6, + "metadata": {}, + "outputs": [], + "source": [ + "data_lm = load_data(path, 'tmp_lm', bs=bs)" + ] + }, + { + "cell_type": "code", + "execution_count": 7, + "metadata": {}, + "outputs": [ + { + "data": { + "text/html": [ + "\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
idxtext
0ik uiteindelijk wel zeker , xxmaj matthias was dood . \\n xxmaj uit de verschillende verhaallijnen heb ik echter nooit kunnen distilleren wie xxmaj matthias nu wel was . xxmaj wel was het duidelijk dat hij op zijn weg heel wat tegenslagen te verwerken kreeg en niet altijd begrepen werd . \\n xxmaj ik kreeg wel een beter beeld van de naasten van xxmaj matthias . \\n
1/ / xxunk / boeken / girl - online - on - tour / xxbos xxmaj tjonge wat een debuut . xxmaj ik heb van het begin tot het eind genoten . xxmaj schrijf maar lekker door xxmaj elizabeth . u heeft er een fan bij ! \\n xxmaj voor mij is dit boek 5 duimpjes waard ! xxbos xxmaj wanneer je ontwikkeling zoekt in een serie dan ben
2laten invoelen in de personages zodat je je echt één voelt met ze . xxmaj wat een verschrikkelijke mensen het soms ook zijn . \\n xxmaj dit is geen gewone thriller zoals je gewend bent , de spanning en de snelheid zitten er wel degelijk in maar op een totaal andere manier . xxmaj er worden geen mensen vermoord en achtervolgingen gedaan maar er wordt op een rustige intrigerende
3xxmaj angstaanjagend , dat wel . \\n \\n xxmaj de schrijfstijl van xxmaj lauerhohn is direct , ongenuanceerd en hier en daar zelfs hard , maar dat sluit naadloos aan bij het verhaal . xxmaj de sfeer is benauwend werkelijk , filmisch haast . \\n \\n “ xxmaj ze stond in een portiek tegenover hun bouwval en xxunk hem . xxmaj het meisje wees met een bevende vinger
4raadselachtige wijze overlijd is het voor de jonge xxmaj michele duidelijk , hij en zijn vader staan lijnrecht tegenover elkaar . \\n xxmaj dit deel van het boek vind ik ontzettend spannend en soms ook luguber , maar tegelijkertijd ook moeilijk omdat er veel politiek naar boven komt , en je goed moet opletten hoe de verschillende idealen zich ontwikkelen , en op welke manier deze tegenover elkaar komen
\n" + ], + "text/plain": [ + "" + ] + }, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "data_lm.show_batch()" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "## Language model" + ] + }, + { + "cell_type": "code", + "execution_count": 7, + "metadata": {}, + "outputs": [], + "source": [ + "from fastai.text.models import AWD_LSTM" + ] + }, + { + "cell_type": "code", + "execution_count": 8, + "metadata": {}, + "outputs": [], + "source": [ + "learn = language_model_learner(data_lm, AWD_LSTM, pretrained_fnames=['lm_best', 'itos'], drop_mult=0.3)" + ] + }, + { + "cell_type": "code", + "execution_count": 10, + "metadata": {}, + "outputs": [ + { + "data": { + "text/html": [], + "text/plain": [ + "" + ] + }, + "metadata": {}, + "output_type": "execute_result" + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "LR Finder is complete, type {learner_name}.recorder.plot() to see the graph.\n" + ] + } + ], + "source": [ + "learn.lr_find()" + ] + }, + { + "cell_type": "code", + "execution_count": 11, + "metadata": {}, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "Min numerical gradient: 2.75E-02\n" + ] + }, + { + "data": { + "image/png": "iVBORw0KGgoAAAANSUhEUgAAAZgAAAEKCAYAAAAvlUMdAAAABHNCSVQICAgIfAhkiAAAAAlwSFlzAAALEgAACxIB0t1+/AAAADl0RVh0U29mdHdhcmUAbWF0cGxvdGxpYiB2ZXJzaW9uIDMuMC4wLCBodHRwOi8vbWF0cGxvdGxpYi5vcmcvqOYd8AAAIABJREFUeJzt3Xd8leX9//HX52RBBhAgASRhha0MISCKMlx1r6pF67al1tVqbX9t7bBaO77V1tr224pUrVq3XyuOilREUFlBhoJswggjCWEkBLLO9fvj3JSICQnh3OckJ+/n43E/OOeen4uT5H3udd3mnENERCTcAtEuQEREYpMCRkREfKGAERERXyhgRETEFwoYERHxhQJGRER8oYARERFfKGBERMQXChgREfFFfLQLCKfOnTu7Xr16RbsMEZEWY9GiRcXOuQw/1h1TAdOrVy/y8vKiXYaISIthZhv9WrcOkYmIiC8UMCIi4gsFjIiI+EIBIyIivlDAiIiIL3wNGDPLN7NPzWyJmX3p8i4zG2hmc82swszuOZplRUSkeYvEZcoTnXPF9UwrAe4ELmnCsiIi0oxF9RCZc67QObcQqIpmHY++t4bXlxRQWHogmmWIiMQUv/dgHPCumTngMefclHAva2aTgckAPXr0OOoCD1TV8NTH+ZTsqwSgf5dUTsnpzIie6fTNSKVPRgptEuKOer0iIq2dOef8W7lZd+dcgZllAjOAO5xzs+uY7z6gzDn30NEuW1tubq5ryp38NUHH8q17+GjtTj5eV8yCDSVUVAcBCBj06JjMFbnZ3Daxb6PWV1UTZPnWvQzLao+ZHXU9IiKRYmaLnHO5fqzb1z0Y51yB92+hmb0GjAaOGBLhWPZoxQWMoVkdGJrVgW9PyKGiuoYNxftYs6OMNYVlzF+/k99NX0X/LmmcNbhLg+t7+N3V/O2DdVx/ck9+duHxxAUUMtFSXlnNjr0VdGvfRnuiIhHmW8CYWQoQcM6Veq/PBu73e9lwSIqPY2DXdgzs2g6AiuoaLv3Lx/y/V5cxLPs0MtPa1Lvsjr0HePKjDXTv0JZ/zN3I1j0HeHTSibRNbF1/3JxzfLC6iCWbd5MYHyAxLkBSQhzdO7Rh4oDMiOzZzVy5gx+++imFpRUApCcn0K19WwZ1a8c3x/X+7+crIv7w7RCZmfUBXvPexgPPOeceNLNbAJxzfzOzrkAe0A4IAmXAYKBzXcs2tM2mHiJrjDU7SrngTx8ypk8nnrpxVL1/IO997VNeXLiZmd+bwMyVO/jFmysYmtWBv1+fS+fUJF9qa04qq4O8vqSAqXM2sGpHaZ3znNS7I7+6bAg5Gam+1LD3QBUPvLGClxdtYUCXNG4c24ud+yrZuns/2/YcYP76neyrrOGswV24fWJfhmV38KUOkZbAz0Nkvp6DiTQ/Awbg6bn5/Oz15dx34WBuGNv7S9Pzi/dx5u8/4KrRPXjgkhMAmL58O3c+v5gu7drwl6tHMCSrvW/1RVNldZBn5m1kyux17NhbwcCuaXzztD5cMKwbzkFFdZDK6iDvfb6DX739OQeqgtw6MYdvT8ghKT6OmqBjV3klhXsr2LyrnE07y9lUUk5xWQWTRvdgfP+GexOvrgnyn88Luf+N5Wzfe4BbxufwnTP7kRT/xb3H3eWVPPVxPk9+lM+e/VWM7JlOdnpbOqYk0Sk1kU4piWR3TKZHx2S6tW9DfJzuR5bYpYBpJL8DxjnHTU8t5KN1O3nj9lMZ0DXtC9PvfH4x767YzuzvTySz3aHDaJ9s2sW3n13EzrJK7ji9H7dOzCEhRv5oOeeYsWIHv/73SjYU7+PkPp24ZUIO4/p1rncvr6i0ggfeXMG0pVvpnJqEGewsqyB42I9i+7YJJMQFKC6r4JoxPfjxeYNITvzyUd3NJeW8lLeZl/O2sH3vAfpkpPDwFcM4sUf6EWsvPVDFs/M2MX35dnbuq6CkrJJ9lTVfmCcuYPTomMz4/hlcMLQbI3qkE9A5NYkhCphG8jtgIPTH8ZxHZtM2MY4HLx3y32/WK7bu5bxH53DrhBx+cM7ALy23u7ySn72+nGlLtzIsqz0PXzmcvpmHDhE559izv4qi0goKSysoLqvghO7t6zyMVBMM/VHfsqucPhkp9O6cSlZ626MKreKyCuat38lp/TJo3zahCf8TsGp7Kb94Yzkfr9tJTkYKPzl/MBMGZDT6/MqsVYW8vGgL7drE0zk1iYy0JDJSk8hKD+09tE9O4EBVDQ9NX8XfP9pAz47J/P5rw+nZMZnFm3azaNMu8vJLyNu4CwPG98/ga6N6cMagzCYH+IGqGopKK9iyaz+bS8rZWLKPVdtLmb2mmMrqIF3bteG8Id24anQ2/bqkNbxCkWZOAdNIkQgYgEUbS/jeS0vJ31nOWYO78NPzB3PfG8vJyy9hzg9Op31y/X+w31q2jZ/861PKKqpJSYqnusZRVROkqib4pW/wABMHZHDzqX0Y27cTlTVBXvukgMdmr2dD8b4vzBcfMPp1SWPigAzOGNSF4dkd6rx6bX1RGVM/3MCri7ZQUR2kQ3ICt0/syzVjeh7VVVazVxfxrWcWkZQQ4K4z+3P1ST183Subu24n97y8lK179nPwRzY+YAw+rh2nD8zkytxsjuvQ1rftlx6oYubKQt5cto0PVhVRWRPktH6dufnU3ozv3/hQFWluFDCNFKmAgdCVZU98mM+fZq6husZRWRPkB+cM4NYJDd8rU1h6gL/P2cD+qhriAwES4o2EQID0lMT/fovvkJzA9OXbeXbeRorLKhnQJY09+6vYvvcAJ3Rvx60T+nJS747k7yxnQ/E+1heVsWjjLvI27qIm6OiUksjo3h1JTownMd5IjAtQsHs/760sJCEuwFdHdOeswV148qN85qwppnuHtnz3zH5cOOy4BoPmzWVbuevFJfTNTOMfN4064lV14VR6oIqpczbQNjGOET3SGdK9fVSuzivZV8lz8zfy9NyNFJZW0Dczle+c0Y8LhnZT0EiLo4BppEgGzEHb9xzgt++sZF1RGS9MHlPnOYJjcaCqhmlLt/LPeRtJbRPPt8blcNoRzm/sKa9i1upC3vu8kM8K9oROrnt7SEnxAa7Mzea6k3uRkXboiraP1hbzm3+v5NOCPbRNiOOUnE5MGJDBhAGZZKW3/cK2np23kZ++/hm5PdOZev2oJh9eiwWV1UHe+nQrj32wnpXbSzmpd0fuu+h4BnXT5c/ScihgGikaARMrgkHH7DVFzFxZyKxVRWwqKQcgLSmerI7JZKe3JSkhjjeWbuX0gZn85eoRre7envrUBB0vLNzEQ9NXsWd/FdeO6cndZw044qFSkeZCAdNICpjwcM6xoXgfc9YUs76ojM3eCe9tew5w3pCuPHjpkJi5Ci6cdpdX8vsZq3l23kay0pP5+/W5uhBAmj0FTCMpYKQ5WLRxF996ZhEVVTU8evWJTByQGe2SROqlgGkkBYw0FwW79/ONf+Sxavte7j1/MDeN7cXWPQdYXrCH5Vv3squ8kpSkeFKT4klJjKNX5xTG9cvQPTYScQqYRlLASHOyr6Kau15cwrsrdpCWFE9pRTUAZqFzW+WVNVTXujZ9cLd23H1Wf84YFJm+2kRAAdNoChhpboJBx98/3MD64jIGH9eewd3aMahbGsmJ8TjnqKgOsq+imlmrivjje2vYVFLOsOwO3HBKT2qCofM6JfsqqQ46zh/STf2mSdgpYBpJASMtWVVNkFcXbeFPM9dSsHv/f8fHB4yAGZU1QYZ0b8+1Y3py4bDjdBWfhIUCppEUMBILKquDrN5RSlqbeNJTEklLiqesopp/LS7gmXkbWb2jjLQ28Yzvn8G4/hmM65dB1/aRudlVYo8CppEUMBLrnHMszN/FS3mb+WB1EUXes24GdEnjqtHZTBrdQw9Wk6OigGkkBYy0Js45Vm4vZfbqIt5Zvp3Fm3aTmZbEt8bncPXoHjqEJo2igGkkBYy0Vs455q0v4dH31jB3/U46pybyjdP6cM2YnqQm+fpkdGnhFDCNpIARgYX5oaCZs6aY9m0TuOGUXtw4thcdkhOjXZo0QwqYRlLAiByydPNu/vz+Wmas2EFKYhw/Pn8QXz+pZ7TLkmbGz4DRvrNIjBqW3YHHr8tl5fa9PPjW59z72mckJ8Zx6YlZ0S5NWgn1WCgS4wZ2bcfj1+Uypk9Hvv/yMmatKox2SdJKKGBEWoE2CXE8fl0u/buk8e1nP2Hxpl3RLklaAQWMSCuR1iaBp24aRUZaEjc9tZC1haXRLklinAJGpBXJTGvDMzePJi4QYNKU+SzbsjvaJUkMU8CItDI9O6XwwuQxtEkI8LXH5vHe5zuiXZLEKAWMSCvUNzOV/7v1FPpmpvLNp/P45/yN0S5JYpCvAWNm+Wb2qZktMbMv3aBiZgPNbK6ZVZjZPYdNO8fMVpnZWjP7oZ91irRGmWlteGHyGCYMyOTe1z7j9++uinZJEmMisQcz0Tk3vJ4beUqAO4GHao80szjgL8C5wGDgKjMb7HulIq1MSlI8U64dyddys3l05lqe+mhDtEuSGBLVQ2TOuULn3EKg6rBJo4G1zrn1zrlK4AXg4ogXKNIKxMcF+NVlQzh7cBfuf3MFM1bonIyEh98B44B3zWyRmU0+iuW6A5trvd/ijfsSM5tsZnlmlldUVHQMpYq0XnEB44+TTmRI9/bc8fwnLN2sq8vk2PkdMKc650YQOtR1m5mNC/cGnHNTnHO5zrncjIyMcK9epNVomxjH1OtD98nc/I+FbC4pj3ZJ0sL5GjDOuQLv30LgNUKHvhqjAMiu9T7LGyciPspIS+LJG0ZTWR3k6qnz+GhtcbRLkhbMt4AxsxQzSzv4Gjgb+KyRiy8E+plZbzNLBCYB0/ypVERq65uZypM3hr4Lfn3qfG775yds3b0/ylVJS+Rnb8pdgNfM7OB2nnPOvWNmtwA45/5mZl2BPKAdEDSz7wKDnXN7zex2YDoQBzzhnFvuY60iUsvInunMuGs8j32wnv+dtZaZKwv5zpn9+Na4Pni/0yIN0vNgROSINpeU//fqsutP7sl9Fx2vkIkhfj4PRnfyi8gRZXdMZsq1I/nGqb35x9yN/PKtz4mlL6biHz1wTEQaZGbce/4gqoOOv3+4gfiA8cNzB2pPRo5IASMijWJm/PzCwdQEHY/NXk98nHHP2QMUMlIvBYyINJqZ8YuLjqc66PjL++vIyUjlshF6BLPUTedgROSoBALGLy85gdye6fz89eUU6BJmqYcCRkSOWlzA+P2Vwwk6xz0vLSUY1El/+TIFjIg0SY9OyfzswsHMXb+TJ9QLs9RBASMiTXZlbjZnDsrkf6avYvWO0miXI82MAkZEmszM+PVlQ0lLiue7LyyhsjoY7ZKkGVHAiMgxyUhL4teXDWHFtr08Pmd9tMuRZkQBIyLH7Ozju3LO8V3508w1uqpM/ksBIyJh8dMLQ081f+CNFVGuRJoLBYyIhEX3Dm254/R+vLN8O7NWFUa7HGkGFDAiEjbfOK03vTuncN+05VRU10S7HIkyBYyIhE1SfBz3XXQ8+TvLmTpH98a0dgoYEQmr8f0z/nvCf8uu8miXI1GkgBGRsPvphYMxjF/ohH+rpoARkbDr3qEtd57RjxkrdvCfFTuiXY5EiQJGRHxx86m96ZeZys+nLae8sjra5UgUKGBExBeJ8QF+eckJFOzez6PvrY12ORIFChgR8c1JfTrx1RFZTJ2zXp1htkIKGBHx1Y/PG0hKUjw/+ddnOKfnxrQmChgR8VWn1CR+eO5AFmwo4eVFW6JdjkSQAkZEfPe13GxG9UrngTdXsG2POsNsLXwNGDPLN7NPzWyJmeXVMd3M7FEzW2tmy8xsRK1pNd5yS8xsmp91ioi/AgHjd5cPo7rG8YNXlulQWSsRiT2Yic654c653DqmnQv084bJwF9rTdvvLTfcOXdRBOoUER/16pzCj88byJw1xTy3YFO0y5EIiPYhsouBp13IPKCDmXWLck0i4pOvn9STU/t25sG3PmfTTnUjE+v8DhgHvGtmi8xsch3TuwOba73f4o0DaGNmeWY2z8wu8blOEYmAQMD47eVDiTPjnpeXEgzqUFks8ztgTnXOjSB0KOw2Mxt3FMv29A6rXQ08YmY5dc1kZpO9IMorKioKQ8ki4qfuHdryswsHsyC/hCc/zo92OeIjXwPGOVfg/VsIvAaMPmyWAiC71vssb1ztZdcDs4AT69nGFOdcrnMuNyMjI6z1i4g/Lh+ZxYQBGTwyYzXFZRXRLkd84lvAmFmKmaUdfA2cDXx22GzTgOu8q8nGAHucc9vMLN3MkrxlOwNjAXXLKhIjzIyfnD+Y/VU1/GHG6miXIz7xcw+mC/ChmS0FFgBvOefeMbNbzOwWb563gfXAWuBx4FZv/CAgz1v2feA3zjkFjEgM6ZuZyjVjevL8gk2s2q5uZGKRxdL16Lm5uS4v70u324hIM7VrXyXjf/c+w7I78PRNozGzaJfU6pjZonpuIzlm0b5MWURasfSURO48ox9z1hQza5Uu0ok1ChgRiarrTu5F784p/PKtFVTVBKNdjoSRAkZEoioxPsCPzh3IuqJ9PK87/GOKAkZEou6swV0Y06cjf565lspq7cXECgWMiESdmXHrhL4UllYwbenWaJcjYaKAEZFm4bR+nRnYNY3HZ69Xb8sxQgEjIs2CmfGN0/qwakcps9cUR7scCQMFjIg0GxcNO47MtCSmzlkf7VIkDBQwItJsJMYHuGFsL+asKWbF1r3RLkeOkQJGRJqVr4/uSXJiHFM/1F5MS6eAEZFmpX1yAlfmZjNtyVa27zkQ7XLkGChgRKTZufnU3gSd4yk9L6ZFU8CISLOT3TGZc07oynPzN3Kgqiba5UgTKWBEpFn6+kk92Xugmnc+2x7tUqSJFDAi0iyd3KcTPTomq3+yFkwBIyLNUiBgfG1UNvM3lLC+qCza5UgTKGBEpNm6YmQWcQHjxbzN0S5FmqBRAWNmOWaW5L2eYGZ3mlkHf0sTkdYus10bzhiYyauLtqiX5RaosXswrwI1ZtYXmAJkA8/5VpWIiGfS6GyKyyp57/Md0S5FjlJjAybonKsGLgX+5Jz7PtDNv7JERELG98+kW/s2PL9Qh8lamsYGTJWZXQVcD7zpjUvwpyQRkUPiAsYVudnMWVPEll3l0S5HjkJjA+ZG4GTgQefcBjPrDTzjX1kiIodcmZsFwEt5W6JciRyNRgWMc26Fc+5O59zzZpYOpDnnfutzbSIiAGSlJzOuXwYv522mJqiHkbUUjb2KbJaZtTOzjsAnwONm9nt/SxMROeSq0dls23OAD1YXRrsUaaTGHiJr75zbC1wGPO2cOwk407+yRES+6IxBXeicmsRz83Wyv6VobMDEm1k34EoOneRvkJnlm9mnZrbEzPLqmG5m9qiZrTWzZWY2ota0681sjTdc39htikhsSogLcEVuFu+vKmTHXnXj3xI0NmDuB6YD65xzC82sD7CmkctOdM4Nd87l1jHtXKCfN0wG/grgHYr7OXASMBr4uXfuR0RasUmjsqkJOl7Wnf0tQmNP8r/snBvqnPu29369c+6rYdj+xYQOuTnn3Dygg7en9BVghnOuxDm3C5gBnBOG7YlIC9azUwpj+3bihYWbCepkf7PX2JP8WWb2mpkVesOrZpbViEUd8K6ZLTKzyXVM7w7U/iqyxRtX33gRaeVu6hrkWy8+TLBdOwgEoF07uPVWWLcu2qXJYRp7iOxJYBpwnDe84Y1ryKnOuRGEDoXdZmbjmlTlEZjZZDPLM7O8oqKicK9eRJqTf/+b0792FpOWTid+Xxk4B6WlMHUqDB0K//53tCuUWhobMBnOuSedc9Xe8BSQ0dBCzrkC799C4DVC51NqKyDUr9lBWd64+sbXtY0pzrlc51xuRkaDJYlIS7VuHVx+OVZeTkLwsKdcVlVBeTlcfrn2ZJqRxgbMTjO7xszivOEaYOeRFjCzFDNLO/gaOBv47LDZpgHXeVeTjQH2OOe2Ebqg4GwzS/dO7p/tjROR1urhh0NBciRVVfCHP0SmHmlQYwPmJkKXKG8HtgGXAzc0sEwX4EMzWwosAN5yzr1jZreY2S3ePG8D64G1wOPArQDOuRLgAWChN9zvjROR1urZZxsXMM+oF6vmwpxr2pUYZvZd59wjYa7nmOTm5rq8vC/dbiMisSAQCJ1zacx8NTUNzycAmNmiem4jOWbH8kTLu8NWhYhIQ1JTwzuf+O5YAsbCVoWISEOuuQYSGnhKSEICXHttZOqRBh1LwOguJxGJnO99r3EBc9ddkalHGnTEgDGzUjPbW8dQSuh+GBGRyMjJgVdegeTkLwVNVSAel5wcmp6TE6UC5XBHDBjnXJpzrl0dQ5pzLj5SRYqIAHDuubBsGUyeHLqDPxCgMiWV54Z9hVXTPwxNl2bjWA6RiYhEXk4O/PnPsGcP1NSwv6iEX59/G08X6Ttvc6OAEZEWrX3bBM4b0o1pS7ZSXlkd7XKkFgWMiLR4k0b1oKyimreWbYt2KVKLAkZEWrxRvdLp0zmFl/ScmGZFASMiLZ6ZceWobBbm72L1jtJolyMeBYyIxIQrc7NpkxDg8dnro12KeBQwIhITOqYkcmVuNv9aUsC2PfujXY6ggBGRGPLN0/oQdPDkR/nRLkVQwIhIDMnumMz5Q7rx3PxN7NnfQNf+4jsFjIjElMnj+lBWUc0/52+MdimtngJGRGLKCd3bc1q/zjzxYT4HqvRcmGhSwIhIzLllfA7FZRW8trgg2qW0agoYEYk5p+R0Ykj39jw+ez01QT1ZJFoUMCISc8yMW8bnsL54HzNW7Ih2Oa2WAkZEYtI5J3QlK70tT3y0IdqltFoKGBGJSXEB4/qTe7FgQwmfFeyJdjmtkgJGRGLWlaOySU6M042XUaKAEZGY1b5tApePzOKNpVspKq2IdjmtjgJGRGLaDaf0orImqBsvo0ABIyIxrU9GKqcPzOTZeRupqNaNl5Hke8CYWZyZLTazN+uY1tPM3jOzZWY2y8yyak2rMbMl3jDN7zpFJHbdOLYXxWWVvLFUT7yMpEjswXwH+LyeaQ8BTzvnhgL3A7+uNW2/c264N1zkd5EiErtO7duZfpmpPPnRBpzTjZeR4mvAeHsk5wNT65llMDDTe/0+cLGf9YhI62Rm3Di2N8u37mX+hpJol9Nq+L0H8wjwAyBYz/SlwGXe60uBNDPr5L1vY2Z5ZjbPzC7xuU4RiXGXntidjimJPPbBumiX0mr4FjBmdgFQ6JxbdITZ7gHGm9liYDxQABw8C9fTOZcLXA08YmY59WxnshdEeUVFRWFsgYjEkraJcdw0thfvrypi+VbdeBkJfu7BjAUuMrN84AXgdDN7tvYMzrmtzrnLnHMnAvd643Z7/xZ4/64HZgEn1rUR59wU51yucy43IyPDr7aISAy49uRepCbF87+ztBcTCb4FjHPuR865LOdcL2ASMNM5d03tecyss5kdrOFHwBPe+HQzSzo4D6GwWuFXrSLSOrRvm8C1J/fk7U+3sa6oLNrlxLyI3wdjZveb2cGrwiYAq8xsNdAFeNAbPwjIM7OlhE7+/8Y5p4ARkWN286m9SYwL8DftxfjOYumSvdzcXJeXlxftMkSkmbtv2nKenbeRD34wke4d2ka7nKgys0Xe+e6w0538ItLqfHNcHwAen70+ypXENgWMiLQ63Tu05dITu/P8gk0Ul6kTTL8oYESkVbplQg6VNUGeUlf+vlHAiEirlJORyhkDM3lh4Waqauq7F1yOhQJGRFqtq0/qQXFZBTNW7Ih2KTFJASMirdb4/pl079BWz4rxiQJGRFqtuIBx1ehsPlq7kw3F+6JdTsxRwIhIq3ZlbjbxAeP5BZuiXUrMUcCISKuW2a4NZw3uwst5mzlQpSdehpMCRkRava+f1JNd5VW889n2aJcSUxQwItLqnZLTiV6dknluvg6ThZMCRkRavUDAuGp0Dxbkl7B6R2m0y4kZChgREeDykVkkxgX45zxdshwuChgREaBTahLnD+3Gq58UUHqgKtrlxAQFjIiI54ZTelFWUc0ri7ZEu5SYoIAREfEMy+7AiB4d+MfH+QSDsfOsrGhRwIiI1HLD2N7k7yxn1urCaJfS4ilgRERqOfeErnRpl8ST6sb/mClgRERqSYgLcO2YnsxZU8waXbJ8TBQwIiKHuWp0DxLjAzz1cX60S2nRFDAiIofplJrEJcOP4/8+KWBPuS5ZbioFjIhIHW44pTf7q2p4MU/dxzSVAkZEpA6Dj2vH6N4deXbeJl2y3EQKGBGRekwalc2mknIW5JdEu5QWSQEjIlKPc0/oRmpSPC/n6c7+pvA9YMwszswWm9mbdUzraWbvmdkyM5tlZlm1pl1vZmu84Xq/6xQROVzbxDguHNaNtz/dRllFdbTLaXEisQfzHeDzeqY9BDztnBsK3A/8GsDMOgI/B04CRgM/N7P0CNQqIvIFl4/MZn9VDW8v2xbtUlocXwPG2yM5H5hazyyDgZne6/eBi73XXwFmOOdKnHO7gBnAOX7WKiJSlxE9OtAnI4WX8jZHu5QWx+89mEeAHwDBeqYvBS7zXl8KpJlZJ6A7UPvT3OKNExGJKDPjipHZ5G3cxfqismiX06L4FjBmdgFQ6JxbdITZ7gHGm9liYDxQANQc5XYmm1memeUVFRU1vWARkXp8dUR34gKmbvyPkp97MGOBi8wsH3gBON3Mnq09g3Nuq3PuMufcicC93rjdhIImu9asWd64L3HOTXHO5TrncjMyMnxohoi0dpnt2jC+fwavfrKFGt0T02i+BYxz7kfOuSznXC9gEjDTOXdN7XnMrLOZHazhR8AT3uvpwNlmlu6d3D/bGyciEhVXjMxix94KZq/RkZLGivh9MGZ2v5ld5L2dAKwys9VAF+BBAOdcCfAAsNAb7vfGiYhExRmDupCenMDLOtnfaPGR2IhzbhYwy3v9s1rjXwFeqWeZJzi0RyMiElWJ8QEuH5nFEx/ls7awjL6ZqdEuCYCNO/cRMCO7Y3K0S/kS3ckvItJIt4zPoW1CHA9NXxXtUv7rj/9Zw3mPzqGi+qiuj4oIBYyISCN1Sk1i8rg+vLN8O59s2hXtcthTXsXOzju0AAANSklEQVRbn27j4uHHkRQfF+1yvkQBIyJyFG4+tTedU5P4zdsrcS66V5S9tngLFdVBrhrdI6p11EcBIyJyFFKS4vnOmf1YkF/C+6sKo1aHc47nF2xmaFZ7jj+ufdTqOBIFjIjIUZo0KptenZL57b9XRe2+mE827WbVjtJmu/cCChgRkaOWEBfg+18ZyKodpby2uM57wH33/IJNpCTGceGw46Ky/cZQwIiINMF5Q7oyLKs9v5u+ki27yiO67T37q3hz2VYuGt6d1KSI3G3SJAoYEZEmMDN+eckQyitruPJvcyPaEebrSwo4UBXk6mZ8eAwUMCIiTTYkqz3Pf3MMFdVBrnxsLiu27vV9m845npu/iRO6t2NIVvM8uX+QAkZE5Bic0L09L91yMglxASZNmcuijf72arVk825Wbm/eJ/cPUsCIiByjnIxUXr7lZDqmJHLt3xewtrDUt209M28jbRPiuKgZn9w/SAEjIhIGWenJvPitk2mTEMd3XlhCZXV9z1lsulXbS/nX4gKuGt2DtDYJYV9/uClgRETCpEu7Nvz2q0NZvnUvD88If39lv3r7c1KT4rnj9L5hX7cfFDAiImF01uAuXDW6B1Nmr2fuup1hW+/s1UV8sLqIO07vR3pKYtjW6ycFjIhImP30gkH07pTC3S8tYU951TGvrybo+NXbn5PdsS3XndIzDBVGhgJGRCTMkhPjeWTScIpKK/jJ658dc6eYry7awsrtpfy/cwY2y16T66OAERHxwdCsDnz3zH68sXQrtz+3mJJ9lU1aT3llNQ+9u4oTe3Tg/CHdwlylv5pvHwMiIi3crRP6YmY88p/VzN+wkwcvHcJXju96VOuYMns9haUV/PWaEZiZT5X6Q3swIiI+CQSM2yb2Zdrtp5KZ1oZvPbOIu19cwu7yxu3NvL+qkD/NXMsFQ7sxsmdHn6sNPwWMiIjPBnVrx79uG8udZ/Tj9aVbOePhD3ht8ZYjnptZtmU3tz77CQO7pvGbrw6NYLXho4AREYmAxPgAd5/VnzduP5Xsjsnc9eJSrvn7/Do7ydy0s5ybnlpIp9REnrxxVLPuMflILNqP/Ayn3Nxcl5eXF+0yRESOKBh0PLdgE799ZyUV1UEmDsjgpN6dOKlPRzLT2nDlY3PZVV7Jq98+hZyMVF9rMbNFzrlcP9bdMmNRRKQFCwSMa8b05Ozju/Doe2v4YHUR05fvCE2z0APNnvvmSb6Hi98UMCIiUZKZ1oZfXjIEgILd+5m/fid5G3dx9uAuLfKk/uEUMCIizUD3Dm25bEQWl43IinYpYeP7SX4zizOzxWb2Zh3TepjZ+970ZWZ2nje+l5ntN7Ml3vA3v+sUEZHwisQezHeAz4F2dUz7CfCSc+6vZjYYeBvo5U1b55wbHoH6RETEB77uwZhZFnA+MLWeWRyHgqc9sNXPekREJHL8PkT2CPADoL4n79wHXGNmWwjtvdxRa1pv79DZB2Z2mr9liohIuPkWMGZ2AVDonFt0hNmuAp5yzmUB5wHPmFkA2Ab0cM6dCNwNPGdmdR1iw8wmm1memeUVFRWFuRUiItJUfu7BjAUuMrN84AXgdDN79rB5bgZeAnDOzQXaAJ2dcxXOuZ3e+EXAOqB/XRtxzk1xzuU653IzMjL8aYmIiBw13wLGOfcj51yWc64XMAmY6Zy75rDZNgFnAJjZIEIBU2RmGWYW543vA/QD1vtVq4iIhF/E74Mxs/uBPOfcNOB7wONmdhehE/43OOecmY0D7jezKkLnb25xzpVEulYREWm6mOqLzMyKgI2HjW4P7GlgXO33Db3uDBQfQ5l11dPYeY62LYe/P/g6ltpS+/WxtOdY2lLfNP2cHRqnz6ZxtTY0jx+fzQDnXFrDZTeBcy6mB2BKQ+Nqv2/oNaG9r7DW09h5jrYtR2hDzLQlXO05lrbo5+zIP2f6bGL3s2loaA3d9b/RiHFvHOXrcNfT2HmOti2Hv3+jnnmaqjm0pbF1NORY2lLfNP2chYc+myOPj+Znc0QxdYgsEswsz/nUtXWkxVJbILbaE0ttgdhqTyy1BfxtT2vYgwm3KdEuIIxiqS0QW+2JpbZAbLUnltoCPrZHezAiIuIL7cGIiIgvWnXAmNkTZlZoZp81YdmRZvapma01s0fNzGpNu8PMVprZcjP7n/BWXW89YW+Lmd1nZgW1HptwXvgrr7cmXz4bb/r3zMyZWefwVXzEevz4bB7wHnGxxMzeNbPjwl95nfX40Zbfeb8vy8zsNTPrEP7K663Jj/Zc4f3uB83M93M1x9KGetZ3vZmt8Ybra40/4u9Vnfy6PK0lDMA4YATwWROWXQCMAQz4N3CuN34i8B8gyXuf2YLbch9wT6x8Nt60bGA6ofulOrfUtgDtas1zJ/C3FtyWs4F47/Vvgd+25J8zYBAwAJgF5DbXNnj19TpsXEdCvaZ0BNK91+lHau+Rhla9B+Ocmw18oYcAM8sxs3fMbJGZzTGzgYcvZ2bdCP2Cz3Oh//mngUu8yd8GfuOcq/C2UehvK0J8akvU+NiePxDq4TtiJx/9aItzbm+tWVOIUHt8asu7zrlqb9Z5QMQe6ehTez53zq2KRP3e9prUhnp8BZjhnCtxzu0CZgDnNPXvRKsOmHpMAe5wzo0E7gH+t455ugNbar3f4o2DUKecp5nZfAs9amCUr9Ue2bG2BeB279DFE2aW7l+pjXJM7TGzi4EC59xSvwtthGP+bMzsQTPbDHwd+JmPtTYkHD9nB91E6NtxNIWzPdHSmDbUpTuwudb7g+1qUnsj3hdZc2ZmqcApwMu1Di8mHeVq4gntXo4BRgEvmVkfL/UjJkxt+SvwAKFvxw8ADxP6AxBxx9oeM0sGfkzocExUhemzwTl3L3Cvmf0IuB34ediKbKRwtcVb171ANfDP8FTXpBrC1p5oOVIbzOxGQk8ZBugLvG1mlcAG59yl4a5FAfNFAWC3O+xRzRbq2fngc22mEfrDW3s3Pgso8F5vAf7PC5QFZhYk1HdRpB9Wc8xtcc7tqLXc48CbfhbcgGNtTw7QG1jq/dJlAZ+Y2Wjn3Hafaz9cOH7OavsnoQf2RTxgCFNbzOwG4ALgjEh/GTtMuD+baKizDQDOuSeBJwHMbBahDobza81SAEyo9T6L0LmaAprSXr9PQDX3AehFrZNjwMfAFd5rA4bVs9zhJ7zO88bfAtzvve5PaHfTWmhbutWa5y7ghZb82Rw2Tz4ROsnv02fTr9Y8dwCvtOC2nAOsADIi+fPl988ZETrJ39Q2UP9J/g2ETvCne687Nqa9ddYVjQ+0uQzA84SenllFaM/jZkLfct8Blno/9D+rZ9lc4DNCD0P7M4duWk0EnvWmfQKc3oLb8gzwKbCM0Le2bpFoi1/tOWyefCJ3FZkfn82r3vhlhPqV6t6C27KW0BexJd4QkSvifGzPpd66KoAdwPTm2AbqCBhv/E3eZ7IWuLGh9h5p0J38IiLiC11FJiIivlDAiIiILxQwIiLiCwWMiIj4QgEjIiK+UMBITDOzsghvb6qZDQ7Tumos1FvyZ2b2RkO9DJtZBzO7NRzbFgkHXaYsMc3MypxzqWFcX7w71DGjr2rXbmb/AFY75x48wvy9gDedcydEoj6RhmgPRlodM8sws1fNbKE3jPXGjzazuWa22Mw+NrMB3vgbzGyamc0E3jOzCWY2y8xesdBzTP558NkY3vhc73WZ1yHlUjObZ2ZdvPE53vtPzeyXjdzLmsuhTjtTzew9M/vEW8fF3jy/AXK8vZ7fefN+32vjMjP7RRj/G0UapICR1uiPwB+cc6OArwJTvfErgdOccycS6p34V7WWGQFc7pwb770/EfguMBjoA4ytYzspwDzn3DBgNvDNWtv/o3NuCF/sobZOXj9YZxDqTQHgAHCpc24EoecPPewF3A+Bdc654c6575vZ2UA/YDQwHBhpZuMa2p5IuKizS2mNzgQG1+pptp3XA2174B9m1o9QD9IJtZaZ4Zyr/cyNBc65LQBmtoRQX1AfHradSg51ELoIOMt7fTKHnqXxHPBQPXW29dbdHfic0LM5INQX1K+8sAh607vUsfzZ3rDYe59KKHBm17M9kbBSwEhrFADGOOcO1B5pZn8G3nfOXeqdz5hVa/K+w9ZRUet1DXX/LlW5Qyc565vnSPY754Z7jxqYDtwGPEro+S8ZwEjnXJWZ5QNt6ljegF875x47yu2KhIUOkUlr9C6hHogBMLOD3Zq351AX5Df4uP15hA7NAUxqaGbnXDmhxyJ/z8ziCdVZ6IXLRKCnN2spkFZr0enATd7eGWbW3cwyw9QGkQYpYCTWJZvZllrD3YT+WOd6J75XEHrEAsD/AL82s8X4u3f/XeBuM1tG6KFPexpawDm3mFDPyVcRev5Lrpl9ClxH6NwRzrmdwEfeZc2/c869S+gQ3Fxv3lf4YgCJ+EqXKYtEmHfIa79zzpnZJOAq59zFDS0n0tLoHIxI5I0E/uxd+bWbKD2GWsRv2oMRERFf6ByMiIj4QgEjIiK+UMCIiIgvFDAiIuILBYyIiPhCASMiIr74/4N5RqOLf9z7AAAAAElFTkSuQmCC\n", + "text/plain": [ + "
" + ] + }, + "metadata": { + "needs_background": "light" + }, + "output_type": "display_data" + } + ], + "source": [ + "learn.recorder.plot(skip_end=15)" + ] + }, + { + "cell_type": "code", + "execution_count": 12, + "metadata": {}, + "outputs": [ + { + "data": { + "text/html": [ + "Total time: 44:34

\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
epochtrain_lossvalid_lossaccuracy
13.4969303.3678480.390874
\n" + ], + "text/plain": [ + "" + ] + }, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "learn.fit_one_cycle(1, 2.75e-2, moms=(0.8,0.7))" + ] + }, + { + "cell_type": "code", + "execution_count": 13, + "metadata": {}, + "outputs": [], + "source": [ + "learn.save('fit_head')" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [], + "source": [ + "learn.load('fit_head');" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "To complete the fine-tuning, we can then unfeeze and launch a new training." + ] + }, + { + "cell_type": "code", + "execution_count": 14, + "metadata": {}, + "outputs": [], + "source": [ + "learn.unfreeze()" + ] + }, + { + "cell_type": "code", + "execution_count": 15, + "metadata": {}, + "outputs": [ + { + "data": { + "text/html": [], + "text/plain": [ + "" + ] + }, + "metadata": {}, + "output_type": "execute_result" + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "LR Finder is complete, type {learner_name}.recorder.plot() to see the graph.\n" + ] + } + ], + "source": [ + "learn.lr_find()" + ] + }, + { + "cell_type": "code", + "execution_count": 16, + "metadata": {}, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "Min numerical gradient: 6.92E-06\n" + ] + }, + { + "data": { + "image/png": "\n", + "text/plain": [ + "

" + ] + }, + "metadata": { + "needs_background": "light" + }, + "output_type": "display_data" + } + ], + "source": [ + "learn.recorder.plot(skip_end=15, skip_start=15)" + ] + }, + { + "cell_type": "code", + "execution_count": 17, + "metadata": {}, + "outputs": [], + "source": [ + "from fastai.callbacks import SaveModelCallback\n", + "cb = SaveModelCallback(learn, every='epoch')" + ] + }, + { + "cell_type": "code", + "execution_count": 18, + "metadata": {}, + "outputs": [ + { + "data": { + "text/html": [ + "Total time: 4:10:59

\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
epochtrain_lossvalid_lossaccuracy
13.1862403.1533180.415778
23.0674323.0458290.429288
33.0239722.9902760.436462
42.9555882.9595680.440429
52.8965132.9535000.441327
\n" + ], + "text/plain": [ + "" + ] + }, + "metadata": {}, + "output_type": "execute_result" + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "IOPub message rate exceeded.\n", + "The notebook server will temporarily stop sending output\n", + "to the client in order to avoid crashing it.\n", + "To change this limit, set the config variable\n", + "`--NotebookApp.iopub_msg_rate_limit`.\n", + "\n", + "Current values:\n", + "NotebookApp.iopub_msg_rate_limit=1000.0 (msgs/sec)\n", + "NotebookApp.rate_limit_window=3.0 (secs)\n", + "\n" + ] + } + ], + "source": [ + "learn.fit_one_cycle(5, 1e-3, moms=(0.8,0.7), callbacks=[cb])" + ] + }, + { + "cell_type": "code", + "execution_count": 19, + "metadata": {}, + "outputs": [], + "source": [ + "learn.save('fine_tuned')" + ] + }, + { + "cell_type": "code", + "execution_count": 21, + "metadata": {}, + "outputs": [ + { + "data": { + "text/html": [], + "text/plain": [ + "" + ] + }, + "metadata": {}, + "output_type": "execute_result" + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "LR Finder is complete, type {learner_name}.recorder.plot() to see the graph.\n" + ] + } + ], + "source": [ + "learn.lr_find()" + ] + }, + { + "cell_type": "code", + "execution_count": 22, + "metadata": {}, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "Min numerical gradient: 1.32E-04\n" + ] + }, + { + "data": { + "image/png": "\n", + "text/plain": [ + "

" + ] + }, + "metadata": { + "needs_background": "light" + }, + "output_type": "display_data" + } + ], + "source": [ + "learn.recorder.plot(skip_end=15, skip_start=15)" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "How good is our model? Well let's try to see what it predicts after a few given words." + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [], + "source": [ + "learn.load('fine_tuned');" + ] + }, + { + "cell_type": "code", + "execution_count": 23, + "metadata": {}, + "outputs": [], + "source": [ + "cb = SaveModelCallback(learn, every='epoch', name='bestmodel_finetune_stage2')" + ] + }, + { + "cell_type": "code", + "execution_count": 24, + "metadata": {}, + "outputs": [ + { + "data": { + "text/html": [ + "Total time: 4:10:56

\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
epochtrain_lossvalid_lossaccuracy
12.9082932.9531300.441311
22.9085092.9499500.441765
32.8926252.9471430.442238
42.8778562.9456620.442433
52.8901442.9454290.442483
\n" + ], + "text/plain": [ + "" + ] + }, + "metadata": {}, + "output_type": "execute_result" + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "IOPub message rate exceeded.\n", + "The notebook server will temporarily stop sending output\n", + "to the client in order to avoid crashing it.\n", + "To change this limit, set the config variable\n", + "`--NotebookApp.iopub_msg_rate_limit`.\n", + "\n", + "Current values:\n", + "NotebookApp.iopub_msg_rate_limit=1000.0 (msgs/sec)\n", + "NotebookApp.rate_limit_window=3.0 (secs)\n", + "\n", + "IOPub message rate exceeded.\n", + "The notebook server will temporarily stop sending output\n", + "to the client in order to avoid crashing it.\n", + "To change this limit, set the config variable\n", + "`--NotebookApp.iopub_msg_rate_limit`.\n", + "\n", + "Current values:\n", + "NotebookApp.iopub_msg_rate_limit=1000.0 (msgs/sec)\n", + "NotebookApp.rate_limit_window=3.0 (secs)\n", + "\n", + "IOPub message rate exceeded.\n", + "The notebook server will temporarily stop sending output\n", + "to the client in order to avoid crashing it.\n", + "To change this limit, set the config variable\n", + "`--NotebookApp.iopub_msg_rate_limit`.\n", + "\n", + "Current values:\n", + "NotebookApp.iopub_msg_rate_limit=1000.0 (msgs/sec)\n", + "NotebookApp.rate_limit_window=3.0 (secs)\n", + "\n" + ] + } + ], + "source": [ + "learn.fit_one_cycle(5, 1e-4, moms=(0.8,0.7), callbacks=[cb])" + ] + }, + { + "cell_type": "code", + "execution_count": 25, + "metadata": {}, + "outputs": [], + "source": [ + "TEXT = \"Wat een fantastisch boek\"\n", + "N_WORDS = 40\n", + "N_SENTENCES = 2" + ] + }, + { + "cell_type": "code", + "execution_count": 26, + "metadata": {}, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "Wat een fantastisch boek , met een goed verhaal . Een boek waar je in je hoofd mee wilt puzzelen en dan is het ook nog eens spannend . Je krijgt een goed beeld van wat er er allemaal gebeuren is met\n", + "Wat een fantastisch boek ! Door de prachtige cover die Jef beschrijft en de prachtige kleuren , die je in zijn greep houdt , is het een boek dat je niet snel zal vergeten . \n", + " We gaan Wil van\n" + ] + } + ], + "source": [ + "print(\"\\n\".join(learn.predict(TEXT, N_WORDS, temperature=0.75) for _ in range(N_SENTENCES)))" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "We have to save the model but also it's encoder, the part that's responsible for creating and updating the hidden state. For the next part, we don't care about the part that tries to guess the next word." + ] + }, + { + "cell_type": "code", + "execution_count": 27, + "metadata": {}, + "outputs": [], + "source": [ + "learn.save_encoder('fine_tuned_enc')" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "## Classifier" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "Now, we'll create a new data object that only grabs the labelled data and keeps those labels. Again, this line takes a bit of time." + ] + }, + { + "cell_type": "code", + "execution_count": 9, + "metadata": {}, + "outputs": [], + "source": [ + "bs=32\n", + "fname = 'tmp_clas_bs{}'.format(bs)" + ] + }, + { + "cell_type": "code", + "execution_count": 10, + "metadata": {}, + "outputs": [], + "source": [ + "data_clas = (TextList.from_folder(path, vocab=data_lm.vocab)\n", + " #grab all the text files in path\n", + " .split_by_folder(valid='test')\n", + " #split by train and valid folder (that only keeps 'train' and 'test' so no need to filter)\n", + " .label_from_folder(classes=['neg', 'pos'])\n", + " #label them all with their folders\n", + " .databunch(bs=bs))\n", + "\n", + "data_clas.save(fname)" + ] + }, + { + "cell_type": "code", + "execution_count": 10, + "metadata": { + "scrolled": false + }, + "outputs": [], + "source": [ + "data_clas = load_data(path, fname, bs=bs)" + ] + }, + { + "cell_type": "code", + "execution_count": 19, + "metadata": {}, + "outputs": [ + { + "data": { + "text/html": [ + "\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
texttarget
xxbos “ xxmaj het huwelijk is het graf van de liefde . ” \\n \\n xxmaj woorden , woorden , woorden . xxmaj in de juiste volgorde vormen ze een universum waarin je helemaal wil verdwijnen . xxmaj alleen al bij het horen van de naam xxmaj proust word ik – heel toepasselijk - teruggeworpen naar die heerlijke weken waarin ik mocht verdwalen in de omgeving van xxmaj xxunkneg
xxbos xxmaj van alle genres die ik lees , ben ik het meest kritisch voor fantasy . xxmaj als fantasy goed is , is hij vaak ook heel goed , maar als een fantasyboek niet echt goed is , wordt het snel kinderachtig . xxmaj nogal wat auteurs ( en lezers ) zijn al tevreden als de obligate tovenaars , draken en magische zwaarden aanwezig zijn . xxmaj het verhaalneg
xxbos xxmaj het is zo treurig dat in het tijdperk waarin iedereen ( in de vrije wereld althans ) uitstekend xxunk is om de juistheid of xxunk van elke stelling , elke bewering zelf na te gaan , vrijwel niemand de moeite neemt om het te doen . xxmaj het kritisch vermogen ontbreekt kennelijk volkomen . xxmaj een paar xxunk en je duikt in gedigitaliseerde archieven , bekijkt ebook versiesneg
xxbos xxmaj de jonge filosoof xxmaj ype de xxmaj boer ( 1989 ) , die gepromoveerd is op de postmoderne xxmaj italiaanse filosoof xxmaj xxunk , heeft onlangs een boekje gepubliceerd waarin hij xxmaj murakami 's fictie interpreteert vanuit filosofische invalshoek . xxmaj wat zijn de kernthema 's van xxmaj murakami 's fictie , zo vraagt xxmaj de xxmaj boer zich af , en wat voor waardevolle filosofische conclusies kunnenpos
xxbos xxmaj pierre xxmaj lauffer ( 1920 - 1981 ) schreef vrijwel zijn hele leven poëzie en proza . xxmaj frank xxmaj martinus xxmaj arion noemde hem de xxmaj dante van het xxmaj papiaments . ‘ xxmaj je kunt zeggen dat iedereen die in het xxmaj papiaments goede poëzie schrijft , op de ene of andere manier door xxmaj pierre beïnvloed is.’ xxmaj helaas was het juist de taal diepos
\n" + ], + "text/plain": [ + "" + ] + }, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "data_clas.show_batch()" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "We can then create a model to classify those reviews and load the encoder we saved before." + ] + }, + { + "cell_type": "code", + "execution_count": 11, + "metadata": {}, + "outputs": [], + "source": [ + "learn = text_classifier_learner(data_clas, AWD_LSTM, drop_mult=0.5)\n", + "learn.load_encoder('fine_tuned_enc')" + ] + }, + { + "cell_type": "code", + "execution_count": 31, + "metadata": {}, + "outputs": [ + { + "data": { + "text/html": [], + "text/plain": [ + "" + ] + }, + "metadata": {}, + "output_type": "execute_result" + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "LR Finder is complete, type {learner_name}.recorder.plot() to see the graph.\n" + ] + } + ], + "source": [ + "learn.lr_find()" + ] + }, + { + "cell_type": "code", + "execution_count": 32, + "metadata": {}, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "Min numerical gradient: 2.29E-02\n" + ] + }, + { + "data": { + "image/png": "\n", + "text/plain": [ + "

" + ] + }, + "metadata": { + "needs_background": "light" + }, + "output_type": "display_data" + } + ], + "source": [ + "learn.recorder.plot()" + ] + }, + { + "cell_type": "code", + "execution_count": 33, + "metadata": {}, + "outputs": [ + { + "data": { + "text/html": [ + "Total time: 02:24

\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
epochtrain_lossvalid_lossaccuracy
10.4587310.3202280.860554
\n" + ], + "text/plain": [ + "" + ] + }, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "learn.fit_one_cycle(1, 1e-3, moms=(0.8,0.7))" + ] + }, + { + "cell_type": "code", + "execution_count": 34, + "metadata": {}, + "outputs": [], + "source": [ + "learn.save('first')" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [], + "source": [ + "learn.load('first');" + ] + }, + { + "cell_type": "code", + "execution_count": 35, + "metadata": {}, + "outputs": [ + { + "data": { + "text/html": [ + "Total time: 03:03

\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
epochtrain_lossvalid_lossaccuracy
10.3044650.2143480.915950
\n" + ], + "text/plain": [ + "" + ] + }, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "learn.freeze_to(-2)\n", + "learn.fit_one_cycle(1, slice(1e-2/(2.6**4),1e-2), moms=(0.8,0.7))" + ] + }, + { + "cell_type": "code", + "execution_count": 36, + "metadata": {}, + "outputs": [], + "source": [ + "learn.save('second')" + ] + }, + { + "cell_type": "code", + "execution_count": 14, + "metadata": {}, + "outputs": [], + "source": [ + "learn.load('second');" + ] + }, + { + "cell_type": "code", + "execution_count": 15, + "metadata": {}, + "outputs": [ + { + "data": { + "text/html": [], + "text/plain": [ + "" + ] + }, + "metadata": {}, + "output_type": "execute_result" + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "LR Finder is complete, type {learner_name}.recorder.plot() to see the graph.\n", + "Min numerical gradient: 3.31E-06\n" + ] + }, + { + "data": { + "image/png": "\n", + "text/plain": [ + "

" + ] + }, + "metadata": { + "needs_background": "light" + }, + "output_type": "display_data" + } + ], + "source": [ + "learn.lr_find()\n", + "learn.recorder.plot(skip_end=15, skip_start=15)" + ] + }, + { + "cell_type": "code", + "execution_count": 16, + "metadata": {}, + "outputs": [ + { + "data": { + "text/html": [ + "Total time: 05:07

\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
epochtrain_lossvalid_lossaccuracy
10.2789790.1956040.922159
\n" + ], + "text/plain": [ + "" + ] + }, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "learn.freeze_to(-3)\n", + "learn.fit_one_cycle(1, slice(5e-5/(2.6**4),5e-3), moms=(0.8,0.7))" + ] + }, + { + "cell_type": "code", + "execution_count": 17, + "metadata": {}, + "outputs": [], + "source": [ + "learn.save('third')" + ] + }, + { + "cell_type": "code", + "execution_count": 12, + "metadata": {}, + "outputs": [], + "source": [ + "learn.load('third');" + ] + }, + { + "cell_type": "code", + "execution_count": 13, + "metadata": {}, + "outputs": [ + { + "data": { + "text/html": [ + "Total time: 18:25

\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
epochtrain_lossvalid_lossaccuracy
10.2688360.1915260.927889
20.2384360.1763440.931710
\n" + ], + "text/plain": [ + "" + ] + }, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "learn.unfreeze()\n", + "learn.fit_one_cycle(2, slice(1e-3/(2.6**4),1e-3), moms=(0.8,0.7))" + ] + }, + { + "cell_type": "code", + "execution_count": 14, + "metadata": {}, + "outputs": [], + "source": [ + "learn.save('fourth')" + ] + }, + { + "cell_type": "code", + "execution_count": 15, + "metadata": {}, + "outputs": [ + { + "data": { + "text/html": [ + "Total time: 44:24

\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
epochtrain_lossvalid_lossaccuracy
10.2863340.1880370.926457
20.2676890.1768390.930277
30.2610100.1714480.934097
40.2243150.1712470.934575
50.2273270.1636050.938395
\n" + ], + "text/plain": [ + "" + ] + }, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "# Model seems not to overfit yet! Try again with more epochs\n", + "learn.load('third');\n", + "learn.unfreeze()\n", + "learn.fit_one_cycle(5, slice(1e-3/(2.6**4),1e-3), moms=(0.8,0.7))" + ] + }, + { + "cell_type": "code", + "execution_count": 16, + "metadata": {}, + "outputs": [], + "source": [ + "learn.save('fifth')" + ] + }, + { + "cell_type": "code", + "execution_count": 17, + "metadata": {}, + "outputs": [ + { + "data": { + "text/html": [ + "\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
texttargetprediction
xxbos xxmaj grieks drama in de xxunk \\n \\n \\n xxmaj xxunk : spoilers \\n \\n \\n ‘ xxmaj de volle maan , tragisch die avond , was reeds vroeg , nog in de laatste xxunk xxunk als een immense , xxunk bol , xxunk als een zonsondergang laag achter de xxunk van de xxmaj lange xxmaj laan en steeg , langzaam zich louterende van haar tragische tintpospos
xxbos xxmaj for xxunk : xxmaj below \\n \\n xxmaj deon xxmaj meyer is een van mijn favoriete schrijvers . xxmaj op 9 juni zou xxmaj deon zijn boeken signeren in een boekhandel van xxunk , slechts 35 km van mijn dorpje . xxmaj nou ben ik niet iemand , die snel contact maakt met allerlei schrijvers , maar als het zo dichtbij is , kon ik dit nietpospos
xxbos xxmaj giorgio xxmaj bassani ( 1916 - 2000 ) heeft tot 1981 een groot deel van leven doorgebracht in een xxmaj joodse gemeenschap in het xxmaj noord - xxmaj italiaanse stadje xxmaj ferrara aan de rivier de xxmaj po . xxmaj hij wordt gezien als een van de belangrijkste moderne schrijvers van xxmaj italië . \\n \\n xxmaj de kronieken van xxmaj ferrara ( xxmaj il xxmaj xxunkpospos
xxbos xxmaj ondanks zijn grote succes als dichter en een boekenplank vol publicaties vecht xxmaj rogi xxmaj wieg ( 1962 ) al jarenlang tegen zijn depressies . xxmaj misschien heeft het een met het ander te maken . xxmaj iemand die zo diep durft te gaan in wat hij schrijft , iemand die pijnlijk eerlijk over zichzelf durft te zijn , zoals in xxmaj kameraad xxmaj scheermes , zet zichzelfpospos
xxbos xxmaj maar de kerel staat erop . “ xxmaj in dit land , ” verklaart hij , “ moet je , als je iets wilt hebben , dwang xxunk \\n \\n ( … ) \\n \\n ‘ “ xxmaj er zitten twee mensen in een kamer , ” begin ik . “ xxmaj ineens wordt er aan de deur xxunk \\n \\n xxmaj bij dit eerstepospos
xxbos xxmaj hoewel dit boek de xxmaj man xxmaj booker prijs 2014 gewonnen heeft zijn de meningen verdeeld : sommigen vinden het een meesterwerk , terwijl bijvoorbeeld de xxmaj new xxmaj york xxmaj times sprak van een \" deeply xxunk novel \" . xxmaj zelf baalde ik als een stekker dat dit boek won terwijl prachtboeken van andere giganten ( xxmaj mitchell , xxmaj powers , xxmaj amis ) nietpospos
xxbos xxmaj achterflap : \\n xxmaj ruim zeventig jaar nadat een xxmaj duitse xxunk zijn geheime “ xxmaj wunderwaffen ” van de brandstapel wist te redden , vindt er in het grensgebied van xxmaj soedan een mysterieuze explosie plaats , waardoor de bevolking van een compleet dorp van de aardbodem verdwijnt . xxmaj als het bericht van de slachting xxmaj europa bereikt , wordt xxmaj alex xxmaj de xxmajpospos
xxbos xxmaj het leven is hardlopen , onder andere xxrep 5 . \\n \\n \\n \\n ‘ xxmaj ik hou er niet van om te veel over mezelf te vertellen , maar als ik anderzijds niet eerlijk vertel wat er te vertellen valt , heeft het schrijven van een boek als dit niet veel zin en had ik me net zo goed de moeite kunnen besparen [ xxrep 4posneg
xxbos xxmaj toen ik de voorpublicatie van dit boek van xxmaj giphart gelezen had , was ik direct gegrepen en ben ik zeer enthousiast geworden om mee te doen aan de xxmaj hebban - leesclub . xxmaj ik moet eerlijk zeggen - en ik heb dat ook eerlijk gezegd in mijn motivatie voor de leesclub - dat ik maar één boek van xxmaj giphart gelezen heb : xxmaj troost uitnegneg
xxbos ‘ xxmaj villa xxmaj toscane – xxmaj linda xxmaj van xxmaj xxunk – xxmaj een trage start met een voorspelbaar einde . \\n \\n “ xxmaj villa xxmaj toscane ” , een titel waarmee je als lezer meteen in vakantiestemming terechtkomt , maar al snel blijkt het toch niet de beste bestemming te zijn en al zeker niet met het verleden van xxmaj carlo en zijn ex -negneg
\n" + ], + "text/plain": [ + "" + ] + }, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "learn.show_results(rows=10)" + ] + }, + { + "cell_type": "code", + "execution_count": 18, + "metadata": {}, + "outputs": [], + "source": [ + "interp = learn.interpret()" + ] + }, + { + "cell_type": "code", + "execution_count": 19, + "metadata": {}, + "outputs": [ + { + "data": { + "image/png": "\n", + "text/plain": [ + "

" + ] + }, + "metadata": { + "needs_background": "light" + }, + "output_type": "display_data" + } + ], + "source": [ + "interp.plot_confusion_matrix()" + ] + }, + { + "cell_type": "code", + "execution_count": 20, + "metadata": {}, + "outputs": [ + { + "data": { + "text/plain": [ + "(tensor([9.5704, 7.3124, 5.9622, 5.8540, 5.8231, 4.8916, 4.7085, 3.7781, 3.5620,\n", + " 3.4087]),\n", + " tensor([2060, 2032, 1402, 1002, 1813, 1274, 418, 380, 178, 1853]))" + ] + }, + "execution_count": 20, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "interp.top_losses(k=10)" + ] + }, + { + "cell_type": "code", + "execution_count": 21, + "metadata": {}, + "outputs": [ + { + "data": { + "text/plain": [ + "(Text xxbos xxmaj met haar debuut xxmaj muidhond heeft xxmaj inge xxmaj schilperoord een gevoelig onderwerp in de literatuur aangesneden . \n", + " \n", + " xxmaj muidhond gaat over xxmaj jonathan ( 30 ) die na vrijspraak bij gebrek aan bewijs terugkeert naar huis . xxmaj hij woont samen met zijn moeder in een vissersdorpje en werkt in een xxunk . xxmaj hij heeft zijn hond xxmaj milk gemist en is blij dat hij weer met zijn hond door de duinen kan wandelen . xxmaj daar vind hij in een klein meertje een muidhond die hij mee naar huis neemt om voor te zorgen . xxmaj hij wordt rustig van het kijken naar de vis in zijn aquarium . \n", + " \n", + " xxmaj jonathan is een pedofiel die na zijn vrijspraak probeert om een ‘ nieuw mens’ te worden . xxmaj hij stelt een strak xxunk op en verplicht zichzelf aan opdrachten te werken die hij van zijn psycholoog heeft meegekregen . xxmaj dan leert hij een nieuw buurmeisje ( xxmaj elke ) kennen en wordt zijn voornemen zwaar op de proef gesteld . xxmaj om deze worsteling met zijn geaardheid draait het boek . xxmaj het stelt de vraag in hoeverre iemand wezenlijk in staat is om te veranderen . xxmaj en ook welke rol de omgeving speelt . xxmaj in hoeverre is iemand volledig toerekeningsvatbaar ? \n", + " \n", + " xxmaj het knappe van de schrijfster is dat ze de neergang van xxmaj jonathan heel geleidelijk beschrijft . xxmaj hierin zijn duidelijke overeenkomsten met ‘ xxmaj de xxunk , van xxmaj albert xxmaj camus te herkennen ( zie ook het motto in het boek ) \n", + " xxmaj de hoofdpersoon xxmaj meursault is net als xxmaj jonathan een in zichzelf gekeerde , zonderlinge man . xxmaj ook hij streeft een xxunk bestaan dat vrij is van veranderingen na . xxmaj hij heeft weinig ambitie en ervaart het leven als een opeenvolging van tragische gebeurtenissen die hun loop nemen , zonder dat je hier als mens controle over hebt . xxmaj ook de hitte speelt daarbij een grote rol . \n", + " xxmaj de neergang wordt zo als het ware onontkoombaar . \n", + " \n", + " xxmaj een belangrijk verschil is echter dat xxmaj inge xxmaj schilperoord zonder de ernst van de situatie te bagatelliseren , ze xxmaj jonathan met veel inlevingsvermogen beschrijft . xxmaj dat leidt er toe dat je hem als mens kunt zien die zowel dader als slachtoffer is . \n", + " ' xxmaj wat beweegt de jonge zwarte deelpachter xxmaj tucker xxmaj caliban om huis , vee en akkers te vernietigen en met vrouw en kind naar het xxmaj noorden te vertrekken?'- xxmaj win xxmaj uit de maat voor je hele leesgroep ! \n", + " ' xxmaj het is autobiografisch , helemaal waargebeurd maar toch zie je elementen van fictie in de stijl en vooral de opbouw , dat maakt het des te sterker . ' - xxmaj win boeken voor je hele leesclub ! \n", + " xxmaj we gaan xxmaj wil van xxmaj jeroen xxmaj olyslaegers luisteren via de gratis xxmaj hebban xxmaj luisterboeken - app . xxmaj doe je mee ?,\n", + " Category pos)" + ] + }, + "execution_count": 21, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "learn.data.valid_ds[2060]" + ] + }, + { + "cell_type": "code", + "execution_count": 22, + "metadata": {}, + "outputs": [], + "source": [ + "y_probs, y_pred, y_loss = learn.get_preds(ordered=True, with_loss=True)" + ] + }, + { + "cell_type": "code", + "execution_count": 23, + "metadata": {}, + "outputs": [ + { + "data": { + "text/plain": [ + "(tensor([0.0586, 0.9414]), tensor(1), tensor(9.5704))" + ] + }, + "execution_count": 23, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "y_probs[2060], y_pred[2060], y_loss[2060]" + ] + } + ], + "metadata": { + "kernelspec": { + "display_name": "Python 3", + "language": "python", + "name": "python3" + }, + "language_info": { + "codemirror_mode": { + "name": "ipython", + "version": 3 + }, + "file_extension": ".py", + "mimetype": "text/x-python", + "name": "python", + "nbconvert_exporter": "python", + "pygments_lexer": "ipython3", + "version": "3.7.1" + } + }, + "nbformat": 4, + "nbformat_minor": 2 +}